Nam Nguyen
commited on
Update handler.py
Browse files- handler.py +7 -1
handler.py
CHANGED
@@ -36,6 +36,12 @@ class EndpointHandler:
|
|
36 |
).to("cuda")
|
37 |
|
38 |
with torch.backends.cuda.sdp_kernel(enable_flash=True, enable_math=False, enable_mem_efficient=False):
|
39 |
-
outputs = self.model.generate(
|
|
|
|
|
|
|
|
|
|
|
|
|
40 |
|
41 |
return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
|
|
36 |
).to("cuda")
|
37 |
|
38 |
with torch.backends.cuda.sdp_kernel(enable_flash=True, enable_math=False, enable_mem_efficient=False):
|
39 |
+
outputs = self.model.generate(
|
40 |
+
input_ids=inputs,
|
41 |
+
max_new_tokens=64,
|
42 |
+
use_cache=True,
|
43 |
+
temperature=1.5,
|
44 |
+
min_p=0.1,
|
45 |
+
)
|
46 |
|
47 |
return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|