Nam Nguyen commited on
Commit
9522763
·
verified ·
1 Parent(s): 3dea10e

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +7 -1
handler.py CHANGED
@@ -36,6 +36,12 @@ class EndpointHandler:
36
  ).to("cuda")
37
 
38
  with torch.backends.cuda.sdp_kernel(enable_flash=True, enable_math=False, enable_mem_efficient=False):
39
- outputs = self.model.generate(**inputs)
 
 
 
 
 
 
40
 
41
  return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
 
36
  ).to("cuda")
37
 
38
  with torch.backends.cuda.sdp_kernel(enable_flash=True, enable_math=False, enable_mem_efficient=False):
39
+ outputs = self.model.generate(
40
+ input_ids=inputs,
41
+ max_new_tokens=64,
42
+ use_cache=True,
43
+ temperature=1.5,
44
+ min_p=0.1,
45
+ )
46
 
47
  return self.tokenizer.decode(outputs[0], skip_special_tokens=True)