Nam Nguyen commited on
Commit
1eb2656
·
verified ·
1 Parent(s): 73dabdc

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +0 -5
handler.py CHANGED
@@ -14,15 +14,10 @@ def extract_assistant_response_simple(response_text):
14
 
15
  class EndpointHandler:
16
  def __init__(self, path=""):
17
- quantization_config = BitsAndBytesConfig(
18
- load_in_4bit=True,
19
- bnb_4bit_compute_dtype=torch.float16
20
- )
21
  self.tokenizer = AutoTokenizer.from_pretrained(path)
22
  model = AutoModelForCausalLM.from_pretrained(
23
  path,
24
  torch_dtype="auto",
25
- quantization_config=quantization_config
26
  )
27
  self.model = model.to_bettertransformer()
28
 
 
14
 
15
  class EndpointHandler:
16
  def __init__(self, path=""):
 
 
 
 
17
  self.tokenizer = AutoTokenizer.from_pretrained(path)
18
  model = AutoModelForCausalLM.from_pretrained(
19
  path,
20
  torch_dtype="auto",
 
21
  )
22
  self.model = model.to_bettertransformer()
23