Nam Nguyen
commited on
Update handler.py
Browse files- handler.py +0 -5
handler.py
CHANGED
@@ -14,15 +14,10 @@ def extract_assistant_response_simple(response_text):
|
|
14 |
|
15 |
class EndpointHandler:
|
16 |
def __init__(self, path=""):
|
17 |
-
quantization_config = BitsAndBytesConfig(
|
18 |
-
load_in_4bit=True,
|
19 |
-
bnb_4bit_compute_dtype=torch.float16
|
20 |
-
)
|
21 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
22 |
model = AutoModelForCausalLM.from_pretrained(
|
23 |
path,
|
24 |
torch_dtype="auto",
|
25 |
-
quantization_config=quantization_config
|
26 |
)
|
27 |
self.model = model.to_bettertransformer()
|
28 |
|
|
|
14 |
|
15 |
class EndpointHandler:
|
16 |
def __init__(self, path=""):
|
|
|
|
|
|
|
|
|
17 |
self.tokenizer = AutoTokenizer.from_pretrained(path)
|
18 |
model = AutoModelForCausalLM.from_pretrained(
|
19 |
path,
|
20 |
torch_dtype="auto",
|
|
|
21 |
)
|
22 |
self.model = model.to_bettertransformer()
|
23 |
|