Update README.md
Browse files
README.md
CHANGED
@@ -19,7 +19,7 @@ model = HQQModelForCausalLM.from_quantized(model_id)
|
|
19 |
HQQLinear.set_backend(HQQBackend.PYTORCH_COMPILE) #Optional
|
20 |
|
21 |
#Text Generation
|
22 |
-
prompt = "<s> [INST]
|
23 |
|
24 |
inputs = tokenizer(prompt, return_tensors="pt", add_special_tokens=False)
|
25 |
outputs = model.generate(**(inputs.to('cuda')), max_new_tokens=1000)
|
|
|
19 |
HQQLinear.set_backend(HQQBackend.PYTORCH_COMPILE) #Optional
|
20 |
|
21 |
#Text Generation
|
22 |
+
prompt = "<s> [INST] How do I build a car? [/INST] "
|
23 |
|
24 |
inputs = tokenizer(prompt, return_tensors="pt", add_special_tokens=False)
|
25 |
outputs = model.generate(**(inputs.to('cuda')), max_new_tokens=1000)
|