date3k2
/

Mistral-7B-Instruct-vi-alpaca

Text Generation

Generated from Trainer

Model card Files Files and versions Community

date3k2 commited on May 30, 2024

Commit

654a623

·

verified ·

1 Parent(s): 8cade22

Update README.md

Files changed (1) hide show

README.md +12 -10

README.md CHANGED Viewed

@@ -38,14 +38,12 @@ import torch
 model_name = "mistralai/Mistral-7B-Instruct-v0.3"
 peft_model_id = "date3k2/mistral-v0.3-alpaca-vi-v1"
-bnb_config = BitsAndBytesConfig(
-    load_in_8bit= True
-)
 model = AutoModelForCausalLM.from_pretrained(
-        model_name,
-        quantization_config=bnb_config,
-        device_map="auto",
-        trust_remote_code=True,
 )
 tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -54,9 +52,12 @@ model.load_adapter(peft_model_id)
 device = "cuda"
 messages = [
-    {"role": "user", "content": "Bạn là ai?"},
-    {"role": "assistant", "content": "Tôi là Dastral, một trợ lý AI đắc lực"},
-    {"role": "user", "content": "Viết công thức để nấu một món ngon từ thịt bò."}
 ]
 encodeds = tokenizer.apply_chat_template(messages, return_tensors="pt")
@@ -66,6 +67,7 @@ model_inputs = encodeds.to(device)
 generated_ids = model.generate(model_inputs, max_new_tokens=500, do_sample=True)
 decoded = tokenizer.batch_decode(generated_ids)
 print(decoded[0])
 ```
 The following hyperparameters were used during training:

 model_name = "mistralai/Mistral-7B-Instruct-v0.3"
 peft_model_id = "date3k2/mistral-v0.3-alpaca-vi-v1"
+bnb_config = BitsAndBytesConfig(load_in_8bit=True)
 model = AutoModelForCausalLM.from_pretrained(
+    model_name,
+    quantization_config=bnb_config,
+    device_map="auto",
+    trust_remote_code=True,
 )
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 device = "cuda"
 messages = [
+    {
+        "role": "user",
+        "content": """You are a helpful Vietnamese AI chatbot. Below is an instruction that describes a task. Write a response that appropriately completes the request. Your response should be in Vietnamese.
+    Instruction:
+    Viết công thức để nấu một món ngon từ thịt bò.""",
+    },
 ]
 encodeds = tokenizer.apply_chat_template(messages, return_tensors="pt")
 generated_ids = model.generate(model_inputs, max_new_tokens=500, do_sample=True)
 decoded = tokenizer.batch_decode(generated_ids)
 print(decoded[0])
 ```
 The following hyperparameters were used during training: