Spaces:

jljiu
/

nekoa

Sleeping

jljiu commited on Dec 26, 2024

Commit

201a793

verified ·

1 Parent(s): 3423340

Update train.py

Files changed (1) hide show

train.py CHANGED Viewed

@@ -14,12 +14,16 @@ class ModelTrainer:
         with open(system_prompts_path, 'r', encoding='utf-8') as f:
             self.system_prompts = json.load(f)
-        # 初始化tokenizer和model - 移除GPU相关设置
-        self.tokenizer = AutoTokenizer.from_pretrained(model_id)
         self.model = AutoModelForCausalLM.from_pretrained(
             model_id,
-            low_cpu_mem_usage=True,    # 降低内存使用
-            torch_dtype='float32'      # 使用float32而不是float16
         )
         # 使用更轻量的LoRA配置

         with open(system_prompts_path, 'r', encoding='utf-8') as f:
             self.system_prompts = json.load(f)
+        # 初始化tokenizer和model - 添加trust_remote_code=True
+        self.tokenizer = AutoTokenizer.from_pretrained(
+            model_id,
+            trust_remote_code=True  # 添加此参数
+        )
         self.model = AutoModelForCausalLM.from_pretrained(
             model_id,
+            trust_remote_code=True,  # 添加此参数
+            low_cpu_mem_usage=True,
+            torch_dtype='float32'
         )
         # 使用更轻量的LoRA配置