Spaces:

Dovakiins
/

qwerrwe

Build error

winglian commited on Apr 30, 2023

Commit

9190ada

1 Parent(s): 4dbef09

8bit and deepspeed changes

Files changed (2) hide show

ds_config.json CHANGED Viewed

@@ -20,10 +20,12 @@
     }
   },
   "scheduler": {
-    "type": "OneCycle",
     "params": {
-      "cycle_min_lr": 1e-7,
-      "cycle_max_lr": 1e-4
     }
   },
   "zero_optimization": {

     }
   },
   "scheduler": {
+    "type": "WarmupDecayLR",
     "params": {
+      "warmup_min_lr": "auto",
+      "warmup_max_lr": "auto",
+      "warmup_num_steps": "auto",
+      "total_num_steps": "auto"
     }
   },
   "zero_optimization": {

src/axolotl/utils/models.py CHANGED Viewed

@@ -101,19 +101,12 @@ def load_model(
             )
             load_in_8bit = False
         elif is_llama_derived_model and "LlamaForCausalLM" in globals():
-            if not cfg.load_in_8bit:
-                model = LlamaForCausalLM.from_pretrained(
-                    base_model,
-                    device_map=cfg.device_map,
-                )
-            else:
-                model = LlamaForCausalLM.from_pretrained(
-                    base_model,
-                    load_in_8bit=cfg.load_in_8bit and cfg.adapter is not None,
-                    torch_dtype=torch_dtype,
-                    device_map=cfg.device_map,
-                )
         elif model_type:
             model = getattr(transformers, model_type).from_pretrained(
                 base_model,

             )
             load_in_8bit = False
         elif is_llama_derived_model and "LlamaForCausalLM" in globals():
+            model = LlamaForCausalLM.from_pretrained(
+                base_model,
+                load_in_8bit=cfg.load_in_8bit and cfg.adapter is not None,
+                torch_dtype=torch_dtype,
+                device_map=cfg.device_map,
+            )
         elif model_type:
             model = getattr(transformers, model_type).from_pretrained(
                 base_model,