emdemor commited on
Commit
7e02fb9
·
verified ·
1 Parent(s): 55fb309

Training in progress, step 2750

Browse files
Files changed (3) hide show
  1. adapter_model.safetensors +1 -1
  2. metrics.json +1 -0
  3. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24985e82bf76520307e5bc7c5d88100c0a4c123052eefa641905271c0098c921
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13d1f7d583dfc0f47ccb619dbbe99b944e5ee767d070c60d516fdd9cbbd41a76
3
  size 35668592
metrics.json CHANGED
@@ -52,3 +52,4 @@
52
  {"Step":2600,"eval_loss":1.7732738256,"eval_runtime":29.4165,"eval_samples_per_second":3.399,"eval_steps_per_second":0.442,"epoch":2.0424194815}
53
  {"Step":2650,"eval_loss":1.7721085548,"eval_runtime":29.5171,"eval_samples_per_second":3.388,"eval_steps_per_second":0.44,"epoch":2.0816967793}
54
  {"Step":2700,"eval_loss":1.7694271803,"eval_runtime":29.9036,"eval_samples_per_second":3.344,"eval_steps_per_second":0.435,"epoch":2.120974077}
 
 
52
  {"Step":2600,"eval_loss":1.7732738256,"eval_runtime":29.4165,"eval_samples_per_second":3.399,"eval_steps_per_second":0.442,"epoch":2.0424194815}
53
  {"Step":2650,"eval_loss":1.7721085548,"eval_runtime":29.5171,"eval_samples_per_second":3.388,"eval_steps_per_second":0.44,"epoch":2.0816967793}
54
  {"Step":2700,"eval_loss":1.7694271803,"eval_runtime":29.9036,"eval_samples_per_second":3.344,"eval_steps_per_second":0.435,"epoch":2.120974077}
55
+ {"Step":2750,"eval_loss":1.7644474506,"eval_runtime":29.5003,"eval_samples_per_second":3.39,"eval_steps_per_second":0.441,"epoch":2.1602513747}
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.1209740769835035,
5
  "eval_steps": 50,
6
- "global_step": 2700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -802,6 +802,21 @@
802
  "eval_samples_per_second": 3.388,
803
  "eval_steps_per_second": 0.44,
804
  "step": 2650
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
805
  }
806
  ],
807
  "logging_steps": 50,
@@ -821,7 +836,7 @@
821
  "attributes": {}
822
  }
823
  },
824
- "total_flos": 3.3322595280384e+16,
825
  "train_batch_size": 8,
826
  "trial_name": null,
827
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.16025137470542,
5
  "eval_steps": 50,
6
+ "global_step": 2750,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
802
  "eval_samples_per_second": 3.388,
803
  "eval_steps_per_second": 0.44,
804
  "step": 2650
805
+ },
806
+ {
807
+ "epoch": 2.1209740769835035,
808
+ "grad_norm": 0.2122960090637207,
809
+ "learning_rate": 0.00016278731451847543,
810
+ "loss": 1.7821,
811
+ "step": 2700
812
+ },
813
+ {
814
+ "epoch": 2.1209740769835035,
815
+ "eval_loss": 1.7694271802902222,
816
+ "eval_runtime": 29.9036,
817
+ "eval_samples_per_second": 3.344,
818
+ "eval_steps_per_second": 0.435,
819
+ "step": 2700
820
  }
821
  ],
822
  "logging_steps": 50,
 
836
  "attributes": {}
837
  }
838
  },
839
+ "total_flos": 3.39324703067136e+16,
840
  "train_batch_size": 8,
841
  "trial_name": null,
842
  "trial_params": null