emdemor commited on
Commit
dfbd051
·
verified ·
1 Parent(s): 0697fa4

Training in progress, step 2900

Browse files
Files changed (3) hide show
  1. adapter_model.safetensors +1 -1
  2. metrics.json +1 -0
  3. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5a441d7626d2dcc89857225abb72e5e945117611169865fb3c04a312eeb0019
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ac1e1d1c32b00d6d777fa3c34d41acfc1b48d7d6be55be71fe48d5fd32f9a52
3
  size 35668592
metrics.json CHANGED
@@ -55,3 +55,4 @@
55
  {"Step":2750,"eval_loss":1.7644474506,"eval_runtime":29.5003,"eval_samples_per_second":3.39,"eval_steps_per_second":0.441,"epoch":2.1602513747}
56
  {"Step":2800,"eval_loss":1.76300776,"eval_runtime":29.3837,"eval_samples_per_second":3.403,"eval_steps_per_second":0.442,"epoch":2.1995286724}
57
  {"Step":2850,"eval_loss":1.760255456,"eval_runtime":29.4586,"eval_samples_per_second":3.395,"eval_steps_per_second":0.441,"epoch":2.2388059701}
 
 
55
  {"Step":2750,"eval_loss":1.7644474506,"eval_runtime":29.5003,"eval_samples_per_second":3.39,"eval_steps_per_second":0.441,"epoch":2.1602513747}
56
  {"Step":2800,"eval_loss":1.76300776,"eval_runtime":29.3837,"eval_samples_per_second":3.403,"eval_steps_per_second":0.442,"epoch":2.1995286724}
57
  {"Step":2850,"eval_loss":1.760255456,"eval_runtime":29.4586,"eval_samples_per_second":3.395,"eval_steps_per_second":0.441,"epoch":2.2388059701}
58
+ {"Step":2900,"eval_loss":1.7579619884,"eval_runtime":29.3692,"eval_samples_per_second":3.405,"eval_steps_per_second":0.443,"epoch":2.2780832679}
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.2388059701492535,
5
  "eval_steps": 50,
6
- "global_step": 2850,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -847,6 +847,21 @@
847
  "eval_samples_per_second": 3.403,
848
  "eval_steps_per_second": 0.442,
849
  "step": 2800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
850
  }
851
  ],
852
  "logging_steps": 50,
@@ -866,7 +881,7 @@
866
  "attributes": {}
867
  }
868
  },
869
- "total_flos": 3.518249022117888e+16,
870
  "train_batch_size": 8,
871
  "trial_name": null,
872
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.27808326787117,
5
  "eval_steps": 50,
6
+ "global_step": 2900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
847
  "eval_samples_per_second": 3.403,
848
  "eval_steps_per_second": 0.442,
849
  "step": 2800
850
+ },
851
+ {
852
+ "epoch": 2.2388059701492535,
853
+ "grad_norm": 0.2436445653438568,
854
+ "learning_rate": 0.00014096595868489962,
855
+ "loss": 1.7616,
856
+ "step": 2850
857
+ },
858
+ {
859
+ "epoch": 2.2388059701492535,
860
+ "eval_loss": 1.7602554559707642,
861
+ "eval_runtime": 29.4586,
862
+ "eval_samples_per_second": 3.395,
863
+ "eval_steps_per_second": 0.441,
864
+ "step": 2850
865
  }
866
  ],
867
  "logging_steps": 50,
 
881
  "attributes": {}
882
  }
883
  },
884
+ "total_flos": 3.581672442624e+16,
885
  "train_batch_size": 8,
886
  "trial_name": null,
887
  "trial_params": null