emdemor commited on
Commit
492d947
·
verified ·
1 Parent(s): 6d16c73

Training in progress, step 3819

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4126a86cedcc673291758a54cbca8d13b3b7d163ea1261dae62eb96e248768df
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac9d1260e3eb5e3e89c1771538bf89abfcb0bf3025fd9db1d0c2d3eae71a285b
3
  size 35668592
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9850746268656714,
5
  "eval_steps": 50,
6
- "global_step": 3800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1132,6 +1132,21 @@
1132
  "eval_samples_per_second": 3.396,
1133
  "eval_steps_per_second": 0.441,
1134
  "step": 3750
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1135
  }
1136
  ],
1137
  "logging_steps": 50,
@@ -1151,7 +1166,7 @@
1151
  "attributes": {}
1152
  }
1153
  },
1154
- "total_flos": 4.720338670196736e+16,
1155
  "train_batch_size": 8,
1156
  "trial_name": null,
1157
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
  "eval_steps": 50,
6
+ "global_step": 3819,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1132
  "eval_samples_per_second": 3.396,
1133
  "eval_steps_per_second": 0.441,
1134
  "step": 3750
1135
+ },
1136
+ {
1137
+ "epoch": 2.9850746268656714,
1138
+ "grad_norm": 0.23328797519207,
1139
+ "learning_rate": 2.764038405586267e-06,
1140
+ "loss": 1.7539,
1141
+ "step": 3800
1142
+ },
1143
+ {
1144
+ "epoch": 2.9850746268656714,
1145
+ "eval_loss": 1.73746657371521,
1146
+ "eval_runtime": 29.4954,
1147
+ "eval_samples_per_second": 3.39,
1148
+ "eval_steps_per_second": 0.441,
1149
+ "step": 3800
1150
  }
1151
  ],
1152
  "logging_steps": 50,
 
1166
  "attributes": {}
1167
  }
1168
  },
1169
+ "total_flos": 4.78476511570944e+16,
1170
  "train_batch_size": 8,
1171
  "trial_name": null,
1172
  "trial_params": null