emdemor commited on
Commit
a08b281
·
verified ·
1 Parent(s): 76a0b32

Training in progress, step 2650

Browse files
Files changed (3) hide show
  1. adapter_model.safetensors +1 -1
  2. metrics.json +1 -0
  3. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cfdcec4d41fe4ac86ec9ec7b6c3070b8a088d9a232f715ffbe3e94cea7d4adb
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15aef3d44cc29c204e8ca0fb979a8d9bbdf4e68623bbe2b0a744edf8777264dd
3
  size 35668592
metrics.json CHANGED
@@ -50,3 +50,4 @@
50
  {"Step":2500,"eval_loss":1.7779937983,"eval_runtime":29.5562,"eval_samples_per_second":3.383,"eval_steps_per_second":0.44,"epoch":1.9638648861}
51
  {"Step":2550,"eval_loss":1.7793732882,"eval_runtime":29.5808,"eval_samples_per_second":3.381,"eval_steps_per_second":0.439,"epoch":2.0031421838}
52
  {"Step":2600,"eval_loss":1.7732738256,"eval_runtime":29.4165,"eval_samples_per_second":3.399,"eval_steps_per_second":0.442,"epoch":2.0424194815}
 
 
50
  {"Step":2500,"eval_loss":1.7779937983,"eval_runtime":29.5562,"eval_samples_per_second":3.383,"eval_steps_per_second":0.44,"epoch":1.9638648861}
51
  {"Step":2550,"eval_loss":1.7793732882,"eval_runtime":29.5808,"eval_samples_per_second":3.381,"eval_steps_per_second":0.439,"epoch":2.0031421838}
52
  {"Step":2600,"eval_loss":1.7732738256,"eval_runtime":29.4165,"eval_samples_per_second":3.399,"eval_steps_per_second":0.442,"epoch":2.0424194815}
53
+ {"Step":2650,"eval_loss":1.7721085548,"eval_runtime":29.5171,"eval_samples_per_second":3.388,"eval_steps_per_second":0.44,"epoch":2.0816967793}
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.04241948153967,
5
  "eval_steps": 50,
6
- "global_step": 2600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -772,6 +772,21 @@
772
  "eval_samples_per_second": 3.381,
773
  "eval_steps_per_second": 0.439,
774
  "step": 2550
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
775
  }
776
  ],
777
  "logging_steps": 50,
@@ -791,7 +806,7 @@
791
  "attributes": {}
792
  }
793
  },
794
- "total_flos": 3.208869541066752e+16,
795
  "train_batch_size": 8,
796
  "trial_name": null,
797
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.081696779261587,
5
  "eval_steps": 50,
6
+ "global_step": 2650,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
772
  "eval_samples_per_second": 3.381,
773
  "eval_steps_per_second": 0.439,
774
  "step": 2550
775
+ },
776
+ {
777
+ "epoch": 2.04241948153967,
778
+ "grad_norm": 0.2194184958934784,
779
+ "learning_rate": 0.0001773348850741926,
780
+ "loss": 1.7922,
781
+ "step": 2600
782
+ },
783
+ {
784
+ "epoch": 2.04241948153967,
785
+ "eval_loss": 1.7732738256454468,
786
+ "eval_runtime": 29.4165,
787
+ "eval_samples_per_second": 3.399,
788
+ "eval_steps_per_second": 0.442,
789
+ "step": 2600
790
  }
791
  ],
792
  "logging_steps": 50,
 
806
  "attributes": {}
807
  }
808
  },
809
+ "total_flos": 3.269355531196416e+16,
810
  "train_batch_size": 8,
811
  "trial_name": null,
812
  "trial_params": null