prxy5608 commited on
Commit
88a33b6
·
verified ·
1 Parent(s): 28c21fe

Training in progress, step 151, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47d9a4a16fdc46bbc89f10c142edbc1e5936b4695667b90c838c25efe312e0c7
3
  size 671149168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0540f2e663270d7b286adf364a4c5c89fc5048e95c951a845eed6f0ff29ea84
3
  size 671149168
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56feeb9665ee04e9f2375c78123f291155a50d9e9fe263a4ee579e6d3373686f
3
  size 341314196
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8db9b0ba2385beafa45cd08c4cfef71f07e0c891e37249f4e660078960576ad
3
  size 341314196
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:200e1fbf02bb39ece07cfd621f3e0b4a5ed2afd2723f8d7313b94a6fd4c9bbb8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d8fe7d9ddafff804fb27f268ff5b42d441929f36c7969d48f1e18f0898463d2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed41efdd6283cc55a7eeb8c1b2afb10664f4494afd05738afd0d2d78da3d68f7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5e2b7252ed14bf7b200301efea19c6da8009c4b85d61545d95c12430694780
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.9624110460281372,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-100",
4
- "epoch": 2.9850746268656714,
5
  "eval_steps": 50,
6
- "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1089,6 +1089,13 @@
1089
  "eval_samples_per_second": 13.367,
1090
  "eval_steps_per_second": 3.46,
1091
  "step": 150
 
 
 
 
 
 
 
1092
  }
1093
  ],
1094
  "logging_steps": 1,
@@ -1112,12 +1119,12 @@
1112
  "should_evaluate": false,
1113
  "should_log": false,
1114
  "should_save": true,
1115
- "should_training_stop": false
1116
  },
1117
  "attributes": {}
1118
  }
1119
  },
1120
- "total_flos": 2.262770368118784e+17,
1121
  "train_batch_size": 8,
1122
  "trial_name": null,
1123
  "trial_params": null
 
1
  {
2
  "best_metric": 0.9624110460281372,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-100",
4
+ "epoch": 3.0049751243781095,
5
  "eval_steps": 50,
6
+ "global_step": 151,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1089
  "eval_samples_per_second": 13.367,
1090
  "eval_steps_per_second": 3.46,
1091
  "step": 150
1092
+ },
1093
+ {
1094
+ "epoch": 3.0049751243781095,
1095
+ "grad_norm": 7.453361511230469,
1096
+ "learning_rate": 0.0,
1097
+ "loss": 2.4948,
1098
+ "step": 151
1099
  }
1100
  ],
1101
  "logging_steps": 1,
 
1119
  "should_evaluate": false,
1120
  "should_log": false,
1121
  "should_save": true,
1122
+ "should_training_stop": true
1123
  },
1124
  "attributes": {}
1125
  }
1126
  },
1127
+ "total_flos": 2.2778555039062426e+17,
1128
  "train_batch_size": 8,
1129
  "trial_name": null,
1130
  "trial_params": null