farmery commited on
Commit
427e12c
·
verified ·
1 Parent(s): 9c76520

Training in progress, step 18, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8e83e82304d93cfd449f178079cc3344684651d089e50e0548957df808f990a
3
  size 83115256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:610e55096f1da125f1df84825d249b8109653808909e01cd3a587d7d157523a3
3
  size 83115256
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82a4d8a52597fd98db42b5bbc8a000d2ead8caac057876ab38166359d21d1e60
3
  size 42608388
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f7735e853c7a0df3fe0dda1808c7785d5c7ad99ab57def927f2811184a9f9ac
3
  size 42608388
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5cc430eab98049d80eb0384f5c1ba23aed2937bdb5f4807726e825212bc972e3
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f2ae7796563de8707806556f3767ebfdf616adb061e5ceb7f9f970a57876ec6
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2975d7d46baeff645d2e6f0f86d7be145db90bf3fbb53a45b6e6a4d5eea42c6
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f020a27eca7ff90953e82532899c7d9cd3715cf48ee015ad662932d0be5fe643
3
  size 14960
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68c7c897b5ed1625323fa48d49e77bd6cb1241346b2e1c27d28b2edaebada7bf
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1940a318a83f821b72fa349a839b33b51f0dbfb4356182db57a54660938d1a2c
3
  size 14960
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:231ff6e08355287600ada4dab81dfdcf98a104528645cbebdaaec2f98ba021b9
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7044711c09638686dddd8afc36884335491e66001d1e4905e09e19e8021522b5
3
  size 14960
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eca0ddb3ec890c90e8e6e7325bec40cdb8b59e4bebf5c0da8473b02809de875
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ed723721bc2dad2381ab5522e40123ba4aa738fa3e449c48809fa9c2697eb95
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0038893690579083835,
5
  "eval_steps": 9,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -44,6 +44,35 @@
44
  "eval_samples_per_second": 117.988,
45
  "eval_steps_per_second": 3.694,
46
  "step": 9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
48
  ],
49
  "logging_steps": 3,
@@ -63,7 +92,7 @@
63
  "attributes": {}
64
  }
65
  },
66
- "total_flos": 2.834941159984333e+16,
67
  "train_batch_size": 8,
68
  "trial_name": null,
69
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.007778738115816767,
5
  "eval_steps": 9,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
44
  "eval_samples_per_second": 117.988,
45
  "eval_steps_per_second": 3.694,
46
  "step": 9
47
+ },
48
+ {
49
+ "epoch": 0.005185825410544511,
50
+ "grad_norm": 1.3412178754806519,
51
+ "learning_rate": 9.987820251299122e-05,
52
+ "loss": 1.829,
53
+ "step": 12
54
+ },
55
+ {
56
+ "epoch": 0.00648228176318064,
57
+ "grad_norm": 1.5588266849517822,
58
+ "learning_rate": 9.924038765061042e-05,
59
+ "loss": 1.7529,
60
+ "step": 15
61
+ },
62
+ {
63
+ "epoch": 0.007778738115816767,
64
+ "grad_norm": 1.1395800113677979,
65
+ "learning_rate": 9.806308479691595e-05,
66
+ "loss": 1.7135,
67
+ "step": 18
68
+ },
69
+ {
70
+ "epoch": 0.007778738115816767,
71
+ "eval_loss": 1.6603822708129883,
72
+ "eval_runtime": 132.0674,
73
+ "eval_samples_per_second": 118.038,
74
+ "eval_steps_per_second": 3.695,
75
+ "step": 18
76
  }
77
  ],
78
  "logging_steps": 3,
 
92
  "attributes": {}
93
  }
94
  },
95
+ "total_flos": 5.67993544254423e+16,
96
  "train_batch_size": 8,
97
  "trial_name": null,
98
  "trial_params": null