SystemAdmin123 commited on
Commit
d8968b4
·
verified ·
1 Parent(s): 199f020

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:356e77737e1ae57c572cefec580a243ff3bf580fbabb7d8184cf96c4dc8f3524
3
  size 723676832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed1ed9d8dfa9dd55b199bc5e21c0811819d1ab75ccfaea1ddfdae9a96f62b60d
3
  size 723676832
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb1e871d2adeb06e378f9b3dd9f505b3cc3347052040d028a70c5698d6ed5f4
3
  size 735627290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c7997c91fa3548efba8ca037e07ebcad875744d69d906895ad8baef3f316380
3
  size 735627290
last-checkpoint/trainer_state.json CHANGED
@@ -11,53 +11,53 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.9618937969207764,
14
- "eval_runtime": 5.2129,
15
- "eval_samples_per_second": 288.133,
16
- "eval_steps_per_second": 18.032,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.4375,
22
  "learning_rate": 1.6000000000000003e-05,
23
- "loss": 2.6559,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.6328125,
29
  "learning_rate": 3.2000000000000005e-05,
30
- "loss": 2.7912,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
- "eval_loss": 2.9339327812194824,
36
- "eval_runtime": 5.5967,
37
- "eval_samples_per_second": 268.371,
38
- "eval_steps_per_second": 16.796,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
  "grad_norm": 6.34375,
44
  "learning_rate": 4.8e-05,
45
- "loss": 2.8945,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 2.1875,
51
  "learning_rate": 6.400000000000001e-05,
52
- "loss": 2.7552,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
- "eval_loss": 2.7184391021728516,
58
- "eval_runtime": 5.6084,
59
- "eval_samples_per_second": 267.814,
60
- "eval_steps_per_second": 16.761,
61
  "step": 40
62
  }
63
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 2.9618937969207764,
14
+ "eval_runtime": 5.153,
15
+ "eval_samples_per_second": 291.48,
16
+ "eval_steps_per_second": 18.242,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.011834319526627219,
21
  "grad_norm": 4.4375,
22
  "learning_rate": 1.6000000000000003e-05,
23
+ "loss": 2.6542,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.023668639053254437,
28
  "grad_norm": 1.6328125,
29
  "learning_rate": 3.2000000000000005e-05,
30
+ "loss": 2.79,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.023668639053254437,
35
+ "eval_loss": 2.9338200092315674,
36
+ "eval_runtime": 5.4254,
37
+ "eval_samples_per_second": 276.844,
38
+ "eval_steps_per_second": 17.326,
39
  "step": 20
40
  },
41
  {
42
  "epoch": 0.03550295857988166,
43
  "grad_norm": 6.34375,
44
  "learning_rate": 4.8e-05,
45
+ "loss": 2.8939,
46
  "step": 30
47
  },
48
  {
49
  "epoch": 0.047337278106508875,
50
  "grad_norm": 2.1875,
51
  "learning_rate": 6.400000000000001e-05,
52
+ "loss": 2.7567,
53
  "step": 40
54
  },
55
  {
56
  "epoch": 0.047337278106508875,
57
+ "eval_loss": 2.7183806896209717,
58
+ "eval_runtime": 5.4234,
59
+ "eval_samples_per_second": 276.95,
60
+ "eval_steps_per_second": 17.332,
61
  "step": 40
62
  }
63
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7337b093c5d7d6a10f8669867e0be91b7b9af804f42fa136237f8529e7181224
3
  size 6840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55fb1fb11393c44950fb4dfab07de848902eaeb6dba9ba2c18239d02cde2e9ba
3
  size 6840