dzanbek commited on
Commit
b617ace
·
verified ·
1 Parent(s): b9dca12

Training in progress, step 30, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "v_proj",
24
- "o_proj",
25
- "gate_proj",
26
- "k_proj",
27
  "q_proj",
 
 
28
  "down_proj",
 
 
29
  "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
 
23
  "q_proj",
24
+ "k_proj",
25
+ "o_proj",
26
  "down_proj",
27
+ "gate_proj",
28
+ "v_proj",
29
  "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
last-checkpoint/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 5.649238765076406e-05,
13
  "eval_loss": NaN,
14
- "eval_runtime": 840.147,
15
- "eval_samples_per_second": 8.872,
16
- "eval_steps_per_second": 4.436,
17
  "step": 1
18
  },
19
  {
@@ -33,9 +33,9 @@
33
  {
34
  "epoch": 0.0004519391012061125,
35
  "eval_loss": NaN,
36
- "eval_runtime": 838.7263,
37
- "eval_samples_per_second": 8.887,
38
- "eval_steps_per_second": 4.444,
39
  "step": 8
40
  },
41
  {
@@ -62,9 +62,9 @@
62
  {
63
  "epoch": 0.000903878202412225,
64
  "eval_loss": NaN,
65
- "eval_runtime": 839.2896,
66
- "eval_samples_per_second": 8.881,
67
- "eval_steps_per_second": 4.441,
68
  "step": 16
69
  },
70
  {
@@ -91,9 +91,9 @@
91
  {
92
  "epoch": 0.0013558173036183373,
93
  "eval_loss": NaN,
94
- "eval_runtime": 839.2045,
95
- "eval_samples_per_second": 8.882,
96
- "eval_steps_per_second": 4.441,
97
  "step": 24
98
  },
99
  {
 
11
  {
12
  "epoch": 5.649238765076406e-05,
13
  "eval_loss": NaN,
14
+ "eval_runtime": 839.5498,
15
+ "eval_samples_per_second": 8.879,
16
+ "eval_steps_per_second": 4.439,
17
  "step": 1
18
  },
19
  {
 
33
  {
34
  "epoch": 0.0004519391012061125,
35
  "eval_loss": NaN,
36
+ "eval_runtime": 839.9171,
37
+ "eval_samples_per_second": 8.875,
38
+ "eval_steps_per_second": 4.437,
39
  "step": 8
40
  },
41
  {
 
62
  {
63
  "epoch": 0.000903878202412225,
64
  "eval_loss": NaN,
65
+ "eval_runtime": 840.0505,
66
+ "eval_samples_per_second": 8.873,
67
+ "eval_steps_per_second": 4.437,
68
  "step": 16
69
  },
70
  {
 
91
  {
92
  "epoch": 0.0013558173036183373,
93
  "eval_loss": NaN,
94
+ "eval_runtime": 1608.6872,
95
+ "eval_samples_per_second": 4.634,
96
+ "eval_steps_per_second": 2.317,
97
  "step": 24
98
  },
99
  {
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1943c7a77e2d339e91bedf96425c16c679b9e07aa0683e2aa27e5d0cf6d89fe0
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67084735e3d06a13d05229e5cdbc391d9e578329a70de319caa246419a2f07b6
3
  size 6712