Jerry46 commited on
Commit
28e7de9
·
1 Parent(s): f74cf6b

Training in progress, epoch 1

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c4851d0fda021876b9eb5ecbd6ec0d108d643bb4b81a517a68af72134d8b407
3
  size 218138576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9dcafb75e33763bcbb1dcac4844987b4bc4804afc8cd5a98e4c454d0a897ab4
3
  size 218138576
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.3465735912322998,
4
- "train_runtime": 27.423,
5
  "train_samples": 61966,
6
- "train_samples_per_second": 0.365,
7
- "train_steps_per_second": 0.036
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.3465735912322998,
4
+ "train_runtime": 17.6734,
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.566,
7
+ "train_steps_per_second": 0.057
8
  }
runs/Dec10_16-11-47_uclaml03.cs.ucla.edu/events.out.tfevents.1702253602.uclaml03.cs.ucla.edu.2936686.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbabe86d1716cd7d30bd6450626a9baf98dacbe028cc8c3efe53008e1814d7c0
3
+ size 6089
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.3465735912322998,
4
- "train_runtime": 27.423,
5
  "train_samples": 61966,
6
- "train_samples_per_second": 0.365,
7
- "train_steps_per_second": 0.036
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.3465735912322998,
4
+ "train_runtime": 17.6734,
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.566,
7
+ "train_steps_per_second": 0.057
8
  }
trainer_state.json CHANGED
@@ -24,18 +24,18 @@
24
  },
25
  {
26
  "epoch": 1.0,
27
- "eval_logits/chosen": -2.9331436157226562,
28
- "eval_logits/rejected": -3.0131616592407227,
29
- "eval_logps/chosen": -168.64442443847656,
30
- "eval_logps/rejected": -190.56906127929688,
31
  "eval_loss": 0.6931471824645996,
32
  "eval_rewards/accuracies": 0.0,
33
  "eval_rewards/chosen": 0.0,
34
  "eval_rewards/margins": 0.0,
35
  "eval_rewards/rejected": 0.0,
36
- "eval_runtime": 4.843,
37
- "eval_samples_per_second": 2.065,
38
- "eval_steps_per_second": 0.206,
39
  "step": 1
40
  },
41
  {
@@ -43,9 +43,9 @@
43
  "step": 1,
44
  "total_flos": 0.0,
45
  "train_loss": 0.3465735912322998,
46
- "train_runtime": 27.423,
47
- "train_samples_per_second": 0.365,
48
- "train_steps_per_second": 0.036
49
  }
50
  ],
51
  "logging_steps": 10,
 
24
  },
25
  {
26
  "epoch": 1.0,
27
+ "eval_logits/chosen": -3.0078587532043457,
28
+ "eval_logits/rejected": -3.042999744415283,
29
+ "eval_logps/chosen": -194.36697387695312,
30
+ "eval_logps/rejected": -179.82501220703125,
31
  "eval_loss": 0.6931471824645996,
32
  "eval_rewards/accuracies": 0.0,
33
  "eval_rewards/chosen": 0.0,
34
  "eval_rewards/margins": 0.0,
35
  "eval_rewards/rejected": 0.0,
36
+ "eval_runtime": 5.2287,
37
+ "eval_samples_per_second": 1.913,
38
+ "eval_steps_per_second": 0.383,
39
  "step": 1
40
  },
41
  {
 
43
  "step": 1,
44
  "total_flos": 0.0,
45
  "train_loss": 0.3465735912322998,
46
+ "train_runtime": 17.6734,
47
+ "train_samples_per_second": 0.566,
48
+ "train_steps_per_second": 0.057
49
  }
50
  ],
51
  "logging_steps": 10,