sedrickkeh commited on
Commit
991e0c3
·
verified ·
1 Parent(s): ef718d2

Training in progress, epoch 2

Browse files
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27a2090160045648b92b361d16391a4414d9f1ed06c34d567854d9d7323c5c72
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ce7143e13c45e2b9591e3d0be06b9acacfd580f7d34e6487e42177bbedd28e4
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b0671bc2dd832ca2daecc3dd13fa9dbce9c9d22b4a6e324377c54c0a5b8a2ef
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81e9db3f26b42f3fcb899472b63ab9007a5ad41e903b9dc9f8fea33ac1fc6e99
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d661f5fca5f993a50603303fefcdf71682f4aaf03452ed3a78c4211aa3627299
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3086868f5fce3f03b1a9e30ddbc8d01a1b526dc5a054d2e168b42d65f2cc522c
3
  size 4540516344
trainer_log.jsonl CHANGED
@@ -98,3 +98,52 @@
98
  {"current_steps": 970, "total_steps": 1479, "loss": 0.4821, "learning_rate": 5e-06, "epoch": 1.9645569620253165, "percentage": 65.58, "elapsed_time": "15:14:13", "remaining_time": "7:59:43"}
99
  {"current_steps": 980, "total_steps": 1479, "loss": 0.4823, "learning_rate": 5e-06, "epoch": 1.9848101265822784, "percentage": 66.26, "elapsed_time": "15:23:33", "remaining_time": "7:50:15"}
100
  {"current_steps": 987, "total_steps": 1479, "eval_loss": 0.06866108626127243, "epoch": 1.998987341772152, "percentage": 66.73, "elapsed_time": "15:38:54", "remaining_time": "7:48:01"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
98
  {"current_steps": 970, "total_steps": 1479, "loss": 0.4821, "learning_rate": 5e-06, "epoch": 1.9645569620253165, "percentage": 65.58, "elapsed_time": "15:14:13", "remaining_time": "7:59:43"}
99
  {"current_steps": 980, "total_steps": 1479, "loss": 0.4823, "learning_rate": 5e-06, "epoch": 1.9848101265822784, "percentage": 66.26, "elapsed_time": "15:23:33", "remaining_time": "7:50:15"}
100
  {"current_steps": 987, "total_steps": 1479, "eval_loss": 0.06866108626127243, "epoch": 1.998987341772152, "percentage": 66.73, "elapsed_time": "15:38:54", "remaining_time": "7:48:01"}
101
+ {"current_steps": 990, "total_steps": 1479, "loss": 0.4544, "learning_rate": 5e-06, "epoch": 2.0050632911392405, "percentage": 66.94, "elapsed_time": "15:42:24", "remaining_time": "7:45:29"}
102
+ {"current_steps": 1000, "total_steps": 1479, "loss": 0.3907, "learning_rate": 5e-06, "epoch": 2.0253164556962027, "percentage": 67.61, "elapsed_time": "15:51:44", "remaining_time": "7:35:53"}
103
+ {"current_steps": 1010, "total_steps": 1479, "loss": 0.3873, "learning_rate": 5e-06, "epoch": 2.0455696202531644, "percentage": 68.29, "elapsed_time": "16:01:04", "remaining_time": "7:26:16"}
104
+ {"current_steps": 1020, "total_steps": 1479, "loss": 0.3833, "learning_rate": 5e-06, "epoch": 2.0658227848101265, "percentage": 68.97, "elapsed_time": "16:10:24", "remaining_time": "7:16:41"}
105
+ {"current_steps": 1030, "total_steps": 1479, "loss": 0.3837, "learning_rate": 5e-06, "epoch": 2.0860759493670886, "percentage": 69.64, "elapsed_time": "16:19:45", "remaining_time": "7:07:05"}
106
+ {"current_steps": 1040, "total_steps": 1479, "loss": 0.3815, "learning_rate": 5e-06, "epoch": 2.1063291139240508, "percentage": 70.32, "elapsed_time": "16:29:05", "remaining_time": "6:57:30"}
107
+ {"current_steps": 1050, "total_steps": 1479, "loss": 0.3916, "learning_rate": 5e-06, "epoch": 2.1265822784810124, "percentage": 70.99, "elapsed_time": "16:38:24", "remaining_time": "6:47:55"}
108
+ {"current_steps": 1060, "total_steps": 1479, "loss": 0.3869, "learning_rate": 5e-06, "epoch": 2.1468354430379746, "percentage": 71.67, "elapsed_time": "16:47:43", "remaining_time": "6:38:20"}
109
+ {"current_steps": 1070, "total_steps": 1479, "loss": 0.3903, "learning_rate": 5e-06, "epoch": 2.1670886075949367, "percentage": 72.35, "elapsed_time": "16:57:03", "remaining_time": "6:28:45"}
110
+ {"current_steps": 1080, "total_steps": 1479, "loss": 0.3883, "learning_rate": 5e-06, "epoch": 2.187341772151899, "percentage": 73.02, "elapsed_time": "17:06:22", "remaining_time": "6:19:11"}
111
+ {"current_steps": 1090, "total_steps": 1479, "loss": 0.3849, "learning_rate": 5e-06, "epoch": 2.207594936708861, "percentage": 73.7, "elapsed_time": "17:15:41", "remaining_time": "6:09:37"}
112
+ {"current_steps": 1100, "total_steps": 1479, "loss": 0.3934, "learning_rate": 5e-06, "epoch": 2.2278481012658227, "percentage": 74.37, "elapsed_time": "17:25:01", "remaining_time": "6:00:03"}
113
+ {"current_steps": 1110, "total_steps": 1479, "loss": 0.3893, "learning_rate": 5e-06, "epoch": 2.248101265822785, "percentage": 75.05, "elapsed_time": "17:34:21", "remaining_time": "5:50:30"}
114
+ {"current_steps": 1120, "total_steps": 1479, "loss": 0.3916, "learning_rate": 5e-06, "epoch": 2.268354430379747, "percentage": 75.73, "elapsed_time": "17:43:41", "remaining_time": "5:40:57"}
115
+ {"current_steps": 1130, "total_steps": 1479, "loss": 0.3936, "learning_rate": 5e-06, "epoch": 2.2886075949367086, "percentage": 76.4, "elapsed_time": "17:53:01", "remaining_time": "5:31:24"}
116
+ {"current_steps": 1140, "total_steps": 1479, "loss": 0.39, "learning_rate": 5e-06, "epoch": 2.3088607594936708, "percentage": 77.08, "elapsed_time": "18:02:21", "remaining_time": "5:21:51"}
117
+ {"current_steps": 1150, "total_steps": 1479, "loss": 0.3967, "learning_rate": 5e-06, "epoch": 2.329113924050633, "percentage": 77.76, "elapsed_time": "18:11:42", "remaining_time": "5:12:19"}
118
+ {"current_steps": 1160, "total_steps": 1479, "loss": 0.3973, "learning_rate": 5e-06, "epoch": 2.349367088607595, "percentage": 78.43, "elapsed_time": "18:21:03", "remaining_time": "5:02:47"}
119
+ {"current_steps": 1170, "total_steps": 1479, "loss": 0.3981, "learning_rate": 5e-06, "epoch": 2.369620253164557, "percentage": 79.11, "elapsed_time": "18:30:25", "remaining_time": "4:53:15"}
120
+ {"current_steps": 1180, "total_steps": 1479, "loss": 0.3971, "learning_rate": 5e-06, "epoch": 2.389873417721519, "percentage": 79.78, "elapsed_time": "18:39:45", "remaining_time": "4:43:44"}
121
+ {"current_steps": 1190, "total_steps": 1479, "loss": 0.3958, "learning_rate": 5e-06, "epoch": 2.410126582278481, "percentage": 80.46, "elapsed_time": "18:49:06", "remaining_time": "4:34:12"}
122
+ {"current_steps": 1200, "total_steps": 1479, "loss": 0.3936, "learning_rate": 5e-06, "epoch": 2.430379746835443, "percentage": 81.14, "elapsed_time": "18:58:27", "remaining_time": "4:24:41"}
123
+ {"current_steps": 1210, "total_steps": 1479, "loss": 0.3936, "learning_rate": 5e-06, "epoch": 2.4506329113924052, "percentage": 81.81, "elapsed_time": "19:07:47", "remaining_time": "4:15:10"}
124
+ {"current_steps": 1220, "total_steps": 1479, "loss": 0.3963, "learning_rate": 5e-06, "epoch": 2.470886075949367, "percentage": 82.49, "elapsed_time": "19:17:08", "remaining_time": "4:05:39"}
125
+ {"current_steps": 1230, "total_steps": 1479, "loss": 0.3968, "learning_rate": 5e-06, "epoch": 2.491139240506329, "percentage": 83.16, "elapsed_time": "19:26:30", "remaining_time": "3:56:08"}
126
+ {"current_steps": 1240, "total_steps": 1479, "loss": 0.4012, "learning_rate": 5e-06, "epoch": 2.511392405063291, "percentage": 83.84, "elapsed_time": "19:35:50", "remaining_time": "3:46:38"}
127
+ {"current_steps": 1250, "total_steps": 1479, "loss": 0.3951, "learning_rate": 5e-06, "epoch": 2.5316455696202533, "percentage": 84.52, "elapsed_time": "19:45:11", "remaining_time": "3:37:07"}
128
+ {"current_steps": 1260, "total_steps": 1479, "loss": 0.3915, "learning_rate": 5e-06, "epoch": 2.5518987341772155, "percentage": 85.19, "elapsed_time": "19:54:30", "remaining_time": "3:27:37"}
129
+ {"current_steps": 1270, "total_steps": 1479, "loss": 0.3981, "learning_rate": 5e-06, "epoch": 2.572151898734177, "percentage": 85.87, "elapsed_time": "20:03:50", "remaining_time": "3:18:06"}
130
+ {"current_steps": 1280, "total_steps": 1479, "loss": 0.3999, "learning_rate": 5e-06, "epoch": 2.5924050632911393, "percentage": 86.54, "elapsed_time": "20:13:09", "remaining_time": "3:08:36"}
131
+ {"current_steps": 1290, "total_steps": 1479, "loss": 0.4049, "learning_rate": 5e-06, "epoch": 2.6126582278481014, "percentage": 87.22, "elapsed_time": "20:22:28", "remaining_time": "2:59:06"}
132
+ {"current_steps": 1300, "total_steps": 1479, "loss": 0.3997, "learning_rate": 5e-06, "epoch": 2.632911392405063, "percentage": 87.9, "elapsed_time": "20:31:48", "remaining_time": "2:49:36"}
133
+ {"current_steps": 1310, "total_steps": 1479, "loss": 0.3993, "learning_rate": 5e-06, "epoch": 2.6531645569620252, "percentage": 88.57, "elapsed_time": "20:41:08", "remaining_time": "2:40:07"}
134
+ {"current_steps": 1320, "total_steps": 1479, "loss": 0.4023, "learning_rate": 5e-06, "epoch": 2.6734177215189874, "percentage": 89.25, "elapsed_time": "20:50:28", "remaining_time": "2:30:37"}
135
+ {"current_steps": 1330, "total_steps": 1479, "loss": 0.4048, "learning_rate": 5e-06, "epoch": 2.6936708860759495, "percentage": 89.93, "elapsed_time": "20:59:48", "remaining_time": "2:21:08"}
136
+ {"current_steps": 1340, "total_steps": 1479, "loss": 0.4032, "learning_rate": 5e-06, "epoch": 2.7139240506329116, "percentage": 90.6, "elapsed_time": "21:09:08", "remaining_time": "2:11:39"}
137
+ {"current_steps": 1350, "total_steps": 1479, "loss": 0.4028, "learning_rate": 5e-06, "epoch": 2.7341772151898733, "percentage": 91.28, "elapsed_time": "21:18:28", "remaining_time": "2:02:09"}
138
+ {"current_steps": 1360, "total_steps": 1479, "loss": 0.3986, "learning_rate": 5e-06, "epoch": 2.7544303797468355, "percentage": 91.95, "elapsed_time": "21:27:49", "remaining_time": "1:52:41"}
139
+ {"current_steps": 1370, "total_steps": 1479, "loss": 0.4047, "learning_rate": 5e-06, "epoch": 2.7746835443037976, "percentage": 92.63, "elapsed_time": "21:37:09", "remaining_time": "1:43:12"}
140
+ {"current_steps": 1380, "total_steps": 1479, "loss": 0.4021, "learning_rate": 5e-06, "epoch": 2.7949367088607593, "percentage": 93.31, "elapsed_time": "21:46:29", "remaining_time": "1:33:43"}
141
+ {"current_steps": 1390, "total_steps": 1479, "loss": 0.4049, "learning_rate": 5e-06, "epoch": 2.8151898734177214, "percentage": 93.98, "elapsed_time": "21:55:48", "remaining_time": "1:24:15"}
142
+ {"current_steps": 1400, "total_steps": 1479, "loss": 0.3984, "learning_rate": 5e-06, "epoch": 2.8354430379746836, "percentage": 94.66, "elapsed_time": "22:05:08", "remaining_time": "1:14:46"}
143
+ {"current_steps": 1410, "total_steps": 1479, "loss": 0.4067, "learning_rate": 5e-06, "epoch": 2.8556962025316457, "percentage": 95.33, "elapsed_time": "22:14:28", "remaining_time": "1:05:18"}
144
+ {"current_steps": 1420, "total_steps": 1479, "loss": 0.4025, "learning_rate": 5e-06, "epoch": 2.875949367088608, "percentage": 96.01, "elapsed_time": "22:23:48", "remaining_time": "0:55:50"}
145
+ {"current_steps": 1430, "total_steps": 1479, "loss": 0.4036, "learning_rate": 5e-06, "epoch": 2.8962025316455695, "percentage": 96.69, "elapsed_time": "22:33:07", "remaining_time": "0:46:21"}
146
+ {"current_steps": 1440, "total_steps": 1479, "loss": 0.4057, "learning_rate": 5e-06, "epoch": 2.9164556962025316, "percentage": 97.36, "elapsed_time": "22:42:27", "remaining_time": "0:36:54"}
147
+ {"current_steps": 1450, "total_steps": 1479, "loss": 0.4145, "learning_rate": 5e-06, "epoch": 2.9367088607594938, "percentage": 98.04, "elapsed_time": "22:51:47", "remaining_time": "0:27:26"}
148
+ {"current_steps": 1460, "total_steps": 1479, "loss": 0.4023, "learning_rate": 5e-06, "epoch": 2.9569620253164555, "percentage": 98.72, "elapsed_time": "23:01:06", "remaining_time": "0:17:58"}
149
+ {"current_steps": 1470, "total_steps": 1479, "loss": 0.4067, "learning_rate": 5e-06, "epoch": 2.9772151898734176, "percentage": 99.39, "elapsed_time": "23:10:25", "remaining_time": "0:08:30"}