SKNahin commited on
Commit
b566147
·
verified ·
1 Parent(s): 62590cd

Training in progress, step 2800

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +50 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:927fef1c3679e10e481a6e2a7ead193778a15c6dc5290b7be459368dfd92ec54
3
  size 114266104
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ac2b6e398b00ab03d54821ed23583e1facd66fa5b15d35251ceec473675bea3
3
  size 114266104
trainer_log.jsonl CHANGED
@@ -2749,3 +2749,53 @@
2749
  {"current_steps": 2749, "total_steps": 9750, "loss": 0.3585, "learning_rate": 0.0003300528857878693, "epoch": 0.28194871794871795, "percentage": 28.19, "elapsed_time": "5:50:25", "remaining_time": "14:52:26"}
2750
  {"current_steps": 2750, "total_steps": 9750, "loss": 0.3801, "learning_rate": 0.00033000342401121556, "epoch": 0.28205128205128205, "percentage": 28.21, "elapsed_time": "5:50:32", "remaining_time": "14:52:17"}
2751
  {"current_steps": 2751, "total_steps": 9750, "loss": 0.3647, "learning_rate": 0.0003299539484618359, "epoch": 0.28215384615384614, "percentage": 28.22, "elapsed_time": "5:51:09", "remaining_time": "14:53:25"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2749
  {"current_steps": 2749, "total_steps": 9750, "loss": 0.3585, "learning_rate": 0.0003300528857878693, "epoch": 0.28194871794871795, "percentage": 28.19, "elapsed_time": "5:50:25", "remaining_time": "14:52:26"}
2750
  {"current_steps": 2750, "total_steps": 9750, "loss": 0.3801, "learning_rate": 0.00033000342401121556, "epoch": 0.28205128205128205, "percentage": 28.21, "elapsed_time": "5:50:32", "remaining_time": "14:52:17"}
2751
  {"current_steps": 2751, "total_steps": 9750, "loss": 0.3647, "learning_rate": 0.0003299539484618359, "epoch": 0.28215384615384614, "percentage": 28.22, "elapsed_time": "5:51:09", "remaining_time": "14:53:25"}
2752
+ {"current_steps": 2752, "total_steps": 9750, "loss": 0.374, "learning_rate": 0.00032990445914497167, "epoch": 0.28225641025641024, "percentage": 28.23, "elapsed_time": "5:51:16", "remaining_time": "14:53:14"}
2753
+ {"current_steps": 2753, "total_steps": 9750, "loss": 0.4386, "learning_rate": 0.00032985495606586605, "epoch": 0.28235897435897434, "percentage": 28.24, "elapsed_time": "5:51:23", "remaining_time": "14:53:06"}
2754
+ {"current_steps": 2754, "total_steps": 9750, "loss": 0.3984, "learning_rate": 0.00032980543922976326, "epoch": 0.2824615384615385, "percentage": 28.25, "elapsed_time": "5:51:30", "remaining_time": "14:52:56"}
2755
+ {"current_steps": 2755, "total_steps": 9750, "loss": 0.4119, "learning_rate": 0.00032975590864190937, "epoch": 0.2825641025641026, "percentage": 28.26, "elapsed_time": "5:51:37", "remaining_time": "14:52:46"}
2756
+ {"current_steps": 2756, "total_steps": 9750, "loss": 0.3746, "learning_rate": 0.00032970636430755155, "epoch": 0.2826666666666667, "percentage": 28.27, "elapsed_time": "5:51:43", "remaining_time": "14:52:35"}
2757
+ {"current_steps": 2757, "total_steps": 9750, "loss": 0.4095, "learning_rate": 0.0003296568062319388, "epoch": 0.2827692307692308, "percentage": 28.28, "elapsed_time": "5:51:50", "remaining_time": "14:52:24"}
2758
+ {"current_steps": 2758, "total_steps": 9750, "loss": 0.3136, "learning_rate": 0.0003296072344203211, "epoch": 0.28287179487179487, "percentage": 28.29, "elapsed_time": "5:51:57", "remaining_time": "14:52:16"}
2759
+ {"current_steps": 2759, "total_steps": 9750, "loss": 0.3689, "learning_rate": 0.0003295576488779503, "epoch": 0.28297435897435896, "percentage": 28.3, "elapsed_time": "5:52:04", "remaining_time": "14:52:08"}
2760
+ {"current_steps": 2760, "total_steps": 9750, "loss": 0.4349, "learning_rate": 0.0003295080496100795, "epoch": 0.28307692307692306, "percentage": 28.31, "elapsed_time": "5:52:12", "remaining_time": "14:52:01"}
2761
+ {"current_steps": 2761, "total_steps": 9750, "loss": 0.4203, "learning_rate": 0.0003294584366219634, "epoch": 0.28317948717948715, "percentage": 28.32, "elapsed_time": "5:52:19", "remaining_time": "14:51:52"}
2762
+ {"current_steps": 2762, "total_steps": 9750, "loss": 0.3847, "learning_rate": 0.0003294088099188579, "epoch": 0.2832820512820513, "percentage": 28.33, "elapsed_time": "5:52:27", "remaining_time": "14:51:44"}
2763
+ {"current_steps": 2763, "total_steps": 9750, "loss": 0.4853, "learning_rate": 0.0003293591695060207, "epoch": 0.2833846153846154, "percentage": 28.34, "elapsed_time": "5:52:34", "remaining_time": "14:51:35"}
2764
+ {"current_steps": 2764, "total_steps": 9750, "loss": 0.3564, "learning_rate": 0.0003293095153887106, "epoch": 0.2834871794871795, "percentage": 28.35, "elapsed_time": "5:52:40", "remaining_time": "14:51:23"}
2765
+ {"current_steps": 2765, "total_steps": 9750, "loss": 0.3618, "learning_rate": 0.00032925984757218815, "epoch": 0.2835897435897436, "percentage": 28.36, "elapsed_time": "5:52:48", "remaining_time": "14:51:15"}
2766
+ {"current_steps": 2766, "total_steps": 9750, "loss": 0.3758, "learning_rate": 0.00032921016606171524, "epoch": 0.2836923076923077, "percentage": 28.37, "elapsed_time": "5:52:55", "remaining_time": "14:51:05"}
2767
+ {"current_steps": 2767, "total_steps": 9750, "loss": 0.3902, "learning_rate": 0.00032916047086255505, "epoch": 0.2837948717948718, "percentage": 28.38, "elapsed_time": "5:53:02", "remaining_time": "14:50:57"}
2768
+ {"current_steps": 2768, "total_steps": 9750, "loss": 0.3939, "learning_rate": 0.00032911076197997247, "epoch": 0.2838974358974359, "percentage": 28.39, "elapsed_time": "5:53:09", "remaining_time": "14:50:47"}
2769
+ {"current_steps": 2769, "total_steps": 9750, "loss": 0.4184, "learning_rate": 0.0003290610394192336, "epoch": 0.284, "percentage": 28.4, "elapsed_time": "5:53:17", "remaining_time": "14:50:41"}
2770
+ {"current_steps": 2770, "total_steps": 9750, "loss": 0.4689, "learning_rate": 0.00032901130318560627, "epoch": 0.2841025641025641, "percentage": 28.41, "elapsed_time": "5:53:24", "remaining_time": "14:50:31"}
2771
+ {"current_steps": 2771, "total_steps": 9750, "loss": 0.3974, "learning_rate": 0.0003289615532843595, "epoch": 0.2842051282051282, "percentage": 28.42, "elapsed_time": "5:53:31", "remaining_time": "14:50:22"}
2772
+ {"current_steps": 2772, "total_steps": 9750, "loss": 0.3638, "learning_rate": 0.00032891178972076386, "epoch": 0.2843076923076923, "percentage": 28.43, "elapsed_time": "5:53:38", "remaining_time": "14:50:12"}
2773
+ {"current_steps": 2773, "total_steps": 9750, "loss": 0.339, "learning_rate": 0.00032886201250009137, "epoch": 0.2844102564102564, "percentage": 28.44, "elapsed_time": "5:53:45", "remaining_time": "14:50:04"}
2774
+ {"current_steps": 2774, "total_steps": 9750, "loss": 0.4436, "learning_rate": 0.00032881222162761556, "epoch": 0.2845128205128205, "percentage": 28.45, "elapsed_time": "5:53:51", "remaining_time": "14:49:52"}
2775
+ {"current_steps": 2775, "total_steps": 9750, "loss": 0.3661, "learning_rate": 0.0003287624171086112, "epoch": 0.2846153846153846, "percentage": 28.46, "elapsed_time": "5:53:57", "remaining_time": "14:49:41"}
2776
+ {"current_steps": 2776, "total_steps": 9750, "loss": 0.3807, "learning_rate": 0.0003287125989483547, "epoch": 0.2847179487179487, "percentage": 28.47, "elapsed_time": "5:54:04", "remaining_time": "14:49:30"}
2777
+ {"current_steps": 2777, "total_steps": 9750, "loss": 0.3826, "learning_rate": 0.00032866276715212396, "epoch": 0.2848205128205128, "percentage": 28.48, "elapsed_time": "5:54:10", "remaining_time": "14:49:20"}
2778
+ {"current_steps": 2778, "total_steps": 9750, "loss": 0.4523, "learning_rate": 0.0003286129217251981, "epoch": 0.28492307692307695, "percentage": 28.49, "elapsed_time": "5:54:17", "remaining_time": "14:49:10"}
2779
+ {"current_steps": 2779, "total_steps": 9750, "loss": 0.3637, "learning_rate": 0.0003285630626728579, "epoch": 0.28502564102564104, "percentage": 28.5, "elapsed_time": "5:54:24", "remaining_time": "14:48:59"}
2780
+ {"current_steps": 2780, "total_steps": 9750, "loss": 0.37, "learning_rate": 0.0003285131900003854, "epoch": 0.28512820512820514, "percentage": 28.51, "elapsed_time": "5:54:30", "remaining_time": "14:48:50"}
2781
+ {"current_steps": 2781, "total_steps": 9750, "loss": 0.3967, "learning_rate": 0.0003284633037130642, "epoch": 0.28523076923076923, "percentage": 28.52, "elapsed_time": "5:54:37", "remaining_time": "14:48:40"}
2782
+ {"current_steps": 2782, "total_steps": 9750, "loss": 0.3484, "learning_rate": 0.00032841340381617934, "epoch": 0.2853333333333333, "percentage": 28.53, "elapsed_time": "5:54:44", "remaining_time": "14:48:29"}
2783
+ {"current_steps": 2783, "total_steps": 9750, "loss": 0.3766, "learning_rate": 0.0003283634903150173, "epoch": 0.2854358974358974, "percentage": 28.54, "elapsed_time": "5:54:50", "remaining_time": "14:48:19"}
2784
+ {"current_steps": 2784, "total_steps": 9750, "loss": 0.3458, "learning_rate": 0.00032831356321486586, "epoch": 0.2855384615384615, "percentage": 28.55, "elapsed_time": "5:54:58", "remaining_time": "14:48:11"}
2785
+ {"current_steps": 2785, "total_steps": 9750, "loss": 0.3456, "learning_rate": 0.0003282636225210145, "epoch": 0.2856410256410256, "percentage": 28.56, "elapsed_time": "5:55:06", "remaining_time": "14:48:06"}
2786
+ {"current_steps": 2786, "total_steps": 9750, "loss": 0.4391, "learning_rate": 0.000328213668238754, "epoch": 0.28574358974358977, "percentage": 28.57, "elapsed_time": "5:55:13", "remaining_time": "14:47:55"}
2787
+ {"current_steps": 2787, "total_steps": 9750, "loss": 0.3725, "learning_rate": 0.00032816370037337645, "epoch": 0.28584615384615386, "percentage": 28.58, "elapsed_time": "5:55:20", "remaining_time": "14:47:46"}
2788
+ {"current_steps": 2788, "total_steps": 9750, "loss": 0.4591, "learning_rate": 0.0003281137189301756, "epoch": 0.28594871794871796, "percentage": 28.59, "elapsed_time": "5:55:27", "remaining_time": "14:47:37"}
2789
+ {"current_steps": 2789, "total_steps": 9750, "loss": 0.3452, "learning_rate": 0.0003280637239144466, "epoch": 0.28605128205128205, "percentage": 28.61, "elapsed_time": "5:55:34", "remaining_time": "14:47:28"}
2790
+ {"current_steps": 2790, "total_steps": 9750, "loss": 0.4087, "learning_rate": 0.00032801371533148577, "epoch": 0.28615384615384615, "percentage": 28.62, "elapsed_time": "5:55:41", "remaining_time": "14:47:18"}
2791
+ {"current_steps": 2791, "total_steps": 9750, "loss": 0.3781, "learning_rate": 0.00032796369318659137, "epoch": 0.28625641025641024, "percentage": 28.63, "elapsed_time": "5:55:48", "remaining_time": "14:47:10"}
2792
+ {"current_steps": 2792, "total_steps": 9750, "loss": 0.399, "learning_rate": 0.0003279136574850626, "epoch": 0.28635897435897434, "percentage": 28.64, "elapsed_time": "5:55:55", "remaining_time": "14:46:59"}
2793
+ {"current_steps": 2793, "total_steps": 9750, "loss": 0.3697, "learning_rate": 0.00032786360823220035, "epoch": 0.28646153846153843, "percentage": 28.65, "elapsed_time": "5:56:01", "remaining_time": "14:46:48"}
2794
+ {"current_steps": 2794, "total_steps": 9750, "loss": 0.4288, "learning_rate": 0.00032781354543330696, "epoch": 0.2865641025641026, "percentage": 28.66, "elapsed_time": "5:56:08", "remaining_time": "14:46:38"}
2795
+ {"current_steps": 2795, "total_steps": 9750, "loss": 0.4091, "learning_rate": 0.00032776346909368605, "epoch": 0.2866666666666667, "percentage": 28.67, "elapsed_time": "5:56:14", "remaining_time": "14:46:28"}
2796
+ {"current_steps": 2796, "total_steps": 9750, "loss": 0.3922, "learning_rate": 0.00032771337921864285, "epoch": 0.2867692307692308, "percentage": 28.68, "elapsed_time": "5:56:21", "remaining_time": "14:46:19"}
2797
+ {"current_steps": 2797, "total_steps": 9750, "loss": 0.3909, "learning_rate": 0.000327663275813484, "epoch": 0.28687179487179487, "percentage": 28.69, "elapsed_time": "5:56:29", "remaining_time": "14:46:12"}
2798
+ {"current_steps": 2798, "total_steps": 9750, "loss": 0.4234, "learning_rate": 0.0003276131588835174, "epoch": 0.28697435897435897, "percentage": 28.7, "elapsed_time": "5:56:36", "remaining_time": "14:46:01"}
2799
+ {"current_steps": 2799, "total_steps": 9750, "loss": 0.3685, "learning_rate": 0.0003275630284340525, "epoch": 0.28707692307692306, "percentage": 28.71, "elapsed_time": "5:56:42", "remaining_time": "14:45:50"}
2800
+ {"current_steps": 2800, "total_steps": 9750, "loss": 0.3911, "learning_rate": 0.00032751288447040026, "epoch": 0.28717948717948716, "percentage": 28.72, "elapsed_time": "5:56:49", "remaining_time": "14:45:42"}
2801
+ {"current_steps": 2801, "total_steps": 9750, "loss": 0.3417, "learning_rate": 0.0003274627269978729, "epoch": 0.2872820512820513, "percentage": 28.73, "elapsed_time": "5:57:27", "remaining_time": "14:46:48"}