{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.40960436911327053, "eval_steps": 500, "global_step": 48000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 5e-06, "loss": 3.2684, "step": 5 }, { "epoch": 0.0, "learning_rate": 1e-05, "loss": 3.3273, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.5e-05, "loss": 3.2418, "step": 15 }, { "epoch": 0.0, "learning_rate": 2e-05, "loss": 3.2584, "step": 20 }, { "epoch": 0.0, "learning_rate": 2.5e-05, "loss": 3.2362, "step": 25 }, { "epoch": 0.0, "learning_rate": 3e-05, "loss": 3.1811, "step": 30 }, { "epoch": 0.0, "learning_rate": 3.5e-05, "loss": 3.2123, "step": 35 }, { "epoch": 0.0, "learning_rate": 4e-05, "loss": 3.2072, "step": 40 }, { "epoch": 0.0, "learning_rate": 4.5e-05, "loss": 3.1808, "step": 45 }, { "epoch": 0.0, "learning_rate": 5e-05, "loss": 3.1338, "step": 50 }, { "epoch": 0.0, "learning_rate": 5.500000000000001e-05, "loss": 3.188, "step": 55 }, { "epoch": 0.0, "learning_rate": 6e-05, "loss": 3.2331, "step": 60 }, { "epoch": 0.0, "learning_rate": 6.500000000000001e-05, "loss": 3.0912, "step": 65 }, { "epoch": 0.0, "learning_rate": 7e-05, "loss": 3.1508, "step": 70 }, { "epoch": 0.0, "learning_rate": 7.500000000000001e-05, "loss": 3.1775, "step": 75 }, { "epoch": 0.0, "learning_rate": 8e-05, "loss": 3.109, "step": 80 }, { "epoch": 0.0, "learning_rate": 8.5e-05, "loss": 3.1145, "step": 85 }, { "epoch": 0.0, "learning_rate": 9e-05, "loss": 3.0888, "step": 90 }, { "epoch": 0.0, "learning_rate": 9.5e-05, "loss": 3.0755, "step": 95 }, { "epoch": 0.0, "learning_rate": 0.0001, "loss": 3.036, "step": 100 }, { "epoch": 0.0, "learning_rate": 9.999999955004424e-05, "loss": 3.164, "step": 105 }, { "epoch": 0.0, "learning_rate": 9.999999820017694e-05, "loss": 2.9222, "step": 110 }, { "epoch": 0.0, "learning_rate": 9.999999595039815e-05, "loss": 3.1212, "step": 115 }, { "epoch": 0.0, "learning_rate": 9.999999280070788e-05, "loss": 3.1119, "step": 120 }, { "epoch": 0.0, "learning_rate": 9.999998875110621e-05, "loss": 2.9637, "step": 125 }, { "epoch": 0.0, "learning_rate": 9.999998380159321e-05, "loss": 3.0579, "step": 130 }, { "epoch": 0.0, "learning_rate": 9.999997795216898e-05, "loss": 3.0606, "step": 135 }, { "epoch": 0.0, "learning_rate": 9.99999712028336e-05, "loss": 3.0103, "step": 140 }, { "epoch": 0.0, "learning_rate": 9.99999635535872e-05, "loss": 3.0002, "step": 145 }, { "epoch": 0.0, "learning_rate": 9.999995500442991e-05, "loss": 3.0608, "step": 150 }, { "epoch": 0.0, "learning_rate": 9.999994555536192e-05, "loss": 2.893, "step": 155 }, { "epoch": 0.0, "learning_rate": 9.999993520638335e-05, "loss": 3.0401, "step": 160 }, { "epoch": 0.0, "learning_rate": 9.999992395749442e-05, "loss": 2.9684, "step": 165 }, { "epoch": 0.0, "learning_rate": 9.999991180869534e-05, "loss": 2.974, "step": 170 }, { "epoch": 0.0, "learning_rate": 9.99998987599863e-05, "loss": 3.0205, "step": 175 }, { "epoch": 0.0, "learning_rate": 9.999988481136753e-05, "loss": 2.9529, "step": 180 }, { "epoch": 0.0, "learning_rate": 9.999986996283932e-05, "loss": 3.0358, "step": 185 }, { "epoch": 0.0, "learning_rate": 9.99998542144019e-05, "loss": 3.0013, "step": 190 }, { "epoch": 0.0, "learning_rate": 9.999983756605558e-05, "loss": 3.0335, "step": 195 }, { "epoch": 0.0, "learning_rate": 9.999982001780064e-05, "loss": 3.0333, "step": 200 }, { "epoch": 0.0, "learning_rate": 9.999980156963742e-05, "loss": 3.059, "step": 205 }, { "epoch": 0.0, "learning_rate": 9.999978222156622e-05, "loss": 2.9894, "step": 210 }, { "epoch": 0.0, "learning_rate": 9.99997619735874e-05, "loss": 3.0275, "step": 215 }, { "epoch": 0.0, "learning_rate": 9.999974082570134e-05, "loss": 3.0287, "step": 220 }, { "epoch": 0.0, "learning_rate": 9.999971877790841e-05, "loss": 2.9289, "step": 225 }, { "epoch": 0.0, "learning_rate": 9.9999695830209e-05, "loss": 2.9362, "step": 230 }, { "epoch": 0.0, "learning_rate": 9.999967198260354e-05, "loss": 3.0556, "step": 235 }, { "epoch": 0.0, "learning_rate": 9.999964723509243e-05, "loss": 2.9116, "step": 240 }, { "epoch": 0.0, "learning_rate": 9.999962158767615e-05, "loss": 2.9441, "step": 245 }, { "epoch": 0.0, "learning_rate": 9.999959504035513e-05, "loss": 2.8568, "step": 250 }, { "epoch": 0.0, "learning_rate": 9.999956759312987e-05, "loss": 3.0391, "step": 255 }, { "epoch": 0.0, "learning_rate": 9.999953924600087e-05, "loss": 2.9357, "step": 260 }, { "epoch": 0.0, "learning_rate": 9.999950999896861e-05, "loss": 2.977, "step": 265 }, { "epoch": 0.0, "learning_rate": 9.999947985203364e-05, "loss": 2.8533, "step": 270 }, { "epoch": 0.0, "learning_rate": 9.99994488051965e-05, "loss": 2.9165, "step": 275 }, { "epoch": 0.0, "learning_rate": 9.999941685845773e-05, "loss": 2.9564, "step": 280 }, { "epoch": 0.0, "learning_rate": 9.999938401181794e-05, "loss": 3.0019, "step": 285 }, { "epoch": 0.0, "learning_rate": 9.99993502652777e-05, "loss": 2.8855, "step": 290 }, { "epoch": 0.0, "learning_rate": 9.999931561883761e-05, "loss": 2.897, "step": 295 }, { "epoch": 0.0, "learning_rate": 9.99992800724983e-05, "loss": 2.869, "step": 300 }, { "epoch": 0.0, "learning_rate": 9.999924362626043e-05, "loss": 2.8128, "step": 305 }, { "epoch": 0.0, "learning_rate": 9.999920628012463e-05, "loss": 2.9596, "step": 310 }, { "epoch": 0.0, "learning_rate": 9.999916803409157e-05, "loss": 2.8131, "step": 315 }, { "epoch": 0.0, "learning_rate": 9.999912888816195e-05, "loss": 2.8911, "step": 320 }, { "epoch": 0.0, "learning_rate": 9.999908884233647e-05, "loss": 2.8701, "step": 325 }, { "epoch": 0.0, "learning_rate": 9.999904789661588e-05, "loss": 2.877, "step": 330 }, { "epoch": 0.0, "learning_rate": 9.999900605100085e-05, "loss": 2.9649, "step": 335 }, { "epoch": 0.0, "learning_rate": 9.99989633054922e-05, "loss": 2.9506, "step": 340 }, { "epoch": 0.0, "learning_rate": 9.999891966009068e-05, "loss": 2.7947, "step": 345 }, { "epoch": 0.0, "learning_rate": 9.999887511479705e-05, "loss": 2.8851, "step": 350 }, { "epoch": 0.0, "learning_rate": 9.999882966961213e-05, "loss": 2.8304, "step": 355 }, { "epoch": 0.0, "learning_rate": 9.999878332453676e-05, "loss": 2.7745, "step": 360 }, { "epoch": 0.0, "learning_rate": 9.999873607957173e-05, "loss": 2.9151, "step": 365 }, { "epoch": 0.0, "learning_rate": 9.999868793471791e-05, "loss": 2.7993, "step": 370 }, { "epoch": 0.0, "learning_rate": 9.99986388899762e-05, "loss": 2.8568, "step": 375 }, { "epoch": 0.0, "learning_rate": 9.999858894534743e-05, "loss": 2.9135, "step": 380 }, { "epoch": 0.0, "learning_rate": 9.999853810083253e-05, "loss": 2.8447, "step": 385 }, { "epoch": 0.0, "learning_rate": 9.99984863564324e-05, "loss": 2.8789, "step": 390 }, { "epoch": 0.0, "learning_rate": 9.999843371214797e-05, "loss": 2.8906, "step": 395 }, { "epoch": 0.0, "learning_rate": 9.999838016798021e-05, "loss": 2.8845, "step": 400 }, { "epoch": 0.0, "learning_rate": 9.999832572393006e-05, "loss": 2.8516, "step": 405 }, { "epoch": 0.0, "learning_rate": 9.999827037999852e-05, "loss": 2.8821, "step": 410 }, { "epoch": 0.0, "learning_rate": 9.999821413618657e-05, "loss": 2.7952, "step": 415 }, { "epoch": 0.0, "learning_rate": 9.999815699249522e-05, "loss": 2.8095, "step": 420 }, { "epoch": 0.0, "learning_rate": 9.999809894892551e-05, "loss": 2.8395, "step": 425 }, { "epoch": 0.0, "learning_rate": 9.999804000547848e-05, "loss": 2.9139, "step": 430 }, { "epoch": 0.0, "learning_rate": 9.999798016215519e-05, "loss": 2.8205, "step": 435 }, { "epoch": 0.0, "learning_rate": 9.999791941895671e-05, "loss": 2.8539, "step": 440 }, { "epoch": 0.0, "learning_rate": 9.999785777588415e-05, "loss": 2.8145, "step": 445 }, { "epoch": 0.0, "learning_rate": 9.999779523293862e-05, "loss": 2.8153, "step": 450 }, { "epoch": 0.0, "learning_rate": 9.999773179012121e-05, "loss": 2.8963, "step": 455 }, { "epoch": 0.0, "learning_rate": 9.999766744743311e-05, "loss": 2.9175, "step": 460 }, { "epoch": 0.0, "learning_rate": 9.999760220487547e-05, "loss": 2.8518, "step": 465 }, { "epoch": 0.0, "learning_rate": 9.999753606244942e-05, "loss": 2.8212, "step": 470 }, { "epoch": 0.0, "learning_rate": 9.99974690201562e-05, "loss": 2.9314, "step": 475 }, { "epoch": 0.0, "learning_rate": 9.999740107799698e-05, "loss": 2.7623, "step": 480 }, { "epoch": 0.0, "learning_rate": 9.999733223597302e-05, "loss": 2.8694, "step": 485 }, { "epoch": 0.0, "learning_rate": 9.999726249408553e-05, "loss": 2.818, "step": 490 }, { "epoch": 0.0, "learning_rate": 9.999719185233579e-05, "loss": 2.9023, "step": 495 }, { "epoch": 0.0, "learning_rate": 9.999712031072503e-05, "loss": 2.7819, "step": 500 }, { "epoch": 0.0, "learning_rate": 9.999704786925458e-05, "loss": 2.79, "step": 505 }, { "epoch": 0.0, "learning_rate": 9.999697452792572e-05, "loss": 2.7978, "step": 510 }, { "epoch": 0.0, "learning_rate": 9.999690028673978e-05, "loss": 2.804, "step": 515 }, { "epoch": 0.0, "learning_rate": 9.99968251456981e-05, "loss": 2.848, "step": 520 }, { "epoch": 0.0, "learning_rate": 9.999674910480203e-05, "loss": 2.7883, "step": 525 }, { "epoch": 0.0, "learning_rate": 9.999667216405293e-05, "loss": 2.8039, "step": 530 }, { "epoch": 0.0, "learning_rate": 9.999659432345218e-05, "loss": 2.824, "step": 535 }, { "epoch": 0.0, "learning_rate": 9.99965155830012e-05, "loss": 2.8508, "step": 540 }, { "epoch": 0.0, "learning_rate": 9.999643594270141e-05, "loss": 2.7649, "step": 545 }, { "epoch": 0.0, "learning_rate": 9.999635540255421e-05, "loss": 2.7521, "step": 550 }, { "epoch": 0.0, "learning_rate": 9.999627396256109e-05, "loss": 2.8065, "step": 555 }, { "epoch": 0.0, "learning_rate": 9.999619162272346e-05, "loss": 2.7224, "step": 560 }, { "epoch": 0.0, "learning_rate": 9.999610838304288e-05, "loss": 2.8257, "step": 565 }, { "epoch": 0.0, "learning_rate": 9.999602424352079e-05, "loss": 2.7952, "step": 570 }, { "epoch": 0.0, "learning_rate": 9.999593920415873e-05, "loss": 2.7375, "step": 575 }, { "epoch": 0.0, "learning_rate": 9.999585326495822e-05, "loss": 2.8044, "step": 580 }, { "epoch": 0.0, "learning_rate": 9.999576642592078e-05, "loss": 2.7798, "step": 585 }, { "epoch": 0.01, "learning_rate": 9.999567868704804e-05, "loss": 2.7935, "step": 590 }, { "epoch": 0.01, "learning_rate": 9.999559004834152e-05, "loss": 2.8489, "step": 595 }, { "epoch": 0.01, "learning_rate": 9.999550050980284e-05, "loss": 2.7763, "step": 600 }, { "epoch": 0.01, "learning_rate": 9.999541007143362e-05, "loss": 2.7516, "step": 605 }, { "epoch": 0.01, "learning_rate": 9.999531873323545e-05, "loss": 2.8091, "step": 610 }, { "epoch": 0.01, "learning_rate": 9.999522649521003e-05, "loss": 2.8186, "step": 615 }, { "epoch": 0.01, "learning_rate": 9.999513335735896e-05, "loss": 2.9302, "step": 620 }, { "epoch": 0.01, "learning_rate": 9.999503931968396e-05, "loss": 2.8585, "step": 625 }, { "epoch": 0.01, "learning_rate": 9.99949443821867e-05, "loss": 2.7785, "step": 630 }, { "epoch": 0.01, "learning_rate": 9.999484854486891e-05, "loss": 2.7453, "step": 635 }, { "epoch": 0.01, "learning_rate": 9.99947518077323e-05, "loss": 2.7573, "step": 640 }, { "epoch": 0.01, "learning_rate": 9.99946541707786e-05, "loss": 2.7858, "step": 645 }, { "epoch": 0.01, "learning_rate": 9.999455563400959e-05, "loss": 2.7026, "step": 650 }, { "epoch": 0.01, "learning_rate": 9.999445619742703e-05, "loss": 2.7864, "step": 655 }, { "epoch": 0.01, "learning_rate": 9.999435586103272e-05, "loss": 2.8037, "step": 660 }, { "epoch": 0.01, "learning_rate": 9.999425462482846e-05, "loss": 2.843, "step": 665 }, { "epoch": 0.01, "learning_rate": 9.999415248881605e-05, "loss": 2.7711, "step": 670 }, { "epoch": 0.01, "learning_rate": 9.999404945299738e-05, "loss": 2.7674, "step": 675 }, { "epoch": 0.01, "learning_rate": 9.999394551737424e-05, "loss": 2.734, "step": 680 }, { "epoch": 0.01, "learning_rate": 9.999384068194856e-05, "loss": 2.7064, "step": 685 }, { "epoch": 0.01, "learning_rate": 9.999373494672219e-05, "loss": 2.7465, "step": 690 }, { "epoch": 0.01, "learning_rate": 9.999362831169705e-05, "loss": 2.8157, "step": 695 }, { "epoch": 0.01, "learning_rate": 9.999352077687506e-05, "loss": 2.8563, "step": 700 }, { "epoch": 0.01, "learning_rate": 9.999341234225815e-05, "loss": 2.7637, "step": 705 }, { "epoch": 0.01, "learning_rate": 9.999330300784827e-05, "loss": 2.719, "step": 710 }, { "epoch": 0.01, "learning_rate": 9.999319277364736e-05, "loss": 2.7703, "step": 715 }, { "epoch": 0.01, "learning_rate": 9.999308163965745e-05, "loss": 2.7625, "step": 720 }, { "epoch": 0.01, "learning_rate": 9.999296960588054e-05, "loss": 2.6717, "step": 725 }, { "epoch": 0.01, "learning_rate": 9.999285667231861e-05, "loss": 2.7129, "step": 730 }, { "epoch": 0.01, "learning_rate": 9.999274283897372e-05, "loss": 2.8584, "step": 735 }, { "epoch": 0.01, "learning_rate": 9.99926281058479e-05, "loss": 2.7955, "step": 740 }, { "epoch": 0.01, "learning_rate": 9.999251247294326e-05, "loss": 2.796, "step": 745 }, { "epoch": 0.01, "learning_rate": 9.99923959402618e-05, "loss": 2.6882, "step": 750 }, { "epoch": 0.01, "learning_rate": 9.99922785078057e-05, "loss": 2.7468, "step": 755 }, { "epoch": 0.01, "learning_rate": 9.999216017557703e-05, "loss": 2.7458, "step": 760 }, { "epoch": 0.01, "learning_rate": 9.999204094357792e-05, "loss": 2.6784, "step": 765 }, { "epoch": 0.01, "learning_rate": 9.999192081181052e-05, "loss": 2.7402, "step": 770 }, { "epoch": 0.01, "learning_rate": 9.9991799780277e-05, "loss": 2.6681, "step": 775 }, { "epoch": 0.01, "learning_rate": 9.999167784897954e-05, "loss": 2.6943, "step": 780 }, { "epoch": 0.01, "learning_rate": 9.999155501792032e-05, "loss": 2.8471, "step": 785 }, { "epoch": 0.01, "learning_rate": 9.999143128710156e-05, "loss": 2.7478, "step": 790 }, { "epoch": 0.01, "learning_rate": 9.99913066565255e-05, "loss": 2.6906, "step": 795 }, { "epoch": 0.01, "learning_rate": 9.999118112619435e-05, "loss": 2.7223, "step": 800 }, { "epoch": 0.01, "learning_rate": 9.999105469611039e-05, "loss": 2.8674, "step": 805 }, { "epoch": 0.01, "learning_rate": 9.999092736627592e-05, "loss": 2.823, "step": 810 }, { "epoch": 0.01, "learning_rate": 9.999079913669318e-05, "loss": 2.7051, "step": 815 }, { "epoch": 0.01, "learning_rate": 9.99906700073645e-05, "loss": 2.8177, "step": 820 }, { "epoch": 0.01, "learning_rate": 9.999053997829222e-05, "loss": 2.7195, "step": 825 }, { "epoch": 0.01, "learning_rate": 9.999040904947868e-05, "loss": 2.7626, "step": 830 }, { "epoch": 0.01, "learning_rate": 9.999027722092621e-05, "loss": 2.7238, "step": 835 }, { "epoch": 0.01, "learning_rate": 9.99901444926372e-05, "loss": 2.6969, "step": 840 }, { "epoch": 0.01, "learning_rate": 9.999001086461404e-05, "loss": 2.7253, "step": 845 }, { "epoch": 0.01, "learning_rate": 9.998987633685913e-05, "loss": 2.6958, "step": 850 }, { "epoch": 0.01, "learning_rate": 9.998974090937489e-05, "loss": 2.7911, "step": 855 }, { "epoch": 0.01, "learning_rate": 9.998960458216376e-05, "loss": 2.7675, "step": 860 }, { "epoch": 0.01, "learning_rate": 9.998946735522819e-05, "loss": 2.7852, "step": 865 }, { "epoch": 0.01, "learning_rate": 9.998932922857066e-05, "loss": 2.6868, "step": 870 }, { "epoch": 0.01, "learning_rate": 9.998919020219364e-05, "loss": 2.7209, "step": 875 }, { "epoch": 0.01, "learning_rate": 9.998905027609966e-05, "loss": 2.7736, "step": 880 }, { "epoch": 0.01, "learning_rate": 9.99889094502912e-05, "loss": 2.8039, "step": 885 }, { "epoch": 0.01, "learning_rate": 9.998876772477083e-05, "loss": 2.773, "step": 890 }, { "epoch": 0.01, "learning_rate": 9.998862509954108e-05, "loss": 2.8195, "step": 895 }, { "epoch": 0.01, "learning_rate": 9.998848157460453e-05, "loss": 2.7481, "step": 900 }, { "epoch": 0.01, "learning_rate": 9.998833714996374e-05, "loss": 2.6684, "step": 905 }, { "epoch": 0.01, "learning_rate": 9.998819182562134e-05, "loss": 2.7226, "step": 910 }, { "epoch": 0.01, "learning_rate": 9.998804560157993e-05, "loss": 2.7816, "step": 915 }, { "epoch": 0.01, "learning_rate": 9.998789847784214e-05, "loss": 2.6872, "step": 920 }, { "epoch": 0.01, "learning_rate": 9.998775045441061e-05, "loss": 2.7133, "step": 925 }, { "epoch": 0.01, "learning_rate": 9.998760153128803e-05, "loss": 2.7296, "step": 930 }, { "epoch": 0.01, "learning_rate": 9.998745170847705e-05, "loss": 2.733, "step": 935 }, { "epoch": 0.01, "learning_rate": 9.998730098598039e-05, "loss": 2.7, "step": 940 }, { "epoch": 0.01, "learning_rate": 9.998714936380076e-05, "loss": 2.7425, "step": 945 }, { "epoch": 0.01, "learning_rate": 9.998699684194089e-05, "loss": 2.77, "step": 950 }, { "epoch": 0.01, "learning_rate": 9.998684342040349e-05, "loss": 2.7239, "step": 955 }, { "epoch": 0.01, "learning_rate": 9.998668909919138e-05, "loss": 2.7539, "step": 960 }, { "epoch": 0.01, "learning_rate": 9.998653387830729e-05, "loss": 2.7656, "step": 965 }, { "epoch": 0.01, "learning_rate": 9.998637775775403e-05, "loss": 2.7055, "step": 970 }, { "epoch": 0.01, "learning_rate": 9.998622073753443e-05, "loss": 2.7053, "step": 975 }, { "epoch": 0.01, "learning_rate": 9.998606281765127e-05, "loss": 2.7274, "step": 980 }, { "epoch": 0.01, "learning_rate": 9.998590399810744e-05, "loss": 2.7037, "step": 985 }, { "epoch": 0.01, "learning_rate": 9.998574427890577e-05, "loss": 2.6972, "step": 990 }, { "epoch": 0.01, "learning_rate": 9.998558366004914e-05, "loss": 2.6814, "step": 995 }, { "epoch": 0.01, "learning_rate": 9.998542214154046e-05, "loss": 2.668, "step": 1000 }, { "epoch": 0.01, "learning_rate": 9.99852597233826e-05, "loss": 2.6943, "step": 1005 }, { "epoch": 0.01, "learning_rate": 9.998509640557849e-05, "loss": 2.789, "step": 1010 }, { "epoch": 0.01, "learning_rate": 9.998493218813111e-05, "loss": 2.7209, "step": 1015 }, { "epoch": 0.01, "learning_rate": 9.998476707104339e-05, "loss": 2.7578, "step": 1020 }, { "epoch": 0.01, "learning_rate": 9.998460105431828e-05, "loss": 2.7564, "step": 1025 }, { "epoch": 0.01, "learning_rate": 9.99844341379588e-05, "loss": 2.7385, "step": 1030 }, { "epoch": 0.01, "learning_rate": 9.998426632196796e-05, "loss": 2.5883, "step": 1035 }, { "epoch": 0.01, "learning_rate": 9.998409760634874e-05, "loss": 2.6776, "step": 1040 }, { "epoch": 0.01, "learning_rate": 9.99839279911042e-05, "loss": 2.6983, "step": 1045 }, { "epoch": 0.01, "learning_rate": 9.998375747623741e-05, "loss": 2.7924, "step": 1050 }, { "epoch": 0.01, "learning_rate": 9.99835860617514e-05, "loss": 2.788, "step": 1055 }, { "epoch": 0.01, "learning_rate": 9.998341374764928e-05, "loss": 2.6687, "step": 1060 }, { "epoch": 0.01, "learning_rate": 9.998324053393416e-05, "loss": 2.6708, "step": 1065 }, { "epoch": 0.01, "learning_rate": 9.998306642060913e-05, "loss": 2.6863, "step": 1070 }, { "epoch": 0.01, "learning_rate": 9.998289140767736e-05, "loss": 2.7403, "step": 1075 }, { "epoch": 0.01, "learning_rate": 9.998271549514195e-05, "loss": 2.6659, "step": 1080 }, { "epoch": 0.01, "learning_rate": 9.998253868300613e-05, "loss": 2.6262, "step": 1085 }, { "epoch": 0.01, "learning_rate": 9.998236097127302e-05, "loss": 2.7425, "step": 1090 }, { "epoch": 0.01, "learning_rate": 9.998218235994585e-05, "loss": 2.7225, "step": 1095 }, { "epoch": 0.01, "learning_rate": 9.998200284902785e-05, "loss": 2.7585, "step": 1100 }, { "epoch": 0.01, "learning_rate": 9.998182243852221e-05, "loss": 2.6418, "step": 1105 }, { "epoch": 0.01, "learning_rate": 9.998164112843221e-05, "loss": 2.5976, "step": 1110 }, { "epoch": 0.01, "learning_rate": 9.99814589187611e-05, "loss": 2.706, "step": 1115 }, { "epoch": 0.01, "learning_rate": 9.998127580951216e-05, "loss": 2.7318, "step": 1120 }, { "epoch": 0.01, "learning_rate": 9.998109180068869e-05, "loss": 2.6858, "step": 1125 }, { "epoch": 0.01, "learning_rate": 9.998090689229398e-05, "loss": 2.7337, "step": 1130 }, { "epoch": 0.01, "learning_rate": 9.99807210843314e-05, "loss": 2.7004, "step": 1135 }, { "epoch": 0.01, "learning_rate": 9.998053437680426e-05, "loss": 2.7686, "step": 1140 }, { "epoch": 0.01, "learning_rate": 9.998034676971593e-05, "loss": 2.7342, "step": 1145 }, { "epoch": 0.01, "learning_rate": 9.998015826306979e-05, "loss": 2.6396, "step": 1150 }, { "epoch": 0.01, "learning_rate": 9.997996885686924e-05, "loss": 2.7647, "step": 1155 }, { "epoch": 0.01, "learning_rate": 9.997977855111767e-05, "loss": 2.7246, "step": 1160 }, { "epoch": 0.01, "learning_rate": 9.997958734581852e-05, "loss": 2.7415, "step": 1165 }, { "epoch": 0.01, "learning_rate": 9.997939524097523e-05, "loss": 2.6417, "step": 1170 }, { "epoch": 0.01, "learning_rate": 9.997920223659126e-05, "loss": 2.686, "step": 1175 }, { "epoch": 0.01, "learning_rate": 9.997900833267004e-05, "loss": 2.6321, "step": 1180 }, { "epoch": 0.01, "learning_rate": 9.997881352921513e-05, "loss": 2.6525, "step": 1185 }, { "epoch": 0.01, "learning_rate": 9.997861782623e-05, "loss": 2.6671, "step": 1190 }, { "epoch": 0.01, "learning_rate": 9.997842122371816e-05, "loss": 2.6689, "step": 1195 }, { "epoch": 0.01, "learning_rate": 9.99782237216832e-05, "loss": 2.6797, "step": 1200 }, { "epoch": 0.01, "learning_rate": 9.997802532012861e-05, "loss": 2.7244, "step": 1205 }, { "epoch": 0.01, "learning_rate": 9.9977826019058e-05, "loss": 2.68, "step": 1210 }, { "epoch": 0.01, "learning_rate": 9.997762581847494e-05, "loss": 2.7122, "step": 1215 }, { "epoch": 0.01, "learning_rate": 9.997742471838304e-05, "loss": 2.6829, "step": 1220 }, { "epoch": 0.01, "learning_rate": 9.997722271878593e-05, "loss": 2.6569, "step": 1225 }, { "epoch": 0.01, "learning_rate": 9.997701981968723e-05, "loss": 2.6833, "step": 1230 }, { "epoch": 0.01, "learning_rate": 9.997681602109059e-05, "loss": 2.738, "step": 1235 }, { "epoch": 0.01, "learning_rate": 9.997661132299969e-05, "loss": 2.6058, "step": 1240 }, { "epoch": 0.01, "learning_rate": 9.997640572541822e-05, "loss": 2.7016, "step": 1245 }, { "epoch": 0.01, "learning_rate": 9.997619922834985e-05, "loss": 2.5784, "step": 1250 }, { "epoch": 0.01, "learning_rate": 9.997599183179834e-05, "loss": 2.6936, "step": 1255 }, { "epoch": 0.01, "learning_rate": 9.997578353576737e-05, "loss": 2.769, "step": 1260 }, { "epoch": 0.01, "learning_rate": 9.997557434026075e-05, "loss": 2.6112, "step": 1265 }, { "epoch": 0.01, "learning_rate": 9.99753642452822e-05, "loss": 2.6588, "step": 1270 }, { "epoch": 0.01, "learning_rate": 9.99751532508355e-05, "loss": 2.7218, "step": 1275 }, { "epoch": 0.01, "learning_rate": 9.997494135692447e-05, "loss": 2.6465, "step": 1280 }, { "epoch": 0.01, "learning_rate": 9.997472856355293e-05, "loss": 2.6191, "step": 1285 }, { "epoch": 0.01, "learning_rate": 9.997451487072468e-05, "loss": 2.6553, "step": 1290 }, { "epoch": 0.01, "learning_rate": 9.997430027844359e-05, "loss": 2.6932, "step": 1295 }, { "epoch": 0.01, "learning_rate": 9.997408478671351e-05, "loss": 2.6119, "step": 1300 }, { "epoch": 0.01, "learning_rate": 9.997386839553833e-05, "loss": 2.6769, "step": 1305 }, { "epoch": 0.01, "learning_rate": 9.997365110492194e-05, "loss": 2.6237, "step": 1310 }, { "epoch": 0.01, "learning_rate": 9.997343291486823e-05, "loss": 2.6739, "step": 1315 }, { "epoch": 0.01, "learning_rate": 9.997321382538116e-05, "loss": 2.6284, "step": 1320 }, { "epoch": 0.01, "learning_rate": 9.997299383646466e-05, "loss": 2.7342, "step": 1325 }, { "epoch": 0.01, "learning_rate": 9.997277294812269e-05, "loss": 2.6317, "step": 1330 }, { "epoch": 0.01, "learning_rate": 9.99725511603592e-05, "loss": 2.6467, "step": 1335 }, { "epoch": 0.01, "learning_rate": 9.997232847317822e-05, "loss": 2.6555, "step": 1340 }, { "epoch": 0.01, "learning_rate": 9.997210488658375e-05, "loss": 2.5878, "step": 1345 }, { "epoch": 0.01, "learning_rate": 9.99718804005798e-05, "loss": 2.7179, "step": 1350 }, { "epoch": 0.01, "learning_rate": 9.997165501517042e-05, "loss": 2.6848, "step": 1355 }, { "epoch": 0.01, "learning_rate": 9.997142873035967e-05, "loss": 2.6474, "step": 1360 }, { "epoch": 0.01, "learning_rate": 9.99712015461516e-05, "loss": 2.5212, "step": 1365 }, { "epoch": 0.01, "learning_rate": 9.997097346255034e-05, "loss": 2.6337, "step": 1370 }, { "epoch": 0.01, "learning_rate": 9.997074447955994e-05, "loss": 2.7096, "step": 1375 }, { "epoch": 0.01, "learning_rate": 9.997051459718457e-05, "loss": 2.6061, "step": 1380 }, { "epoch": 0.01, "learning_rate": 9.997028381542835e-05, "loss": 2.6235, "step": 1385 }, { "epoch": 0.01, "learning_rate": 9.997005213429544e-05, "loss": 2.6584, "step": 1390 }, { "epoch": 0.01, "learning_rate": 9.996981955378999e-05, "loss": 2.6415, "step": 1395 }, { "epoch": 0.01, "learning_rate": 9.99695860739162e-05, "loss": 2.6817, "step": 1400 }, { "epoch": 0.01, "learning_rate": 9.996935169467828e-05, "loss": 2.659, "step": 1405 }, { "epoch": 0.01, "learning_rate": 9.996911641608045e-05, "loss": 2.6608, "step": 1410 }, { "epoch": 0.01, "learning_rate": 9.996888023812691e-05, "loss": 2.5826, "step": 1415 }, { "epoch": 0.01, "learning_rate": 9.996864316082195e-05, "loss": 2.7205, "step": 1420 }, { "epoch": 0.01, "learning_rate": 9.996840518416981e-05, "loss": 2.5722, "step": 1425 }, { "epoch": 0.01, "learning_rate": 9.996816630817481e-05, "loss": 2.6356, "step": 1430 }, { "epoch": 0.01, "learning_rate": 9.99679265328412e-05, "loss": 2.5992, "step": 1435 }, { "epoch": 0.01, "learning_rate": 9.996768585817333e-05, "loss": 2.6355, "step": 1440 }, { "epoch": 0.01, "learning_rate": 9.996744428417552e-05, "loss": 2.6305, "step": 1445 }, { "epoch": 0.01, "learning_rate": 9.996720181085211e-05, "loss": 2.6629, "step": 1450 }, { "epoch": 0.01, "learning_rate": 9.996695843820749e-05, "loss": 2.6352, "step": 1455 }, { "epoch": 0.01, "learning_rate": 9.996671416624602e-05, "loss": 2.6458, "step": 1460 }, { "epoch": 0.01, "learning_rate": 9.99664689949721e-05, "loss": 2.6106, "step": 1465 }, { "epoch": 0.01, "learning_rate": 9.996622292439015e-05, "loss": 2.648, "step": 1470 }, { "epoch": 0.01, "learning_rate": 9.996597595450459e-05, "loss": 2.6172, "step": 1475 }, { "epoch": 0.01, "learning_rate": 9.996572808531985e-05, "loss": 2.6345, "step": 1480 }, { "epoch": 0.01, "learning_rate": 9.996547931684042e-05, "loss": 2.6211, "step": 1485 }, { "epoch": 0.01, "learning_rate": 9.996522964907078e-05, "loss": 2.7069, "step": 1490 }, { "epoch": 0.01, "learning_rate": 9.996497908201538e-05, "loss": 2.6613, "step": 1495 }, { "epoch": 0.01, "learning_rate": 9.996472761567879e-05, "loss": 2.6585, "step": 1500 }, { "epoch": 0.01, "learning_rate": 9.996447525006549e-05, "loss": 2.6764, "step": 1505 }, { "epoch": 0.01, "learning_rate": 9.996422198518003e-05, "loss": 2.657, "step": 1510 }, { "epoch": 0.01, "learning_rate": 9.996396782102699e-05, "loss": 2.6641, "step": 1515 }, { "epoch": 0.01, "learning_rate": 9.996371275761091e-05, "loss": 2.6268, "step": 1520 }, { "epoch": 0.01, "learning_rate": 9.996345679493642e-05, "loss": 2.5883, "step": 1525 }, { "epoch": 0.01, "learning_rate": 9.996319993300812e-05, "loss": 2.6261, "step": 1530 }, { "epoch": 0.01, "learning_rate": 9.99629421718306e-05, "loss": 2.6468, "step": 1535 }, { "epoch": 0.01, "learning_rate": 9.996268351140851e-05, "loss": 2.6228, "step": 1540 }, { "epoch": 0.01, "learning_rate": 9.996242395174653e-05, "loss": 2.7123, "step": 1545 }, { "epoch": 0.01, "learning_rate": 9.996216349284932e-05, "loss": 2.6808, "step": 1550 }, { "epoch": 0.01, "learning_rate": 9.996190213472157e-05, "loss": 2.6004, "step": 1555 }, { "epoch": 0.01, "learning_rate": 9.996163987736796e-05, "loss": 2.6209, "step": 1560 }, { "epoch": 0.01, "learning_rate": 9.996137672079325e-05, "loss": 2.6626, "step": 1565 }, { "epoch": 0.01, "learning_rate": 9.996111266500214e-05, "loss": 2.5992, "step": 1570 }, { "epoch": 0.01, "learning_rate": 9.996084770999939e-05, "loss": 2.638, "step": 1575 }, { "epoch": 0.01, "learning_rate": 9.99605818557898e-05, "loss": 2.6652, "step": 1580 }, { "epoch": 0.01, "learning_rate": 9.996031510237811e-05, "loss": 2.681, "step": 1585 }, { "epoch": 0.01, "learning_rate": 9.996004744976916e-05, "loss": 2.6226, "step": 1590 }, { "epoch": 0.01, "learning_rate": 9.995977889796774e-05, "loss": 2.6131, "step": 1595 }, { "epoch": 0.01, "learning_rate": 9.99595094469787e-05, "loss": 2.7082, "step": 1600 }, { "epoch": 0.01, "learning_rate": 9.995923909680687e-05, "loss": 2.6557, "step": 1605 }, { "epoch": 0.01, "learning_rate": 9.995896784745715e-05, "loss": 2.5701, "step": 1610 }, { "epoch": 0.01, "learning_rate": 9.995869569893438e-05, "loss": 2.5943, "step": 1615 }, { "epoch": 0.01, "learning_rate": 9.995842265124349e-05, "loss": 2.6255, "step": 1620 }, { "epoch": 0.01, "learning_rate": 9.995814870438937e-05, "loss": 2.6324, "step": 1625 }, { "epoch": 0.01, "learning_rate": 9.995787385837698e-05, "loss": 2.5298, "step": 1630 }, { "epoch": 0.01, "learning_rate": 9.995759811321124e-05, "loss": 2.6668, "step": 1635 }, { "epoch": 0.01, "learning_rate": 9.995732146889713e-05, "loss": 2.5824, "step": 1640 }, { "epoch": 0.01, "learning_rate": 9.995704392543963e-05, "loss": 2.7284, "step": 1645 }, { "epoch": 0.01, "learning_rate": 9.995676548284371e-05, "loss": 2.64, "step": 1650 }, { "epoch": 0.01, "learning_rate": 9.995648614111441e-05, "loss": 2.6767, "step": 1655 }, { "epoch": 0.01, "learning_rate": 9.995620590025675e-05, "loss": 2.6645, "step": 1660 }, { "epoch": 0.01, "learning_rate": 9.995592476027576e-05, "loss": 2.6507, "step": 1665 }, { "epoch": 0.01, "learning_rate": 9.995564272117652e-05, "loss": 2.5787, "step": 1670 }, { "epoch": 0.01, "learning_rate": 9.99553597829641e-05, "loss": 2.6699, "step": 1675 }, { "epoch": 0.01, "learning_rate": 9.995507594564359e-05, "loss": 2.5304, "step": 1680 }, { "epoch": 0.01, "learning_rate": 9.995479120922009e-05, "loss": 2.6758, "step": 1685 }, { "epoch": 0.01, "learning_rate": 9.995450557369874e-05, "loss": 2.5318, "step": 1690 }, { "epoch": 0.01, "learning_rate": 9.995421903908467e-05, "loss": 2.6038, "step": 1695 }, { "epoch": 0.01, "learning_rate": 9.995393160538303e-05, "loss": 2.5682, "step": 1700 }, { "epoch": 0.01, "learning_rate": 9.995364327259902e-05, "loss": 2.5977, "step": 1705 }, { "epoch": 0.01, "learning_rate": 9.99533540407378e-05, "loss": 2.6053, "step": 1710 }, { "epoch": 0.01, "learning_rate": 9.995306390980461e-05, "loss": 2.5287, "step": 1715 }, { "epoch": 0.01, "learning_rate": 9.995277287980464e-05, "loss": 2.624, "step": 1720 }, { "epoch": 0.01, "learning_rate": 9.995248095074313e-05, "loss": 2.5875, "step": 1725 }, { "epoch": 0.01, "learning_rate": 9.995218812262535e-05, "loss": 2.6157, "step": 1730 }, { "epoch": 0.01, "learning_rate": 9.995189439545657e-05, "loss": 2.6657, "step": 1735 }, { "epoch": 0.01, "learning_rate": 9.995159976924206e-05, "loss": 2.5982, "step": 1740 }, { "epoch": 0.01, "learning_rate": 9.995130424398715e-05, "loss": 2.6523, "step": 1745 }, { "epoch": 0.01, "learning_rate": 9.995100781969713e-05, "loss": 2.5346, "step": 1750 }, { "epoch": 0.01, "learning_rate": 9.995071049637734e-05, "loss": 2.6491, "step": 1755 }, { "epoch": 0.02, "learning_rate": 9.995041227403314e-05, "loss": 2.5438, "step": 1760 }, { "epoch": 0.02, "learning_rate": 9.995011315266991e-05, "loss": 2.6009, "step": 1765 }, { "epoch": 0.02, "learning_rate": 9.994981313229301e-05, "loss": 2.5568, "step": 1770 }, { "epoch": 0.02, "learning_rate": 9.994951221290786e-05, "loss": 2.5353, "step": 1775 }, { "epoch": 0.02, "learning_rate": 9.994921039451985e-05, "loss": 2.645, "step": 1780 }, { "epoch": 0.02, "learning_rate": 9.994890767713445e-05, "loss": 2.6159, "step": 1785 }, { "epoch": 0.02, "learning_rate": 9.994860406075706e-05, "loss": 2.6486, "step": 1790 }, { "epoch": 0.02, "learning_rate": 9.994829954539318e-05, "loss": 2.6952, "step": 1795 }, { "epoch": 0.02, "learning_rate": 9.99479941310483e-05, "loss": 2.6425, "step": 1800 }, { "epoch": 0.02, "learning_rate": 9.994768781772787e-05, "loss": 2.6188, "step": 1805 }, { "epoch": 0.02, "learning_rate": 9.994738060543745e-05, "loss": 2.6257, "step": 1810 }, { "epoch": 0.02, "learning_rate": 9.994707249418254e-05, "loss": 2.6155, "step": 1815 }, { "epoch": 0.02, "learning_rate": 9.99467634839687e-05, "loss": 2.6829, "step": 1820 }, { "epoch": 0.02, "learning_rate": 9.994645357480148e-05, "loss": 2.6141, "step": 1825 }, { "epoch": 0.02, "learning_rate": 9.994614276668647e-05, "loss": 2.5479, "step": 1830 }, { "epoch": 0.02, "learning_rate": 9.994583105962927e-05, "loss": 2.5755, "step": 1835 }, { "epoch": 0.02, "learning_rate": 9.994551845363547e-05, "loss": 2.5798, "step": 1840 }, { "epoch": 0.02, "learning_rate": 9.994520494871072e-05, "loss": 2.6292, "step": 1845 }, { "epoch": 0.02, "learning_rate": 9.994489054486062e-05, "loss": 2.7222, "step": 1850 }, { "epoch": 0.02, "learning_rate": 9.994457524209089e-05, "loss": 2.6235, "step": 1855 }, { "epoch": 0.02, "learning_rate": 9.994425904040716e-05, "loss": 2.6464, "step": 1860 }, { "epoch": 0.02, "learning_rate": 9.994394193981512e-05, "loss": 2.5811, "step": 1865 }, { "epoch": 0.02, "learning_rate": 9.994362394032051e-05, "loss": 2.6411, "step": 1870 }, { "epoch": 0.02, "learning_rate": 9.994330504192901e-05, "loss": 2.6312, "step": 1875 }, { "epoch": 0.02, "learning_rate": 9.99429852446464e-05, "loss": 2.5424, "step": 1880 }, { "epoch": 0.02, "learning_rate": 9.994266454847842e-05, "loss": 2.5949, "step": 1885 }, { "epoch": 0.02, "learning_rate": 9.994234295343084e-05, "loss": 2.5919, "step": 1890 }, { "epoch": 0.02, "learning_rate": 9.994202045950944e-05, "loss": 2.658, "step": 1895 }, { "epoch": 0.02, "learning_rate": 9.994169706672006e-05, "loss": 2.5762, "step": 1900 }, { "epoch": 0.02, "learning_rate": 9.994137277506847e-05, "loss": 2.6026, "step": 1905 }, { "epoch": 0.02, "learning_rate": 9.994104758456053e-05, "loss": 2.5786, "step": 1910 }, { "epoch": 0.02, "learning_rate": 9.99407214952021e-05, "loss": 2.6079, "step": 1915 }, { "epoch": 0.02, "learning_rate": 9.994039450699906e-05, "loss": 2.6305, "step": 1920 }, { "epoch": 0.02, "learning_rate": 9.994006661995725e-05, "loss": 2.6244, "step": 1925 }, { "epoch": 0.02, "learning_rate": 9.993973783408262e-05, "loss": 2.6346, "step": 1930 }, { "epoch": 0.02, "learning_rate": 9.993940814938105e-05, "loss": 2.6247, "step": 1935 }, { "epoch": 0.02, "learning_rate": 9.993907756585851e-05, "loss": 2.6136, "step": 1940 }, { "epoch": 0.02, "learning_rate": 9.993874608352092e-05, "loss": 2.5771, "step": 1945 }, { "epoch": 0.02, "learning_rate": 9.993841370237424e-05, "loss": 2.6013, "step": 1950 }, { "epoch": 0.02, "learning_rate": 9.99380804224245e-05, "loss": 2.6514, "step": 1955 }, { "epoch": 0.02, "learning_rate": 9.993774624367764e-05, "loss": 2.6485, "step": 1960 }, { "epoch": 0.02, "learning_rate": 9.993741116613973e-05, "loss": 2.5071, "step": 1965 }, { "epoch": 0.02, "learning_rate": 9.993707518981675e-05, "loss": 2.6178, "step": 1970 }, { "epoch": 0.02, "learning_rate": 9.993673831471479e-05, "loss": 2.5945, "step": 1975 }, { "epoch": 0.02, "learning_rate": 9.993640054083988e-05, "loss": 2.6449, "step": 1980 }, { "epoch": 0.02, "learning_rate": 9.99360618681981e-05, "loss": 2.5947, "step": 1985 }, { "epoch": 0.02, "learning_rate": 9.993572229679557e-05, "loss": 2.6138, "step": 1990 }, { "epoch": 0.02, "learning_rate": 9.993538182663839e-05, "loss": 2.619, "step": 1995 }, { "epoch": 0.02, "learning_rate": 9.99350404577327e-05, "loss": 2.6323, "step": 2000 }, { "epoch": 0.02, "learning_rate": 9.993469819008461e-05, "loss": 2.5941, "step": 2005 }, { "epoch": 0.02, "learning_rate": 9.993435502370032e-05, "loss": 2.5948, "step": 2010 }, { "epoch": 0.02, "learning_rate": 9.993401095858599e-05, "loss": 2.6417, "step": 2015 }, { "epoch": 0.02, "learning_rate": 9.993366599474779e-05, "loss": 2.5835, "step": 2020 }, { "epoch": 0.02, "learning_rate": 9.993332013219196e-05, "loss": 2.5519, "step": 2025 }, { "epoch": 0.02, "learning_rate": 9.993297337092472e-05, "loss": 2.6831, "step": 2030 }, { "epoch": 0.02, "learning_rate": 9.99326257109523e-05, "loss": 2.5802, "step": 2035 }, { "epoch": 0.02, "learning_rate": 9.993227715228096e-05, "loss": 2.609, "step": 2040 }, { "epoch": 0.02, "learning_rate": 9.993192769491697e-05, "loss": 2.5794, "step": 2045 }, { "epoch": 0.02, "learning_rate": 9.993157733886664e-05, "loss": 2.5366, "step": 2050 }, { "epoch": 0.02, "learning_rate": 9.993122608413625e-05, "loss": 2.5959, "step": 2055 }, { "epoch": 0.02, "learning_rate": 9.993087393073214e-05, "loss": 2.6265, "step": 2060 }, { "epoch": 0.02, "learning_rate": 9.993052087866065e-05, "loss": 2.5569, "step": 2065 }, { "epoch": 0.02, "learning_rate": 9.993016692792812e-05, "loss": 2.5129, "step": 2070 }, { "epoch": 0.02, "learning_rate": 9.992981207854091e-05, "loss": 2.5272, "step": 2075 }, { "epoch": 0.02, "learning_rate": 9.992945633050544e-05, "loss": 2.6266, "step": 2080 }, { "epoch": 0.02, "learning_rate": 9.99290996838281e-05, "loss": 2.5359, "step": 2085 }, { "epoch": 0.02, "learning_rate": 9.992874213851528e-05, "loss": 2.5212, "step": 2090 }, { "epoch": 0.02, "learning_rate": 9.992838369457346e-05, "loss": 2.6058, "step": 2095 }, { "epoch": 0.02, "learning_rate": 9.992802435200908e-05, "loss": 2.5424, "step": 2100 }, { "epoch": 0.02, "learning_rate": 9.992766411082859e-05, "loss": 2.5178, "step": 2105 }, { "epoch": 0.02, "learning_rate": 9.992730297103847e-05, "loss": 2.5594, "step": 2110 }, { "epoch": 0.02, "learning_rate": 9.992694093264525e-05, "loss": 2.6155, "step": 2115 }, { "epoch": 0.02, "learning_rate": 9.992657799565541e-05, "loss": 2.6148, "step": 2120 }, { "epoch": 0.02, "learning_rate": 9.992621416007553e-05, "loss": 2.5317, "step": 2125 }, { "epoch": 0.02, "learning_rate": 9.99258494259121e-05, "loss": 2.4529, "step": 2130 }, { "epoch": 0.02, "learning_rate": 9.992548379317173e-05, "loss": 2.5954, "step": 2135 }, { "epoch": 0.02, "learning_rate": 9.992511726186098e-05, "loss": 2.5689, "step": 2140 }, { "epoch": 0.02, "learning_rate": 9.992474983198645e-05, "loss": 2.6419, "step": 2145 }, { "epoch": 0.02, "learning_rate": 9.992438150355475e-05, "loss": 2.6305, "step": 2150 }, { "epoch": 0.02, "learning_rate": 9.992401227657253e-05, "loss": 2.5389, "step": 2155 }, { "epoch": 0.02, "learning_rate": 9.99236421510464e-05, "loss": 2.5691, "step": 2160 }, { "epoch": 0.02, "learning_rate": 9.992327112698306e-05, "loss": 2.6171, "step": 2165 }, { "epoch": 0.02, "learning_rate": 9.992289920438915e-05, "loss": 2.419, "step": 2170 }, { "epoch": 0.02, "learning_rate": 9.99225263832714e-05, "loss": 2.5896, "step": 2175 }, { "epoch": 0.02, "learning_rate": 9.992215266363648e-05, "loss": 2.5738, "step": 2180 }, { "epoch": 0.02, "learning_rate": 9.992177804549116e-05, "loss": 2.6163, "step": 2185 }, { "epoch": 0.02, "learning_rate": 9.992140252884215e-05, "loss": 2.5989, "step": 2190 }, { "epoch": 0.02, "learning_rate": 9.992102611369623e-05, "loss": 2.5704, "step": 2195 }, { "epoch": 0.02, "learning_rate": 9.992064880006015e-05, "loss": 2.6467, "step": 2200 }, { "epoch": 0.02, "learning_rate": 9.992027058794073e-05, "loss": 2.4998, "step": 2205 }, { "epoch": 0.02, "learning_rate": 9.991989147734475e-05, "loss": 2.5535, "step": 2210 }, { "epoch": 0.02, "learning_rate": 9.991951146827906e-05, "loss": 2.5439, "step": 2215 }, { "epoch": 0.02, "learning_rate": 9.991913056075049e-05, "loss": 2.5745, "step": 2220 }, { "epoch": 0.02, "learning_rate": 9.991874875476587e-05, "loss": 2.5549, "step": 2225 }, { "epoch": 0.02, "learning_rate": 9.99183660503321e-05, "loss": 2.6127, "step": 2230 }, { "epoch": 0.02, "learning_rate": 9.991798244745607e-05, "loss": 2.5292, "step": 2235 }, { "epoch": 0.02, "learning_rate": 9.991759794614466e-05, "loss": 2.5606, "step": 2240 }, { "epoch": 0.02, "learning_rate": 9.991721254640483e-05, "loss": 2.6114, "step": 2245 }, { "epoch": 0.02, "learning_rate": 9.991682624824347e-05, "loss": 2.5909, "step": 2250 }, { "epoch": 0.02, "learning_rate": 9.991643905166756e-05, "loss": 2.5738, "step": 2255 }, { "epoch": 0.02, "learning_rate": 9.991605095668409e-05, "loss": 2.5892, "step": 2260 }, { "epoch": 0.02, "learning_rate": 9.991566196329999e-05, "loss": 2.5112, "step": 2265 }, { "epoch": 0.02, "learning_rate": 9.991527207152229e-05, "loss": 2.536, "step": 2270 }, { "epoch": 0.02, "learning_rate": 9.991488128135802e-05, "loss": 2.5791, "step": 2275 }, { "epoch": 0.02, "learning_rate": 9.99144895928142e-05, "loss": 2.5098, "step": 2280 }, { "epoch": 0.02, "learning_rate": 9.991409700589787e-05, "loss": 2.6071, "step": 2285 }, { "epoch": 0.02, "learning_rate": 9.99137035206161e-05, "loss": 2.6102, "step": 2290 }, { "epoch": 0.02, "learning_rate": 9.9913309136976e-05, "loss": 2.5383, "step": 2295 }, { "epoch": 0.02, "learning_rate": 9.991291385498465e-05, "loss": 2.647, "step": 2300 }, { "epoch": 0.02, "learning_rate": 9.991251767464915e-05, "loss": 2.5873, "step": 2305 }, { "epoch": 0.02, "learning_rate": 9.991212059597663e-05, "loss": 2.5787, "step": 2310 }, { "epoch": 0.02, "learning_rate": 9.991172261897426e-05, "loss": 2.564, "step": 2315 }, { "epoch": 0.02, "learning_rate": 9.99113237436492e-05, "loss": 2.61, "step": 2320 }, { "epoch": 0.02, "learning_rate": 9.99109239700086e-05, "loss": 2.4759, "step": 2325 }, { "epoch": 0.02, "learning_rate": 9.99105232980597e-05, "loss": 2.6339, "step": 2330 }, { "epoch": 0.02, "learning_rate": 9.991012172780967e-05, "loss": 2.6478, "step": 2335 }, { "epoch": 0.02, "learning_rate": 9.990971925926575e-05, "loss": 2.5417, "step": 2340 }, { "epoch": 0.02, "learning_rate": 9.99093158924352e-05, "loss": 2.6491, "step": 2345 }, { "epoch": 0.02, "learning_rate": 9.990891162732527e-05, "loss": 2.4709, "step": 2350 }, { "epoch": 0.02, "learning_rate": 9.990850646394323e-05, "loss": 2.5209, "step": 2355 }, { "epoch": 0.02, "learning_rate": 9.990810040229637e-05, "loss": 2.507, "step": 2360 }, { "epoch": 0.02, "learning_rate": 9.990769344239201e-05, "loss": 2.5453, "step": 2365 }, { "epoch": 0.02, "learning_rate": 9.990728558423747e-05, "loss": 2.6425, "step": 2370 }, { "epoch": 0.02, "learning_rate": 9.990687682784009e-05, "loss": 2.5893, "step": 2375 }, { "epoch": 0.02, "learning_rate": 9.990646717320723e-05, "loss": 2.5774, "step": 2380 }, { "epoch": 0.02, "learning_rate": 9.990605662034626e-05, "loss": 2.5898, "step": 2385 }, { "epoch": 0.02, "learning_rate": 9.990564516926456e-05, "loss": 2.5201, "step": 2390 }, { "epoch": 0.02, "learning_rate": 9.990523281996955e-05, "loss": 2.5209, "step": 2395 }, { "epoch": 0.02, "learning_rate": 9.990481957246865e-05, "loss": 2.5104, "step": 2400 }, { "epoch": 0.02, "learning_rate": 9.990440542676929e-05, "loss": 2.576, "step": 2405 }, { "epoch": 0.02, "learning_rate": 9.990399038287893e-05, "loss": 2.6075, "step": 2410 }, { "epoch": 0.02, "learning_rate": 9.990357444080503e-05, "loss": 2.5399, "step": 2415 }, { "epoch": 0.02, "learning_rate": 9.990315760055509e-05, "loss": 2.5951, "step": 2420 }, { "epoch": 0.02, "learning_rate": 9.990273986213661e-05, "loss": 2.558, "step": 2425 }, { "epoch": 0.02, "learning_rate": 9.99023212255571e-05, "loss": 2.5925, "step": 2430 }, { "epoch": 0.02, "learning_rate": 9.99019016908241e-05, "loss": 2.5635, "step": 2435 }, { "epoch": 0.02, "learning_rate": 9.990148125794518e-05, "loss": 2.5471, "step": 2440 }, { "epoch": 0.02, "learning_rate": 9.990105992692786e-05, "loss": 2.4935, "step": 2445 }, { "epoch": 0.02, "learning_rate": 9.990063769777977e-05, "loss": 2.634, "step": 2450 }, { "epoch": 0.02, "learning_rate": 9.990021457050847e-05, "loss": 2.5807, "step": 2455 }, { "epoch": 0.02, "learning_rate": 9.989979054512162e-05, "loss": 2.5659, "step": 2460 }, { "epoch": 0.02, "learning_rate": 9.98993656216268e-05, "loss": 2.5377, "step": 2465 }, { "epoch": 0.02, "learning_rate": 9.989893980003171e-05, "loss": 2.6041, "step": 2470 }, { "epoch": 0.02, "learning_rate": 9.989851308034398e-05, "loss": 2.5008, "step": 2475 }, { "epoch": 0.02, "learning_rate": 9.98980854625713e-05, "loss": 2.6363, "step": 2480 }, { "epoch": 0.02, "learning_rate": 9.989765694672136e-05, "loss": 2.5347, "step": 2485 }, { "epoch": 0.02, "learning_rate": 9.989722753280188e-05, "loss": 2.5808, "step": 2490 }, { "epoch": 0.02, "learning_rate": 9.989679722082059e-05, "loss": 2.5638, "step": 2495 }, { "epoch": 0.02, "learning_rate": 9.989636601078524e-05, "loss": 2.5986, "step": 2500 }, { "epoch": 0.02, "learning_rate": 9.989593390270357e-05, "loss": 2.6445, "step": 2505 }, { "epoch": 0.02, "learning_rate": 9.989550089658338e-05, "loss": 2.5364, "step": 2510 }, { "epoch": 0.02, "learning_rate": 9.989506699243245e-05, "loss": 2.5608, "step": 2515 }, { "epoch": 0.02, "learning_rate": 9.98946321902586e-05, "loss": 2.5724, "step": 2520 }, { "epoch": 0.02, "learning_rate": 9.989419649006963e-05, "loss": 2.5127, "step": 2525 }, { "epoch": 0.02, "learning_rate": 9.989375989187341e-05, "loss": 2.6087, "step": 2530 }, { "epoch": 0.02, "learning_rate": 9.989332239567781e-05, "loss": 2.5703, "step": 2535 }, { "epoch": 0.02, "learning_rate": 9.989288400149066e-05, "loss": 2.6146, "step": 2540 }, { "epoch": 0.02, "learning_rate": 9.989244470931988e-05, "loss": 2.5911, "step": 2545 }, { "epoch": 0.02, "learning_rate": 9.989200451917336e-05, "loss": 2.5173, "step": 2550 }, { "epoch": 0.02, "learning_rate": 9.989156343105905e-05, "loss": 2.5806, "step": 2555 }, { "epoch": 0.02, "learning_rate": 9.989112144498484e-05, "loss": 2.4601, "step": 2560 }, { "epoch": 0.02, "learning_rate": 9.989067856095875e-05, "loss": 2.5634, "step": 2565 }, { "epoch": 0.02, "learning_rate": 9.989023477898871e-05, "loss": 2.5839, "step": 2570 }, { "epoch": 0.02, "learning_rate": 9.988979009908271e-05, "loss": 2.532, "step": 2575 }, { "epoch": 0.02, "learning_rate": 9.988934452124875e-05, "loss": 2.5533, "step": 2580 }, { "epoch": 0.02, "learning_rate": 9.988889804549486e-05, "loss": 2.5219, "step": 2585 }, { "epoch": 0.02, "learning_rate": 9.988845067182908e-05, "loss": 2.5118, "step": 2590 }, { "epoch": 0.02, "learning_rate": 9.988800240025945e-05, "loss": 2.5528, "step": 2595 }, { "epoch": 0.02, "learning_rate": 9.988755323079404e-05, "loss": 2.596, "step": 2600 }, { "epoch": 0.02, "learning_rate": 9.988710316344094e-05, "loss": 2.508, "step": 2605 }, { "epoch": 0.02, "learning_rate": 9.988665219820825e-05, "loss": 2.615, "step": 2610 }, { "epoch": 0.02, "learning_rate": 9.98862003351041e-05, "loss": 2.6195, "step": 2615 }, { "epoch": 0.02, "learning_rate": 9.988574757413658e-05, "loss": 2.5631, "step": 2620 }, { "epoch": 0.02, "learning_rate": 9.988529391531388e-05, "loss": 2.5133, "step": 2625 }, { "epoch": 0.02, "learning_rate": 9.988483935864416e-05, "loss": 2.4823, "step": 2630 }, { "epoch": 0.02, "learning_rate": 9.988438390413557e-05, "loss": 2.5085, "step": 2635 }, { "epoch": 0.02, "learning_rate": 9.988392755179634e-05, "loss": 2.5093, "step": 2640 }, { "epoch": 0.02, "learning_rate": 9.988347030163469e-05, "loss": 2.6384, "step": 2645 }, { "epoch": 0.02, "learning_rate": 9.988301215365881e-05, "loss": 2.5972, "step": 2650 }, { "epoch": 0.02, "learning_rate": 9.988255310787698e-05, "loss": 2.5989, "step": 2655 }, { "epoch": 0.02, "learning_rate": 9.988209316429745e-05, "loss": 2.6323, "step": 2660 }, { "epoch": 0.02, "learning_rate": 9.988163232292849e-05, "loss": 2.4559, "step": 2665 }, { "epoch": 0.02, "learning_rate": 9.988117058377841e-05, "loss": 2.5604, "step": 2670 }, { "epoch": 0.02, "learning_rate": 9.988070794685552e-05, "loss": 2.563, "step": 2675 }, { "epoch": 0.02, "learning_rate": 9.988024441216813e-05, "loss": 2.4876, "step": 2680 }, { "epoch": 0.02, "learning_rate": 9.98797799797246e-05, "loss": 2.5866, "step": 2685 }, { "epoch": 0.02, "learning_rate": 9.987931464953329e-05, "loss": 2.624, "step": 2690 }, { "epoch": 0.02, "learning_rate": 9.987884842160255e-05, "loss": 2.5201, "step": 2695 }, { "epoch": 0.02, "learning_rate": 9.98783812959408e-05, "loss": 2.5592, "step": 2700 }, { "epoch": 0.02, "learning_rate": 9.987791327255644e-05, "loss": 2.5432, "step": 2705 }, { "epoch": 0.02, "learning_rate": 9.987744435145787e-05, "loss": 2.476, "step": 2710 }, { "epoch": 0.02, "learning_rate": 9.987697453265357e-05, "loss": 2.4934, "step": 2715 }, { "epoch": 0.02, "learning_rate": 9.987650381615197e-05, "loss": 2.4954, "step": 2720 }, { "epoch": 0.02, "learning_rate": 9.987603220196153e-05, "loss": 2.4859, "step": 2725 }, { "epoch": 0.02, "learning_rate": 9.987555969009078e-05, "loss": 2.4923, "step": 2730 }, { "epoch": 0.02, "learning_rate": 9.987508628054819e-05, "loss": 2.5804, "step": 2735 }, { "epoch": 0.02, "learning_rate": 9.98746119733423e-05, "loss": 2.5319, "step": 2740 }, { "epoch": 0.02, "learning_rate": 9.987413676848163e-05, "loss": 2.5914, "step": 2745 }, { "epoch": 0.02, "learning_rate": 9.987366066597474e-05, "loss": 2.5305, "step": 2750 }, { "epoch": 0.02, "learning_rate": 9.987318366583018e-05, "loss": 2.4987, "step": 2755 }, { "epoch": 0.02, "learning_rate": 9.987270576805658e-05, "loss": 2.4758, "step": 2760 }, { "epoch": 0.02, "learning_rate": 9.98722269726625e-05, "loss": 2.5311, "step": 2765 }, { "epoch": 0.02, "learning_rate": 9.987174727965659e-05, "loss": 2.4511, "step": 2770 }, { "epoch": 0.02, "learning_rate": 9.987126668904747e-05, "loss": 2.4898, "step": 2775 }, { "epoch": 0.02, "learning_rate": 9.987078520084376e-05, "loss": 2.603, "step": 2780 }, { "epoch": 0.02, "learning_rate": 9.987030281505418e-05, "loss": 2.5073, "step": 2785 }, { "epoch": 0.02, "learning_rate": 9.986981953168737e-05, "loss": 2.5923, "step": 2790 }, { "epoch": 0.02, "learning_rate": 9.986933535075204e-05, "loss": 2.6022, "step": 2795 }, { "epoch": 0.02, "learning_rate": 9.986885027225691e-05, "loss": 2.5324, "step": 2800 }, { "epoch": 0.02, "learning_rate": 9.98683642962107e-05, "loss": 2.5775, "step": 2805 }, { "epoch": 0.02, "learning_rate": 9.986787742262219e-05, "loss": 2.5751, "step": 2810 }, { "epoch": 0.02, "learning_rate": 9.986738965150008e-05, "loss": 2.5072, "step": 2815 }, { "epoch": 0.02, "learning_rate": 9.986690098285322e-05, "loss": 2.5306, "step": 2820 }, { "epoch": 0.02, "learning_rate": 9.986641141669036e-05, "loss": 2.4778, "step": 2825 }, { "epoch": 0.02, "learning_rate": 9.986592095302031e-05, "loss": 2.5631, "step": 2830 }, { "epoch": 0.02, "learning_rate": 9.986542959185193e-05, "loss": 2.5135, "step": 2835 }, { "epoch": 0.02, "learning_rate": 9.986493733319403e-05, "loss": 2.5256, "step": 2840 }, { "epoch": 0.02, "learning_rate": 9.986444417705549e-05, "loss": 2.5593, "step": 2845 }, { "epoch": 0.02, "learning_rate": 9.986395012344519e-05, "loss": 2.5996, "step": 2850 }, { "epoch": 0.02, "learning_rate": 9.986345517237199e-05, "loss": 2.5645, "step": 2855 }, { "epoch": 0.02, "learning_rate": 9.986295932384482e-05, "loss": 2.517, "step": 2860 }, { "epoch": 0.02, "learning_rate": 9.986246257787261e-05, "loss": 2.5808, "step": 2865 }, { "epoch": 0.02, "learning_rate": 9.986196493446432e-05, "loss": 2.53, "step": 2870 }, { "epoch": 0.02, "learning_rate": 9.986146639362886e-05, "loss": 2.4872, "step": 2875 }, { "epoch": 0.02, "learning_rate": 9.986096695537521e-05, "loss": 2.4942, "step": 2880 }, { "epoch": 0.02, "learning_rate": 9.98604666197124e-05, "loss": 2.4759, "step": 2885 }, { "epoch": 0.02, "learning_rate": 9.985996538664939e-05, "loss": 2.5729, "step": 2890 }, { "epoch": 0.02, "learning_rate": 9.985946325619524e-05, "loss": 2.518, "step": 2895 }, { "epoch": 0.02, "learning_rate": 9.985896022835895e-05, "loss": 2.4879, "step": 2900 }, { "epoch": 0.02, "learning_rate": 9.98584563031496e-05, "loss": 2.5916, "step": 2905 }, { "epoch": 0.02, "learning_rate": 9.985795148057624e-05, "loss": 2.4871, "step": 2910 }, { "epoch": 0.02, "learning_rate": 9.985744576064797e-05, "loss": 2.5427, "step": 2915 }, { "epoch": 0.02, "learning_rate": 9.98569391433739e-05, "loss": 2.5697, "step": 2920 }, { "epoch": 0.02, "learning_rate": 9.985643162876313e-05, "loss": 2.5436, "step": 2925 }, { "epoch": 0.03, "learning_rate": 9.985592321682479e-05, "loss": 2.5269, "step": 2930 }, { "epoch": 0.03, "learning_rate": 9.985541390756805e-05, "loss": 2.5097, "step": 2935 }, { "epoch": 0.03, "learning_rate": 9.985490370100208e-05, "loss": 2.5404, "step": 2940 }, { "epoch": 0.03, "learning_rate": 9.985439259713604e-05, "loss": 2.4923, "step": 2945 }, { "epoch": 0.03, "learning_rate": 9.985388059597915e-05, "loss": 2.517, "step": 2950 }, { "epoch": 0.03, "learning_rate": 9.98533676975406e-05, "loss": 2.5497, "step": 2955 }, { "epoch": 0.03, "learning_rate": 9.985285390182965e-05, "loss": 2.5446, "step": 2960 }, { "epoch": 0.03, "learning_rate": 9.985233920885552e-05, "loss": 2.4576, "step": 2965 }, { "epoch": 0.03, "learning_rate": 9.98518236186275e-05, "loss": 2.5134, "step": 2970 }, { "epoch": 0.03, "learning_rate": 9.985130713115485e-05, "loss": 2.4905, "step": 2975 }, { "epoch": 0.03, "learning_rate": 9.985078974644688e-05, "loss": 2.5458, "step": 2980 }, { "epoch": 0.03, "learning_rate": 9.985027146451288e-05, "loss": 2.5217, "step": 2985 }, { "epoch": 0.03, "learning_rate": 9.984975228536222e-05, "loss": 2.4857, "step": 2990 }, { "epoch": 0.03, "learning_rate": 9.98492322090042e-05, "loss": 2.5391, "step": 2995 }, { "epoch": 0.03, "learning_rate": 9.98487112354482e-05, "loss": 2.5577, "step": 3000 }, { "epoch": 0.03, "learning_rate": 9.984818936470359e-05, "loss": 2.529, "step": 3005 }, { "epoch": 0.03, "learning_rate": 9.984766659677978e-05, "loss": 2.5368, "step": 3010 }, { "epoch": 0.03, "learning_rate": 9.984714293168616e-05, "loss": 2.5845, "step": 3015 }, { "epoch": 0.03, "learning_rate": 9.984661836943216e-05, "loss": 2.4526, "step": 3020 }, { "epoch": 0.03, "learning_rate": 9.984609291002723e-05, "loss": 2.5491, "step": 3025 }, { "epoch": 0.03, "learning_rate": 9.984556655348081e-05, "loss": 2.5592, "step": 3030 }, { "epoch": 0.03, "learning_rate": 9.984503929980239e-05, "loss": 2.5626, "step": 3035 }, { "epoch": 0.03, "learning_rate": 9.984451114900144e-05, "loss": 2.519, "step": 3040 }, { "epoch": 0.03, "learning_rate": 9.984398210108749e-05, "loss": 2.555, "step": 3045 }, { "epoch": 0.03, "learning_rate": 9.984345215607004e-05, "loss": 2.5554, "step": 3050 }, { "epoch": 0.03, "learning_rate": 9.984292131395867e-05, "loss": 2.5744, "step": 3055 }, { "epoch": 0.03, "learning_rate": 9.984238957476288e-05, "loss": 2.5386, "step": 3060 }, { "epoch": 0.03, "learning_rate": 9.984185693849226e-05, "loss": 2.5063, "step": 3065 }, { "epoch": 0.03, "learning_rate": 9.984132340515642e-05, "loss": 2.5435, "step": 3070 }, { "epoch": 0.03, "learning_rate": 9.984078897476492e-05, "loss": 2.5597, "step": 3075 }, { "epoch": 0.03, "learning_rate": 9.98402536473274e-05, "loss": 2.4966, "step": 3080 }, { "epoch": 0.03, "learning_rate": 9.983971742285352e-05, "loss": 2.5858, "step": 3085 }, { "epoch": 0.03, "learning_rate": 9.983918030135289e-05, "loss": 2.5154, "step": 3090 }, { "epoch": 0.03, "learning_rate": 9.98386422828352e-05, "loss": 2.54, "step": 3095 }, { "epoch": 0.03, "learning_rate": 9.983810336731012e-05, "loss": 2.5314, "step": 3100 }, { "epoch": 0.03, "learning_rate": 9.983756355478736e-05, "loss": 2.6033, "step": 3105 }, { "epoch": 0.03, "learning_rate": 9.983702284527664e-05, "loss": 2.5007, "step": 3110 }, { "epoch": 0.03, "learning_rate": 9.983648123878768e-05, "loss": 2.501, "step": 3115 }, { "epoch": 0.03, "learning_rate": 9.983593873533024e-05, "loss": 2.5095, "step": 3120 }, { "epoch": 0.03, "learning_rate": 9.983539533491407e-05, "loss": 2.5012, "step": 3125 }, { "epoch": 0.03, "learning_rate": 9.983485103754896e-05, "loss": 2.5, "step": 3130 }, { "epoch": 0.03, "learning_rate": 9.98343058432447e-05, "loss": 2.5089, "step": 3135 }, { "epoch": 0.03, "learning_rate": 9.98337597520111e-05, "loss": 2.5215, "step": 3140 }, { "epoch": 0.03, "learning_rate": 9.983321276385802e-05, "loss": 2.4724, "step": 3145 }, { "epoch": 0.03, "learning_rate": 9.983266487879525e-05, "loss": 2.5578, "step": 3150 }, { "epoch": 0.03, "learning_rate": 9.983211609683271e-05, "loss": 2.482, "step": 3155 }, { "epoch": 0.03, "learning_rate": 9.983156641798023e-05, "loss": 2.5534, "step": 3160 }, { "epoch": 0.03, "learning_rate": 9.983101584224772e-05, "loss": 2.5881, "step": 3165 }, { "epoch": 0.03, "learning_rate": 9.98304643696451e-05, "loss": 2.598, "step": 3170 }, { "epoch": 0.03, "learning_rate": 9.982991200018228e-05, "loss": 2.5126, "step": 3175 }, { "epoch": 0.03, "learning_rate": 9.98293587338692e-05, "loss": 2.5399, "step": 3180 }, { "epoch": 0.03, "learning_rate": 9.982880457071584e-05, "loss": 2.5133, "step": 3185 }, { "epoch": 0.03, "learning_rate": 9.982824951073215e-05, "loss": 2.4601, "step": 3190 }, { "epoch": 0.03, "learning_rate": 9.982769355392813e-05, "loss": 2.538, "step": 3195 }, { "epoch": 0.03, "learning_rate": 9.98271367003138e-05, "loss": 2.5055, "step": 3200 }, { "epoch": 0.03, "learning_rate": 9.982657894989915e-05, "loss": 2.479, "step": 3205 }, { "epoch": 0.03, "learning_rate": 9.982602030269425e-05, "loss": 2.5595, "step": 3210 }, { "epoch": 0.03, "learning_rate": 9.982546075870913e-05, "loss": 2.5568, "step": 3215 }, { "epoch": 0.03, "learning_rate": 9.982490031795388e-05, "loss": 2.4733, "step": 3220 }, { "epoch": 0.03, "learning_rate": 9.982433898043857e-05, "loss": 2.5956, "step": 3225 }, { "epoch": 0.03, "learning_rate": 9.982377674617332e-05, "loss": 2.5731, "step": 3230 }, { "epoch": 0.03, "learning_rate": 9.982321361516825e-05, "loss": 2.4946, "step": 3235 }, { "epoch": 0.03, "learning_rate": 9.982264958743347e-05, "loss": 2.5119, "step": 3240 }, { "epoch": 0.03, "learning_rate": 9.982208466297915e-05, "loss": 2.5255, "step": 3245 }, { "epoch": 0.03, "learning_rate": 9.982151884181546e-05, "loss": 2.563, "step": 3250 }, { "epoch": 0.03, "learning_rate": 9.982095212395259e-05, "loss": 2.4737, "step": 3255 }, { "epoch": 0.03, "learning_rate": 9.982038450940072e-05, "loss": 2.4827, "step": 3260 }, { "epoch": 0.03, "learning_rate": 9.981981599817008e-05, "loss": 2.5569, "step": 3265 }, { "epoch": 0.03, "learning_rate": 9.981924659027088e-05, "loss": 2.4964, "step": 3270 }, { "epoch": 0.03, "learning_rate": 9.981867628571341e-05, "loss": 2.4834, "step": 3275 }, { "epoch": 0.03, "learning_rate": 9.98181050845079e-05, "loss": 2.4626, "step": 3280 }, { "epoch": 0.03, "learning_rate": 9.981753298666465e-05, "loss": 2.4948, "step": 3285 }, { "epoch": 0.03, "learning_rate": 9.981695999219394e-05, "loss": 2.4506, "step": 3290 }, { "epoch": 0.03, "learning_rate": 9.981638610110609e-05, "loss": 2.4532, "step": 3295 }, { "epoch": 0.03, "learning_rate": 9.981581131341142e-05, "loss": 2.4625, "step": 3300 }, { "epoch": 0.03, "learning_rate": 9.981523562912029e-05, "loss": 2.5395, "step": 3305 }, { "epoch": 0.03, "learning_rate": 9.981465904824308e-05, "loss": 2.5116, "step": 3310 }, { "epoch": 0.03, "learning_rate": 9.981408157079012e-05, "loss": 2.4772, "step": 3315 }, { "epoch": 0.03, "learning_rate": 9.981350319677184e-05, "loss": 2.5539, "step": 3320 }, { "epoch": 0.03, "learning_rate": 9.981292392619862e-05, "loss": 2.5725, "step": 3325 }, { "epoch": 0.03, "learning_rate": 9.981234375908092e-05, "loss": 2.5806, "step": 3330 }, { "epoch": 0.03, "learning_rate": 9.981176269542916e-05, "loss": 2.413, "step": 3335 }, { "epoch": 0.03, "learning_rate": 9.98111807352538e-05, "loss": 2.4985, "step": 3340 }, { "epoch": 0.03, "learning_rate": 9.981059787856531e-05, "loss": 2.4615, "step": 3345 }, { "epoch": 0.03, "learning_rate": 9.98100141253742e-05, "loss": 2.4946, "step": 3350 }, { "epoch": 0.03, "learning_rate": 9.980942947569097e-05, "loss": 2.5005, "step": 3355 }, { "epoch": 0.03, "learning_rate": 9.980884392952612e-05, "loss": 2.4794, "step": 3360 }, { "epoch": 0.03, "learning_rate": 9.980825748689023e-05, "loss": 2.4649, "step": 3365 }, { "epoch": 0.03, "learning_rate": 9.98076701477938e-05, "loss": 2.5995, "step": 3370 }, { "epoch": 0.03, "learning_rate": 9.980708191224745e-05, "loss": 2.5311, "step": 3375 }, { "epoch": 0.03, "learning_rate": 9.980649278026175e-05, "loss": 2.5033, "step": 3380 }, { "epoch": 0.03, "learning_rate": 9.980590275184729e-05, "loss": 2.5552, "step": 3385 }, { "epoch": 0.03, "learning_rate": 9.980531182701471e-05, "loss": 2.535, "step": 3390 }, { "epoch": 0.03, "learning_rate": 9.980472000577463e-05, "loss": 2.5854, "step": 3395 }, { "epoch": 0.03, "learning_rate": 9.980412728813772e-05, "loss": 2.5231, "step": 3400 }, { "epoch": 0.03, "learning_rate": 9.980353367411463e-05, "loss": 2.5777, "step": 3405 }, { "epoch": 0.03, "learning_rate": 9.980293916371605e-05, "loss": 2.5367, "step": 3410 }, { "epoch": 0.03, "learning_rate": 9.98023437569527e-05, "loss": 2.5149, "step": 3415 }, { "epoch": 0.03, "learning_rate": 9.980174745383526e-05, "loss": 2.5153, "step": 3420 }, { "epoch": 0.03, "learning_rate": 9.980115025437447e-05, "loss": 2.5555, "step": 3425 }, { "epoch": 0.03, "learning_rate": 9.98005521585811e-05, "loss": 2.4425, "step": 3430 }, { "epoch": 0.03, "learning_rate": 9.97999531664659e-05, "loss": 2.4868, "step": 3435 }, { "epoch": 0.03, "learning_rate": 9.979935327803966e-05, "loss": 2.5128, "step": 3440 }, { "epoch": 0.03, "learning_rate": 9.979875249331318e-05, "loss": 2.5039, "step": 3445 }, { "epoch": 0.03, "learning_rate": 9.979815081229724e-05, "loss": 2.5665, "step": 3450 }, { "epoch": 0.03, "learning_rate": 9.979754823500272e-05, "loss": 2.5048, "step": 3455 }, { "epoch": 0.03, "learning_rate": 9.979694476144042e-05, "loss": 2.5089, "step": 3460 }, { "epoch": 0.03, "learning_rate": 9.979634039162121e-05, "loss": 2.5841, "step": 3465 }, { "epoch": 0.03, "learning_rate": 9.979573512555598e-05, "loss": 2.4975, "step": 3470 }, { "epoch": 0.03, "learning_rate": 9.979512896325565e-05, "loss": 2.5363, "step": 3475 }, { "epoch": 0.03, "learning_rate": 9.979452190473106e-05, "loss": 2.4515, "step": 3480 }, { "epoch": 0.03, "learning_rate": 9.979391394999321e-05, "loss": 2.4219, "step": 3485 }, { "epoch": 0.03, "learning_rate": 9.979330509905301e-05, "loss": 2.5688, "step": 3490 }, { "epoch": 0.03, "learning_rate": 9.97926953519214e-05, "loss": 2.5865, "step": 3495 }, { "epoch": 0.03, "learning_rate": 9.979208470860937e-05, "loss": 2.4767, "step": 3500 }, { "epoch": 0.03, "learning_rate": 9.979147316912791e-05, "loss": 2.486, "step": 3505 }, { "epoch": 0.03, "learning_rate": 9.979086073348804e-05, "loss": 2.5187, "step": 3510 }, { "epoch": 0.03, "learning_rate": 9.979024740170076e-05, "loss": 2.5501, "step": 3515 }, { "epoch": 0.03, "learning_rate": 9.978963317377712e-05, "loss": 2.5865, "step": 3520 }, { "epoch": 0.03, "learning_rate": 9.97890180497282e-05, "loss": 2.4963, "step": 3525 }, { "epoch": 0.03, "learning_rate": 9.978840202956503e-05, "loss": 2.4653, "step": 3530 }, { "epoch": 0.03, "learning_rate": 9.978778511329871e-05, "loss": 2.5177, "step": 3535 }, { "epoch": 0.03, "learning_rate": 9.978716730094035e-05, "loss": 2.4696, "step": 3540 }, { "epoch": 0.03, "learning_rate": 9.978654859250107e-05, "loss": 2.5564, "step": 3545 }, { "epoch": 0.03, "learning_rate": 9.9785928987992e-05, "loss": 2.5667, "step": 3550 }, { "epoch": 0.03, "learning_rate": 9.978530848742429e-05, "loss": 2.5255, "step": 3555 }, { "epoch": 0.03, "learning_rate": 9.978468709080911e-05, "loss": 2.5091, "step": 3560 }, { "epoch": 0.03, "learning_rate": 9.978406479815765e-05, "loss": 2.587, "step": 3565 }, { "epoch": 0.03, "learning_rate": 9.978344160948111e-05, "loss": 2.5102, "step": 3570 }, { "epoch": 0.03, "learning_rate": 9.97828175247907e-05, "loss": 2.5658, "step": 3575 }, { "epoch": 0.03, "learning_rate": 9.978219254409766e-05, "loss": 2.5046, "step": 3580 }, { "epoch": 0.03, "learning_rate": 9.978156666741323e-05, "loss": 2.5485, "step": 3585 }, { "epoch": 0.03, "learning_rate": 9.978093989474867e-05, "loss": 2.4134, "step": 3590 }, { "epoch": 0.03, "learning_rate": 9.978031222611528e-05, "loss": 2.4835, "step": 3595 }, { "epoch": 0.03, "learning_rate": 9.977968366152435e-05, "loss": 2.5763, "step": 3600 }, { "epoch": 0.03, "learning_rate": 9.977905420098717e-05, "loss": 2.5271, "step": 3605 }, { "epoch": 0.03, "learning_rate": 9.97784238445151e-05, "loss": 2.5565, "step": 3610 }, { "epoch": 0.03, "learning_rate": 9.977779259211948e-05, "loss": 2.5905, "step": 3615 }, { "epoch": 0.03, "learning_rate": 9.977716044381164e-05, "loss": 2.4955, "step": 3620 }, { "epoch": 0.03, "learning_rate": 9.977652739960301e-05, "loss": 2.5364, "step": 3625 }, { "epoch": 0.03, "learning_rate": 9.977589345950495e-05, "loss": 2.5849, "step": 3630 }, { "epoch": 0.03, "learning_rate": 9.977525862352887e-05, "loss": 2.5816, "step": 3635 }, { "epoch": 0.03, "learning_rate": 9.97746228916862e-05, "loss": 2.447, "step": 3640 }, { "epoch": 0.03, "learning_rate": 9.977398626398839e-05, "loss": 2.4, "step": 3645 }, { "epoch": 0.03, "learning_rate": 9.977334874044688e-05, "loss": 2.457, "step": 3650 }, { "epoch": 0.03, "learning_rate": 9.977271032107317e-05, "loss": 2.5901, "step": 3655 }, { "epoch": 0.03, "learning_rate": 9.977207100587873e-05, "loss": 2.4407, "step": 3660 }, { "epoch": 0.03, "learning_rate": 9.977143079487508e-05, "loss": 2.4908, "step": 3665 }, { "epoch": 0.03, "learning_rate": 9.977078968807372e-05, "loss": 2.5797, "step": 3670 }, { "epoch": 0.03, "learning_rate": 9.977014768548622e-05, "loss": 2.4891, "step": 3675 }, { "epoch": 0.03, "learning_rate": 9.976950478712413e-05, "loss": 2.5632, "step": 3680 }, { "epoch": 0.03, "learning_rate": 9.976886099299898e-05, "loss": 2.4334, "step": 3685 }, { "epoch": 0.03, "learning_rate": 9.976821630312241e-05, "loss": 2.6227, "step": 3690 }, { "epoch": 0.03, "learning_rate": 9.976757071750599e-05, "loss": 2.4789, "step": 3695 }, { "epoch": 0.03, "learning_rate": 9.976692423616137e-05, "loss": 2.5535, "step": 3700 }, { "epoch": 0.03, "learning_rate": 9.976627685910013e-05, "loss": 2.5126, "step": 3705 }, { "epoch": 0.03, "learning_rate": 9.976562858633399e-05, "loss": 2.5453, "step": 3710 }, { "epoch": 0.03, "learning_rate": 9.976497941787458e-05, "loss": 2.4256, "step": 3715 }, { "epoch": 0.03, "learning_rate": 9.976432935373359e-05, "loss": 2.5531, "step": 3720 }, { "epoch": 0.03, "learning_rate": 9.976367839392272e-05, "loss": 2.5069, "step": 3725 }, { "epoch": 0.03, "learning_rate": 9.976302653845366e-05, "loss": 2.4931, "step": 3730 }, { "epoch": 0.03, "learning_rate": 9.97623737873382e-05, "loss": 2.4717, "step": 3735 }, { "epoch": 0.03, "learning_rate": 9.976172014058803e-05, "loss": 2.5408, "step": 3740 }, { "epoch": 0.03, "learning_rate": 9.976106559821495e-05, "loss": 2.5471, "step": 3745 }, { "epoch": 0.03, "learning_rate": 9.976041016023074e-05, "loss": 2.5037, "step": 3750 }, { "epoch": 0.03, "learning_rate": 9.975975382664719e-05, "loss": 2.546, "step": 3755 }, { "epoch": 0.03, "learning_rate": 9.975909659747609e-05, "loss": 2.4651, "step": 3760 }, { "epoch": 0.03, "learning_rate": 9.97584384727293e-05, "loss": 2.4565, "step": 3765 }, { "epoch": 0.03, "learning_rate": 9.975777945241867e-05, "loss": 2.4249, "step": 3770 }, { "epoch": 0.03, "learning_rate": 9.975711953655601e-05, "loss": 2.5319, "step": 3775 }, { "epoch": 0.03, "learning_rate": 9.975645872515327e-05, "loss": 2.5265, "step": 3780 }, { "epoch": 0.03, "learning_rate": 9.975579701822229e-05, "loss": 2.5427, "step": 3785 }, { "epoch": 0.03, "learning_rate": 9.975513441577502e-05, "loss": 2.5011, "step": 3790 }, { "epoch": 0.03, "learning_rate": 9.975447091782333e-05, "loss": 2.5706, "step": 3795 }, { "epoch": 0.03, "learning_rate": 9.97538065243792e-05, "loss": 2.4868, "step": 3800 }, { "epoch": 0.03, "learning_rate": 9.975314123545458e-05, "loss": 2.5237, "step": 3805 }, { "epoch": 0.03, "learning_rate": 9.975247505106147e-05, "loss": 2.5642, "step": 3810 }, { "epoch": 0.03, "learning_rate": 9.975180797121181e-05, "loss": 2.5397, "step": 3815 }, { "epoch": 0.03, "learning_rate": 9.975113999591764e-05, "loss": 2.5146, "step": 3820 }, { "epoch": 0.03, "learning_rate": 9.975047112519098e-05, "loss": 2.5382, "step": 3825 }, { "epoch": 0.03, "learning_rate": 9.974980135904386e-05, "loss": 2.5592, "step": 3830 }, { "epoch": 0.03, "learning_rate": 9.974913069748832e-05, "loss": 2.4641, "step": 3835 }, { "epoch": 0.03, "learning_rate": 9.974845914053647e-05, "loss": 2.433, "step": 3840 }, { "epoch": 0.03, "learning_rate": 9.974778668820037e-05, "loss": 2.4811, "step": 3845 }, { "epoch": 0.03, "learning_rate": 9.974711334049212e-05, "loss": 2.4864, "step": 3850 }, { "epoch": 0.03, "learning_rate": 9.974643909742386e-05, "loss": 2.5021, "step": 3855 }, { "epoch": 0.03, "learning_rate": 9.97457639590077e-05, "loss": 2.4827, "step": 3860 }, { "epoch": 0.03, "learning_rate": 9.974508792525581e-05, "loss": 2.5252, "step": 3865 }, { "epoch": 0.03, "learning_rate": 9.974441099618035e-05, "loss": 2.4895, "step": 3870 }, { "epoch": 0.03, "learning_rate": 9.974373317179351e-05, "loss": 2.5403, "step": 3875 }, { "epoch": 0.03, "learning_rate": 9.974305445210748e-05, "loss": 2.4934, "step": 3880 }, { "epoch": 0.03, "learning_rate": 9.974237483713448e-05, "loss": 2.5845, "step": 3885 }, { "epoch": 0.03, "learning_rate": 9.974169432688674e-05, "loss": 2.512, "step": 3890 }, { "epoch": 0.03, "learning_rate": 9.974101292137651e-05, "loss": 2.4567, "step": 3895 }, { "epoch": 0.03, "learning_rate": 9.974033062061605e-05, "loss": 2.4847, "step": 3900 }, { "epoch": 0.03, "learning_rate": 9.973964742461765e-05, "loss": 2.5205, "step": 3905 }, { "epoch": 0.03, "learning_rate": 9.973896333339359e-05, "loss": 2.5686, "step": 3910 }, { "epoch": 0.03, "learning_rate": 9.973827834695621e-05, "loss": 2.5187, "step": 3915 }, { "epoch": 0.03, "learning_rate": 9.973759246531782e-05, "loss": 2.4978, "step": 3920 }, { "epoch": 0.03, "learning_rate": 9.973690568849074e-05, "loss": 2.493, "step": 3925 }, { "epoch": 0.03, "learning_rate": 9.973621801648739e-05, "loss": 2.4811, "step": 3930 }, { "epoch": 0.03, "learning_rate": 9.97355294493201e-05, "loss": 2.5132, "step": 3935 }, { "epoch": 0.03, "learning_rate": 9.973483998700127e-05, "loss": 2.4443, "step": 3940 }, { "epoch": 0.03, "learning_rate": 9.973414962954332e-05, "loss": 2.479, "step": 3945 }, { "epoch": 0.03, "learning_rate": 9.973345837695868e-05, "loss": 2.5641, "step": 3950 }, { "epoch": 0.03, "learning_rate": 9.973276622925978e-05, "loss": 2.5967, "step": 3955 }, { "epoch": 0.03, "learning_rate": 9.973207318645908e-05, "loss": 2.5605, "step": 3960 }, { "epoch": 0.03, "learning_rate": 9.973137924856903e-05, "loss": 2.4804, "step": 3965 }, { "epoch": 0.03, "learning_rate": 9.973068441560216e-05, "loss": 2.4625, "step": 3970 }, { "epoch": 0.03, "learning_rate": 9.972998868757096e-05, "loss": 2.4964, "step": 3975 }, { "epoch": 0.03, "learning_rate": 9.972929206448796e-05, "loss": 2.4596, "step": 3980 }, { "epoch": 0.03, "learning_rate": 9.972859454636568e-05, "loss": 2.512, "step": 3985 }, { "epoch": 0.03, "learning_rate": 9.972789613321667e-05, "loss": 2.6149, "step": 3990 }, { "epoch": 0.03, "learning_rate": 9.972719682505353e-05, "loss": 2.458, "step": 3995 }, { "epoch": 0.03, "learning_rate": 9.972649662188882e-05, "loss": 2.5436, "step": 4000 }, { "epoch": 0.03, "learning_rate": 9.972579552373515e-05, "loss": 2.48, "step": 4005 }, { "epoch": 0.03, "learning_rate": 9.972509353060515e-05, "loss": 2.4441, "step": 4010 }, { "epoch": 0.03, "learning_rate": 9.972439064251144e-05, "loss": 2.5191, "step": 4015 }, { "epoch": 0.03, "learning_rate": 9.972368685946666e-05, "loss": 2.4809, "step": 4020 }, { "epoch": 0.03, "learning_rate": 9.972298218148353e-05, "loss": 2.4377, "step": 4025 }, { "epoch": 0.03, "learning_rate": 9.972227660857467e-05, "loss": 2.5085, "step": 4030 }, { "epoch": 0.03, "learning_rate": 9.972157014075281e-05, "loss": 2.4703, "step": 4035 }, { "epoch": 0.03, "learning_rate": 9.972086277803066e-05, "loss": 2.4797, "step": 4040 }, { "epoch": 0.03, "learning_rate": 9.972015452042094e-05, "loss": 2.5611, "step": 4045 }, { "epoch": 0.03, "learning_rate": 9.97194453679364e-05, "loss": 2.5073, "step": 4050 }, { "epoch": 0.03, "learning_rate": 9.971873532058984e-05, "loss": 2.5089, "step": 4055 }, { "epoch": 0.03, "learning_rate": 9.9718024378394e-05, "loss": 2.5581, "step": 4060 }, { "epoch": 0.03, "learning_rate": 9.971731254136167e-05, "loss": 2.5775, "step": 4065 }, { "epoch": 0.03, "learning_rate": 9.97165998095057e-05, "loss": 2.5019, "step": 4070 }, { "epoch": 0.03, "learning_rate": 9.971588618283889e-05, "loss": 2.512, "step": 4075 }, { "epoch": 0.03, "learning_rate": 9.97151716613741e-05, "loss": 2.5329, "step": 4080 }, { "epoch": 0.03, "learning_rate": 9.971445624512416e-05, "loss": 2.4537, "step": 4085 }, { "epoch": 0.03, "learning_rate": 9.971373993410199e-05, "loss": 2.4552, "step": 4090 }, { "epoch": 0.03, "learning_rate": 9.971302272832043e-05, "loss": 2.4378, "step": 4095 }, { "epoch": 0.03, "learning_rate": 9.971230462779246e-05, "loss": 2.5142, "step": 4100 }, { "epoch": 0.04, "learning_rate": 9.971158563253094e-05, "loss": 2.4914, "step": 4105 }, { "epoch": 0.04, "learning_rate": 9.971086574254882e-05, "loss": 2.5017, "step": 4110 }, { "epoch": 0.04, "learning_rate": 9.971014495785909e-05, "loss": 2.5178, "step": 4115 }, { "epoch": 0.04, "learning_rate": 9.970942327847468e-05, "loss": 2.4726, "step": 4120 }, { "epoch": 0.04, "learning_rate": 9.970870070440861e-05, "loss": 2.4858, "step": 4125 }, { "epoch": 0.04, "learning_rate": 9.970797723567389e-05, "loss": 2.492, "step": 4130 }, { "epoch": 0.04, "learning_rate": 9.970725287228352e-05, "loss": 2.5032, "step": 4135 }, { "epoch": 0.04, "learning_rate": 9.970652761425055e-05, "loss": 2.5209, "step": 4140 }, { "epoch": 0.04, "learning_rate": 9.970580146158801e-05, "loss": 2.4739, "step": 4145 }, { "epoch": 0.04, "learning_rate": 9.9705074414309e-05, "loss": 2.5719, "step": 4150 }, { "epoch": 0.04, "learning_rate": 9.97043464724266e-05, "loss": 2.5587, "step": 4155 }, { "epoch": 0.04, "learning_rate": 9.97036176359539e-05, "loss": 2.5098, "step": 4160 }, { "epoch": 0.04, "learning_rate": 9.970288790490404e-05, "loss": 2.5576, "step": 4165 }, { "epoch": 0.04, "learning_rate": 9.970215727929011e-05, "loss": 2.5108, "step": 4170 }, { "epoch": 0.04, "learning_rate": 9.970142575912529e-05, "loss": 2.5184, "step": 4175 }, { "epoch": 0.04, "learning_rate": 9.970069334442275e-05, "loss": 2.5033, "step": 4180 }, { "epoch": 0.04, "learning_rate": 9.969996003519566e-05, "loss": 2.4814, "step": 4185 }, { "epoch": 0.04, "learning_rate": 9.969922583145724e-05, "loss": 2.464, "step": 4190 }, { "epoch": 0.04, "learning_rate": 9.969849073322067e-05, "loss": 2.3991, "step": 4195 }, { "epoch": 0.04, "learning_rate": 9.969775474049919e-05, "loss": 2.5534, "step": 4200 }, { "epoch": 0.04, "learning_rate": 9.969701785330608e-05, "loss": 2.4318, "step": 4205 }, { "epoch": 0.04, "learning_rate": 9.969628007165455e-05, "loss": 2.4329, "step": 4210 }, { "epoch": 0.04, "learning_rate": 9.969554139555793e-05, "loss": 2.5021, "step": 4215 }, { "epoch": 0.04, "learning_rate": 9.969480182502947e-05, "loss": 2.5085, "step": 4220 }, { "epoch": 0.04, "learning_rate": 9.96940613600825e-05, "loss": 2.5431, "step": 4225 }, { "epoch": 0.04, "learning_rate": 9.969332000073038e-05, "loss": 2.4577, "step": 4230 }, { "epoch": 0.04, "learning_rate": 9.96925777469864e-05, "loss": 2.4801, "step": 4235 }, { "epoch": 0.04, "learning_rate": 9.969183459886393e-05, "loss": 2.4804, "step": 4240 }, { "epoch": 0.04, "learning_rate": 9.969109055637638e-05, "loss": 2.5241, "step": 4245 }, { "epoch": 0.04, "learning_rate": 9.96903456195371e-05, "loss": 2.4495, "step": 4250 }, { "epoch": 0.04, "learning_rate": 9.968959978835954e-05, "loss": 2.436, "step": 4255 }, { "epoch": 0.04, "learning_rate": 9.968885306285707e-05, "loss": 2.4977, "step": 4260 }, { "epoch": 0.04, "learning_rate": 9.968810544304318e-05, "loss": 2.4465, "step": 4265 }, { "epoch": 0.04, "learning_rate": 9.96873569289313e-05, "loss": 2.4992, "step": 4270 }, { "epoch": 0.04, "learning_rate": 9.96866075205349e-05, "loss": 2.529, "step": 4275 }, { "epoch": 0.04, "learning_rate": 9.968585721786747e-05, "loss": 2.4571, "step": 4280 }, { "epoch": 0.04, "learning_rate": 9.968510602094255e-05, "loss": 2.4026, "step": 4285 }, { "epoch": 0.04, "learning_rate": 9.96843539297736e-05, "loss": 2.4423, "step": 4290 }, { "epoch": 0.04, "learning_rate": 9.968360094437419e-05, "loss": 2.4916, "step": 4295 }, { "epoch": 0.04, "learning_rate": 9.968284706475787e-05, "loss": 2.4812, "step": 4300 }, { "epoch": 0.04, "learning_rate": 9.968209229093821e-05, "loss": 2.4468, "step": 4305 }, { "epoch": 0.04, "learning_rate": 9.968133662292877e-05, "loss": 2.5096, "step": 4310 }, { "epoch": 0.04, "learning_rate": 9.968058006074321e-05, "loss": 2.4709, "step": 4315 }, { "epoch": 0.04, "learning_rate": 9.967982260439507e-05, "loss": 2.4627, "step": 4320 }, { "epoch": 0.04, "learning_rate": 9.967906425389805e-05, "loss": 2.5209, "step": 4325 }, { "epoch": 0.04, "learning_rate": 9.967830500926576e-05, "loss": 2.5056, "step": 4330 }, { "epoch": 0.04, "learning_rate": 9.967754487051187e-05, "loss": 2.4931, "step": 4335 }, { "epoch": 0.04, "learning_rate": 9.967678383765007e-05, "loss": 2.4685, "step": 4340 }, { "epoch": 0.04, "learning_rate": 9.967602191069406e-05, "loss": 2.4474, "step": 4345 }, { "epoch": 0.04, "learning_rate": 9.967525908965755e-05, "loss": 2.524, "step": 4350 }, { "epoch": 0.04, "learning_rate": 9.967449537455425e-05, "loss": 2.441, "step": 4355 }, { "epoch": 0.04, "learning_rate": 9.967373076539793e-05, "loss": 2.5211, "step": 4360 }, { "epoch": 0.04, "learning_rate": 9.967296526220234e-05, "loss": 2.4122, "step": 4365 }, { "epoch": 0.04, "learning_rate": 9.967219886498128e-05, "loss": 2.5126, "step": 4370 }, { "epoch": 0.04, "learning_rate": 9.96714315737485e-05, "loss": 2.4836, "step": 4375 }, { "epoch": 0.04, "learning_rate": 9.967066338851785e-05, "loss": 2.475, "step": 4380 }, { "epoch": 0.04, "learning_rate": 9.966989430930314e-05, "loss": 2.4531, "step": 4385 }, { "epoch": 0.04, "learning_rate": 9.966912433611821e-05, "loss": 2.5134, "step": 4390 }, { "epoch": 0.04, "learning_rate": 9.966835346897692e-05, "loss": 2.5912, "step": 4395 }, { "epoch": 0.04, "learning_rate": 9.966758170789314e-05, "loss": 2.4994, "step": 4400 }, { "epoch": 0.04, "learning_rate": 9.966680905288077e-05, "loss": 2.4914, "step": 4405 }, { "epoch": 0.04, "learning_rate": 9.966603550395373e-05, "loss": 2.5062, "step": 4410 }, { "epoch": 0.04, "learning_rate": 9.96652610611259e-05, "loss": 2.4394, "step": 4415 }, { "epoch": 0.04, "learning_rate": 9.966448572441125e-05, "loss": 2.4598, "step": 4420 }, { "epoch": 0.04, "learning_rate": 9.966370949382373e-05, "loss": 2.4409, "step": 4425 }, { "epoch": 0.04, "learning_rate": 9.966293236937731e-05, "loss": 2.474, "step": 4430 }, { "epoch": 0.04, "learning_rate": 9.966215435108597e-05, "loss": 2.471, "step": 4435 }, { "epoch": 0.04, "learning_rate": 9.966137543896372e-05, "loss": 2.4899, "step": 4440 }, { "epoch": 0.04, "learning_rate": 9.966059563302458e-05, "loss": 2.476, "step": 4445 }, { "epoch": 0.04, "learning_rate": 9.965981493328259e-05, "loss": 2.5328, "step": 4450 }, { "epoch": 0.04, "learning_rate": 9.965903333975178e-05, "loss": 2.5145, "step": 4455 }, { "epoch": 0.04, "learning_rate": 9.965825085244625e-05, "loss": 2.4974, "step": 4460 }, { "epoch": 0.04, "learning_rate": 9.965746747138004e-05, "loss": 2.4638, "step": 4465 }, { "epoch": 0.04, "learning_rate": 9.96566831965673e-05, "loss": 2.4516, "step": 4470 }, { "epoch": 0.04, "learning_rate": 9.965589802802211e-05, "loss": 2.59, "step": 4475 }, { "epoch": 0.04, "learning_rate": 9.965511196575861e-05, "loss": 2.5525, "step": 4480 }, { "epoch": 0.04, "learning_rate": 9.965432500979094e-05, "loss": 2.5057, "step": 4485 }, { "epoch": 0.04, "learning_rate": 9.965353716013328e-05, "loss": 2.4954, "step": 4490 }, { "epoch": 0.04, "learning_rate": 9.965274841679981e-05, "loss": 2.4579, "step": 4495 }, { "epoch": 0.04, "learning_rate": 9.965195877980471e-05, "loss": 2.438, "step": 4500 }, { "epoch": 0.04, "learning_rate": 9.96511682491622e-05, "loss": 2.4294, "step": 4505 }, { "epoch": 0.04, "learning_rate": 9.965037682488652e-05, "loss": 2.4871, "step": 4510 }, { "epoch": 0.04, "learning_rate": 9.964958450699189e-05, "loss": 2.4602, "step": 4515 }, { "epoch": 0.04, "learning_rate": 9.964879129549258e-05, "loss": 2.5339, "step": 4520 }, { "epoch": 0.04, "learning_rate": 9.964799719040287e-05, "loss": 2.4847, "step": 4525 }, { "epoch": 0.04, "learning_rate": 9.964720219173707e-05, "loss": 2.5059, "step": 4530 }, { "epoch": 0.04, "learning_rate": 9.964640629950946e-05, "loss": 2.4615, "step": 4535 }, { "epoch": 0.04, "learning_rate": 9.964560951373438e-05, "loss": 2.4594, "step": 4540 }, { "epoch": 0.04, "learning_rate": 9.964481183442616e-05, "loss": 2.4522, "step": 4545 }, { "epoch": 0.04, "learning_rate": 9.964401326159917e-05, "loss": 2.5284, "step": 4550 }, { "epoch": 0.04, "learning_rate": 9.964321379526778e-05, "loss": 2.4941, "step": 4555 }, { "epoch": 0.04, "learning_rate": 9.964241343544635e-05, "loss": 2.4135, "step": 4560 }, { "epoch": 0.04, "learning_rate": 9.964161218214934e-05, "loss": 2.4809, "step": 4565 }, { "epoch": 0.04, "learning_rate": 9.964081003539113e-05, "loss": 2.519, "step": 4570 }, { "epoch": 0.04, "learning_rate": 9.964000699518617e-05, "loss": 2.5119, "step": 4575 }, { "epoch": 0.04, "learning_rate": 9.96392030615489e-05, "loss": 2.468, "step": 4580 }, { "epoch": 0.04, "learning_rate": 9.963839823449383e-05, "loss": 2.5046, "step": 4585 }, { "epoch": 0.04, "learning_rate": 9.963759251403539e-05, "loss": 2.4304, "step": 4590 }, { "epoch": 0.04, "learning_rate": 9.963678590018813e-05, "loss": 2.4754, "step": 4595 }, { "epoch": 0.04, "learning_rate": 9.963597839296653e-05, "loss": 2.484, "step": 4600 }, { "epoch": 0.04, "learning_rate": 9.963516999238514e-05, "loss": 2.4513, "step": 4605 }, { "epoch": 0.04, "learning_rate": 9.96343606984585e-05, "loss": 2.5207, "step": 4610 }, { "epoch": 0.04, "learning_rate": 9.96335505112012e-05, "loss": 2.4883, "step": 4615 }, { "epoch": 0.04, "learning_rate": 9.96327394306278e-05, "loss": 2.4677, "step": 4620 }, { "epoch": 0.04, "learning_rate": 9.96319274567529e-05, "loss": 2.4929, "step": 4625 }, { "epoch": 0.04, "learning_rate": 9.963111458959113e-05, "loss": 2.4564, "step": 4630 }, { "epoch": 0.04, "learning_rate": 9.963030082915711e-05, "loss": 2.4566, "step": 4635 }, { "epoch": 0.04, "learning_rate": 9.962948617546548e-05, "loss": 2.4174, "step": 4640 }, { "epoch": 0.04, "learning_rate": 9.962867062853091e-05, "loss": 2.4828, "step": 4645 }, { "epoch": 0.04, "learning_rate": 9.962785418836808e-05, "loss": 2.4641, "step": 4650 }, { "epoch": 0.04, "learning_rate": 9.962703685499169e-05, "loss": 2.4123, "step": 4655 }, { "epoch": 0.04, "learning_rate": 9.962621862841641e-05, "loss": 2.402, "step": 4660 }, { "epoch": 0.04, "learning_rate": 9.962539950865703e-05, "loss": 2.3983, "step": 4665 }, { "epoch": 0.04, "learning_rate": 9.962457949572823e-05, "loss": 2.4837, "step": 4670 }, { "epoch": 0.04, "learning_rate": 9.962375858964483e-05, "loss": 2.5136, "step": 4675 }, { "epoch": 0.04, "learning_rate": 9.962293679042156e-05, "loss": 2.4303, "step": 4680 }, { "epoch": 0.04, "learning_rate": 9.962211409807322e-05, "loss": 2.4622, "step": 4685 }, { "epoch": 0.04, "learning_rate": 9.962129051261464e-05, "loss": 2.4112, "step": 4690 }, { "epoch": 0.04, "learning_rate": 9.962046603406061e-05, "loss": 2.4751, "step": 4695 }, { "epoch": 0.04, "learning_rate": 9.961964066242599e-05, "loss": 2.5371, "step": 4700 }, { "epoch": 0.04, "learning_rate": 9.961881439772563e-05, "loss": 2.4708, "step": 4705 }, { "epoch": 0.04, "learning_rate": 9.96179872399744e-05, "loss": 2.5197, "step": 4710 }, { "epoch": 0.04, "learning_rate": 9.961715918918719e-05, "loss": 2.5012, "step": 4715 }, { "epoch": 0.04, "learning_rate": 9.961633024537888e-05, "loss": 2.4593, "step": 4720 }, { "epoch": 0.04, "learning_rate": 9.961550040856444e-05, "loss": 2.5532, "step": 4725 }, { "epoch": 0.04, "learning_rate": 9.961466967875876e-05, "loss": 2.5217, "step": 4730 }, { "epoch": 0.04, "learning_rate": 9.961383805597684e-05, "loss": 2.5183, "step": 4735 }, { "epoch": 0.04, "learning_rate": 9.961300554023358e-05, "loss": 2.453, "step": 4740 }, { "epoch": 0.04, "learning_rate": 9.961217213154401e-05, "loss": 2.4945, "step": 4745 }, { "epoch": 0.04, "learning_rate": 9.961133782992314e-05, "loss": 2.499, "step": 4750 }, { "epoch": 0.04, "learning_rate": 9.961050263538594e-05, "loss": 2.5177, "step": 4755 }, { "epoch": 0.04, "learning_rate": 9.960966654794748e-05, "loss": 2.4609, "step": 4760 }, { "epoch": 0.04, "learning_rate": 9.960882956762279e-05, "loss": 2.5098, "step": 4765 }, { "epoch": 0.04, "learning_rate": 9.960799169442695e-05, "loss": 2.4716, "step": 4770 }, { "epoch": 0.04, "learning_rate": 9.960715292837502e-05, "loss": 2.4821, "step": 4775 }, { "epoch": 0.04, "learning_rate": 9.960631326948211e-05, "loss": 2.4929, "step": 4780 }, { "epoch": 0.04, "learning_rate": 9.960547271776334e-05, "loss": 2.5458, "step": 4785 }, { "epoch": 0.04, "learning_rate": 9.960463127323382e-05, "loss": 2.4424, "step": 4790 }, { "epoch": 0.04, "learning_rate": 9.96037889359087e-05, "loss": 2.4133, "step": 4795 }, { "epoch": 0.04, "learning_rate": 9.960294570580314e-05, "loss": 2.4353, "step": 4800 }, { "epoch": 0.04, "learning_rate": 9.960210158293233e-05, "loss": 2.481, "step": 4805 }, { "epoch": 0.04, "learning_rate": 9.960125656731145e-05, "loss": 2.4639, "step": 4810 }, { "epoch": 0.04, "learning_rate": 9.960041065895569e-05, "loss": 2.5481, "step": 4815 }, { "epoch": 0.04, "learning_rate": 9.959956385788032e-05, "loss": 2.4553, "step": 4820 }, { "epoch": 0.04, "learning_rate": 9.959871616410055e-05, "loss": 2.4821, "step": 4825 }, { "epoch": 0.04, "learning_rate": 9.959786757763163e-05, "loss": 2.3928, "step": 4830 }, { "epoch": 0.04, "learning_rate": 9.959701809848887e-05, "loss": 2.465, "step": 4835 }, { "epoch": 0.04, "learning_rate": 9.959616772668752e-05, "loss": 2.4303, "step": 4840 }, { "epoch": 0.04, "learning_rate": 9.959531646224291e-05, "loss": 2.5281, "step": 4845 }, { "epoch": 0.04, "learning_rate": 9.959446430517034e-05, "loss": 2.5194, "step": 4850 }, { "epoch": 0.04, "learning_rate": 9.959361125548517e-05, "loss": 2.4481, "step": 4855 }, { "epoch": 0.04, "learning_rate": 9.959275731320274e-05, "loss": 2.5177, "step": 4860 }, { "epoch": 0.04, "learning_rate": 9.959190247833843e-05, "loss": 2.4696, "step": 4865 }, { "epoch": 0.04, "learning_rate": 9.959104675090762e-05, "loss": 2.5075, "step": 4870 }, { "epoch": 0.04, "learning_rate": 9.959019013092569e-05, "loss": 2.5278, "step": 4875 }, { "epoch": 0.04, "learning_rate": 9.958933261840809e-05, "loss": 2.5364, "step": 4880 }, { "epoch": 0.04, "learning_rate": 9.958847421337024e-05, "loss": 2.4234, "step": 4885 }, { "epoch": 0.04, "learning_rate": 9.95876149158276e-05, "loss": 2.4223, "step": 4890 }, { "epoch": 0.04, "learning_rate": 9.958675472579562e-05, "loss": 2.494, "step": 4895 }, { "epoch": 0.04, "learning_rate": 9.958589364328977e-05, "loss": 2.4057, "step": 4900 }, { "epoch": 0.04, "learning_rate": 9.958503166832558e-05, "loss": 2.4861, "step": 4905 }, { "epoch": 0.04, "learning_rate": 9.958416880091857e-05, "loss": 2.3945, "step": 4910 }, { "epoch": 0.04, "learning_rate": 9.958330504108421e-05, "loss": 2.4997, "step": 4915 }, { "epoch": 0.04, "learning_rate": 9.958244038883813e-05, "loss": 2.4622, "step": 4920 }, { "epoch": 0.04, "learning_rate": 9.958157484419581e-05, "loss": 2.4499, "step": 4925 }, { "epoch": 0.04, "learning_rate": 9.95807084071729e-05, "loss": 2.4802, "step": 4930 }, { "epoch": 0.04, "learning_rate": 9.957984107778494e-05, "loss": 2.4468, "step": 4935 }, { "epoch": 0.04, "learning_rate": 9.957897285604757e-05, "loss": 2.52, "step": 4940 }, { "epoch": 0.04, "learning_rate": 9.957810374197641e-05, "loss": 2.4403, "step": 4945 }, { "epoch": 0.04, "learning_rate": 9.957723373558709e-05, "loss": 2.5054, "step": 4950 }, { "epoch": 0.04, "learning_rate": 9.957636283689529e-05, "loss": 2.4495, "step": 4955 }, { "epoch": 0.04, "learning_rate": 9.957549104591668e-05, "loss": 2.4499, "step": 4960 }, { "epoch": 0.04, "learning_rate": 9.957461836266693e-05, "loss": 2.4737, "step": 4965 }, { "epoch": 0.04, "learning_rate": 9.957374478716177e-05, "loss": 2.4265, "step": 4970 }, { "epoch": 0.04, "learning_rate": 9.95728703194169e-05, "loss": 2.495, "step": 4975 }, { "epoch": 0.04, "learning_rate": 9.95719949594481e-05, "loss": 2.5261, "step": 4980 }, { "epoch": 0.04, "learning_rate": 9.957111870727108e-05, "loss": 2.4948, "step": 4985 }, { "epoch": 0.04, "learning_rate": 9.957024156290162e-05, "loss": 2.5162, "step": 4990 }, { "epoch": 0.04, "learning_rate": 9.956936352635552e-05, "loss": 2.5092, "step": 4995 }, { "epoch": 0.04, "learning_rate": 9.956848459764861e-05, "loss": 2.4781, "step": 5000 }, { "epoch": 0.04, "learning_rate": 9.956760477679665e-05, "loss": 2.5392, "step": 5005 }, { "epoch": 0.04, "learning_rate": 9.956672406381551e-05, "loss": 2.5247, "step": 5010 }, { "epoch": 0.04, "learning_rate": 9.956584245872104e-05, "loss": 2.477, "step": 5015 }, { "epoch": 0.04, "learning_rate": 9.956495996152909e-05, "loss": 2.4278, "step": 5020 }, { "epoch": 0.04, "learning_rate": 9.956407657225557e-05, "loss": 2.4858, "step": 5025 }, { "epoch": 0.04, "learning_rate": 9.956319229091635e-05, "loss": 2.4421, "step": 5030 }, { "epoch": 0.04, "learning_rate": 9.956230711752737e-05, "loss": 2.4838, "step": 5035 }, { "epoch": 0.04, "learning_rate": 9.956142105210455e-05, "loss": 2.5047, "step": 5040 }, { "epoch": 0.04, "learning_rate": 9.956053409466384e-05, "loss": 2.5019, "step": 5045 }, { "epoch": 0.04, "learning_rate": 9.955964624522121e-05, "loss": 2.4041, "step": 5050 }, { "epoch": 0.04, "learning_rate": 9.955875750379263e-05, "loss": 2.4899, "step": 5055 }, { "epoch": 0.04, "learning_rate": 9.955786787039409e-05, "loss": 2.5646, "step": 5060 }, { "epoch": 0.04, "learning_rate": 9.955697734504161e-05, "loss": 2.5458, "step": 5065 }, { "epoch": 0.04, "learning_rate": 9.955608592775124e-05, "loss": 2.4716, "step": 5070 }, { "epoch": 0.04, "learning_rate": 9.955519361853897e-05, "loss": 2.4992, "step": 5075 }, { "epoch": 0.04, "learning_rate": 9.955430041742091e-05, "loss": 2.5009, "step": 5080 }, { "epoch": 0.04, "learning_rate": 9.955340632441312e-05, "loss": 2.4889, "step": 5085 }, { "epoch": 0.04, "learning_rate": 9.95525113395317e-05, "loss": 2.4535, "step": 5090 }, { "epoch": 0.04, "learning_rate": 9.955161546279272e-05, "loss": 2.4777, "step": 5095 }, { "epoch": 0.04, "learning_rate": 9.955071869421236e-05, "loss": 2.5226, "step": 5100 }, { "epoch": 0.04, "learning_rate": 9.954982103380673e-05, "loss": 2.4502, "step": 5105 }, { "epoch": 0.04, "learning_rate": 9.954892248159197e-05, "loss": 2.4855, "step": 5110 }, { "epoch": 0.04, "learning_rate": 9.95480230375843e-05, "loss": 2.4894, "step": 5115 }, { "epoch": 0.04, "learning_rate": 9.954712270179987e-05, "loss": 2.4371, "step": 5120 }, { "epoch": 0.04, "learning_rate": 9.954622147425487e-05, "loss": 2.4997, "step": 5125 }, { "epoch": 0.04, "learning_rate": 9.954531935496558e-05, "loss": 2.497, "step": 5130 }, { "epoch": 0.04, "learning_rate": 9.954441634394818e-05, "loss": 2.4732, "step": 5135 }, { "epoch": 0.04, "learning_rate": 9.954351244121895e-05, "loss": 2.4595, "step": 5140 }, { "epoch": 0.04, "learning_rate": 9.954260764679416e-05, "loss": 2.4211, "step": 5145 }, { "epoch": 0.04, "learning_rate": 9.954170196069008e-05, "loss": 2.4826, "step": 5150 }, { "epoch": 0.04, "learning_rate": 9.954079538292303e-05, "loss": 2.4454, "step": 5155 }, { "epoch": 0.04, "learning_rate": 9.95398879135093e-05, "loss": 2.4941, "step": 5160 }, { "epoch": 0.04, "learning_rate": 9.953897955246525e-05, "loss": 2.4711, "step": 5165 }, { "epoch": 0.04, "learning_rate": 9.95380702998072e-05, "loss": 2.481, "step": 5170 }, { "epoch": 0.04, "learning_rate": 9.953716015555155e-05, "loss": 2.4282, "step": 5175 }, { "epoch": 0.04, "learning_rate": 9.953624911971466e-05, "loss": 2.4906, "step": 5180 }, { "epoch": 0.04, "learning_rate": 9.953533719231292e-05, "loss": 2.4746, "step": 5185 }, { "epoch": 0.04, "learning_rate": 9.953442437336276e-05, "loss": 2.487, "step": 5190 }, { "epoch": 0.04, "learning_rate": 9.953351066288062e-05, "loss": 2.5015, "step": 5195 }, { "epoch": 0.04, "learning_rate": 9.95325960608829e-05, "loss": 2.4545, "step": 5200 }, { "epoch": 0.04, "learning_rate": 9.953168056738609e-05, "loss": 2.4128, "step": 5205 }, { "epoch": 0.04, "learning_rate": 9.953076418240668e-05, "loss": 2.5159, "step": 5210 }, { "epoch": 0.04, "learning_rate": 9.952984690596115e-05, "loss": 2.5352, "step": 5215 }, { "epoch": 0.04, "learning_rate": 9.952892873806599e-05, "loss": 2.4698, "step": 5220 }, { "epoch": 0.04, "learning_rate": 9.952800967873775e-05, "loss": 2.3553, "step": 5225 }, { "epoch": 0.04, "learning_rate": 9.952708972799298e-05, "loss": 2.4699, "step": 5230 }, { "epoch": 0.04, "learning_rate": 9.95261688858482e-05, "loss": 2.4977, "step": 5235 }, { "epoch": 0.04, "learning_rate": 9.952524715232003e-05, "loss": 2.5266, "step": 5240 }, { "epoch": 0.04, "learning_rate": 9.952432452742501e-05, "loss": 2.3987, "step": 5245 }, { "epoch": 0.04, "learning_rate": 9.95234010111798e-05, "loss": 2.4933, "step": 5250 }, { "epoch": 0.04, "learning_rate": 9.952247660360099e-05, "loss": 2.5429, "step": 5255 }, { "epoch": 0.04, "learning_rate": 9.95215513047052e-05, "loss": 2.5, "step": 5260 }, { "epoch": 0.04, "learning_rate": 9.952062511450913e-05, "loss": 2.5134, "step": 5265 }, { "epoch": 0.04, "learning_rate": 9.95196980330294e-05, "loss": 2.4954, "step": 5270 }, { "epoch": 0.05, "learning_rate": 9.951877006028273e-05, "loss": 2.3691, "step": 5275 }, { "epoch": 0.05, "learning_rate": 9.951784119628582e-05, "loss": 2.4335, "step": 5280 }, { "epoch": 0.05, "learning_rate": 9.951691144105537e-05, "loss": 2.4506, "step": 5285 }, { "epoch": 0.05, "learning_rate": 9.951598079460813e-05, "loss": 2.4582, "step": 5290 }, { "epoch": 0.05, "learning_rate": 9.951504925696084e-05, "loss": 2.4093, "step": 5295 }, { "epoch": 0.05, "learning_rate": 9.951411682813027e-05, "loss": 2.4511, "step": 5300 }, { "epoch": 0.05, "learning_rate": 9.95131835081332e-05, "loss": 2.5227, "step": 5305 }, { "epoch": 0.05, "learning_rate": 9.951224929698643e-05, "loss": 2.4502, "step": 5310 }, { "epoch": 0.05, "learning_rate": 9.951131419470678e-05, "loss": 2.4087, "step": 5315 }, { "epoch": 0.05, "learning_rate": 9.951037820131108e-05, "loss": 2.4717, "step": 5320 }, { "epoch": 0.05, "learning_rate": 9.950944131681615e-05, "loss": 2.5178, "step": 5325 }, { "epoch": 0.05, "learning_rate": 9.950850354123888e-05, "loss": 2.4877, "step": 5330 }, { "epoch": 0.05, "learning_rate": 9.950756487459616e-05, "loss": 2.4898, "step": 5335 }, { "epoch": 0.05, "learning_rate": 9.950662531690484e-05, "loss": 2.4062, "step": 5340 }, { "epoch": 0.05, "learning_rate": 9.950568486818188e-05, "loss": 2.4894, "step": 5345 }, { "epoch": 0.05, "learning_rate": 9.950474352844416e-05, "loss": 2.4679, "step": 5350 }, { "epoch": 0.05, "learning_rate": 9.950380129770866e-05, "loss": 2.3394, "step": 5355 }, { "epoch": 0.05, "learning_rate": 9.950285817599232e-05, "loss": 2.4887, "step": 5360 }, { "epoch": 0.05, "learning_rate": 9.950191416331211e-05, "loss": 2.3972, "step": 5365 }, { "epoch": 0.05, "learning_rate": 9.950096925968505e-05, "loss": 2.4087, "step": 5370 }, { "epoch": 0.05, "learning_rate": 9.950002346512811e-05, "loss": 2.4986, "step": 5375 }, { "epoch": 0.05, "learning_rate": 9.949907677965833e-05, "loss": 2.4207, "step": 5380 }, { "epoch": 0.05, "learning_rate": 9.949812920329275e-05, "loss": 2.4622, "step": 5385 }, { "epoch": 0.05, "learning_rate": 9.949718073604841e-05, "loss": 2.5402, "step": 5390 }, { "epoch": 0.05, "learning_rate": 9.94962313779424e-05, "loss": 2.4924, "step": 5395 }, { "epoch": 0.05, "learning_rate": 9.949528112899179e-05, "loss": 2.5543, "step": 5400 }, { "epoch": 0.05, "learning_rate": 9.94943299892137e-05, "loss": 2.4092, "step": 5405 }, { "epoch": 0.05, "learning_rate": 9.949337795862523e-05, "loss": 2.5237, "step": 5410 }, { "epoch": 0.05, "learning_rate": 9.949242503724354e-05, "loss": 2.4711, "step": 5415 }, { "epoch": 0.05, "learning_rate": 9.949147122508575e-05, "loss": 2.4462, "step": 5420 }, { "epoch": 0.05, "learning_rate": 9.949051652216906e-05, "loss": 2.4688, "step": 5425 }, { "epoch": 0.05, "learning_rate": 9.948956092851063e-05, "loss": 2.4378, "step": 5430 }, { "epoch": 0.05, "learning_rate": 9.948860444412766e-05, "loss": 2.5383, "step": 5435 }, { "epoch": 0.05, "learning_rate": 9.948764706903737e-05, "loss": 2.4783, "step": 5440 }, { "epoch": 0.05, "learning_rate": 9.9486688803257e-05, "loss": 2.4679, "step": 5445 }, { "epoch": 0.05, "learning_rate": 9.948572964680378e-05, "loss": 2.5546, "step": 5450 }, { "epoch": 0.05, "learning_rate": 9.948476959969496e-05, "loss": 2.4304, "step": 5455 }, { "epoch": 0.05, "learning_rate": 9.948380866194788e-05, "loss": 2.4738, "step": 5460 }, { "epoch": 0.05, "learning_rate": 9.948284683357978e-05, "loss": 2.4205, "step": 5465 }, { "epoch": 0.05, "learning_rate": 9.948188411460799e-05, "loss": 2.5399, "step": 5470 }, { "epoch": 0.05, "learning_rate": 9.948092050504982e-05, "loss": 2.5107, "step": 5475 }, { "epoch": 0.05, "learning_rate": 9.947995600492263e-05, "loss": 2.5528, "step": 5480 }, { "epoch": 0.05, "learning_rate": 9.947899061424379e-05, "loss": 2.4803, "step": 5485 }, { "epoch": 0.05, "learning_rate": 9.947802433303065e-05, "loss": 2.4627, "step": 5490 }, { "epoch": 0.05, "learning_rate": 9.947705716130062e-05, "loss": 2.4871, "step": 5495 }, { "epoch": 0.05, "learning_rate": 9.947608909907109e-05, "loss": 2.4061, "step": 5500 }, { "epoch": 0.05, "learning_rate": 9.947512014635951e-05, "loss": 2.5276, "step": 5505 }, { "epoch": 0.05, "learning_rate": 9.947415030318329e-05, "loss": 2.4714, "step": 5510 }, { "epoch": 0.05, "learning_rate": 9.94731795695599e-05, "loss": 2.4526, "step": 5515 }, { "epoch": 0.05, "learning_rate": 9.947220794550683e-05, "loss": 2.5332, "step": 5520 }, { "epoch": 0.05, "learning_rate": 9.947123543104152e-05, "loss": 2.4814, "step": 5525 }, { "epoch": 0.05, "learning_rate": 9.947026202618152e-05, "loss": 2.4916, "step": 5530 }, { "epoch": 0.05, "learning_rate": 9.946928773094431e-05, "loss": 2.4031, "step": 5535 }, { "epoch": 0.05, "learning_rate": 9.946831254534748e-05, "loss": 2.473, "step": 5540 }, { "epoch": 0.05, "learning_rate": 9.946733646940852e-05, "loss": 2.4486, "step": 5545 }, { "epoch": 0.05, "learning_rate": 9.946635950314503e-05, "loss": 2.4993, "step": 5550 }, { "epoch": 0.05, "learning_rate": 9.94653816465746e-05, "loss": 2.4513, "step": 5555 }, { "epoch": 0.05, "learning_rate": 9.94644028997148e-05, "loss": 2.4931, "step": 5560 }, { "epoch": 0.05, "learning_rate": 9.946342326258329e-05, "loss": 2.4186, "step": 5565 }, { "epoch": 0.05, "learning_rate": 9.946244273519766e-05, "loss": 2.4841, "step": 5570 }, { "epoch": 0.05, "learning_rate": 9.946146131757557e-05, "loss": 2.477, "step": 5575 }, { "epoch": 0.05, "learning_rate": 9.94604790097347e-05, "loss": 2.4324, "step": 5580 }, { "epoch": 0.05, "learning_rate": 9.945949581169271e-05, "loss": 2.4592, "step": 5585 }, { "epoch": 0.05, "learning_rate": 9.945851172346732e-05, "loss": 2.5009, "step": 5590 }, { "epoch": 0.05, "learning_rate": 9.945752674507621e-05, "loss": 2.4214, "step": 5595 }, { "epoch": 0.05, "learning_rate": 9.945654087653713e-05, "loss": 2.45, "step": 5600 }, { "epoch": 0.05, "learning_rate": 9.945555411786782e-05, "loss": 2.4199, "step": 5605 }, { "epoch": 0.05, "learning_rate": 9.945456646908602e-05, "loss": 2.4377, "step": 5610 }, { "epoch": 0.05, "learning_rate": 9.945357793020953e-05, "loss": 2.4958, "step": 5615 }, { "epoch": 0.05, "learning_rate": 9.945258850125615e-05, "loss": 2.4613, "step": 5620 }, { "epoch": 0.05, "learning_rate": 9.945159818224365e-05, "loss": 2.436, "step": 5625 }, { "epoch": 0.05, "learning_rate": 9.945060697318991e-05, "loss": 2.4408, "step": 5630 }, { "epoch": 0.05, "learning_rate": 9.94496148741127e-05, "loss": 2.4406, "step": 5635 }, { "epoch": 0.05, "learning_rate": 9.944862188502995e-05, "loss": 2.5198, "step": 5640 }, { "epoch": 0.05, "learning_rate": 9.944762800595946e-05, "loss": 2.5166, "step": 5645 }, { "epoch": 0.05, "learning_rate": 9.944663323691917e-05, "loss": 2.5083, "step": 5650 }, { "epoch": 0.05, "learning_rate": 9.944563757792697e-05, "loss": 2.4511, "step": 5655 }, { "epoch": 0.05, "learning_rate": 9.944464102900077e-05, "loss": 2.3771, "step": 5660 }, { "epoch": 0.05, "learning_rate": 9.944364359015852e-05, "loss": 2.4299, "step": 5665 }, { "epoch": 0.05, "learning_rate": 9.944264526141816e-05, "loss": 2.4988, "step": 5670 }, { "epoch": 0.05, "learning_rate": 9.944164604279767e-05, "loss": 2.4645, "step": 5675 }, { "epoch": 0.05, "learning_rate": 9.944064593431502e-05, "loss": 2.3821, "step": 5680 }, { "epoch": 0.05, "learning_rate": 9.943964493598824e-05, "loss": 2.4324, "step": 5685 }, { "epoch": 0.05, "learning_rate": 9.94386430478353e-05, "loss": 2.5121, "step": 5690 }, { "epoch": 0.05, "learning_rate": 9.943764026987426e-05, "loss": 2.4217, "step": 5695 }, { "epoch": 0.05, "learning_rate": 9.943663660212316e-05, "loss": 2.4439, "step": 5700 }, { "epoch": 0.05, "learning_rate": 9.943563204460009e-05, "loss": 2.5319, "step": 5705 }, { "epoch": 0.05, "learning_rate": 9.94346265973231e-05, "loss": 2.4894, "step": 5710 }, { "epoch": 0.05, "learning_rate": 9.943362026031028e-05, "loss": 2.5165, "step": 5715 }, { "epoch": 0.05, "learning_rate": 9.943261303357978e-05, "loss": 2.4456, "step": 5720 }, { "epoch": 0.05, "learning_rate": 9.943160491714969e-05, "loss": 2.4767, "step": 5725 }, { "epoch": 0.05, "learning_rate": 9.943059591103818e-05, "loss": 2.4864, "step": 5730 }, { "epoch": 0.05, "learning_rate": 9.94295860152634e-05, "loss": 2.4943, "step": 5735 }, { "epoch": 0.05, "learning_rate": 9.942857522984352e-05, "loss": 2.4175, "step": 5740 }, { "epoch": 0.05, "learning_rate": 9.942756355479674e-05, "loss": 2.479, "step": 5745 }, { "epoch": 0.05, "learning_rate": 9.942655099014128e-05, "loss": 2.5032, "step": 5750 }, { "epoch": 0.05, "learning_rate": 9.942553753589534e-05, "loss": 2.4748, "step": 5755 }, { "epoch": 0.05, "learning_rate": 9.942452319207718e-05, "loss": 2.5326, "step": 5760 }, { "epoch": 0.05, "learning_rate": 9.942350795870506e-05, "loss": 2.4907, "step": 5765 }, { "epoch": 0.05, "learning_rate": 9.942249183579721e-05, "loss": 2.4209, "step": 5770 }, { "epoch": 0.05, "learning_rate": 9.942147482337197e-05, "loss": 2.4533, "step": 5775 }, { "epoch": 0.05, "learning_rate": 9.942045692144763e-05, "loss": 2.51, "step": 5780 }, { "epoch": 0.05, "learning_rate": 9.941943813004249e-05, "loss": 2.4663, "step": 5785 }, { "epoch": 0.05, "learning_rate": 9.941841844917492e-05, "loss": 2.4471, "step": 5790 }, { "epoch": 0.05, "learning_rate": 9.941739787886323e-05, "loss": 2.4822, "step": 5795 }, { "epoch": 0.05, "learning_rate": 9.941637641912582e-05, "loss": 2.4732, "step": 5800 }, { "epoch": 0.05, "learning_rate": 9.941535406998107e-05, "loss": 2.4121, "step": 5805 }, { "epoch": 0.05, "learning_rate": 9.941433083144738e-05, "loss": 2.4663, "step": 5810 }, { "epoch": 0.05, "learning_rate": 9.941330670354317e-05, "loss": 2.4559, "step": 5815 }, { "epoch": 0.05, "learning_rate": 9.941228168628685e-05, "loss": 2.4981, "step": 5820 }, { "epoch": 0.05, "learning_rate": 9.941125577969689e-05, "loss": 2.3376, "step": 5825 }, { "epoch": 0.05, "learning_rate": 9.941022898379175e-05, "loss": 2.4078, "step": 5830 }, { "epoch": 0.05, "learning_rate": 9.940920129858991e-05, "loss": 2.5301, "step": 5835 }, { "epoch": 0.05, "learning_rate": 9.940817272410986e-05, "loss": 2.5049, "step": 5840 }, { "epoch": 0.05, "learning_rate": 9.940714326037013e-05, "loss": 2.4892, "step": 5845 }, { "epoch": 0.05, "learning_rate": 9.940611290738921e-05, "loss": 2.4646, "step": 5850 }, { "epoch": 0.05, "learning_rate": 9.940508166518571e-05, "loss": 2.4216, "step": 5855 }, { "epoch": 0.05, "learning_rate": 9.940404953377813e-05, "loss": 2.4931, "step": 5860 }, { "epoch": 0.05, "learning_rate": 9.940301651318506e-05, "loss": 2.4804, "step": 5865 }, { "epoch": 0.05, "learning_rate": 9.940198260342513e-05, "loss": 2.4511, "step": 5870 }, { "epoch": 0.05, "learning_rate": 9.94009478045169e-05, "loss": 2.4749, "step": 5875 }, { "epoch": 0.05, "learning_rate": 9.939991211647901e-05, "loss": 2.4806, "step": 5880 }, { "epoch": 0.05, "learning_rate": 9.939887553933012e-05, "loss": 2.3555, "step": 5885 }, { "epoch": 0.05, "learning_rate": 9.939783807308887e-05, "loss": 2.4328, "step": 5890 }, { "epoch": 0.05, "learning_rate": 9.939679971777393e-05, "loss": 2.4251, "step": 5895 }, { "epoch": 0.05, "learning_rate": 9.939576047340398e-05, "loss": 2.4211, "step": 5900 }, { "epoch": 0.05, "learning_rate": 9.939472033999775e-05, "loss": 2.5302, "step": 5905 }, { "epoch": 0.05, "learning_rate": 9.939367931757396e-05, "loss": 2.4374, "step": 5910 }, { "epoch": 0.05, "learning_rate": 9.93926374061513e-05, "loss": 2.4753, "step": 5915 }, { "epoch": 0.05, "learning_rate": 9.939159460574859e-05, "loss": 2.4421, "step": 5920 }, { "epoch": 0.05, "learning_rate": 9.939055091638454e-05, "loss": 2.49, "step": 5925 }, { "epoch": 0.05, "learning_rate": 9.938950633807797e-05, "loss": 2.3406, "step": 5930 }, { "epoch": 0.05, "learning_rate": 9.938846087084767e-05, "loss": 2.3686, "step": 5935 }, { "epoch": 0.05, "learning_rate": 9.938741451471247e-05, "loss": 2.4836, "step": 5940 }, { "epoch": 0.05, "learning_rate": 9.938636726969117e-05, "loss": 2.4391, "step": 5945 }, { "epoch": 0.05, "learning_rate": 9.938531913580265e-05, "loss": 2.4496, "step": 5950 }, { "epoch": 0.05, "learning_rate": 9.938427011306575e-05, "loss": 2.4742, "step": 5955 }, { "epoch": 0.05, "learning_rate": 9.938322020149939e-05, "loss": 2.3849, "step": 5960 }, { "epoch": 0.05, "learning_rate": 9.938216940112242e-05, "loss": 2.5146, "step": 5965 }, { "epoch": 0.05, "learning_rate": 9.938111771195378e-05, "loss": 2.4734, "step": 5970 }, { "epoch": 0.05, "learning_rate": 9.938006513401237e-05, "loss": 2.4905, "step": 5975 }, { "epoch": 0.05, "learning_rate": 9.937901166731718e-05, "loss": 2.5077, "step": 5980 }, { "epoch": 0.05, "learning_rate": 9.937795731188713e-05, "loss": 2.4257, "step": 5985 }, { "epoch": 0.05, "learning_rate": 9.937690206774122e-05, "loss": 2.4544, "step": 5990 }, { "epoch": 0.05, "learning_rate": 9.937584593489844e-05, "loss": 2.4986, "step": 5995 }, { "epoch": 0.05, "learning_rate": 9.937478891337778e-05, "loss": 2.4787, "step": 6000 }, { "epoch": 0.05, "learning_rate": 9.937373100319829e-05, "loss": 2.4584, "step": 6005 }, { "epoch": 0.05, "learning_rate": 9.937267220437899e-05, "loss": 2.4404, "step": 6010 }, { "epoch": 0.05, "learning_rate": 9.937161251693895e-05, "loss": 2.4587, "step": 6015 }, { "epoch": 0.05, "learning_rate": 9.937055194089723e-05, "loss": 2.4687, "step": 6020 }, { "epoch": 0.05, "learning_rate": 9.936949047627294e-05, "loss": 2.5629, "step": 6025 }, { "epoch": 0.05, "learning_rate": 9.936842812308516e-05, "loss": 2.4743, "step": 6030 }, { "epoch": 0.05, "learning_rate": 9.936736488135304e-05, "loss": 2.3883, "step": 6035 }, { "epoch": 0.05, "learning_rate": 9.936630075109567e-05, "loss": 2.5167, "step": 6040 }, { "epoch": 0.05, "learning_rate": 9.936523573233224e-05, "loss": 2.4458, "step": 6045 }, { "epoch": 0.05, "learning_rate": 9.936416982508191e-05, "loss": 2.4466, "step": 6050 }, { "epoch": 0.05, "learning_rate": 9.936310302936387e-05, "loss": 2.3745, "step": 6055 }, { "epoch": 0.05, "learning_rate": 9.93620353451973e-05, "loss": 2.407, "step": 6060 }, { "epoch": 0.05, "learning_rate": 9.936096677260142e-05, "loss": 2.3991, "step": 6065 }, { "epoch": 0.05, "learning_rate": 9.935989731159549e-05, "loss": 2.4576, "step": 6070 }, { "epoch": 0.05, "learning_rate": 9.935882696219874e-05, "loss": 2.5316, "step": 6075 }, { "epoch": 0.05, "learning_rate": 9.935775572443044e-05, "loss": 2.4681, "step": 6080 }, { "epoch": 0.05, "learning_rate": 9.935668359830986e-05, "loss": 2.3924, "step": 6085 }, { "epoch": 0.05, "learning_rate": 9.935561058385629e-05, "loss": 2.5421, "step": 6090 }, { "epoch": 0.05, "learning_rate": 9.935453668108907e-05, "loss": 2.4704, "step": 6095 }, { "epoch": 0.05, "learning_rate": 9.935346189002752e-05, "loss": 2.5366, "step": 6100 }, { "epoch": 0.05, "learning_rate": 9.935238621069096e-05, "loss": 2.3864, "step": 6105 }, { "epoch": 0.05, "learning_rate": 9.935130964309876e-05, "loss": 2.4568, "step": 6110 }, { "epoch": 0.05, "learning_rate": 9.935023218727032e-05, "loss": 2.378, "step": 6115 }, { "epoch": 0.05, "learning_rate": 9.934915384322501e-05, "loss": 2.4063, "step": 6120 }, { "epoch": 0.05, "learning_rate": 9.934807461098224e-05, "loss": 2.4212, "step": 6125 }, { "epoch": 0.05, "learning_rate": 9.934699449056144e-05, "loss": 2.4076, "step": 6130 }, { "epoch": 0.05, "learning_rate": 9.934591348198205e-05, "loss": 2.4304, "step": 6135 }, { "epoch": 0.05, "learning_rate": 9.934483158526353e-05, "loss": 2.3961, "step": 6140 }, { "epoch": 0.05, "learning_rate": 9.934374880042534e-05, "loss": 2.4227, "step": 6145 }, { "epoch": 0.05, "learning_rate": 9.934266512748698e-05, "loss": 2.4069, "step": 6150 }, { "epoch": 0.05, "learning_rate": 9.934158056646794e-05, "loss": 2.4304, "step": 6155 }, { "epoch": 0.05, "learning_rate": 9.934049511738777e-05, "loss": 2.4231, "step": 6160 }, { "epoch": 0.05, "learning_rate": 9.933940878026596e-05, "loss": 2.5121, "step": 6165 }, { "epoch": 0.05, "learning_rate": 9.93383215551221e-05, "loss": 2.5052, "step": 6170 }, { "epoch": 0.05, "learning_rate": 9.933723344197574e-05, "loss": 2.4902, "step": 6175 }, { "epoch": 0.05, "learning_rate": 9.933614444084649e-05, "loss": 2.4069, "step": 6180 }, { "epoch": 0.05, "learning_rate": 9.933505455175391e-05, "loss": 2.462, "step": 6185 }, { "epoch": 0.05, "learning_rate": 9.933396377471765e-05, "loss": 2.4806, "step": 6190 }, { "epoch": 0.05, "learning_rate": 9.93328721097573e-05, "loss": 2.5231, "step": 6195 }, { "epoch": 0.05, "learning_rate": 9.933177955689256e-05, "loss": 2.3944, "step": 6200 }, { "epoch": 0.05, "learning_rate": 9.933068611614307e-05, "loss": 2.4424, "step": 6205 }, { "epoch": 0.05, "learning_rate": 9.932959178752851e-05, "loss": 2.4186, "step": 6210 }, { "epoch": 0.05, "learning_rate": 9.932849657106857e-05, "loss": 2.4763, "step": 6215 }, { "epoch": 0.05, "learning_rate": 9.932740046678298e-05, "loss": 2.4919, "step": 6220 }, { "epoch": 0.05, "learning_rate": 9.932630347469144e-05, "loss": 2.4552, "step": 6225 }, { "epoch": 0.05, "learning_rate": 9.932520559481372e-05, "loss": 2.4189, "step": 6230 }, { "epoch": 0.05, "learning_rate": 9.932410682716957e-05, "loss": 2.4456, "step": 6235 }, { "epoch": 0.05, "learning_rate": 9.932300717177875e-05, "loss": 2.4385, "step": 6240 }, { "epoch": 0.05, "learning_rate": 9.93219066286611e-05, "loss": 2.4866, "step": 6245 }, { "epoch": 0.05, "learning_rate": 9.932080519783638e-05, "loss": 2.4828, "step": 6250 }, { "epoch": 0.05, "learning_rate": 9.931970287932442e-05, "loss": 2.4773, "step": 6255 }, { "epoch": 0.05, "learning_rate": 9.931859967314507e-05, "loss": 2.4742, "step": 6260 }, { "epoch": 0.05, "learning_rate": 9.93174955793182e-05, "loss": 2.4324, "step": 6265 }, { "epoch": 0.05, "learning_rate": 9.931639059786365e-05, "loss": 2.5101, "step": 6270 }, { "epoch": 0.05, "learning_rate": 9.931528472880133e-05, "loss": 2.4803, "step": 6275 }, { "epoch": 0.05, "learning_rate": 9.931417797215114e-05, "loss": 2.5185, "step": 6280 }, { "epoch": 0.05, "learning_rate": 9.9313070327933e-05, "loss": 2.4241, "step": 6285 }, { "epoch": 0.05, "learning_rate": 9.931196179616684e-05, "loss": 2.4823, "step": 6290 }, { "epoch": 0.05, "learning_rate": 9.931085237687261e-05, "loss": 2.4589, "step": 6295 }, { "epoch": 0.05, "learning_rate": 9.930974207007029e-05, "loss": 2.4906, "step": 6300 }, { "epoch": 0.05, "learning_rate": 9.930863087577986e-05, "loss": 2.4773, "step": 6305 }, { "epoch": 0.05, "learning_rate": 9.930751879402131e-05, "loss": 2.4783, "step": 6310 }, { "epoch": 0.05, "learning_rate": 9.930640582481466e-05, "loss": 2.4179, "step": 6315 }, { "epoch": 0.05, "learning_rate": 9.930529196817995e-05, "loss": 2.5147, "step": 6320 }, { "epoch": 0.05, "learning_rate": 9.93041772241372e-05, "loss": 2.4384, "step": 6325 }, { "epoch": 0.05, "learning_rate": 9.930306159270653e-05, "loss": 2.4662, "step": 6330 }, { "epoch": 0.05, "learning_rate": 9.930194507390796e-05, "loss": 2.3976, "step": 6335 }, { "epoch": 0.05, "learning_rate": 9.93008276677616e-05, "loss": 2.4645, "step": 6340 }, { "epoch": 0.05, "learning_rate": 9.929970937428758e-05, "loss": 2.5019, "step": 6345 }, { "epoch": 0.05, "learning_rate": 9.929859019350602e-05, "loss": 2.4453, "step": 6350 }, { "epoch": 0.05, "learning_rate": 9.929747012543704e-05, "loss": 2.4874, "step": 6355 }, { "epoch": 0.05, "learning_rate": 9.929634917010084e-05, "loss": 2.433, "step": 6360 }, { "epoch": 0.05, "learning_rate": 9.929522732751757e-05, "loss": 2.4597, "step": 6365 }, { "epoch": 0.05, "learning_rate": 9.929410459770742e-05, "loss": 2.4762, "step": 6370 }, { "epoch": 0.05, "learning_rate": 9.929298098069062e-05, "loss": 2.3686, "step": 6375 }, { "epoch": 0.05, "learning_rate": 9.929185647648736e-05, "loss": 2.4437, "step": 6380 }, { "epoch": 0.05, "learning_rate": 9.92907310851179e-05, "loss": 2.3692, "step": 6385 }, { "epoch": 0.05, "learning_rate": 9.928960480660248e-05, "loss": 2.5251, "step": 6390 }, { "epoch": 0.05, "learning_rate": 9.92884776409614e-05, "loss": 2.4338, "step": 6395 }, { "epoch": 0.05, "learning_rate": 9.928734958821492e-05, "loss": 2.4584, "step": 6400 }, { "epoch": 0.05, "learning_rate": 9.928622064838335e-05, "loss": 2.4531, "step": 6405 }, { "epoch": 0.05, "learning_rate": 9.9285090821487e-05, "loss": 2.4608, "step": 6410 }, { "epoch": 0.05, "learning_rate": 9.928396010754623e-05, "loss": 2.4135, "step": 6415 }, { "epoch": 0.05, "learning_rate": 9.928282850658138e-05, "loss": 2.5093, "step": 6420 }, { "epoch": 0.05, "learning_rate": 9.928169601861281e-05, "loss": 2.4373, "step": 6425 }, { "epoch": 0.05, "learning_rate": 9.92805626436609e-05, "loss": 2.3967, "step": 6430 }, { "epoch": 0.05, "learning_rate": 9.927942838174605e-05, "loss": 2.4868, "step": 6435 }, { "epoch": 0.05, "learning_rate": 9.927829323288868e-05, "loss": 2.526, "step": 6440 }, { "epoch": 0.05, "learning_rate": 9.927715719710922e-05, "loss": 2.4827, "step": 6445 }, { "epoch": 0.06, "learning_rate": 9.927602027442812e-05, "loss": 2.4413, "step": 6450 }, { "epoch": 0.06, "learning_rate": 9.927488246486583e-05, "loss": 2.3708, "step": 6455 }, { "epoch": 0.06, "learning_rate": 9.927374376844285e-05, "loss": 2.4956, "step": 6460 }, { "epoch": 0.06, "learning_rate": 9.927260418517965e-05, "loss": 2.4334, "step": 6465 }, { "epoch": 0.06, "learning_rate": 9.927146371509676e-05, "loss": 2.4742, "step": 6470 }, { "epoch": 0.06, "learning_rate": 9.92703223582147e-05, "loss": 2.4319, "step": 6475 }, { "epoch": 0.06, "learning_rate": 9.926918011455401e-05, "loss": 2.4614, "step": 6480 }, { "epoch": 0.06, "learning_rate": 9.926803698413525e-05, "loss": 2.4143, "step": 6485 }, { "epoch": 0.06, "learning_rate": 9.926689296697899e-05, "loss": 2.4194, "step": 6490 }, { "epoch": 0.06, "learning_rate": 9.926574806310582e-05, "loss": 2.4775, "step": 6495 }, { "epoch": 0.06, "learning_rate": 9.926460227253636e-05, "loss": 2.4653, "step": 6500 }, { "epoch": 0.06, "learning_rate": 9.926345559529122e-05, "loss": 2.4857, "step": 6505 }, { "epoch": 0.06, "learning_rate": 9.926230803139104e-05, "loss": 2.4378, "step": 6510 }, { "epoch": 0.06, "learning_rate": 9.926115958085646e-05, "loss": 2.4402, "step": 6515 }, { "epoch": 0.06, "learning_rate": 9.92600102437082e-05, "loss": 2.4494, "step": 6520 }, { "epoch": 0.06, "learning_rate": 9.925886001996688e-05, "loss": 2.4621, "step": 6525 }, { "epoch": 0.06, "learning_rate": 9.925770890965324e-05, "loss": 2.4088, "step": 6530 }, { "epoch": 0.06, "learning_rate": 9.925655691278801e-05, "loss": 2.5148, "step": 6535 }, { "epoch": 0.06, "learning_rate": 9.925540402939189e-05, "loss": 2.4153, "step": 6540 }, { "epoch": 0.06, "learning_rate": 9.925425025948564e-05, "loss": 2.4682, "step": 6545 }, { "epoch": 0.06, "learning_rate": 9.925309560309003e-05, "loss": 2.4802, "step": 6550 }, { "epoch": 0.06, "learning_rate": 9.925194006022585e-05, "loss": 2.4943, "step": 6555 }, { "epoch": 0.06, "learning_rate": 9.925078363091389e-05, "loss": 2.3983, "step": 6560 }, { "epoch": 0.06, "learning_rate": 9.924962631517496e-05, "loss": 2.4785, "step": 6565 }, { "epoch": 0.06, "learning_rate": 9.924846811302989e-05, "loss": 2.3854, "step": 6570 }, { "epoch": 0.06, "learning_rate": 9.924730902449953e-05, "loss": 2.4651, "step": 6575 }, { "epoch": 0.06, "learning_rate": 9.924614904960474e-05, "loss": 2.4213, "step": 6580 }, { "epoch": 0.06, "learning_rate": 9.924498818836641e-05, "loss": 2.4192, "step": 6585 }, { "epoch": 0.06, "learning_rate": 9.924382644080541e-05, "loss": 2.4822, "step": 6590 }, { "epoch": 0.06, "learning_rate": 9.924266380694266e-05, "loss": 2.4393, "step": 6595 }, { "epoch": 0.06, "learning_rate": 9.92415002867991e-05, "loss": 2.4677, "step": 6600 }, { "epoch": 0.06, "learning_rate": 9.924033588039565e-05, "loss": 2.5251, "step": 6605 }, { "epoch": 0.06, "learning_rate": 9.923917058775328e-05, "loss": 2.5432, "step": 6610 }, { "epoch": 0.06, "learning_rate": 9.923800440889294e-05, "loss": 2.4972, "step": 6615 }, { "epoch": 0.06, "learning_rate": 9.923683734383564e-05, "loss": 2.3765, "step": 6620 }, { "epoch": 0.06, "learning_rate": 9.923566939260239e-05, "loss": 2.4249, "step": 6625 }, { "epoch": 0.06, "learning_rate": 9.92345005552142e-05, "loss": 2.4426, "step": 6630 }, { "epoch": 0.06, "learning_rate": 9.923333083169212e-05, "loss": 2.4205, "step": 6635 }, { "epoch": 0.06, "learning_rate": 9.92321602220572e-05, "loss": 2.4925, "step": 6640 }, { "epoch": 0.06, "learning_rate": 9.923098872633047e-05, "loss": 2.4316, "step": 6645 }, { "epoch": 0.06, "learning_rate": 9.922981634453306e-05, "loss": 2.4849, "step": 6650 }, { "epoch": 0.06, "learning_rate": 9.922864307668607e-05, "loss": 2.4133, "step": 6655 }, { "epoch": 0.06, "learning_rate": 9.92274689228106e-05, "loss": 2.4213, "step": 6660 }, { "epoch": 0.06, "learning_rate": 9.922629388292779e-05, "loss": 2.4854, "step": 6665 }, { "epoch": 0.06, "learning_rate": 9.922511795705878e-05, "loss": 2.4657, "step": 6670 }, { "epoch": 0.06, "learning_rate": 9.922394114522474e-05, "loss": 2.4387, "step": 6675 }, { "epoch": 0.06, "learning_rate": 9.922276344744686e-05, "loss": 2.4945, "step": 6680 }, { "epoch": 0.06, "learning_rate": 9.92215848637463e-05, "loss": 2.4662, "step": 6685 }, { "epoch": 0.06, "learning_rate": 9.922040539414432e-05, "loss": 2.4611, "step": 6690 }, { "epoch": 0.06, "learning_rate": 9.921922503866213e-05, "loss": 2.4298, "step": 6695 }, { "epoch": 0.06, "learning_rate": 9.921804379732098e-05, "loss": 2.391, "step": 6700 }, { "epoch": 0.06, "learning_rate": 9.92168616701421e-05, "loss": 2.4475, "step": 6705 }, { "epoch": 0.06, "learning_rate": 9.92156786571468e-05, "loss": 2.4494, "step": 6710 }, { "epoch": 0.06, "learning_rate": 9.921449475835637e-05, "loss": 2.4147, "step": 6715 }, { "epoch": 0.06, "learning_rate": 9.92133099737921e-05, "loss": 2.4187, "step": 6720 }, { "epoch": 0.06, "learning_rate": 9.921212430347533e-05, "loss": 2.3859, "step": 6725 }, { "epoch": 0.06, "learning_rate": 9.921093774742739e-05, "loss": 2.5082, "step": 6730 }, { "epoch": 0.06, "learning_rate": 9.920975030566964e-05, "loss": 2.428, "step": 6735 }, { "epoch": 0.06, "learning_rate": 9.920856197822344e-05, "loss": 2.4607, "step": 6740 }, { "epoch": 0.06, "learning_rate": 9.92073727651102e-05, "loss": 2.4254, "step": 6745 }, { "epoch": 0.06, "learning_rate": 9.920618266635131e-05, "loss": 2.4895, "step": 6750 }, { "epoch": 0.06, "learning_rate": 9.92049916819682e-05, "loss": 2.4326, "step": 6755 }, { "epoch": 0.06, "learning_rate": 9.920379981198229e-05, "loss": 2.4243, "step": 6760 }, { "epoch": 0.06, "learning_rate": 9.920260705641503e-05, "loss": 2.4296, "step": 6765 }, { "epoch": 0.06, "learning_rate": 9.92014134152879e-05, "loss": 2.4611, "step": 6770 }, { "epoch": 0.06, "learning_rate": 9.92002188886224e-05, "loss": 2.4589, "step": 6775 }, { "epoch": 0.06, "learning_rate": 9.919902347643999e-05, "loss": 2.4636, "step": 6780 }, { "epoch": 0.06, "learning_rate": 9.919782717876222e-05, "loss": 2.5009, "step": 6785 }, { "epoch": 0.06, "learning_rate": 9.919662999561059e-05, "loss": 2.4426, "step": 6790 }, { "epoch": 0.06, "learning_rate": 9.919543192700667e-05, "loss": 2.4982, "step": 6795 }, { "epoch": 0.06, "learning_rate": 9.919423297297201e-05, "loss": 2.4713, "step": 6800 }, { "epoch": 0.06, "learning_rate": 9.919303313352821e-05, "loss": 2.4243, "step": 6805 }, { "epoch": 0.06, "learning_rate": 9.919183240869684e-05, "loss": 2.4586, "step": 6810 }, { "epoch": 0.06, "learning_rate": 9.919063079849953e-05, "loss": 2.4042, "step": 6815 }, { "epoch": 0.06, "learning_rate": 9.91894283029579e-05, "loss": 2.4338, "step": 6820 }, { "epoch": 0.06, "learning_rate": 9.918822492209356e-05, "loss": 2.4956, "step": 6825 }, { "epoch": 0.06, "learning_rate": 9.918702065592825e-05, "loss": 2.4467, "step": 6830 }, { "epoch": 0.06, "learning_rate": 9.918581550448356e-05, "loss": 2.4257, "step": 6835 }, { "epoch": 0.06, "learning_rate": 9.91846094677812e-05, "loss": 2.4247, "step": 6840 }, { "epoch": 0.06, "learning_rate": 9.918340254584293e-05, "loss": 2.4751, "step": 6845 }, { "epoch": 0.06, "learning_rate": 9.918219473869041e-05, "loss": 2.4472, "step": 6850 }, { "epoch": 0.06, "learning_rate": 9.918098604634543e-05, "loss": 2.4681, "step": 6855 }, { "epoch": 0.06, "learning_rate": 9.917977646882968e-05, "loss": 2.4137, "step": 6860 }, { "epoch": 0.06, "learning_rate": 9.9178566006165e-05, "loss": 2.3918, "step": 6865 }, { "epoch": 0.06, "learning_rate": 9.917735465837312e-05, "loss": 2.3674, "step": 6870 }, { "epoch": 0.06, "learning_rate": 9.917614242547587e-05, "loss": 2.4256, "step": 6875 }, { "epoch": 0.06, "learning_rate": 9.917492930749506e-05, "loss": 2.4339, "step": 6880 }, { "epoch": 0.06, "learning_rate": 9.917371530445255e-05, "loss": 2.4273, "step": 6885 }, { "epoch": 0.06, "learning_rate": 9.917250041637014e-05, "loss": 2.4974, "step": 6890 }, { "epoch": 0.06, "learning_rate": 9.917128464326973e-05, "loss": 2.4528, "step": 6895 }, { "epoch": 0.06, "learning_rate": 9.917006798517321e-05, "loss": 2.4452, "step": 6900 }, { "epoch": 0.06, "learning_rate": 9.916885044210245e-05, "loss": 2.464, "step": 6905 }, { "epoch": 0.06, "learning_rate": 9.916763201407937e-05, "loss": 2.4348, "step": 6910 }, { "epoch": 0.06, "learning_rate": 9.916641270112592e-05, "loss": 2.4063, "step": 6915 }, { "epoch": 0.06, "learning_rate": 9.916519250326401e-05, "loss": 2.4378, "step": 6920 }, { "epoch": 0.06, "learning_rate": 9.916397142051565e-05, "loss": 2.5193, "step": 6925 }, { "epoch": 0.06, "learning_rate": 9.916274945290278e-05, "loss": 2.4689, "step": 6930 }, { "epoch": 0.06, "learning_rate": 9.916152660044739e-05, "loss": 2.3915, "step": 6935 }, { "epoch": 0.06, "learning_rate": 9.916030286317152e-05, "loss": 2.4533, "step": 6940 }, { "epoch": 0.06, "learning_rate": 9.915907824109717e-05, "loss": 2.4765, "step": 6945 }, { "epoch": 0.06, "learning_rate": 9.915785273424639e-05, "loss": 2.4432, "step": 6950 }, { "epoch": 0.06, "learning_rate": 9.915662634264123e-05, "loss": 2.5034, "step": 6955 }, { "epoch": 0.06, "learning_rate": 9.915539906630377e-05, "loss": 2.4625, "step": 6960 }, { "epoch": 0.06, "learning_rate": 9.91541709052561e-05, "loss": 2.3877, "step": 6965 }, { "epoch": 0.06, "learning_rate": 9.915294185952032e-05, "loss": 2.4048, "step": 6970 }, { "epoch": 0.06, "learning_rate": 9.915171192911856e-05, "loss": 2.429, "step": 6975 }, { "epoch": 0.06, "learning_rate": 9.915048111407295e-05, "loss": 2.478, "step": 6980 }, { "epoch": 0.06, "learning_rate": 9.914924941440561e-05, "loss": 2.4087, "step": 6985 }, { "epoch": 0.06, "learning_rate": 9.914801683013877e-05, "loss": 2.5054, "step": 6990 }, { "epoch": 0.06, "learning_rate": 9.914678336129458e-05, "loss": 2.4352, "step": 6995 }, { "epoch": 0.06, "learning_rate": 9.914554900789526e-05, "loss": 2.5306, "step": 7000 }, { "epoch": 0.06, "learning_rate": 9.914431376996299e-05, "loss": 2.4678, "step": 7005 }, { "epoch": 0.06, "learning_rate": 9.914307764752003e-05, "loss": 2.4653, "step": 7010 }, { "epoch": 0.06, "learning_rate": 9.91418406405886e-05, "loss": 2.4034, "step": 7015 }, { "epoch": 0.06, "learning_rate": 9.914060274919102e-05, "loss": 2.4762, "step": 7020 }, { "epoch": 0.06, "learning_rate": 9.913936397334951e-05, "loss": 2.4855, "step": 7025 }, { "epoch": 0.06, "learning_rate": 9.91381243130864e-05, "loss": 2.3946, "step": 7030 }, { "epoch": 0.06, "learning_rate": 9.913688376842398e-05, "loss": 2.3666, "step": 7035 }, { "epoch": 0.06, "learning_rate": 9.91356423393846e-05, "loss": 2.5104, "step": 7040 }, { "epoch": 0.06, "learning_rate": 9.91344000259906e-05, "loss": 2.4667, "step": 7045 }, { "epoch": 0.06, "learning_rate": 9.913315682826431e-05, "loss": 2.4587, "step": 7050 }, { "epoch": 0.06, "learning_rate": 9.913191274622815e-05, "loss": 2.4989, "step": 7055 }, { "epoch": 0.06, "learning_rate": 9.913066777990447e-05, "loss": 2.4174, "step": 7060 }, { "epoch": 0.06, "learning_rate": 9.912942192931571e-05, "loss": 2.4302, "step": 7065 }, { "epoch": 0.06, "learning_rate": 9.912817519448429e-05, "loss": 2.5652, "step": 7070 }, { "epoch": 0.06, "learning_rate": 9.912692757543263e-05, "loss": 2.3711, "step": 7075 }, { "epoch": 0.06, "learning_rate": 9.912567907218318e-05, "loss": 2.4035, "step": 7080 }, { "epoch": 0.06, "learning_rate": 9.912442968475843e-05, "loss": 2.5142, "step": 7085 }, { "epoch": 0.06, "learning_rate": 9.912317941318088e-05, "loss": 2.3797, "step": 7090 }, { "epoch": 0.06, "learning_rate": 9.912192825747299e-05, "loss": 2.4487, "step": 7095 }, { "epoch": 0.06, "learning_rate": 9.912067621765732e-05, "loss": 2.3873, "step": 7100 }, { "epoch": 0.06, "learning_rate": 9.911942329375638e-05, "loss": 2.3714, "step": 7105 }, { "epoch": 0.06, "learning_rate": 9.911816948579273e-05, "loss": 2.438, "step": 7110 }, { "epoch": 0.06, "learning_rate": 9.911691479378893e-05, "loss": 2.3829, "step": 7115 }, { "epoch": 0.06, "learning_rate": 9.911565921776756e-05, "loss": 2.4185, "step": 7120 }, { "epoch": 0.06, "learning_rate": 9.911440275775124e-05, "loss": 2.4248, "step": 7125 }, { "epoch": 0.06, "learning_rate": 9.911314541376256e-05, "loss": 2.4258, "step": 7130 }, { "epoch": 0.06, "learning_rate": 9.911188718582415e-05, "loss": 2.4473, "step": 7135 }, { "epoch": 0.06, "learning_rate": 9.911062807395868e-05, "loss": 2.477, "step": 7140 }, { "epoch": 0.06, "learning_rate": 9.910936807818878e-05, "loss": 2.4828, "step": 7145 }, { "epoch": 0.06, "learning_rate": 9.910810719853714e-05, "loss": 2.3367, "step": 7150 }, { "epoch": 0.06, "learning_rate": 9.910684543502648e-05, "loss": 2.4832, "step": 7155 }, { "epoch": 0.06, "learning_rate": 9.910558278767948e-05, "loss": 2.4422, "step": 7160 }, { "epoch": 0.06, "learning_rate": 9.910431925651885e-05, "loss": 2.3847, "step": 7165 }, { "epoch": 0.06, "learning_rate": 9.910305484156737e-05, "loss": 2.5173, "step": 7170 }, { "epoch": 0.06, "learning_rate": 9.910178954284778e-05, "loss": 2.4451, "step": 7175 }, { "epoch": 0.06, "learning_rate": 9.910052336038285e-05, "loss": 2.3867, "step": 7180 }, { "epoch": 0.06, "learning_rate": 9.909925629419539e-05, "loss": 2.4724, "step": 7185 }, { "epoch": 0.06, "learning_rate": 9.909798834430817e-05, "loss": 2.4375, "step": 7190 }, { "epoch": 0.06, "learning_rate": 9.909671951074402e-05, "loss": 2.3961, "step": 7195 }, { "epoch": 0.06, "learning_rate": 9.90954497935258e-05, "loss": 2.4542, "step": 7200 }, { "epoch": 0.06, "learning_rate": 9.909417919267635e-05, "loss": 2.4767, "step": 7205 }, { "epoch": 0.06, "learning_rate": 9.909290770821853e-05, "loss": 2.3785, "step": 7210 }, { "epoch": 0.06, "learning_rate": 9.909163534017522e-05, "loss": 2.4051, "step": 7215 }, { "epoch": 0.06, "learning_rate": 9.909036208856936e-05, "loss": 2.5206, "step": 7220 }, { "epoch": 0.06, "learning_rate": 9.908908795342383e-05, "loss": 2.4968, "step": 7225 }, { "epoch": 0.06, "learning_rate": 9.908781293476155e-05, "loss": 2.4324, "step": 7230 }, { "epoch": 0.06, "learning_rate": 9.90865370326055e-05, "loss": 2.4902, "step": 7235 }, { "epoch": 0.06, "learning_rate": 9.908526024697863e-05, "loss": 2.3838, "step": 7240 }, { "epoch": 0.06, "learning_rate": 9.908398257790393e-05, "loss": 2.4042, "step": 7245 }, { "epoch": 0.06, "learning_rate": 9.908270402540438e-05, "loss": 2.3776, "step": 7250 }, { "epoch": 0.06, "learning_rate": 9.9081424589503e-05, "loss": 2.4638, "step": 7255 }, { "epoch": 0.06, "learning_rate": 9.908014427022281e-05, "loss": 2.4695, "step": 7260 }, { "epoch": 0.06, "learning_rate": 9.907886306758687e-05, "loss": 2.5086, "step": 7265 }, { "epoch": 0.06, "learning_rate": 9.907758098161823e-05, "loss": 2.4267, "step": 7270 }, { "epoch": 0.06, "learning_rate": 9.907629801233996e-05, "loss": 2.3907, "step": 7275 }, { "epoch": 0.06, "learning_rate": 9.907501415977515e-05, "loss": 2.4039, "step": 7280 }, { "epoch": 0.06, "learning_rate": 9.907372942394692e-05, "loss": 2.448, "step": 7285 }, { "epoch": 0.06, "learning_rate": 9.907244380487839e-05, "loss": 2.4244, "step": 7290 }, { "epoch": 0.06, "learning_rate": 9.907115730259269e-05, "loss": 2.3829, "step": 7295 }, { "epoch": 0.06, "learning_rate": 9.906986991711299e-05, "loss": 2.4011, "step": 7300 }, { "epoch": 0.06, "learning_rate": 9.906858164846245e-05, "loss": 2.3544, "step": 7305 }, { "epoch": 0.06, "learning_rate": 9.906729249666424e-05, "loss": 2.407, "step": 7310 }, { "epoch": 0.06, "learning_rate": 9.906600246174157e-05, "loss": 2.4615, "step": 7315 }, { "epoch": 0.06, "learning_rate": 9.90647115437177e-05, "loss": 2.4483, "step": 7320 }, { "epoch": 0.06, "learning_rate": 9.906341974261582e-05, "loss": 2.3256, "step": 7325 }, { "epoch": 0.06, "learning_rate": 9.90621270584592e-05, "loss": 2.4272, "step": 7330 }, { "epoch": 0.06, "learning_rate": 9.906083349127108e-05, "loss": 2.4759, "step": 7335 }, { "epoch": 0.06, "learning_rate": 9.905953904107477e-05, "loss": 2.3644, "step": 7340 }, { "epoch": 0.06, "learning_rate": 9.905824370789356e-05, "loss": 2.3967, "step": 7345 }, { "epoch": 0.06, "learning_rate": 9.905694749175076e-05, "loss": 2.54, "step": 7350 }, { "epoch": 0.06, "learning_rate": 9.905565039266971e-05, "loss": 2.3771, "step": 7355 }, { "epoch": 0.06, "learning_rate": 9.905435241067374e-05, "loss": 2.4145, "step": 7360 }, { "epoch": 0.06, "learning_rate": 9.90530535457862e-05, "loss": 2.4152, "step": 7365 }, { "epoch": 0.06, "learning_rate": 9.905175379803052e-05, "loss": 2.4751, "step": 7370 }, { "epoch": 0.06, "learning_rate": 9.905045316743002e-05, "loss": 2.3973, "step": 7375 }, { "epoch": 0.06, "learning_rate": 9.904915165400816e-05, "loss": 2.3981, "step": 7380 }, { "epoch": 0.06, "learning_rate": 9.904784925778838e-05, "loss": 2.4148, "step": 7385 }, { "epoch": 0.06, "learning_rate": 9.904654597879406e-05, "loss": 2.4364, "step": 7390 }, { "epoch": 0.06, "learning_rate": 9.904524181704871e-05, "loss": 2.4864, "step": 7395 }, { "epoch": 0.06, "learning_rate": 9.904393677257578e-05, "loss": 2.4029, "step": 7400 }, { "epoch": 0.06, "learning_rate": 9.904263084539875e-05, "loss": 2.3669, "step": 7405 }, { "epoch": 0.06, "learning_rate": 9.904132403554113e-05, "loss": 2.4851, "step": 7410 }, { "epoch": 0.06, "learning_rate": 9.904001634302646e-05, "loss": 2.4353, "step": 7415 }, { "epoch": 0.06, "learning_rate": 9.903870776787826e-05, "loss": 2.4874, "step": 7420 }, { "epoch": 0.06, "learning_rate": 9.903739831012008e-05, "loss": 2.3323, "step": 7425 }, { "epoch": 0.06, "learning_rate": 9.90360879697755e-05, "loss": 2.4368, "step": 7430 }, { "epoch": 0.06, "learning_rate": 9.903477674686809e-05, "loss": 2.3406, "step": 7435 }, { "epoch": 0.06, "learning_rate": 9.903346464142147e-05, "loss": 2.4752, "step": 7440 }, { "epoch": 0.06, "learning_rate": 9.903215165345922e-05, "loss": 2.4248, "step": 7445 }, { "epoch": 0.06, "learning_rate": 9.903083778300502e-05, "loss": 2.4632, "step": 7450 }, { "epoch": 0.06, "learning_rate": 9.902952303008246e-05, "loss": 2.3812, "step": 7455 }, { "epoch": 0.06, "learning_rate": 9.902820739471524e-05, "loss": 2.4311, "step": 7460 }, { "epoch": 0.06, "learning_rate": 9.902689087692704e-05, "loss": 2.5028, "step": 7465 }, { "epoch": 0.06, "learning_rate": 9.902557347674154e-05, "loss": 2.4561, "step": 7470 }, { "epoch": 0.06, "learning_rate": 9.902425519418246e-05, "loss": 2.327, "step": 7475 }, { "epoch": 0.06, "learning_rate": 9.902293602927353e-05, "loss": 2.3737, "step": 7480 }, { "epoch": 0.06, "learning_rate": 9.902161598203847e-05, "loss": 2.4764, "step": 7485 }, { "epoch": 0.06, "learning_rate": 9.902029505250108e-05, "loss": 2.4503, "step": 7490 }, { "epoch": 0.06, "learning_rate": 9.90189732406851e-05, "loss": 2.4076, "step": 7495 }, { "epoch": 0.06, "learning_rate": 9.901765054661433e-05, "loss": 2.465, "step": 7500 }, { "epoch": 0.06, "learning_rate": 9.901632697031258e-05, "loss": 2.4436, "step": 7505 }, { "epoch": 0.06, "learning_rate": 9.901500251180367e-05, "loss": 2.4662, "step": 7510 }, { "epoch": 0.06, "learning_rate": 9.901367717111143e-05, "loss": 2.4085, "step": 7515 }, { "epoch": 0.06, "learning_rate": 9.901235094825972e-05, "loss": 2.4566, "step": 7520 }, { "epoch": 0.06, "learning_rate": 9.901102384327241e-05, "loss": 2.3983, "step": 7525 }, { "epoch": 0.06, "learning_rate": 9.90096958561734e-05, "loss": 2.4374, "step": 7530 }, { "epoch": 0.06, "learning_rate": 9.900836698698656e-05, "loss": 2.4255, "step": 7535 }, { "epoch": 0.06, "learning_rate": 9.900703723573583e-05, "loss": 2.4597, "step": 7540 }, { "epoch": 0.06, "learning_rate": 9.900570660244513e-05, "loss": 2.4153, "step": 7545 }, { "epoch": 0.06, "learning_rate": 9.900437508713842e-05, "loss": 2.4597, "step": 7550 }, { "epoch": 0.06, "learning_rate": 9.900304268983966e-05, "loss": 2.3328, "step": 7555 }, { "epoch": 0.06, "learning_rate": 9.900170941057286e-05, "loss": 2.4488, "step": 7560 }, { "epoch": 0.06, "learning_rate": 9.900037524936196e-05, "loss": 2.3786, "step": 7565 }, { "epoch": 0.06, "learning_rate": 9.899904020623101e-05, "loss": 2.4745, "step": 7570 }, { "epoch": 0.06, "learning_rate": 9.899770428120404e-05, "loss": 2.3663, "step": 7575 }, { "epoch": 0.06, "learning_rate": 9.899636747430505e-05, "loss": 2.4221, "step": 7580 }, { "epoch": 0.06, "learning_rate": 9.899502978555817e-05, "loss": 2.3673, "step": 7585 }, { "epoch": 0.06, "learning_rate": 9.899369121498743e-05, "loss": 2.4635, "step": 7590 }, { "epoch": 0.06, "learning_rate": 9.899235176261692e-05, "loss": 2.457, "step": 7595 }, { "epoch": 0.06, "learning_rate": 9.899101142847079e-05, "loss": 2.2306, "step": 7600 }, { "epoch": 0.06, "learning_rate": 9.89896702125731e-05, "loss": 2.3988, "step": 7605 }, { "epoch": 0.06, "learning_rate": 9.898832811494802e-05, "loss": 2.4048, "step": 7610 }, { "epoch": 0.06, "learning_rate": 9.898698513561974e-05, "loss": 2.3851, "step": 7615 }, { "epoch": 0.07, "learning_rate": 9.898564127461238e-05, "loss": 2.4035, "step": 7620 }, { "epoch": 0.07, "learning_rate": 9.898429653195016e-05, "loss": 2.3607, "step": 7625 }, { "epoch": 0.07, "learning_rate": 9.898295090765726e-05, "loss": 2.4102, "step": 7630 }, { "epoch": 0.07, "learning_rate": 9.898160440175791e-05, "loss": 2.4178, "step": 7635 }, { "epoch": 0.07, "learning_rate": 9.898025701427635e-05, "loss": 2.4656, "step": 7640 }, { "epoch": 0.07, "learning_rate": 9.89789087452368e-05, "loss": 2.4577, "step": 7645 }, { "epoch": 0.07, "learning_rate": 9.897755959466359e-05, "loss": 2.4219, "step": 7650 }, { "epoch": 0.07, "learning_rate": 9.897620956258093e-05, "loss": 2.4545, "step": 7655 }, { "epoch": 0.07, "learning_rate": 9.897485864901317e-05, "loss": 2.4926, "step": 7660 }, { "epoch": 0.07, "learning_rate": 9.897350685398461e-05, "loss": 2.3983, "step": 7665 }, { "epoch": 0.07, "learning_rate": 9.897215417751955e-05, "loss": 2.4432, "step": 7670 }, { "epoch": 0.07, "learning_rate": 9.897080061964238e-05, "loss": 2.3918, "step": 7675 }, { "epoch": 0.07, "learning_rate": 9.896944618037744e-05, "loss": 2.3926, "step": 7680 }, { "epoch": 0.07, "learning_rate": 9.89680908597491e-05, "loss": 2.4039, "step": 7685 }, { "epoch": 0.07, "learning_rate": 9.896673465778178e-05, "loss": 2.4328, "step": 7690 }, { "epoch": 0.07, "learning_rate": 9.896537757449986e-05, "loss": 2.4807, "step": 7695 }, { "epoch": 0.07, "learning_rate": 9.896401960992779e-05, "loss": 2.4525, "step": 7700 }, { "epoch": 0.07, "learning_rate": 9.896266076408997e-05, "loss": 2.487, "step": 7705 }, { "epoch": 0.07, "learning_rate": 9.896130103701093e-05, "loss": 2.4335, "step": 7710 }, { "epoch": 0.07, "learning_rate": 9.895994042871506e-05, "loss": 2.4126, "step": 7715 }, { "epoch": 0.07, "learning_rate": 9.89585789392269e-05, "loss": 2.4504, "step": 7720 }, { "epoch": 0.07, "learning_rate": 9.895721656857096e-05, "loss": 2.4006, "step": 7725 }, { "epoch": 0.07, "learning_rate": 9.895585331677171e-05, "loss": 2.425, "step": 7730 }, { "epoch": 0.07, "learning_rate": 9.895448918385373e-05, "loss": 2.3487, "step": 7735 }, { "epoch": 0.07, "learning_rate": 9.895312416984156e-05, "loss": 2.4082, "step": 7740 }, { "epoch": 0.07, "learning_rate": 9.895175827475978e-05, "loss": 2.4546, "step": 7745 }, { "epoch": 0.07, "learning_rate": 9.895039149863294e-05, "loss": 2.4241, "step": 7750 }, { "epoch": 0.07, "learning_rate": 9.894902384148566e-05, "loss": 2.3472, "step": 7755 }, { "epoch": 0.07, "learning_rate": 9.894765530334258e-05, "loss": 2.3834, "step": 7760 }, { "epoch": 0.07, "learning_rate": 9.894628588422829e-05, "loss": 2.461, "step": 7765 }, { "epoch": 0.07, "learning_rate": 9.894491558416745e-05, "loss": 2.4738, "step": 7770 }, { "epoch": 0.07, "learning_rate": 9.894354440318474e-05, "loss": 2.4082, "step": 7775 }, { "epoch": 0.07, "learning_rate": 9.894217234130483e-05, "loss": 2.3122, "step": 7780 }, { "epoch": 0.07, "learning_rate": 9.894079939855238e-05, "loss": 2.4654, "step": 7785 }, { "epoch": 0.07, "learning_rate": 9.893942557495217e-05, "loss": 2.4127, "step": 7790 }, { "epoch": 0.07, "learning_rate": 9.893805087052887e-05, "loss": 2.4879, "step": 7795 }, { "epoch": 0.07, "learning_rate": 9.893667528530724e-05, "loss": 2.4294, "step": 7800 }, { "epoch": 0.07, "learning_rate": 9.893529881931204e-05, "loss": 2.4142, "step": 7805 }, { "epoch": 0.07, "learning_rate": 9.893392147256803e-05, "loss": 2.4581, "step": 7810 }, { "epoch": 0.07, "learning_rate": 9.893254324510003e-05, "loss": 2.4802, "step": 7815 }, { "epoch": 0.07, "learning_rate": 9.893116413693282e-05, "loss": 2.4432, "step": 7820 }, { "epoch": 0.07, "learning_rate": 9.892978414809123e-05, "loss": 2.4889, "step": 7825 }, { "epoch": 0.07, "learning_rate": 9.89284032786001e-05, "loss": 2.4662, "step": 7830 }, { "epoch": 0.07, "learning_rate": 9.892702152848427e-05, "loss": 2.3678, "step": 7835 }, { "epoch": 0.07, "learning_rate": 9.892563889776863e-05, "loss": 2.3845, "step": 7840 }, { "epoch": 0.07, "learning_rate": 9.892425538647805e-05, "loss": 2.4136, "step": 7845 }, { "epoch": 0.07, "learning_rate": 9.892287099463744e-05, "loss": 2.369, "step": 7850 }, { "epoch": 0.07, "learning_rate": 9.892148572227169e-05, "loss": 2.3611, "step": 7855 }, { "epoch": 0.07, "learning_rate": 9.892009956940578e-05, "loss": 2.4691, "step": 7860 }, { "epoch": 0.07, "learning_rate": 9.891871253606462e-05, "loss": 2.4041, "step": 7865 }, { "epoch": 0.07, "learning_rate": 9.891732462227318e-05, "loss": 2.44, "step": 7870 }, { "epoch": 0.07, "learning_rate": 9.891593582805644e-05, "loss": 2.3848, "step": 7875 }, { "epoch": 0.07, "learning_rate": 9.891454615343943e-05, "loss": 2.4252, "step": 7880 }, { "epoch": 0.07, "learning_rate": 9.891315559844711e-05, "loss": 2.4575, "step": 7885 }, { "epoch": 0.07, "learning_rate": 9.891176416310454e-05, "loss": 2.3919, "step": 7890 }, { "epoch": 0.07, "learning_rate": 9.891037184743674e-05, "loss": 2.5117, "step": 7895 }, { "epoch": 0.07, "learning_rate": 9.890897865146879e-05, "loss": 2.3382, "step": 7900 }, { "epoch": 0.07, "learning_rate": 9.890758457522577e-05, "loss": 2.4209, "step": 7905 }, { "epoch": 0.07, "learning_rate": 9.890618961873276e-05, "loss": 2.4604, "step": 7910 }, { "epoch": 0.07, "learning_rate": 9.890479378201486e-05, "loss": 2.3736, "step": 7915 }, { "epoch": 0.07, "learning_rate": 9.890339706509719e-05, "loss": 2.4393, "step": 7920 }, { "epoch": 0.07, "learning_rate": 9.890199946800491e-05, "loss": 2.4002, "step": 7925 }, { "epoch": 0.07, "learning_rate": 9.890060099076316e-05, "loss": 2.4227, "step": 7930 }, { "epoch": 0.07, "learning_rate": 9.88992016333971e-05, "loss": 2.4849, "step": 7935 }, { "epoch": 0.07, "learning_rate": 9.889780139593194e-05, "loss": 2.4213, "step": 7940 }, { "epoch": 0.07, "learning_rate": 9.889640027839287e-05, "loss": 2.4331, "step": 7945 }, { "epoch": 0.07, "learning_rate": 9.889499828080511e-05, "loss": 2.4566, "step": 7950 }, { "epoch": 0.07, "learning_rate": 9.889359540319387e-05, "loss": 2.4716, "step": 7955 }, { "epoch": 0.07, "learning_rate": 9.889219164558443e-05, "loss": 2.4375, "step": 7960 }, { "epoch": 0.07, "learning_rate": 9.889078700800205e-05, "loss": 2.4669, "step": 7965 }, { "epoch": 0.07, "learning_rate": 9.8889381490472e-05, "loss": 2.3799, "step": 7970 }, { "epoch": 0.07, "learning_rate": 9.88879750930196e-05, "loss": 2.4905, "step": 7975 }, { "epoch": 0.07, "learning_rate": 9.888656781567012e-05, "loss": 2.4944, "step": 7980 }, { "epoch": 0.07, "learning_rate": 9.888515965844894e-05, "loss": 2.4555, "step": 7985 }, { "epoch": 0.07, "learning_rate": 9.888375062138136e-05, "loss": 2.4932, "step": 7990 }, { "epoch": 0.07, "learning_rate": 9.888234070449276e-05, "loss": 2.4366, "step": 7995 }, { "epoch": 0.07, "learning_rate": 9.888092990780851e-05, "loss": 2.4055, "step": 8000 }, { "epoch": 0.07, "learning_rate": 9.887951823135402e-05, "loss": 2.3995, "step": 8005 }, { "epoch": 0.07, "learning_rate": 9.887810567515467e-05, "loss": 2.5156, "step": 8010 }, { "epoch": 0.07, "learning_rate": 9.887669223923591e-05, "loss": 2.4214, "step": 8015 }, { "epoch": 0.07, "learning_rate": 9.887527792362317e-05, "loss": 2.4671, "step": 8020 }, { "epoch": 0.07, "learning_rate": 9.887386272834189e-05, "loss": 2.4883, "step": 8025 }, { "epoch": 0.07, "learning_rate": 9.887244665341756e-05, "loss": 2.4296, "step": 8030 }, { "epoch": 0.07, "learning_rate": 9.887102969887565e-05, "loss": 2.4865, "step": 8035 }, { "epoch": 0.07, "learning_rate": 9.886961186474169e-05, "loss": 2.4458, "step": 8040 }, { "epoch": 0.07, "learning_rate": 9.886819315104117e-05, "loss": 2.3901, "step": 8045 }, { "epoch": 0.07, "learning_rate": 9.886677355779963e-05, "loss": 2.3808, "step": 8050 }, { "epoch": 0.07, "learning_rate": 9.886535308504263e-05, "loss": 2.4549, "step": 8055 }, { "epoch": 0.07, "learning_rate": 9.886393173279574e-05, "loss": 2.3955, "step": 8060 }, { "epoch": 0.07, "learning_rate": 9.886250950108453e-05, "loss": 2.4327, "step": 8065 }, { "epoch": 0.07, "learning_rate": 9.886108638993458e-05, "loss": 2.3917, "step": 8070 }, { "epoch": 0.07, "learning_rate": 9.885966239937156e-05, "loss": 2.424, "step": 8075 }, { "epoch": 0.07, "learning_rate": 9.885823752942105e-05, "loss": 2.4148, "step": 8080 }, { "epoch": 0.07, "learning_rate": 9.88568117801087e-05, "loss": 2.4093, "step": 8085 }, { "epoch": 0.07, "learning_rate": 9.885538515146018e-05, "loss": 2.4202, "step": 8090 }, { "epoch": 0.07, "learning_rate": 9.885395764350118e-05, "loss": 2.3931, "step": 8095 }, { "epoch": 0.07, "learning_rate": 9.885252925625736e-05, "loss": 2.4386, "step": 8100 }, { "epoch": 0.07, "learning_rate": 9.885109998975447e-05, "loss": 2.3407, "step": 8105 }, { "epoch": 0.07, "learning_rate": 9.88496698440182e-05, "loss": 2.3846, "step": 8110 }, { "epoch": 0.07, "learning_rate": 9.88482388190743e-05, "loss": 2.3427, "step": 8115 }, { "epoch": 0.07, "learning_rate": 9.884680691494854e-05, "loss": 2.411, "step": 8120 }, { "epoch": 0.07, "learning_rate": 9.884537413166667e-05, "loss": 2.3473, "step": 8125 }, { "epoch": 0.07, "learning_rate": 9.884394046925449e-05, "loss": 2.4088, "step": 8130 }, { "epoch": 0.07, "learning_rate": 9.88425059277378e-05, "loss": 2.3433, "step": 8135 }, { "epoch": 0.07, "learning_rate": 9.884107050714241e-05, "loss": 2.4338, "step": 8140 }, { "epoch": 0.07, "learning_rate": 9.883963420749419e-05, "loss": 2.4612, "step": 8145 }, { "epoch": 0.07, "learning_rate": 9.883819702881895e-05, "loss": 2.3858, "step": 8150 }, { "epoch": 0.07, "learning_rate": 9.883675897114258e-05, "loss": 2.4073, "step": 8155 }, { "epoch": 0.07, "learning_rate": 9.883532003449094e-05, "loss": 2.415, "step": 8160 }, { "epoch": 0.07, "learning_rate": 9.883388021888996e-05, "loss": 2.4339, "step": 8165 }, { "epoch": 0.07, "learning_rate": 9.883243952436552e-05, "loss": 2.3772, "step": 8170 }, { "epoch": 0.07, "learning_rate": 9.883099795094358e-05, "loss": 2.4198, "step": 8175 }, { "epoch": 0.07, "learning_rate": 9.882955549865007e-05, "loss": 2.4842, "step": 8180 }, { "epoch": 0.07, "learning_rate": 9.882811216751095e-05, "loss": 2.3105, "step": 8185 }, { "epoch": 0.07, "learning_rate": 9.88266679575522e-05, "loss": 2.4285, "step": 8190 }, { "epoch": 0.07, "learning_rate": 9.882522286879982e-05, "loss": 2.4016, "step": 8195 }, { "epoch": 0.07, "learning_rate": 9.882377690127981e-05, "loss": 2.4077, "step": 8200 }, { "epoch": 0.07, "learning_rate": 9.882233005501823e-05, "loss": 2.5048, "step": 8205 }, { "epoch": 0.07, "learning_rate": 9.882088233004105e-05, "loss": 2.381, "step": 8210 }, { "epoch": 0.07, "learning_rate": 9.881943372637439e-05, "loss": 2.4484, "step": 8215 }, { "epoch": 0.07, "learning_rate": 9.88179842440443e-05, "loss": 2.4494, "step": 8220 }, { "epoch": 0.07, "learning_rate": 9.881653388307685e-05, "loss": 2.4292, "step": 8225 }, { "epoch": 0.07, "learning_rate": 9.881508264349817e-05, "loss": 2.3964, "step": 8230 }, { "epoch": 0.07, "learning_rate": 9.881363052533437e-05, "loss": 2.4401, "step": 8235 }, { "epoch": 0.07, "learning_rate": 9.881217752861158e-05, "loss": 2.3734, "step": 8240 }, { "epoch": 0.07, "learning_rate": 9.881072365335597e-05, "loss": 2.3745, "step": 8245 }, { "epoch": 0.07, "learning_rate": 9.88092688995937e-05, "loss": 2.4524, "step": 8250 }, { "epoch": 0.07, "learning_rate": 9.880781326735093e-05, "loss": 2.3812, "step": 8255 }, { "epoch": 0.07, "learning_rate": 9.880635675665388e-05, "loss": 2.3732, "step": 8260 }, { "epoch": 0.07, "learning_rate": 9.880489936752877e-05, "loss": 2.4464, "step": 8265 }, { "epoch": 0.07, "learning_rate": 9.880344110000182e-05, "loss": 2.3648, "step": 8270 }, { "epoch": 0.07, "learning_rate": 9.880198195409927e-05, "loss": 2.3914, "step": 8275 }, { "epoch": 0.07, "learning_rate": 9.88005219298474e-05, "loss": 2.4558, "step": 8280 }, { "epoch": 0.07, "learning_rate": 9.879906102727246e-05, "loss": 2.4848, "step": 8285 }, { "epoch": 0.07, "learning_rate": 9.879759924640077e-05, "loss": 2.4561, "step": 8290 }, { "epoch": 0.07, "learning_rate": 9.879613658725864e-05, "loss": 2.438, "step": 8295 }, { "epoch": 0.07, "learning_rate": 9.879467304987238e-05, "loss": 2.4498, "step": 8300 }, { "epoch": 0.07, "learning_rate": 9.879320863426834e-05, "loss": 2.4099, "step": 8305 }, { "epoch": 0.07, "learning_rate": 9.879174334047286e-05, "loss": 2.44, "step": 8310 }, { "epoch": 0.07, "learning_rate": 9.879027716851234e-05, "loss": 2.4806, "step": 8315 }, { "epoch": 0.07, "learning_rate": 9.878881011841314e-05, "loss": 2.4429, "step": 8320 }, { "epoch": 0.07, "learning_rate": 9.87873421902017e-05, "loss": 2.4553, "step": 8325 }, { "epoch": 0.07, "learning_rate": 9.878587338390442e-05, "loss": 2.3353, "step": 8330 }, { "epoch": 0.07, "learning_rate": 9.878440369954772e-05, "loss": 2.4289, "step": 8335 }, { "epoch": 0.07, "learning_rate": 9.878293313715807e-05, "loss": 2.4189, "step": 8340 }, { "epoch": 0.07, "learning_rate": 9.878146169676195e-05, "loss": 2.416, "step": 8345 }, { "epoch": 0.07, "learning_rate": 9.877998937838582e-05, "loss": 2.3731, "step": 8350 }, { "epoch": 0.07, "learning_rate": 9.877851618205619e-05, "loss": 2.4791, "step": 8355 }, { "epoch": 0.07, "learning_rate": 9.877704210779954e-05, "loss": 2.4169, "step": 8360 }, { "epoch": 0.07, "learning_rate": 9.877556715564247e-05, "loss": 2.4005, "step": 8365 }, { "epoch": 0.07, "learning_rate": 9.877409132561149e-05, "loss": 2.3851, "step": 8370 }, { "epoch": 0.07, "learning_rate": 9.877261461773315e-05, "loss": 2.4117, "step": 8375 }, { "epoch": 0.07, "learning_rate": 9.877113703203403e-05, "loss": 2.4876, "step": 8380 }, { "epoch": 0.07, "learning_rate": 9.876965856854074e-05, "loss": 2.412, "step": 8385 }, { "epoch": 0.07, "learning_rate": 9.87681792272799e-05, "loss": 2.3803, "step": 8390 }, { "epoch": 0.07, "learning_rate": 9.876669900827811e-05, "loss": 2.4114, "step": 8395 }, { "epoch": 0.07, "learning_rate": 9.876521791156201e-05, "loss": 2.3834, "step": 8400 }, { "epoch": 0.07, "learning_rate": 9.876373593715829e-05, "loss": 2.4193, "step": 8405 }, { "epoch": 0.07, "learning_rate": 9.876225308509357e-05, "loss": 2.4479, "step": 8410 }, { "epoch": 0.07, "learning_rate": 9.876076935539459e-05, "loss": 2.4037, "step": 8415 }, { "epoch": 0.07, "learning_rate": 9.875928474808803e-05, "loss": 2.3356, "step": 8420 }, { "epoch": 0.07, "learning_rate": 9.875779926320062e-05, "loss": 2.4212, "step": 8425 }, { "epoch": 0.07, "learning_rate": 9.875631290075907e-05, "loss": 2.4616, "step": 8430 }, { "epoch": 0.07, "learning_rate": 9.875482566079017e-05, "loss": 2.4363, "step": 8435 }, { "epoch": 0.07, "learning_rate": 9.875333754332067e-05, "loss": 2.4231, "step": 8440 }, { "epoch": 0.07, "learning_rate": 9.875184854837735e-05, "loss": 2.4989, "step": 8445 }, { "epoch": 0.07, "learning_rate": 9.875035867598701e-05, "loss": 2.3886, "step": 8450 }, { "epoch": 0.07, "learning_rate": 9.874886792617646e-05, "loss": 2.4394, "step": 8455 }, { "epoch": 0.07, "learning_rate": 9.874737629897255e-05, "loss": 2.4551, "step": 8460 }, { "epoch": 0.07, "learning_rate": 9.87458837944021e-05, "loss": 2.4052, "step": 8465 }, { "epoch": 0.07, "learning_rate": 9.874439041249201e-05, "loss": 2.3717, "step": 8470 }, { "epoch": 0.07, "learning_rate": 9.874289615326913e-05, "loss": 2.4055, "step": 8475 }, { "epoch": 0.07, "learning_rate": 9.874140101676035e-05, "loss": 2.3385, "step": 8480 }, { "epoch": 0.07, "learning_rate": 9.87399050029926e-05, "loss": 2.4112, "step": 8485 }, { "epoch": 0.07, "learning_rate": 9.873840811199277e-05, "loss": 2.4524, "step": 8490 }, { "epoch": 0.07, "learning_rate": 9.873691034378784e-05, "loss": 2.392, "step": 8495 }, { "epoch": 0.07, "learning_rate": 9.873541169840476e-05, "loss": 2.4074, "step": 8500 }, { "epoch": 0.07, "learning_rate": 9.873391217587051e-05, "loss": 2.4332, "step": 8505 }, { "epoch": 0.07, "learning_rate": 9.873241177621205e-05, "loss": 2.4682, "step": 8510 }, { "epoch": 0.07, "learning_rate": 9.87309104994564e-05, "loss": 2.4082, "step": 8515 }, { "epoch": 0.07, "learning_rate": 9.872940834563058e-05, "loss": 2.4075, "step": 8520 }, { "epoch": 0.07, "learning_rate": 9.872790531476164e-05, "loss": 2.3573, "step": 8525 }, { "epoch": 0.07, "learning_rate": 9.872640140687659e-05, "loss": 2.3431, "step": 8530 }, { "epoch": 0.07, "learning_rate": 9.872489662200255e-05, "loss": 2.4715, "step": 8535 }, { "epoch": 0.07, "learning_rate": 9.872339096016657e-05, "loss": 2.4436, "step": 8540 }, { "epoch": 0.07, "learning_rate": 9.872188442139576e-05, "loss": 2.4631, "step": 8545 }, { "epoch": 0.07, "learning_rate": 9.872037700571723e-05, "loss": 2.4276, "step": 8550 }, { "epoch": 0.07, "learning_rate": 9.871886871315812e-05, "loss": 2.423, "step": 8555 }, { "epoch": 0.07, "learning_rate": 9.871735954374556e-05, "loss": 2.4825, "step": 8560 }, { "epoch": 0.07, "learning_rate": 9.871584949750674e-05, "loss": 2.399, "step": 8565 }, { "epoch": 0.07, "learning_rate": 9.871433857446881e-05, "loss": 2.4072, "step": 8570 }, { "epoch": 0.07, "learning_rate": 9.871282677465899e-05, "loss": 2.4883, "step": 8575 }, { "epoch": 0.07, "learning_rate": 9.871131409810446e-05, "loss": 2.3092, "step": 8580 }, { "epoch": 0.07, "learning_rate": 9.870980054483247e-05, "loss": 2.403, "step": 8585 }, { "epoch": 0.07, "learning_rate": 9.870828611487024e-05, "loss": 2.4175, "step": 8590 }, { "epoch": 0.07, "learning_rate": 9.870677080824506e-05, "loss": 2.4541, "step": 8595 }, { "epoch": 0.07, "learning_rate": 9.870525462498417e-05, "loss": 2.3895, "step": 8600 }, { "epoch": 0.07, "learning_rate": 9.870373756511487e-05, "loss": 2.3935, "step": 8605 }, { "epoch": 0.07, "learning_rate": 9.870221962866446e-05, "loss": 2.3662, "step": 8610 }, { "epoch": 0.07, "learning_rate": 9.870070081566028e-05, "loss": 2.4289, "step": 8615 }, { "epoch": 0.07, "learning_rate": 9.869918112612964e-05, "loss": 2.4532, "step": 8620 }, { "epoch": 0.07, "learning_rate": 9.86976605600999e-05, "loss": 2.4139, "step": 8625 }, { "epoch": 0.07, "learning_rate": 9.869613911759843e-05, "loss": 2.4308, "step": 8630 }, { "epoch": 0.07, "learning_rate": 9.869461679865261e-05, "loss": 2.3695, "step": 8635 }, { "epoch": 0.07, "learning_rate": 9.869309360328987e-05, "loss": 2.3654, "step": 8640 }, { "epoch": 0.07, "learning_rate": 9.869156953153758e-05, "loss": 2.4002, "step": 8645 }, { "epoch": 0.07, "learning_rate": 9.869004458342317e-05, "loss": 2.4084, "step": 8650 }, { "epoch": 0.07, "learning_rate": 9.868851875897412e-05, "loss": 2.482, "step": 8655 }, { "epoch": 0.07, "learning_rate": 9.868699205821788e-05, "loss": 2.4479, "step": 8660 }, { "epoch": 0.07, "learning_rate": 9.868546448118192e-05, "loss": 2.4019, "step": 8665 }, { "epoch": 0.07, "learning_rate": 9.868393602789375e-05, "loss": 2.3979, "step": 8670 }, { "epoch": 0.07, "learning_rate": 9.868240669838085e-05, "loss": 2.419, "step": 8675 }, { "epoch": 0.07, "learning_rate": 9.868087649267077e-05, "loss": 2.4937, "step": 8680 }, { "epoch": 0.07, "learning_rate": 9.867934541079104e-05, "loss": 2.437, "step": 8685 }, { "epoch": 0.07, "learning_rate": 9.867781345276923e-05, "loss": 2.5001, "step": 8690 }, { "epoch": 0.07, "learning_rate": 9.867628061863289e-05, "loss": 2.3726, "step": 8695 }, { "epoch": 0.07, "learning_rate": 9.867474690840964e-05, "loss": 2.4097, "step": 8700 }, { "epoch": 0.07, "learning_rate": 9.867321232212705e-05, "loss": 2.4855, "step": 8705 }, { "epoch": 0.07, "learning_rate": 9.867167685981276e-05, "loss": 2.4638, "step": 8710 }, { "epoch": 0.07, "learning_rate": 9.867014052149441e-05, "loss": 2.4115, "step": 8715 }, { "epoch": 0.07, "learning_rate": 9.866860330719963e-05, "loss": 2.3774, "step": 8720 }, { "epoch": 0.07, "learning_rate": 9.86670652169561e-05, "loss": 2.3689, "step": 8725 }, { "epoch": 0.07, "learning_rate": 9.866552625079151e-05, "loss": 2.4859, "step": 8730 }, { "epoch": 0.07, "learning_rate": 9.866398640873356e-05, "loss": 2.5137, "step": 8735 }, { "epoch": 0.07, "learning_rate": 9.866244569080994e-05, "loss": 2.3271, "step": 8740 }, { "epoch": 0.07, "learning_rate": 9.866090409704839e-05, "loss": 2.4428, "step": 8745 }, { "epoch": 0.07, "learning_rate": 9.865936162747667e-05, "loss": 2.4511, "step": 8750 }, { "epoch": 0.07, "learning_rate": 9.865781828212254e-05, "loss": 2.4383, "step": 8755 }, { "epoch": 0.07, "learning_rate": 9.865627406101376e-05, "loss": 2.3523, "step": 8760 }, { "epoch": 0.07, "learning_rate": 9.865472896417813e-05, "loss": 2.3329, "step": 8765 }, { "epoch": 0.07, "learning_rate": 9.865318299164348e-05, "loss": 2.3857, "step": 8770 }, { "epoch": 0.07, "learning_rate": 9.865163614343761e-05, "loss": 2.4577, "step": 8775 }, { "epoch": 0.07, "learning_rate": 9.865008841958835e-05, "loss": 2.4279, "step": 8780 }, { "epoch": 0.07, "learning_rate": 9.864853982012361e-05, "loss": 2.3122, "step": 8785 }, { "epoch": 0.08, "learning_rate": 9.864699034507121e-05, "loss": 2.4146, "step": 8790 }, { "epoch": 0.08, "learning_rate": 9.864543999445905e-05, "loss": 2.3639, "step": 8795 }, { "epoch": 0.08, "learning_rate": 9.864388876831506e-05, "loss": 2.3702, "step": 8800 }, { "epoch": 0.08, "learning_rate": 9.86423366666671e-05, "loss": 2.3661, "step": 8805 }, { "epoch": 0.08, "learning_rate": 9.864078368954317e-05, "loss": 2.4172, "step": 8810 }, { "epoch": 0.08, "learning_rate": 9.863922983697118e-05, "loss": 2.331, "step": 8815 }, { "epoch": 0.08, "learning_rate": 9.863767510897912e-05, "loss": 2.4212, "step": 8820 }, { "epoch": 0.08, "learning_rate": 9.863611950559495e-05, "loss": 2.3837, "step": 8825 }, { "epoch": 0.08, "learning_rate": 9.86345630268467e-05, "loss": 2.3509, "step": 8830 }, { "epoch": 0.08, "learning_rate": 9.863300567276235e-05, "loss": 2.3557, "step": 8835 }, { "epoch": 0.08, "learning_rate": 9.863144744336994e-05, "loss": 2.259, "step": 8840 }, { "epoch": 0.08, "learning_rate": 9.862988833869753e-05, "loss": 2.4799, "step": 8845 }, { "epoch": 0.08, "learning_rate": 9.862832835877316e-05, "loss": 2.333, "step": 8850 }, { "epoch": 0.08, "learning_rate": 9.862676750362492e-05, "loss": 2.3488, "step": 8855 }, { "epoch": 0.08, "learning_rate": 9.862520577328091e-05, "loss": 2.424, "step": 8860 }, { "epoch": 0.08, "learning_rate": 9.862364316776921e-05, "loss": 2.463, "step": 8865 }, { "epoch": 0.08, "learning_rate": 9.862207968711798e-05, "loss": 2.31, "step": 8870 }, { "epoch": 0.08, "learning_rate": 9.862051533135535e-05, "loss": 2.3971, "step": 8875 }, { "epoch": 0.08, "learning_rate": 9.861895010050944e-05, "loss": 2.397, "step": 8880 }, { "epoch": 0.08, "learning_rate": 9.861738399460847e-05, "loss": 2.4032, "step": 8885 }, { "epoch": 0.08, "learning_rate": 9.86158170136806e-05, "loss": 2.4447, "step": 8890 }, { "epoch": 0.08, "learning_rate": 9.861424915775404e-05, "loss": 2.4132, "step": 8895 }, { "epoch": 0.08, "learning_rate": 9.861268042685701e-05, "loss": 2.4892, "step": 8900 }, { "epoch": 0.08, "learning_rate": 9.861111082101774e-05, "loss": 2.4604, "step": 8905 }, { "epoch": 0.08, "learning_rate": 9.860954034026448e-05, "loss": 2.4027, "step": 8910 }, { "epoch": 0.08, "learning_rate": 9.86079689846255e-05, "loss": 2.4565, "step": 8915 }, { "epoch": 0.08, "learning_rate": 9.860639675412909e-05, "loss": 2.343, "step": 8920 }, { "epoch": 0.08, "learning_rate": 9.860482364880352e-05, "loss": 2.3815, "step": 8925 }, { "epoch": 0.08, "learning_rate": 9.860324966867714e-05, "loss": 2.4533, "step": 8930 }, { "epoch": 0.08, "learning_rate": 9.860167481377825e-05, "loss": 2.4839, "step": 8935 }, { "epoch": 0.08, "learning_rate": 9.86000990841352e-05, "loss": 2.4231, "step": 8940 }, { "epoch": 0.08, "learning_rate": 9.859852247977634e-05, "loss": 2.4764, "step": 8945 }, { "epoch": 0.08, "learning_rate": 9.859694500073008e-05, "loss": 2.4513, "step": 8950 }, { "epoch": 0.08, "learning_rate": 9.85953666470248e-05, "loss": 2.3142, "step": 8955 }, { "epoch": 0.08, "learning_rate": 9.859378741868888e-05, "loss": 2.4136, "step": 8960 }, { "epoch": 0.08, "learning_rate": 9.859220731575077e-05, "loss": 2.4477, "step": 8965 }, { "epoch": 0.08, "learning_rate": 9.85906263382389e-05, "loss": 2.5068, "step": 8970 }, { "epoch": 0.08, "learning_rate": 9.858904448618173e-05, "loss": 2.4968, "step": 8975 }, { "epoch": 0.08, "learning_rate": 9.858746175960773e-05, "loss": 2.3768, "step": 8980 }, { "epoch": 0.08, "learning_rate": 9.858587815854538e-05, "loss": 2.4373, "step": 8985 }, { "epoch": 0.08, "learning_rate": 9.85842936830232e-05, "loss": 2.3975, "step": 8990 }, { "epoch": 0.08, "learning_rate": 9.858270833306969e-05, "loss": 2.461, "step": 8995 }, { "epoch": 0.08, "learning_rate": 9.858112210871337e-05, "loss": 2.4119, "step": 9000 }, { "epoch": 0.08, "learning_rate": 9.85795350099828e-05, "loss": 2.4247, "step": 9005 }, { "epoch": 0.08, "learning_rate": 9.857794703690657e-05, "loss": 2.424, "step": 9010 }, { "epoch": 0.08, "learning_rate": 9.857635818951325e-05, "loss": 2.4195, "step": 9015 }, { "epoch": 0.08, "learning_rate": 9.857476846783141e-05, "loss": 2.4407, "step": 9020 }, { "epoch": 0.08, "learning_rate": 9.857317787188968e-05, "loss": 2.4169, "step": 9025 }, { "epoch": 0.08, "learning_rate": 9.857158640171671e-05, "loss": 2.4894, "step": 9030 }, { "epoch": 0.08, "learning_rate": 9.85699940573411e-05, "loss": 2.4036, "step": 9035 }, { "epoch": 0.08, "learning_rate": 9.856840083879154e-05, "loss": 2.4256, "step": 9040 }, { "epoch": 0.08, "learning_rate": 9.85668067460967e-05, "loss": 2.4383, "step": 9045 }, { "epoch": 0.08, "learning_rate": 9.856521177928526e-05, "loss": 2.4345, "step": 9050 }, { "epoch": 0.08, "learning_rate": 9.856361593838595e-05, "loss": 2.3794, "step": 9055 }, { "epoch": 0.08, "learning_rate": 9.856201922342745e-05, "loss": 2.4084, "step": 9060 }, { "epoch": 0.08, "learning_rate": 9.856042163443855e-05, "loss": 2.4551, "step": 9065 }, { "epoch": 0.08, "learning_rate": 9.855882317144796e-05, "loss": 2.4343, "step": 9070 }, { "epoch": 0.08, "learning_rate": 9.855722383448447e-05, "loss": 2.4232, "step": 9075 }, { "epoch": 0.08, "learning_rate": 9.855562362357686e-05, "loss": 2.4714, "step": 9080 }, { "epoch": 0.08, "learning_rate": 9.855402253875395e-05, "loss": 2.3736, "step": 9085 }, { "epoch": 0.08, "learning_rate": 9.855242058004453e-05, "loss": 2.3906, "step": 9090 }, { "epoch": 0.08, "learning_rate": 9.855081774747745e-05, "loss": 2.3454, "step": 9095 }, { "epoch": 0.08, "learning_rate": 9.854921404108155e-05, "loss": 2.4022, "step": 9100 }, { "epoch": 0.08, "learning_rate": 9.854760946088568e-05, "loss": 2.3552, "step": 9105 }, { "epoch": 0.08, "learning_rate": 9.854600400691875e-05, "loss": 2.363, "step": 9110 }, { "epoch": 0.08, "learning_rate": 9.854439767920964e-05, "loss": 2.4585, "step": 9115 }, { "epoch": 0.08, "learning_rate": 9.854279047778725e-05, "loss": 2.4044, "step": 9120 }, { "epoch": 0.08, "learning_rate": 9.854118240268053e-05, "loss": 2.3944, "step": 9125 }, { "epoch": 0.08, "learning_rate": 9.85395734539184e-05, "loss": 2.4265, "step": 9130 }, { "epoch": 0.08, "learning_rate": 9.853796363152985e-05, "loss": 2.4972, "step": 9135 }, { "epoch": 0.08, "learning_rate": 9.85363529355438e-05, "loss": 2.4181, "step": 9140 }, { "epoch": 0.08, "learning_rate": 9.853474136598928e-05, "loss": 2.4345, "step": 9145 }, { "epoch": 0.08, "learning_rate": 9.85331289228953e-05, "loss": 2.3432, "step": 9150 }, { "epoch": 0.08, "learning_rate": 9.853151560629087e-05, "loss": 2.5044, "step": 9155 }, { "epoch": 0.08, "learning_rate": 9.852990141620502e-05, "loss": 2.4309, "step": 9160 }, { "epoch": 0.08, "learning_rate": 9.852828635266681e-05, "loss": 2.3844, "step": 9165 }, { "epoch": 0.08, "learning_rate": 9.85266704157053e-05, "loss": 2.4855, "step": 9170 }, { "epoch": 0.08, "learning_rate": 9.852505360534958e-05, "loss": 2.3058, "step": 9175 }, { "epoch": 0.08, "learning_rate": 9.852343592162876e-05, "loss": 2.3969, "step": 9180 }, { "epoch": 0.08, "learning_rate": 9.852181736457194e-05, "loss": 2.3465, "step": 9185 }, { "epoch": 0.08, "learning_rate": 9.852019793420826e-05, "loss": 2.3828, "step": 9190 }, { "epoch": 0.08, "learning_rate": 9.851857763056687e-05, "loss": 2.3689, "step": 9195 }, { "epoch": 0.08, "learning_rate": 9.851695645367691e-05, "loss": 2.4408, "step": 9200 }, { "epoch": 0.08, "learning_rate": 9.851533440356758e-05, "loss": 2.4081, "step": 9205 }, { "epoch": 0.08, "learning_rate": 9.851371148026806e-05, "loss": 2.4096, "step": 9210 }, { "epoch": 0.08, "learning_rate": 9.85120876838076e-05, "loss": 2.4195, "step": 9215 }, { "epoch": 0.08, "learning_rate": 9.851046301421536e-05, "loss": 2.2612, "step": 9220 }, { "epoch": 0.08, "learning_rate": 9.850883747152064e-05, "loss": 2.4315, "step": 9225 }, { "epoch": 0.08, "learning_rate": 9.850721105575265e-05, "loss": 2.4034, "step": 9230 }, { "epoch": 0.08, "learning_rate": 9.85055837669407e-05, "loss": 2.3757, "step": 9235 }, { "epoch": 0.08, "learning_rate": 9.850395560511406e-05, "loss": 2.3484, "step": 9240 }, { "epoch": 0.08, "learning_rate": 9.850232657030202e-05, "loss": 2.4346, "step": 9245 }, { "epoch": 0.08, "learning_rate": 9.850069666253394e-05, "loss": 2.5089, "step": 9250 }, { "epoch": 0.08, "learning_rate": 9.849906588183911e-05, "loss": 2.4767, "step": 9255 }, { "epoch": 0.08, "learning_rate": 9.849743422824692e-05, "loss": 2.4565, "step": 9260 }, { "epoch": 0.08, "learning_rate": 9.849580170178671e-05, "loss": 2.3877, "step": 9265 }, { "epoch": 0.08, "learning_rate": 9.849416830248788e-05, "loss": 2.4834, "step": 9270 }, { "epoch": 0.08, "learning_rate": 9.849253403037982e-05, "loss": 2.3768, "step": 9275 }, { "epoch": 0.08, "learning_rate": 9.849089888549195e-05, "loss": 2.4869, "step": 9280 }, { "epoch": 0.08, "learning_rate": 9.848926286785369e-05, "loss": 2.3716, "step": 9285 }, { "epoch": 0.08, "learning_rate": 9.848762597749448e-05, "loss": 2.3929, "step": 9290 }, { "epoch": 0.08, "learning_rate": 9.84859882144438e-05, "loss": 2.3654, "step": 9295 }, { "epoch": 0.08, "learning_rate": 9.848434957873112e-05, "loss": 2.3244, "step": 9300 }, { "epoch": 0.08, "learning_rate": 9.848271007038594e-05, "loss": 2.3968, "step": 9305 }, { "epoch": 0.08, "learning_rate": 9.848106968943773e-05, "loss": 2.4345, "step": 9310 }, { "epoch": 0.08, "learning_rate": 9.847942843591606e-05, "loss": 2.4329, "step": 9315 }, { "epoch": 0.08, "learning_rate": 9.847778630985046e-05, "loss": 2.3916, "step": 9320 }, { "epoch": 0.08, "learning_rate": 9.847614331127047e-05, "loss": 2.3958, "step": 9325 }, { "epoch": 0.08, "learning_rate": 9.847449944020567e-05, "loss": 2.4223, "step": 9330 }, { "epoch": 0.08, "learning_rate": 9.847285469668565e-05, "loss": 2.4301, "step": 9335 }, { "epoch": 0.08, "learning_rate": 9.847120908074e-05, "loss": 2.4076, "step": 9340 }, { "epoch": 0.08, "learning_rate": 9.846956259239835e-05, "loss": 2.3993, "step": 9345 }, { "epoch": 0.08, "learning_rate": 9.846791523169033e-05, "loss": 2.3927, "step": 9350 }, { "epoch": 0.08, "learning_rate": 9.846626699864558e-05, "loss": 2.5075, "step": 9355 }, { "epoch": 0.08, "learning_rate": 9.846461789329379e-05, "loss": 2.4377, "step": 9360 }, { "epoch": 0.08, "learning_rate": 9.846296791566463e-05, "loss": 2.4679, "step": 9365 }, { "epoch": 0.08, "learning_rate": 9.846131706578779e-05, "loss": 2.4114, "step": 9370 }, { "epoch": 0.08, "learning_rate": 9.845966534369297e-05, "loss": 2.4047, "step": 9375 }, { "epoch": 0.08, "learning_rate": 9.845801274940991e-05, "loss": 2.3903, "step": 9380 }, { "epoch": 0.08, "learning_rate": 9.845635928296837e-05, "loss": 2.4385, "step": 9385 }, { "epoch": 0.08, "learning_rate": 9.84547049443981e-05, "loss": 2.4373, "step": 9390 }, { "epoch": 0.08, "learning_rate": 9.845304973372887e-05, "loss": 2.3848, "step": 9395 }, { "epoch": 0.08, "learning_rate": 9.845139365099046e-05, "loss": 2.467, "step": 9400 }, { "epoch": 0.08, "learning_rate": 9.84497366962127e-05, "loss": 2.4361, "step": 9405 }, { "epoch": 0.08, "learning_rate": 9.84480788694254e-05, "loss": 2.348, "step": 9410 }, { "epoch": 0.08, "learning_rate": 9.84464201706584e-05, "loss": 2.399, "step": 9415 }, { "epoch": 0.08, "learning_rate": 9.844476059994154e-05, "loss": 2.4271, "step": 9420 }, { "epoch": 0.08, "learning_rate": 9.844310015730472e-05, "loss": 2.4205, "step": 9425 }, { "epoch": 0.08, "learning_rate": 9.84414388427778e-05, "loss": 2.4314, "step": 9430 }, { "epoch": 0.08, "learning_rate": 9.843977665639069e-05, "loss": 2.4216, "step": 9435 }, { "epoch": 0.08, "learning_rate": 9.84381135981733e-05, "loss": 2.3492, "step": 9440 }, { "epoch": 0.08, "learning_rate": 9.843644966815557e-05, "loss": 2.332, "step": 9445 }, { "epoch": 0.08, "learning_rate": 9.843478486636744e-05, "loss": 2.4725, "step": 9450 }, { "epoch": 0.08, "learning_rate": 9.843311919283889e-05, "loss": 2.4056, "step": 9455 }, { "epoch": 0.08, "learning_rate": 9.843145264759987e-05, "loss": 2.4054, "step": 9460 }, { "epoch": 0.08, "learning_rate": 9.842978523068041e-05, "loss": 2.4103, "step": 9465 }, { "epoch": 0.08, "learning_rate": 9.84281169421105e-05, "loss": 2.443, "step": 9470 }, { "epoch": 0.08, "learning_rate": 9.842644778192015e-05, "loss": 2.3653, "step": 9475 }, { "epoch": 0.08, "learning_rate": 9.842477775013943e-05, "loss": 2.3447, "step": 9480 }, { "epoch": 0.08, "learning_rate": 9.842310684679838e-05, "loss": 2.3892, "step": 9485 }, { "epoch": 0.08, "learning_rate": 9.84214350719271e-05, "loss": 2.3742, "step": 9490 }, { "epoch": 0.08, "learning_rate": 9.841976242555567e-05, "loss": 2.3711, "step": 9495 }, { "epoch": 0.08, "learning_rate": 9.841808890771416e-05, "loss": 2.4327, "step": 9500 }, { "epoch": 0.08, "learning_rate": 9.841641451843271e-05, "loss": 2.3818, "step": 9505 }, { "epoch": 0.08, "learning_rate": 9.841473925774147e-05, "loss": 2.4886, "step": 9510 }, { "epoch": 0.08, "learning_rate": 9.841306312567059e-05, "loss": 2.4359, "step": 9515 }, { "epoch": 0.08, "learning_rate": 9.841138612225023e-05, "loss": 2.4539, "step": 9520 }, { "epoch": 0.08, "learning_rate": 9.840970824751057e-05, "loss": 2.3473, "step": 9525 }, { "epoch": 0.08, "learning_rate": 9.840802950148181e-05, "loss": 2.4442, "step": 9530 }, { "epoch": 0.08, "learning_rate": 9.840634988419417e-05, "loss": 2.4352, "step": 9535 }, { "epoch": 0.08, "learning_rate": 9.840466939567787e-05, "loss": 2.3464, "step": 9540 }, { "epoch": 0.08, "learning_rate": 9.840298803596318e-05, "loss": 2.4787, "step": 9545 }, { "epoch": 0.08, "learning_rate": 9.840130580508034e-05, "loss": 2.3756, "step": 9550 }, { "epoch": 0.08, "learning_rate": 9.839962270305963e-05, "loss": 2.3638, "step": 9555 }, { "epoch": 0.08, "learning_rate": 9.839793872993133e-05, "loss": 2.3811, "step": 9560 }, { "epoch": 0.08, "learning_rate": 9.839625388572578e-05, "loss": 2.379, "step": 9565 }, { "epoch": 0.08, "learning_rate": 9.839456817047328e-05, "loss": 2.462, "step": 9570 }, { "epoch": 0.08, "learning_rate": 9.839288158420417e-05, "loss": 2.4068, "step": 9575 }, { "epoch": 0.08, "learning_rate": 9.839119412694882e-05, "loss": 2.4362, "step": 9580 }, { "epoch": 0.08, "learning_rate": 9.83895057987376e-05, "loss": 2.4151, "step": 9585 }, { "epoch": 0.08, "learning_rate": 9.838781659960089e-05, "loss": 2.4117, "step": 9590 }, { "epoch": 0.08, "learning_rate": 9.838612652956909e-05, "loss": 2.4417, "step": 9595 }, { "epoch": 0.08, "learning_rate": 9.838443558867262e-05, "loss": 2.3529, "step": 9600 }, { "epoch": 0.08, "learning_rate": 9.838274377694193e-05, "loss": 2.4548, "step": 9605 }, { "epoch": 0.08, "learning_rate": 9.838105109440742e-05, "loss": 2.4394, "step": 9610 }, { "epoch": 0.08, "learning_rate": 9.837935754109962e-05, "loss": 2.4666, "step": 9615 }, { "epoch": 0.08, "learning_rate": 9.837766311704897e-05, "loss": 2.4329, "step": 9620 }, { "epoch": 0.08, "learning_rate": 9.837596782228598e-05, "loss": 2.4928, "step": 9625 }, { "epoch": 0.08, "learning_rate": 9.837427165684116e-05, "loss": 2.4622, "step": 9630 }, { "epoch": 0.08, "learning_rate": 9.837257462074506e-05, "loss": 2.4059, "step": 9635 }, { "epoch": 0.08, "learning_rate": 9.837087671402817e-05, "loss": 2.4699, "step": 9640 }, { "epoch": 0.08, "learning_rate": 9.83691779367211e-05, "loss": 2.3735, "step": 9645 }, { "epoch": 0.08, "learning_rate": 9.836747828885439e-05, "loss": 2.3835, "step": 9650 }, { "epoch": 0.08, "learning_rate": 9.836577777045866e-05, "loss": 2.3826, "step": 9655 }, { "epoch": 0.08, "learning_rate": 9.836407638156451e-05, "loss": 2.4512, "step": 9660 }, { "epoch": 0.08, "learning_rate": 9.836237412220254e-05, "loss": 2.4068, "step": 9665 }, { "epoch": 0.08, "learning_rate": 9.83606709924034e-05, "loss": 2.4606, "step": 9670 }, { "epoch": 0.08, "learning_rate": 9.835896699219776e-05, "loss": 2.4084, "step": 9675 }, { "epoch": 0.08, "learning_rate": 9.835726212161628e-05, "loss": 2.3748, "step": 9680 }, { "epoch": 0.08, "learning_rate": 9.835555638068962e-05, "loss": 2.3853, "step": 9685 }, { "epoch": 0.08, "learning_rate": 9.835384976944853e-05, "loss": 2.3514, "step": 9690 }, { "epoch": 0.08, "learning_rate": 9.835214228792367e-05, "loss": 2.42, "step": 9695 }, { "epoch": 0.08, "learning_rate": 9.83504339361458e-05, "loss": 2.4839, "step": 9700 }, { "epoch": 0.08, "learning_rate": 9.834872471414567e-05, "loss": 2.3656, "step": 9705 }, { "epoch": 0.08, "learning_rate": 9.834701462195404e-05, "loss": 2.3974, "step": 9710 }, { "epoch": 0.08, "learning_rate": 9.834530365960169e-05, "loss": 2.4325, "step": 9715 }, { "epoch": 0.08, "learning_rate": 9.83435918271194e-05, "loss": 2.477, "step": 9720 }, { "epoch": 0.08, "learning_rate": 9.8341879124538e-05, "loss": 2.4264, "step": 9725 }, { "epoch": 0.08, "learning_rate": 9.83401655518883e-05, "loss": 2.3963, "step": 9730 }, { "epoch": 0.08, "learning_rate": 9.833845110920117e-05, "loss": 2.4699, "step": 9735 }, { "epoch": 0.08, "learning_rate": 9.833673579650742e-05, "loss": 2.3586, "step": 9740 }, { "epoch": 0.08, "learning_rate": 9.833501961383795e-05, "loss": 2.3931, "step": 9745 }, { "epoch": 0.08, "learning_rate": 9.833330256122366e-05, "loss": 2.3676, "step": 9750 }, { "epoch": 0.08, "learning_rate": 9.833158463869542e-05, "loss": 2.3813, "step": 9755 }, { "epoch": 0.08, "learning_rate": 9.832986584628418e-05, "loss": 2.4484, "step": 9760 }, { "epoch": 0.08, "learning_rate": 9.832814618402086e-05, "loss": 2.4588, "step": 9765 }, { "epoch": 0.08, "learning_rate": 9.832642565193643e-05, "loss": 2.4138, "step": 9770 }, { "epoch": 0.08, "learning_rate": 9.832470425006183e-05, "loss": 2.3947, "step": 9775 }, { "epoch": 0.08, "learning_rate": 9.832298197842807e-05, "loss": 2.3878, "step": 9780 }, { "epoch": 0.08, "learning_rate": 9.832125883706612e-05, "loss": 2.3224, "step": 9785 }, { "epoch": 0.08, "learning_rate": 9.831953482600699e-05, "loss": 2.4014, "step": 9790 }, { "epoch": 0.08, "learning_rate": 9.831780994528174e-05, "loss": 2.3978, "step": 9795 }, { "epoch": 0.08, "learning_rate": 9.831608419492139e-05, "loss": 2.4906, "step": 9800 }, { "epoch": 0.08, "learning_rate": 9.831435757495701e-05, "loss": 2.3836, "step": 9805 }, { "epoch": 0.08, "learning_rate": 9.831263008541969e-05, "loss": 2.4982, "step": 9810 }, { "epoch": 0.08, "learning_rate": 9.83109017263405e-05, "loss": 2.4399, "step": 9815 }, { "epoch": 0.08, "learning_rate": 9.830917249775055e-05, "loss": 2.4241, "step": 9820 }, { "epoch": 0.08, "learning_rate": 9.830744239968098e-05, "loss": 2.3771, "step": 9825 }, { "epoch": 0.08, "learning_rate": 9.830571143216291e-05, "loss": 2.4023, "step": 9830 }, { "epoch": 0.08, "learning_rate": 9.83039795952275e-05, "loss": 2.3819, "step": 9835 }, { "epoch": 0.08, "learning_rate": 9.830224688890592e-05, "loss": 2.3626, "step": 9840 }, { "epoch": 0.08, "learning_rate": 9.830051331322936e-05, "loss": 2.4206, "step": 9845 }, { "epoch": 0.08, "learning_rate": 9.829877886822903e-05, "loss": 2.5024, "step": 9850 }, { "epoch": 0.08, "learning_rate": 9.829704355393612e-05, "loss": 2.3816, "step": 9855 }, { "epoch": 0.08, "learning_rate": 9.829530737038187e-05, "loss": 2.4273, "step": 9860 }, { "epoch": 0.08, "learning_rate": 9.829357031759755e-05, "loss": 2.4008, "step": 9865 }, { "epoch": 0.08, "learning_rate": 9.829183239561442e-05, "loss": 2.4151, "step": 9870 }, { "epoch": 0.08, "learning_rate": 9.829009360446373e-05, "loss": 2.4656, "step": 9875 }, { "epoch": 0.08, "learning_rate": 9.828835394417679e-05, "loss": 2.429, "step": 9880 }, { "epoch": 0.08, "learning_rate": 9.828661341478494e-05, "loss": 2.3321, "step": 9885 }, { "epoch": 0.08, "learning_rate": 9.828487201631945e-05, "loss": 2.4118, "step": 9890 }, { "epoch": 0.08, "learning_rate": 9.82831297488117e-05, "loss": 2.4005, "step": 9895 }, { "epoch": 0.08, "learning_rate": 9.828138661229307e-05, "loss": 2.4196, "step": 9900 }, { "epoch": 0.08, "learning_rate": 9.827964260679487e-05, "loss": 2.425, "step": 9905 }, { "epoch": 0.08, "learning_rate": 9.827789773234855e-05, "loss": 2.3421, "step": 9910 }, { "epoch": 0.08, "learning_rate": 9.827615198898548e-05, "loss": 2.3268, "step": 9915 }, { "epoch": 0.08, "learning_rate": 9.827440537673709e-05, "loss": 2.3197, "step": 9920 }, { "epoch": 0.08, "learning_rate": 9.827265789563482e-05, "loss": 2.4328, "step": 9925 }, { "epoch": 0.08, "learning_rate": 9.82709095457101e-05, "loss": 2.4502, "step": 9930 }, { "epoch": 0.08, "learning_rate": 9.826916032699443e-05, "loss": 2.3115, "step": 9935 }, { "epoch": 0.08, "learning_rate": 9.826741023951926e-05, "loss": 2.4615, "step": 9940 }, { "epoch": 0.08, "learning_rate": 9.826565928331613e-05, "loss": 2.4452, "step": 9945 }, { "epoch": 0.08, "learning_rate": 9.82639074584165e-05, "loss": 2.402, "step": 9950 }, { "epoch": 0.08, "learning_rate": 9.826215476485194e-05, "loss": 2.385, "step": 9955 }, { "epoch": 0.08, "learning_rate": 9.826040120265398e-05, "loss": 2.4006, "step": 9960 }, { "epoch": 0.09, "learning_rate": 9.82586467718542e-05, "loss": 2.3845, "step": 9965 }, { "epoch": 0.09, "learning_rate": 9.825689147248416e-05, "loss": 2.3577, "step": 9970 }, { "epoch": 0.09, "learning_rate": 9.825513530457545e-05, "loss": 2.3747, "step": 9975 }, { "epoch": 0.09, "learning_rate": 9.825337826815968e-05, "loss": 2.3759, "step": 9980 }, { "epoch": 0.09, "learning_rate": 9.825162036326846e-05, "loss": 2.3724, "step": 9985 }, { "epoch": 0.09, "learning_rate": 9.824986158993346e-05, "loss": 2.3239, "step": 9990 }, { "epoch": 0.09, "learning_rate": 9.824810194818633e-05, "loss": 2.4368, "step": 9995 }, { "epoch": 0.09, "learning_rate": 9.824634143805872e-05, "loss": 2.3653, "step": 10000 }, { "epoch": 0.09, "learning_rate": 9.824458005958232e-05, "loss": 2.3414, "step": 10005 }, { "epoch": 0.09, "learning_rate": 9.824281781278883e-05, "loss": 2.3924, "step": 10010 }, { "epoch": 0.09, "learning_rate": 9.824105469771e-05, "loss": 2.3555, "step": 10015 }, { "epoch": 0.09, "learning_rate": 9.823929071437752e-05, "loss": 2.3626, "step": 10020 }, { "epoch": 0.09, "learning_rate": 9.823752586282316e-05, "loss": 2.4164, "step": 10025 }, { "epoch": 0.09, "learning_rate": 9.823576014307869e-05, "loss": 2.4409, "step": 10030 }, { "epoch": 0.09, "learning_rate": 9.823399355517587e-05, "loss": 2.3462, "step": 10035 }, { "epoch": 0.09, "learning_rate": 9.82322260991465e-05, "loss": 2.4297, "step": 10040 }, { "epoch": 0.09, "learning_rate": 9.823045777502242e-05, "loss": 2.4355, "step": 10045 }, { "epoch": 0.09, "learning_rate": 9.822868858283543e-05, "loss": 2.4331, "step": 10050 }, { "epoch": 0.09, "learning_rate": 9.822691852261736e-05, "loss": 2.4769, "step": 10055 }, { "epoch": 0.09, "learning_rate": 9.82251475944001e-05, "loss": 2.4278, "step": 10060 }, { "epoch": 0.09, "learning_rate": 9.822337579821547e-05, "loss": 2.4339, "step": 10065 }, { "epoch": 0.09, "learning_rate": 9.822160313409544e-05, "loss": 2.4749, "step": 10070 }, { "epoch": 0.09, "learning_rate": 9.821982960207186e-05, "loss": 2.3932, "step": 10075 }, { "epoch": 0.09, "learning_rate": 9.821805520217667e-05, "loss": 2.3901, "step": 10080 }, { "epoch": 0.09, "learning_rate": 9.821627993444178e-05, "loss": 2.481, "step": 10085 }, { "epoch": 0.09, "learning_rate": 9.821450379889916e-05, "loss": 2.423, "step": 10090 }, { "epoch": 0.09, "learning_rate": 9.821272679558079e-05, "loss": 2.3632, "step": 10095 }, { "epoch": 0.09, "learning_rate": 9.821094892451863e-05, "loss": 2.3663, "step": 10100 }, { "epoch": 0.09, "learning_rate": 9.82091701857447e-05, "loss": 2.4282, "step": 10105 }, { "epoch": 0.09, "learning_rate": 9.820739057929099e-05, "loss": 2.3914, "step": 10110 }, { "epoch": 0.09, "learning_rate": 9.820561010518957e-05, "loss": 2.3619, "step": 10115 }, { "epoch": 0.09, "learning_rate": 9.820382876347242e-05, "loss": 2.451, "step": 10120 }, { "epoch": 0.09, "learning_rate": 9.820204655417166e-05, "loss": 2.3712, "step": 10125 }, { "epoch": 0.09, "learning_rate": 9.820026347731934e-05, "loss": 2.4585, "step": 10130 }, { "epoch": 0.09, "learning_rate": 9.819847953294757e-05, "loss": 2.4282, "step": 10135 }, { "epoch": 0.09, "learning_rate": 9.819669472108842e-05, "loss": 2.4835, "step": 10140 }, { "epoch": 0.09, "learning_rate": 9.819490904177407e-05, "loss": 2.4081, "step": 10145 }, { "epoch": 0.09, "learning_rate": 9.81931224950366e-05, "loss": 2.342, "step": 10150 }, { "epoch": 0.09, "learning_rate": 9.81913350809082e-05, "loss": 2.4428, "step": 10155 }, { "epoch": 0.09, "learning_rate": 9.818954679942105e-05, "loss": 2.4185, "step": 10160 }, { "epoch": 0.09, "learning_rate": 9.81877576506073e-05, "loss": 2.4311, "step": 10165 }, { "epoch": 0.09, "learning_rate": 9.818596763449918e-05, "loss": 2.3462, "step": 10170 }, { "epoch": 0.09, "learning_rate": 9.81841767511289e-05, "loss": 2.3674, "step": 10175 }, { "epoch": 0.09, "learning_rate": 9.818238500052868e-05, "loss": 2.462, "step": 10180 }, { "epoch": 0.09, "learning_rate": 9.818059238273078e-05, "loss": 2.4777, "step": 10185 }, { "epoch": 0.09, "learning_rate": 9.817879889776746e-05, "loss": 2.3942, "step": 10190 }, { "epoch": 0.09, "learning_rate": 9.817700454567103e-05, "loss": 2.4256, "step": 10195 }, { "epoch": 0.09, "learning_rate": 9.817520932647373e-05, "loss": 2.4729, "step": 10200 }, { "epoch": 0.09, "learning_rate": 9.81734132402079e-05, "loss": 2.4011, "step": 10205 }, { "epoch": 0.09, "learning_rate": 9.817161628690587e-05, "loss": 2.5078, "step": 10210 }, { "epoch": 0.09, "learning_rate": 9.816981846659998e-05, "loss": 2.4086, "step": 10215 }, { "epoch": 0.09, "learning_rate": 9.816801977932257e-05, "loss": 2.467, "step": 10220 }, { "epoch": 0.09, "learning_rate": 9.816622022510604e-05, "loss": 2.432, "step": 10225 }, { "epoch": 0.09, "learning_rate": 9.816441980398277e-05, "loss": 2.4123, "step": 10230 }, { "epoch": 0.09, "learning_rate": 9.816261851598516e-05, "loss": 2.4132, "step": 10235 }, { "epoch": 0.09, "learning_rate": 9.816081636114563e-05, "loss": 2.4095, "step": 10240 }, { "epoch": 0.09, "learning_rate": 9.81590133394966e-05, "loss": 2.4939, "step": 10245 }, { "epoch": 0.09, "learning_rate": 9.815720945107054e-05, "loss": 2.4508, "step": 10250 }, { "epoch": 0.09, "learning_rate": 9.815540469589993e-05, "loss": 2.3902, "step": 10255 }, { "epoch": 0.09, "learning_rate": 9.815359907401723e-05, "loss": 2.4193, "step": 10260 }, { "epoch": 0.09, "learning_rate": 9.815179258545495e-05, "loss": 2.4257, "step": 10265 }, { "epoch": 0.09, "learning_rate": 9.814998523024558e-05, "loss": 2.4585, "step": 10270 }, { "epoch": 0.09, "learning_rate": 9.814817700842168e-05, "loss": 2.4463, "step": 10275 }, { "epoch": 0.09, "learning_rate": 9.814636792001579e-05, "loss": 2.4589, "step": 10280 }, { "epoch": 0.09, "learning_rate": 9.814455796506044e-05, "loss": 2.444, "step": 10285 }, { "epoch": 0.09, "learning_rate": 9.814274714358825e-05, "loss": 2.363, "step": 10290 }, { "epoch": 0.09, "learning_rate": 9.814093545563179e-05, "loss": 2.4256, "step": 10295 }, { "epoch": 0.09, "learning_rate": 9.813912290122364e-05, "loss": 2.4344, "step": 10300 }, { "epoch": 0.09, "learning_rate": 9.813730948039648e-05, "loss": 2.3614, "step": 10305 }, { "epoch": 0.09, "learning_rate": 9.813549519318291e-05, "loss": 2.42, "step": 10310 }, { "epoch": 0.09, "learning_rate": 9.813368003961558e-05, "loss": 2.4309, "step": 10315 }, { "epoch": 0.09, "learning_rate": 9.813186401972718e-05, "loss": 2.439, "step": 10320 }, { "epoch": 0.09, "learning_rate": 9.81300471335504e-05, "loss": 2.3553, "step": 10325 }, { "epoch": 0.09, "learning_rate": 9.812822938111792e-05, "loss": 2.3758, "step": 10330 }, { "epoch": 0.09, "learning_rate": 9.812641076246246e-05, "loss": 2.4925, "step": 10335 }, { "epoch": 0.09, "learning_rate": 9.812459127761675e-05, "loss": 2.4453, "step": 10340 }, { "epoch": 0.09, "learning_rate": 9.812277092661356e-05, "loss": 2.3895, "step": 10345 }, { "epoch": 0.09, "learning_rate": 9.812094970948562e-05, "loss": 2.3883, "step": 10350 }, { "epoch": 0.09, "learning_rate": 9.811912762626573e-05, "loss": 2.435, "step": 10355 }, { "epoch": 0.09, "learning_rate": 9.811730467698668e-05, "loss": 2.4878, "step": 10360 }, { "epoch": 0.09, "learning_rate": 9.811548086168128e-05, "loss": 2.401, "step": 10365 }, { "epoch": 0.09, "learning_rate": 9.811365618038236e-05, "loss": 2.3834, "step": 10370 }, { "epoch": 0.09, "learning_rate": 9.811183063312275e-05, "loss": 2.3878, "step": 10375 }, { "epoch": 0.09, "learning_rate": 9.811000421993531e-05, "loss": 2.3191, "step": 10380 }, { "epoch": 0.09, "learning_rate": 9.810817694085292e-05, "loss": 2.515, "step": 10385 }, { "epoch": 0.09, "learning_rate": 9.810634879590847e-05, "loss": 2.4043, "step": 10390 }, { "epoch": 0.09, "learning_rate": 9.810451978513484e-05, "loss": 2.4416, "step": 10395 }, { "epoch": 0.09, "learning_rate": 9.810268990856497e-05, "loss": 2.3808, "step": 10400 }, { "epoch": 0.09, "learning_rate": 9.81008591662318e-05, "loss": 2.4034, "step": 10405 }, { "epoch": 0.09, "learning_rate": 9.809902755816826e-05, "loss": 2.459, "step": 10410 }, { "epoch": 0.09, "learning_rate": 9.809719508440732e-05, "loss": 2.3776, "step": 10415 }, { "epoch": 0.09, "learning_rate": 9.809536174498197e-05, "loss": 2.5064, "step": 10420 }, { "epoch": 0.09, "learning_rate": 9.809352753992521e-05, "loss": 2.3902, "step": 10425 }, { "epoch": 0.09, "learning_rate": 9.809169246927004e-05, "loss": 2.3918, "step": 10430 }, { "epoch": 0.09, "learning_rate": 9.80898565330495e-05, "loss": 2.4285, "step": 10435 }, { "epoch": 0.09, "learning_rate": 9.808801973129662e-05, "loss": 2.4228, "step": 10440 }, { "epoch": 0.09, "learning_rate": 9.808618206404447e-05, "loss": 2.396, "step": 10445 }, { "epoch": 0.09, "learning_rate": 9.808434353132611e-05, "loss": 2.4522, "step": 10450 }, { "epoch": 0.09, "learning_rate": 9.808250413317467e-05, "loss": 2.4495, "step": 10455 }, { "epoch": 0.09, "learning_rate": 9.80806638696232e-05, "loss": 2.3976, "step": 10460 }, { "epoch": 0.09, "learning_rate": 9.807882274070486e-05, "loss": 2.4179, "step": 10465 }, { "epoch": 0.09, "learning_rate": 9.807698074645279e-05, "loss": 2.3727, "step": 10470 }, { "epoch": 0.09, "learning_rate": 9.80751378869001e-05, "loss": 2.3178, "step": 10475 }, { "epoch": 0.09, "learning_rate": 9.807329416208001e-05, "loss": 2.3935, "step": 10480 }, { "epoch": 0.09, "learning_rate": 9.807144957202567e-05, "loss": 2.3917, "step": 10485 }, { "epoch": 0.09, "learning_rate": 9.806960411677029e-05, "loss": 2.4291, "step": 10490 }, { "epoch": 0.09, "learning_rate": 9.80677577963471e-05, "loss": 2.4065, "step": 10495 }, { "epoch": 0.09, "learning_rate": 9.806591061078929e-05, "loss": 2.401, "step": 10500 }, { "epoch": 0.09, "learning_rate": 9.806406256013016e-05, "loss": 2.3505, "step": 10505 }, { "epoch": 0.09, "learning_rate": 9.806221364440292e-05, "loss": 2.4294, "step": 10510 }, { "epoch": 0.09, "learning_rate": 9.806036386364088e-05, "loss": 2.4142, "step": 10515 }, { "epoch": 0.09, "learning_rate": 9.805851321787732e-05, "loss": 2.461, "step": 10520 }, { "epoch": 0.09, "learning_rate": 9.805666170714556e-05, "loss": 2.3654, "step": 10525 }, { "epoch": 0.09, "learning_rate": 9.80548093314789e-05, "loss": 2.347, "step": 10530 }, { "epoch": 0.09, "learning_rate": 9.805295609091072e-05, "loss": 2.3486, "step": 10535 }, { "epoch": 0.09, "learning_rate": 9.805110198547433e-05, "loss": 2.4543, "step": 10540 }, { "epoch": 0.09, "learning_rate": 9.804924701520313e-05, "loss": 2.4428, "step": 10545 }, { "epoch": 0.09, "learning_rate": 9.804739118013049e-05, "loss": 2.3446, "step": 10550 }, { "epoch": 0.09, "learning_rate": 9.804553448028981e-05, "loss": 2.4107, "step": 10555 }, { "epoch": 0.09, "learning_rate": 9.804367691571453e-05, "loss": 2.3684, "step": 10560 }, { "epoch": 0.09, "learning_rate": 9.804181848643807e-05, "loss": 2.3825, "step": 10565 }, { "epoch": 0.09, "learning_rate": 9.803995919249387e-05, "loss": 2.3973, "step": 10570 }, { "epoch": 0.09, "learning_rate": 9.803809903391541e-05, "loss": 2.3753, "step": 10575 }, { "epoch": 0.09, "learning_rate": 9.803623801073616e-05, "loss": 2.4468, "step": 10580 }, { "epoch": 0.09, "learning_rate": 9.80343761229896e-05, "loss": 2.4038, "step": 10585 }, { "epoch": 0.09, "learning_rate": 9.803251337070928e-05, "loss": 2.3869, "step": 10590 }, { "epoch": 0.09, "learning_rate": 9.803064975392869e-05, "loss": 2.4341, "step": 10595 }, { "epoch": 0.09, "learning_rate": 9.802878527268138e-05, "loss": 2.3198, "step": 10600 }, { "epoch": 0.09, "learning_rate": 9.802691992700092e-05, "loss": 2.459, "step": 10605 }, { "epoch": 0.09, "learning_rate": 9.802505371692088e-05, "loss": 2.3765, "step": 10610 }, { "epoch": 0.09, "learning_rate": 9.802318664247482e-05, "loss": 2.3828, "step": 10615 }, { "epoch": 0.09, "learning_rate": 9.80213187036964e-05, "loss": 2.4289, "step": 10620 }, { "epoch": 0.09, "learning_rate": 9.801944990061919e-05, "loss": 2.3771, "step": 10625 }, { "epoch": 0.09, "learning_rate": 9.801758023327684e-05, "loss": 2.3056, "step": 10630 }, { "epoch": 0.09, "learning_rate": 9.801570970170301e-05, "loss": 2.4644, "step": 10635 }, { "epoch": 0.09, "learning_rate": 9.801383830593134e-05, "loss": 2.4054, "step": 10640 }, { "epoch": 0.09, "learning_rate": 9.801196604599557e-05, "loss": 2.4352, "step": 10645 }, { "epoch": 0.09, "learning_rate": 9.801009292192933e-05, "loss": 2.467, "step": 10650 }, { "epoch": 0.09, "learning_rate": 9.800821893376637e-05, "loss": 2.3653, "step": 10655 }, { "epoch": 0.09, "learning_rate": 9.80063440815404e-05, "loss": 2.4454, "step": 10660 }, { "epoch": 0.09, "learning_rate": 9.800446836528517e-05, "loss": 2.3492, "step": 10665 }, { "epoch": 0.09, "learning_rate": 9.800259178503446e-05, "loss": 2.3842, "step": 10670 }, { "epoch": 0.09, "learning_rate": 9.800071434082202e-05, "loss": 2.4617, "step": 10675 }, { "epoch": 0.09, "learning_rate": 9.799883603268165e-05, "loss": 2.3653, "step": 10680 }, { "epoch": 0.09, "learning_rate": 9.799695686064716e-05, "loss": 2.4022, "step": 10685 }, { "epoch": 0.09, "learning_rate": 9.799507682475237e-05, "loss": 2.3411, "step": 10690 }, { "epoch": 0.09, "learning_rate": 9.79931959250311e-05, "loss": 2.3976, "step": 10695 }, { "epoch": 0.09, "learning_rate": 9.799131416151724e-05, "loss": 2.4582, "step": 10700 }, { "epoch": 0.09, "learning_rate": 9.79894315342446e-05, "loss": 2.398, "step": 10705 }, { "epoch": 0.09, "learning_rate": 9.798754804324712e-05, "loss": 2.4019, "step": 10710 }, { "epoch": 0.09, "learning_rate": 9.798566368855868e-05, "loss": 2.4358, "step": 10715 }, { "epoch": 0.09, "learning_rate": 9.79837784702132e-05, "loss": 2.4188, "step": 10720 }, { "epoch": 0.09, "learning_rate": 9.79818923882446e-05, "loss": 2.3439, "step": 10725 }, { "epoch": 0.09, "learning_rate": 9.798000544268684e-05, "loss": 2.3754, "step": 10730 }, { "epoch": 0.09, "learning_rate": 9.797811763357385e-05, "loss": 2.4722, "step": 10735 }, { "epoch": 0.09, "learning_rate": 9.797622896093966e-05, "loss": 2.4108, "step": 10740 }, { "epoch": 0.09, "learning_rate": 9.79743394248182e-05, "loss": 2.4714, "step": 10745 }, { "epoch": 0.09, "learning_rate": 9.797244902524354e-05, "loss": 2.4609, "step": 10750 }, { "epoch": 0.09, "learning_rate": 9.797055776224966e-05, "loss": 2.4202, "step": 10755 }, { "epoch": 0.09, "learning_rate": 9.796866563587062e-05, "loss": 2.375, "step": 10760 }, { "epoch": 0.09, "learning_rate": 9.796677264614046e-05, "loss": 2.4769, "step": 10765 }, { "epoch": 0.09, "learning_rate": 9.796487879309327e-05, "loss": 2.4644, "step": 10770 }, { "epoch": 0.09, "learning_rate": 9.796298407676312e-05, "loss": 2.4071, "step": 10775 }, { "epoch": 0.09, "learning_rate": 9.79610884971841e-05, "loss": 2.3498, "step": 10780 }, { "epoch": 0.09, "learning_rate": 9.795919205439036e-05, "loss": 2.3887, "step": 10785 }, { "epoch": 0.09, "learning_rate": 9.795729474841603e-05, "loss": 2.2969, "step": 10790 }, { "epoch": 0.09, "learning_rate": 9.795539657929525e-05, "loss": 2.4139, "step": 10795 }, { "epoch": 0.09, "learning_rate": 9.795349754706216e-05, "loss": 2.4278, "step": 10800 }, { "epoch": 0.09, "learning_rate": 9.795159765175095e-05, "loss": 2.4459, "step": 10805 }, { "epoch": 0.09, "learning_rate": 9.794969689339584e-05, "loss": 2.3732, "step": 10810 }, { "epoch": 0.09, "learning_rate": 9.794779527203101e-05, "loss": 2.4506, "step": 10815 }, { "epoch": 0.09, "learning_rate": 9.794589278769071e-05, "loss": 2.3366, "step": 10820 }, { "epoch": 0.09, "learning_rate": 9.794398944040917e-05, "loss": 2.384, "step": 10825 }, { "epoch": 0.09, "learning_rate": 9.794208523022063e-05, "loss": 2.4425, "step": 10830 }, { "epoch": 0.09, "learning_rate": 9.79401801571594e-05, "loss": 2.3725, "step": 10835 }, { "epoch": 0.09, "learning_rate": 9.793827422125974e-05, "loss": 2.4678, "step": 10840 }, { "epoch": 0.09, "learning_rate": 9.793636742255597e-05, "loss": 2.4401, "step": 10845 }, { "epoch": 0.09, "learning_rate": 9.793445976108237e-05, "loss": 2.3202, "step": 10850 }, { "epoch": 0.09, "learning_rate": 9.793255123687332e-05, "loss": 2.325, "step": 10855 }, { "epoch": 0.09, "learning_rate": 9.793064184996317e-05, "loss": 2.4535, "step": 10860 }, { "epoch": 0.09, "learning_rate": 9.792873160038626e-05, "loss": 2.4553, "step": 10865 }, { "epoch": 0.09, "learning_rate": 9.792682048817699e-05, "loss": 2.4114, "step": 10870 }, { "epoch": 0.09, "learning_rate": 9.792490851336973e-05, "loss": 2.3613, "step": 10875 }, { "epoch": 0.09, "learning_rate": 9.792299567599891e-05, "loss": 2.4272, "step": 10880 }, { "epoch": 0.09, "learning_rate": 9.792108197609898e-05, "loss": 2.4223, "step": 10885 }, { "epoch": 0.09, "learning_rate": 9.791916741370434e-05, "loss": 2.4676, "step": 10890 }, { "epoch": 0.09, "learning_rate": 9.791725198884947e-05, "loss": 2.383, "step": 10895 }, { "epoch": 0.09, "learning_rate": 9.791533570156885e-05, "loss": 2.3604, "step": 10900 }, { "epoch": 0.09, "learning_rate": 9.791341855189697e-05, "loss": 2.4072, "step": 10905 }, { "epoch": 0.09, "learning_rate": 9.791150053986832e-05, "loss": 2.4687, "step": 10910 }, { "epoch": 0.09, "learning_rate": 9.790958166551743e-05, "loss": 2.3756, "step": 10915 }, { "epoch": 0.09, "learning_rate": 9.790766192887884e-05, "loss": 2.3514, "step": 10920 }, { "epoch": 0.09, "learning_rate": 9.79057413299871e-05, "loss": 2.4842, "step": 10925 }, { "epoch": 0.09, "learning_rate": 9.790381986887677e-05, "loss": 2.4168, "step": 10930 }, { "epoch": 0.09, "learning_rate": 9.790189754558244e-05, "loss": 2.4055, "step": 10935 }, { "epoch": 0.09, "learning_rate": 9.789997436013871e-05, "loss": 2.4316, "step": 10940 }, { "epoch": 0.09, "learning_rate": 9.789805031258018e-05, "loss": 2.4325, "step": 10945 }, { "epoch": 0.09, "learning_rate": 9.78961254029415e-05, "loss": 2.3801, "step": 10950 }, { "epoch": 0.09, "learning_rate": 9.78941996312573e-05, "loss": 2.3085, "step": 10955 }, { "epoch": 0.09, "learning_rate": 9.789227299756225e-05, "loss": 2.3581, "step": 10960 }, { "epoch": 0.09, "learning_rate": 9.789034550189103e-05, "loss": 2.3554, "step": 10965 }, { "epoch": 0.09, "learning_rate": 9.78884171442783e-05, "loss": 2.3805, "step": 10970 }, { "epoch": 0.09, "learning_rate": 9.78864879247588e-05, "loss": 2.4327, "step": 10975 }, { "epoch": 0.09, "learning_rate": 9.788455784336726e-05, "loss": 2.4285, "step": 10980 }, { "epoch": 0.09, "learning_rate": 9.788262690013838e-05, "loss": 2.3819, "step": 10985 }, { "epoch": 0.09, "learning_rate": 9.788069509510694e-05, "loss": 2.4143, "step": 10990 }, { "epoch": 0.09, "learning_rate": 9.787876242830769e-05, "loss": 2.3302, "step": 10995 }, { "epoch": 0.09, "learning_rate": 9.787682889977545e-05, "loss": 2.4706, "step": 11000 }, { "epoch": 0.09, "learning_rate": 9.787489450954499e-05, "loss": 2.4168, "step": 11005 }, { "epoch": 0.09, "learning_rate": 9.787295925765114e-05, "loss": 2.3806, "step": 11010 }, { "epoch": 0.09, "learning_rate": 9.78710231441287e-05, "loss": 2.3596, "step": 11015 }, { "epoch": 0.09, "learning_rate": 9.786908616901255e-05, "loss": 2.4313, "step": 11020 }, { "epoch": 0.09, "learning_rate": 9.786714833233756e-05, "loss": 2.408, "step": 11025 }, { "epoch": 0.09, "learning_rate": 9.786520963413859e-05, "loss": 2.3751, "step": 11030 }, { "epoch": 0.09, "learning_rate": 9.786327007445054e-05, "loss": 2.391, "step": 11035 }, { "epoch": 0.09, "learning_rate": 9.786132965330829e-05, "loss": 2.3451, "step": 11040 }, { "epoch": 0.09, "learning_rate": 9.78593883707468e-05, "loss": 2.3547, "step": 11045 }, { "epoch": 0.09, "learning_rate": 9.785744622680099e-05, "loss": 2.4247, "step": 11050 }, { "epoch": 0.09, "learning_rate": 9.785550322150582e-05, "loss": 2.4071, "step": 11055 }, { "epoch": 0.09, "learning_rate": 9.785355935489626e-05, "loss": 2.4031, "step": 11060 }, { "epoch": 0.09, "learning_rate": 9.785161462700731e-05, "loss": 2.3698, "step": 11065 }, { "epoch": 0.09, "learning_rate": 9.784966903787396e-05, "loss": 2.3748, "step": 11070 }, { "epoch": 0.09, "learning_rate": 9.784772258753123e-05, "loss": 2.383, "step": 11075 }, { "epoch": 0.09, "learning_rate": 9.784577527601415e-05, "loss": 2.3815, "step": 11080 }, { "epoch": 0.09, "learning_rate": 9.784382710335776e-05, "loss": 2.4137, "step": 11085 }, { "epoch": 0.09, "learning_rate": 9.784187806959712e-05, "loss": 2.4359, "step": 11090 }, { "epoch": 0.09, "learning_rate": 9.783992817476735e-05, "loss": 2.4018, "step": 11095 }, { "epoch": 0.09, "learning_rate": 9.78379774189035e-05, "loss": 2.3516, "step": 11100 }, { "epoch": 0.09, "learning_rate": 9.783602580204068e-05, "loss": 2.4437, "step": 11105 }, { "epoch": 0.09, "learning_rate": 9.783407332421406e-05, "loss": 2.4326, "step": 11110 }, { "epoch": 0.09, "learning_rate": 9.783211998545874e-05, "loss": 2.3954, "step": 11115 }, { "epoch": 0.09, "learning_rate": 9.783016578580987e-05, "loss": 2.4437, "step": 11120 }, { "epoch": 0.09, "learning_rate": 9.782821072530268e-05, "loss": 2.4106, "step": 11125 }, { "epoch": 0.09, "learning_rate": 9.78262548039723e-05, "loss": 2.3361, "step": 11130 }, { "epoch": 0.1, "learning_rate": 9.782429802185396e-05, "loss": 2.3984, "step": 11135 }, { "epoch": 0.1, "learning_rate": 9.782234037898285e-05, "loss": 2.4047, "step": 11140 }, { "epoch": 0.1, "learning_rate": 9.782038187539424e-05, "loss": 2.4451, "step": 11145 }, { "epoch": 0.1, "learning_rate": 9.781842251112337e-05, "loss": 2.3381, "step": 11150 }, { "epoch": 0.1, "learning_rate": 9.781646228620549e-05, "loss": 2.4263, "step": 11155 }, { "epoch": 0.1, "learning_rate": 9.781450120067589e-05, "loss": 2.4134, "step": 11160 }, { "epoch": 0.1, "learning_rate": 9.781253925456986e-05, "loss": 2.4047, "step": 11165 }, { "epoch": 0.1, "learning_rate": 9.781057644792273e-05, "loss": 2.3658, "step": 11170 }, { "epoch": 0.1, "learning_rate": 9.780861278076982e-05, "loss": 2.3463, "step": 11175 }, { "epoch": 0.1, "learning_rate": 9.780664825314647e-05, "loss": 2.3927, "step": 11180 }, { "epoch": 0.1, "learning_rate": 9.780468286508802e-05, "loss": 2.4236, "step": 11185 }, { "epoch": 0.1, "learning_rate": 9.780271661662986e-05, "loss": 2.4773, "step": 11190 }, { "epoch": 0.1, "learning_rate": 9.780074950780737e-05, "loss": 2.4443, "step": 11195 }, { "epoch": 0.1, "learning_rate": 9.779878153865598e-05, "loss": 2.3888, "step": 11200 }, { "epoch": 0.1, "learning_rate": 9.779681270921108e-05, "loss": 2.3845, "step": 11205 }, { "epoch": 0.1, "learning_rate": 9.779484301950813e-05, "loss": 2.3806, "step": 11210 }, { "epoch": 0.1, "learning_rate": 9.779287246958256e-05, "loss": 2.4612, "step": 11215 }, { "epoch": 0.1, "learning_rate": 9.779090105946985e-05, "loss": 2.4154, "step": 11220 }, { "epoch": 0.1, "learning_rate": 9.778892878920546e-05, "loss": 2.4301, "step": 11225 }, { "epoch": 0.1, "learning_rate": 9.778695565882494e-05, "loss": 2.4665, "step": 11230 }, { "epoch": 0.1, "learning_rate": 9.778498166836374e-05, "loss": 2.4192, "step": 11235 }, { "epoch": 0.1, "learning_rate": 9.778300681785743e-05, "loss": 2.3721, "step": 11240 }, { "epoch": 0.1, "learning_rate": 9.778103110734152e-05, "loss": 2.3562, "step": 11245 }, { "epoch": 0.1, "learning_rate": 9.777905453685161e-05, "loss": 2.4117, "step": 11250 }, { "epoch": 0.1, "learning_rate": 9.777707710642323e-05, "loss": 2.4536, "step": 11255 }, { "epoch": 0.1, "learning_rate": 9.777509881609202e-05, "loss": 2.3953, "step": 11260 }, { "epoch": 0.1, "learning_rate": 9.777311966589354e-05, "loss": 2.3965, "step": 11265 }, { "epoch": 0.1, "learning_rate": 9.777113965586345e-05, "loss": 2.2989, "step": 11270 }, { "epoch": 0.1, "learning_rate": 9.776915878603734e-05, "loss": 2.3762, "step": 11275 }, { "epoch": 0.1, "learning_rate": 9.776717705645091e-05, "loss": 2.4545, "step": 11280 }, { "epoch": 0.1, "learning_rate": 9.77651944671398e-05, "loss": 2.4738, "step": 11285 }, { "epoch": 0.1, "learning_rate": 9.77632110181397e-05, "loss": 2.4874, "step": 11290 }, { "epoch": 0.1, "learning_rate": 9.776122670948631e-05, "loss": 2.4561, "step": 11295 }, { "epoch": 0.1, "learning_rate": 9.775924154121534e-05, "loss": 2.4269, "step": 11300 }, { "epoch": 0.1, "learning_rate": 9.775725551336254e-05, "loss": 2.3665, "step": 11305 }, { "epoch": 0.1, "learning_rate": 9.775526862596361e-05, "loss": 2.3134, "step": 11310 }, { "epoch": 0.1, "learning_rate": 9.775328087905436e-05, "loss": 2.3946, "step": 11315 }, { "epoch": 0.1, "learning_rate": 9.775129227267052e-05, "loss": 2.3343, "step": 11320 }, { "epoch": 0.1, "learning_rate": 9.774930280684793e-05, "loss": 2.3837, "step": 11325 }, { "epoch": 0.1, "learning_rate": 9.774731248162236e-05, "loss": 2.3581, "step": 11330 }, { "epoch": 0.1, "learning_rate": 9.774532129702965e-05, "loss": 2.425, "step": 11335 }, { "epoch": 0.1, "learning_rate": 9.774332925310563e-05, "loss": 2.3756, "step": 11340 }, { "epoch": 0.1, "learning_rate": 9.774133634988615e-05, "loss": 2.3724, "step": 11345 }, { "epoch": 0.1, "learning_rate": 9.773934258740709e-05, "loss": 2.3571, "step": 11350 }, { "epoch": 0.1, "learning_rate": 9.773734796570434e-05, "loss": 2.4544, "step": 11355 }, { "epoch": 0.1, "learning_rate": 9.773535248481376e-05, "loss": 2.3982, "step": 11360 }, { "epoch": 0.1, "learning_rate": 9.77333561447713e-05, "loss": 2.3818, "step": 11365 }, { "epoch": 0.1, "learning_rate": 9.77313589456129e-05, "loss": 2.3687, "step": 11370 }, { "epoch": 0.1, "learning_rate": 9.772936088737448e-05, "loss": 2.3704, "step": 11375 }, { "epoch": 0.1, "learning_rate": 9.7727361970092e-05, "loss": 2.4009, "step": 11380 }, { "epoch": 0.1, "learning_rate": 9.772536219380146e-05, "loss": 2.3356, "step": 11385 }, { "epoch": 0.1, "learning_rate": 9.772336155853884e-05, "loss": 2.4133, "step": 11390 }, { "epoch": 0.1, "learning_rate": 9.772136006434015e-05, "loss": 2.2982, "step": 11395 }, { "epoch": 0.1, "learning_rate": 9.771935771124142e-05, "loss": 2.3398, "step": 11400 }, { "epoch": 0.1, "learning_rate": 9.771735449927867e-05, "loss": 2.4352, "step": 11405 }, { "epoch": 0.1, "learning_rate": 9.771535042848797e-05, "loss": 2.417, "step": 11410 }, { "epoch": 0.1, "learning_rate": 9.771334549890538e-05, "loss": 2.3529, "step": 11415 }, { "epoch": 0.1, "learning_rate": 9.771133971056698e-05, "loss": 2.3262, "step": 11420 }, { "epoch": 0.1, "learning_rate": 9.77093330635089e-05, "loss": 2.3769, "step": 11425 }, { "epoch": 0.1, "learning_rate": 9.770732555776723e-05, "loss": 2.412, "step": 11430 }, { "epoch": 0.1, "learning_rate": 9.77053171933781e-05, "loss": 2.3671, "step": 11435 }, { "epoch": 0.1, "learning_rate": 9.770330797037768e-05, "loss": 2.3549, "step": 11440 }, { "epoch": 0.1, "learning_rate": 9.770129788880212e-05, "loss": 2.4227, "step": 11445 }, { "epoch": 0.1, "learning_rate": 9.769928694868758e-05, "loss": 2.4697, "step": 11450 }, { "epoch": 0.1, "learning_rate": 9.769727515007027e-05, "loss": 2.3943, "step": 11455 }, { "epoch": 0.1, "learning_rate": 9.769526249298639e-05, "loss": 2.4019, "step": 11460 }, { "epoch": 0.1, "learning_rate": 9.76932489774722e-05, "loss": 2.5808, "step": 11465 }, { "epoch": 0.1, "learning_rate": 9.769123460356388e-05, "loss": 2.381, "step": 11470 }, { "epoch": 0.1, "learning_rate": 9.768921937129773e-05, "loss": 2.363, "step": 11475 }, { "epoch": 0.1, "learning_rate": 9.768720328071002e-05, "loss": 2.2513, "step": 11480 }, { "epoch": 0.1, "learning_rate": 9.768518633183702e-05, "loss": 2.3727, "step": 11485 }, { "epoch": 0.1, "learning_rate": 9.768316852471502e-05, "loss": 2.4225, "step": 11490 }, { "epoch": 0.1, "learning_rate": 9.768114985938037e-05, "loss": 2.3587, "step": 11495 }, { "epoch": 0.1, "learning_rate": 9.767913033586937e-05, "loss": 2.4098, "step": 11500 }, { "epoch": 0.1, "learning_rate": 9.76771099542184e-05, "loss": 2.3977, "step": 11505 }, { "epoch": 0.1, "learning_rate": 9.767508871446378e-05, "loss": 2.3953, "step": 11510 }, { "epoch": 0.1, "learning_rate": 9.767306661664193e-05, "loss": 2.3987, "step": 11515 }, { "epoch": 0.1, "learning_rate": 9.767104366078922e-05, "loss": 2.3532, "step": 11520 }, { "epoch": 0.1, "learning_rate": 9.766901984694207e-05, "loss": 2.5452, "step": 11525 }, { "epoch": 0.1, "learning_rate": 9.766699517513691e-05, "loss": 2.4169, "step": 11530 }, { "epoch": 0.1, "learning_rate": 9.766496964541018e-05, "loss": 2.4275, "step": 11535 }, { "epoch": 0.1, "learning_rate": 9.766294325779833e-05, "loss": 2.3433, "step": 11540 }, { "epoch": 0.1, "learning_rate": 9.766091601233781e-05, "loss": 2.4355, "step": 11545 }, { "epoch": 0.1, "learning_rate": 9.765888790906514e-05, "loss": 2.4072, "step": 11550 }, { "epoch": 0.1, "learning_rate": 9.765685894801681e-05, "loss": 2.2921, "step": 11555 }, { "epoch": 0.1, "learning_rate": 9.765482912922934e-05, "loss": 2.4155, "step": 11560 }, { "epoch": 0.1, "learning_rate": 9.765279845273926e-05, "loss": 2.3752, "step": 11565 }, { "epoch": 0.1, "learning_rate": 9.765076691858311e-05, "loss": 2.4217, "step": 11570 }, { "epoch": 0.1, "learning_rate": 9.764873452679748e-05, "loss": 2.3947, "step": 11575 }, { "epoch": 0.1, "learning_rate": 9.764670127741893e-05, "loss": 2.4193, "step": 11580 }, { "epoch": 0.1, "learning_rate": 9.764466717048405e-05, "loss": 2.3295, "step": 11585 }, { "epoch": 0.1, "learning_rate": 9.764263220602945e-05, "loss": 2.4335, "step": 11590 }, { "epoch": 0.1, "learning_rate": 9.764059638409179e-05, "loss": 2.3677, "step": 11595 }, { "epoch": 0.1, "learning_rate": 9.763855970470766e-05, "loss": 2.4452, "step": 11600 }, { "epoch": 0.1, "learning_rate": 9.763652216791375e-05, "loss": 2.3925, "step": 11605 }, { "epoch": 0.1, "learning_rate": 9.763448377374674e-05, "loss": 2.2618, "step": 11610 }, { "epoch": 0.1, "learning_rate": 9.763244452224328e-05, "loss": 2.4511, "step": 11615 }, { "epoch": 0.1, "learning_rate": 9.763040441344011e-05, "loss": 2.3449, "step": 11620 }, { "epoch": 0.1, "learning_rate": 9.762836344737392e-05, "loss": 2.4632, "step": 11625 }, { "epoch": 0.1, "learning_rate": 9.762632162408146e-05, "loss": 2.4197, "step": 11630 }, { "epoch": 0.1, "learning_rate": 9.762427894359947e-05, "loss": 2.411, "step": 11635 }, { "epoch": 0.1, "learning_rate": 9.762223540596474e-05, "loss": 2.3117, "step": 11640 }, { "epoch": 0.1, "learning_rate": 9.762019101121402e-05, "loss": 2.4135, "step": 11645 }, { "epoch": 0.1, "learning_rate": 9.761814575938411e-05, "loss": 2.3609, "step": 11650 }, { "epoch": 0.1, "learning_rate": 9.761609965051184e-05, "loss": 2.3933, "step": 11655 }, { "epoch": 0.1, "learning_rate": 9.7614052684634e-05, "loss": 2.3625, "step": 11660 }, { "epoch": 0.1, "learning_rate": 9.761200486178747e-05, "loss": 2.4432, "step": 11665 }, { "epoch": 0.1, "learning_rate": 9.760995618200909e-05, "loss": 2.339, "step": 11670 }, { "epoch": 0.1, "learning_rate": 9.760790664533574e-05, "loss": 2.4167, "step": 11675 }, { "epoch": 0.1, "learning_rate": 9.76058562518043e-05, "loss": 2.3345, "step": 11680 }, { "epoch": 0.1, "learning_rate": 9.760380500145168e-05, "loss": 2.4048, "step": 11685 }, { "epoch": 0.1, "learning_rate": 9.760175289431478e-05, "loss": 2.3931, "step": 11690 }, { "epoch": 0.1, "learning_rate": 9.759969993043056e-05, "loss": 2.4195, "step": 11695 }, { "epoch": 0.1, "learning_rate": 9.759764610983596e-05, "loss": 2.3647, "step": 11700 }, { "epoch": 0.1, "learning_rate": 9.759559143256794e-05, "loss": 2.3433, "step": 11705 }, { "epoch": 0.1, "learning_rate": 9.75935358986635e-05, "loss": 2.3721, "step": 11710 }, { "epoch": 0.1, "learning_rate": 9.759147950815959e-05, "loss": 2.4223, "step": 11715 }, { "epoch": 0.1, "learning_rate": 9.758942226109328e-05, "loss": 2.4304, "step": 11720 }, { "epoch": 0.1, "learning_rate": 9.758736415750156e-05, "loss": 2.4273, "step": 11725 }, { "epoch": 0.1, "learning_rate": 9.758530519742148e-05, "loss": 2.3456, "step": 11730 }, { "epoch": 0.1, "learning_rate": 9.75832453808901e-05, "loss": 2.3658, "step": 11735 }, { "epoch": 0.1, "learning_rate": 9.758118470794448e-05, "loss": 2.412, "step": 11740 }, { "epoch": 0.1, "learning_rate": 9.757912317862173e-05, "loss": 2.4181, "step": 11745 }, { "epoch": 0.1, "learning_rate": 9.757706079295894e-05, "loss": 2.3927, "step": 11750 }, { "epoch": 0.1, "learning_rate": 9.757499755099324e-05, "loss": 2.4534, "step": 11755 }, { "epoch": 0.1, "learning_rate": 9.757293345276176e-05, "loss": 2.4218, "step": 11760 }, { "epoch": 0.1, "learning_rate": 9.757086849830165e-05, "loss": 2.3092, "step": 11765 }, { "epoch": 0.1, "learning_rate": 9.756880268765007e-05, "loss": 2.4324, "step": 11770 }, { "epoch": 0.1, "learning_rate": 9.75667360208442e-05, "loss": 2.3982, "step": 11775 }, { "epoch": 0.1, "learning_rate": 9.756466849792125e-05, "loss": 2.3494, "step": 11780 }, { "epoch": 0.1, "learning_rate": 9.756260011891841e-05, "loss": 2.3362, "step": 11785 }, { "epoch": 0.1, "learning_rate": 9.756053088387294e-05, "loss": 2.4208, "step": 11790 }, { "epoch": 0.1, "learning_rate": 9.755846079282205e-05, "loss": 2.4142, "step": 11795 }, { "epoch": 0.1, "learning_rate": 9.7556389845803e-05, "loss": 2.4121, "step": 11800 }, { "epoch": 0.1, "learning_rate": 9.755431804285309e-05, "loss": 2.3244, "step": 11805 }, { "epoch": 0.1, "learning_rate": 9.755224538400958e-05, "loss": 2.3871, "step": 11810 }, { "epoch": 0.1, "learning_rate": 9.755017186930979e-05, "loss": 2.4176, "step": 11815 }, { "epoch": 0.1, "learning_rate": 9.754809749879106e-05, "loss": 2.3084, "step": 11820 }, { "epoch": 0.1, "learning_rate": 9.754602227249067e-05, "loss": 2.5251, "step": 11825 }, { "epoch": 0.1, "learning_rate": 9.754394619044602e-05, "loss": 2.3651, "step": 11830 }, { "epoch": 0.1, "learning_rate": 9.754186925269445e-05, "loss": 2.4608, "step": 11835 }, { "epoch": 0.1, "learning_rate": 9.753979145927334e-05, "loss": 2.3764, "step": 11840 }, { "epoch": 0.1, "learning_rate": 9.753771281022012e-05, "loss": 2.4069, "step": 11845 }, { "epoch": 0.1, "learning_rate": 9.753563330557216e-05, "loss": 2.4254, "step": 11850 }, { "epoch": 0.1, "learning_rate": 9.753355294536692e-05, "loss": 2.4702, "step": 11855 }, { "epoch": 0.1, "learning_rate": 9.753147172964181e-05, "loss": 2.4659, "step": 11860 }, { "epoch": 0.1, "learning_rate": 9.752938965843431e-05, "loss": 2.3413, "step": 11865 }, { "epoch": 0.1, "learning_rate": 9.75273067317819e-05, "loss": 2.3398, "step": 11870 }, { "epoch": 0.1, "learning_rate": 9.752522294972204e-05, "loss": 2.3833, "step": 11875 }, { "epoch": 0.1, "learning_rate": 9.752313831229228e-05, "loss": 2.4105, "step": 11880 }, { "epoch": 0.1, "learning_rate": 9.752105281953008e-05, "loss": 2.3763, "step": 11885 }, { "epoch": 0.1, "learning_rate": 9.751896647147303e-05, "loss": 2.3566, "step": 11890 }, { "epoch": 0.1, "learning_rate": 9.751687926815865e-05, "loss": 2.4784, "step": 11895 }, { "epoch": 0.1, "learning_rate": 9.751479120962453e-05, "loss": 2.3438, "step": 11900 }, { "epoch": 0.1, "learning_rate": 9.75127022959082e-05, "loss": 2.4113, "step": 11905 }, { "epoch": 0.1, "learning_rate": 9.751061252704733e-05, "loss": 2.4566, "step": 11910 }, { "epoch": 0.1, "learning_rate": 9.750852190307949e-05, "loss": 2.4216, "step": 11915 }, { "epoch": 0.1, "learning_rate": 9.75064304240423e-05, "loss": 2.3612, "step": 11920 }, { "epoch": 0.1, "learning_rate": 9.750433808997341e-05, "loss": 2.374, "step": 11925 }, { "epoch": 0.1, "learning_rate": 9.75022449009105e-05, "loss": 2.3836, "step": 11930 }, { "epoch": 0.1, "learning_rate": 9.750015085689121e-05, "loss": 2.4607, "step": 11935 }, { "epoch": 0.1, "learning_rate": 9.749805595795326e-05, "loss": 2.3857, "step": 11940 }, { "epoch": 0.1, "learning_rate": 9.749596020413434e-05, "loss": 2.3922, "step": 11945 }, { "epoch": 0.1, "learning_rate": 9.749386359547216e-05, "loss": 2.4611, "step": 11950 }, { "epoch": 0.1, "learning_rate": 9.749176613200448e-05, "loss": 2.3247, "step": 11955 }, { "epoch": 0.1, "learning_rate": 9.748966781376902e-05, "loss": 2.3905, "step": 11960 }, { "epoch": 0.1, "learning_rate": 9.748756864080358e-05, "loss": 2.4254, "step": 11965 }, { "epoch": 0.1, "learning_rate": 9.748546861314592e-05, "loss": 2.376, "step": 11970 }, { "epoch": 0.1, "learning_rate": 9.748336773083382e-05, "loss": 2.3367, "step": 11975 }, { "epoch": 0.1, "learning_rate": 9.748126599390514e-05, "loss": 2.3905, "step": 11980 }, { "epoch": 0.1, "learning_rate": 9.747916340239767e-05, "loss": 2.3988, "step": 11985 }, { "epoch": 0.1, "learning_rate": 9.747705995634925e-05, "loss": 2.4157, "step": 11990 }, { "epoch": 0.1, "learning_rate": 9.747495565579776e-05, "loss": 2.3097, "step": 11995 }, { "epoch": 0.1, "learning_rate": 9.747285050078108e-05, "loss": 2.3666, "step": 12000 }, { "epoch": 0.1, "learning_rate": 9.747074449133707e-05, "loss": 2.37, "step": 12005 }, { "epoch": 0.1, "learning_rate": 9.746863762750366e-05, "loss": 2.4268, "step": 12010 }, { "epoch": 0.1, "learning_rate": 9.746652990931875e-05, "loss": 2.4022, "step": 12015 }, { "epoch": 0.1, "learning_rate": 9.746442133682028e-05, "loss": 2.3044, "step": 12020 }, { "epoch": 0.1, "learning_rate": 9.746231191004621e-05, "loss": 2.4147, "step": 12025 }, { "epoch": 0.1, "learning_rate": 9.746020162903449e-05, "loss": 2.3337, "step": 12030 }, { "epoch": 0.1, "learning_rate": 9.745809049382313e-05, "loss": 2.4957, "step": 12035 }, { "epoch": 0.1, "learning_rate": 9.74559785044501e-05, "loss": 2.4158, "step": 12040 }, { "epoch": 0.1, "learning_rate": 9.745386566095342e-05, "loss": 2.4642, "step": 12045 }, { "epoch": 0.1, "learning_rate": 9.745175196337111e-05, "loss": 2.3692, "step": 12050 }, { "epoch": 0.1, "learning_rate": 9.744963741174124e-05, "loss": 2.3491, "step": 12055 }, { "epoch": 0.1, "learning_rate": 9.744752200610183e-05, "loss": 2.4183, "step": 12060 }, { "epoch": 0.1, "learning_rate": 9.7445405746491e-05, "loss": 2.3643, "step": 12065 }, { "epoch": 0.1, "learning_rate": 9.744328863294679e-05, "loss": 2.4393, "step": 12070 }, { "epoch": 0.1, "learning_rate": 9.744117066550731e-05, "loss": 2.4171, "step": 12075 }, { "epoch": 0.1, "learning_rate": 9.743905184421071e-05, "loss": 2.4852, "step": 12080 }, { "epoch": 0.1, "learning_rate": 9.743693216909512e-05, "loss": 2.4567, "step": 12085 }, { "epoch": 0.1, "learning_rate": 9.743481164019867e-05, "loss": 2.4456, "step": 12090 }, { "epoch": 0.1, "learning_rate": 9.743269025755955e-05, "loss": 2.387, "step": 12095 }, { "epoch": 0.1, "learning_rate": 9.743056802121591e-05, "loss": 2.385, "step": 12100 }, { "epoch": 0.1, "learning_rate": 9.742844493120598e-05, "loss": 2.3585, "step": 12105 }, { "epoch": 0.1, "learning_rate": 9.742632098756795e-05, "loss": 2.4183, "step": 12110 }, { "epoch": 0.1, "learning_rate": 9.742419619034005e-05, "loss": 2.3099, "step": 12115 }, { "epoch": 0.1, "learning_rate": 9.742207053956051e-05, "loss": 2.4335, "step": 12120 }, { "epoch": 0.1, "learning_rate": 9.741994403526764e-05, "loss": 2.3698, "step": 12125 }, { "epoch": 0.1, "learning_rate": 9.741781667749965e-05, "loss": 2.4408, "step": 12130 }, { "epoch": 0.1, "learning_rate": 9.741568846629487e-05, "loss": 2.3609, "step": 12135 }, { "epoch": 0.1, "learning_rate": 9.741355940169158e-05, "loss": 2.4496, "step": 12140 }, { "epoch": 0.1, "learning_rate": 9.741142948372812e-05, "loss": 2.457, "step": 12145 }, { "epoch": 0.1, "learning_rate": 9.74092987124428e-05, "loss": 2.345, "step": 12150 }, { "epoch": 0.1, "learning_rate": 9.740716708787398e-05, "loss": 2.3633, "step": 12155 }, { "epoch": 0.1, "learning_rate": 9.740503461006005e-05, "loss": 2.3681, "step": 12160 }, { "epoch": 0.1, "learning_rate": 9.740290127903937e-05, "loss": 2.3925, "step": 12165 }, { "epoch": 0.1, "learning_rate": 9.740076709485032e-05, "loss": 2.4228, "step": 12170 }, { "epoch": 0.1, "learning_rate": 9.739863205753133e-05, "loss": 2.3644, "step": 12175 }, { "epoch": 0.1, "learning_rate": 9.739649616712084e-05, "loss": 2.3573, "step": 12180 }, { "epoch": 0.1, "learning_rate": 9.739435942365727e-05, "loss": 2.4031, "step": 12185 }, { "epoch": 0.1, "learning_rate": 9.739222182717908e-05, "loss": 2.4066, "step": 12190 }, { "epoch": 0.1, "learning_rate": 9.739008337772476e-05, "loss": 2.3723, "step": 12195 }, { "epoch": 0.1, "learning_rate": 9.738794407533277e-05, "loss": 2.4568, "step": 12200 }, { "epoch": 0.1, "learning_rate": 9.738580392004164e-05, "loss": 2.3778, "step": 12205 }, { "epoch": 0.1, "learning_rate": 9.738366291188988e-05, "loss": 2.4806, "step": 12210 }, { "epoch": 0.1, "learning_rate": 9.738152105091602e-05, "loss": 2.4423, "step": 12215 }, { "epoch": 0.1, "learning_rate": 9.73793783371586e-05, "loss": 2.4579, "step": 12220 }, { "epoch": 0.1, "learning_rate": 9.737723477065622e-05, "loss": 2.3059, "step": 12225 }, { "epoch": 0.1, "learning_rate": 9.737509035144743e-05, "loss": 2.4032, "step": 12230 }, { "epoch": 0.1, "learning_rate": 9.737294507957082e-05, "loss": 2.3742, "step": 12235 }, { "epoch": 0.1, "learning_rate": 9.737079895506504e-05, "loss": 2.4314, "step": 12240 }, { "epoch": 0.1, "learning_rate": 9.736865197796868e-05, "loss": 2.417, "step": 12245 }, { "epoch": 0.1, "learning_rate": 9.736650414832038e-05, "loss": 2.3065, "step": 12250 }, { "epoch": 0.1, "learning_rate": 9.736435546615883e-05, "loss": 2.4428, "step": 12255 }, { "epoch": 0.1, "learning_rate": 9.736220593152268e-05, "loss": 2.3929, "step": 12260 }, { "epoch": 0.1, "learning_rate": 9.73600555444506e-05, "loss": 2.3698, "step": 12265 }, { "epoch": 0.1, "learning_rate": 9.735790430498136e-05, "loss": 2.3885, "step": 12270 }, { "epoch": 0.1, "learning_rate": 9.735575221315359e-05, "loss": 2.3887, "step": 12275 }, { "epoch": 0.1, "learning_rate": 9.735359926900608e-05, "loss": 2.3235, "step": 12280 }, { "epoch": 0.1, "learning_rate": 9.735144547257756e-05, "loss": 2.3873, "step": 12285 }, { "epoch": 0.1, "learning_rate": 9.73492908239068e-05, "loss": 2.4203, "step": 12290 }, { "epoch": 0.1, "learning_rate": 9.73471353230326e-05, "loss": 2.4234, "step": 12295 }, { "epoch": 0.1, "learning_rate": 9.734497896999372e-05, "loss": 2.3851, "step": 12300 }, { "epoch": 0.11, "learning_rate": 9.734282176482899e-05, "loss": 2.3548, "step": 12305 }, { "epoch": 0.11, "learning_rate": 9.734066370757722e-05, "loss": 2.4025, "step": 12310 }, { "epoch": 0.11, "learning_rate": 9.733850479827726e-05, "loss": 2.3913, "step": 12315 }, { "epoch": 0.11, "learning_rate": 9.7336345036968e-05, "loss": 2.349, "step": 12320 }, { "epoch": 0.11, "learning_rate": 9.733418442368825e-05, "loss": 2.4557, "step": 12325 }, { "epoch": 0.11, "learning_rate": 9.733202295847694e-05, "loss": 2.3597, "step": 12330 }, { "epoch": 0.11, "learning_rate": 9.732986064137296e-05, "loss": 2.3532, "step": 12335 }, { "epoch": 0.11, "learning_rate": 9.732769747241523e-05, "loss": 2.4773, "step": 12340 }, { "epoch": 0.11, "learning_rate": 9.732553345164268e-05, "loss": 2.3751, "step": 12345 }, { "epoch": 0.11, "learning_rate": 9.732336857909426e-05, "loss": 2.3412, "step": 12350 }, { "epoch": 0.11, "learning_rate": 9.732120285480894e-05, "loss": 2.3829, "step": 12355 }, { "epoch": 0.11, "learning_rate": 9.73190362788257e-05, "loss": 2.3424, "step": 12360 }, { "epoch": 0.11, "learning_rate": 9.731686885118352e-05, "loss": 2.303, "step": 12365 }, { "epoch": 0.11, "learning_rate": 9.731470057192141e-05, "loss": 2.3958, "step": 12370 }, { "epoch": 0.11, "learning_rate": 9.731253144107842e-05, "loss": 2.4041, "step": 12375 }, { "epoch": 0.11, "learning_rate": 9.731036145869354e-05, "loss": 2.3636, "step": 12380 }, { "epoch": 0.11, "learning_rate": 9.73081906248059e-05, "loss": 2.4057, "step": 12385 }, { "epoch": 0.11, "learning_rate": 9.73060189394545e-05, "loss": 2.3695, "step": 12390 }, { "epoch": 0.11, "learning_rate": 9.730384640267848e-05, "loss": 2.4641, "step": 12395 }, { "epoch": 0.11, "learning_rate": 9.730167301451691e-05, "loss": 2.4147, "step": 12400 }, { "epoch": 0.11, "learning_rate": 9.729949877500893e-05, "loss": 2.3165, "step": 12405 }, { "epoch": 0.11, "learning_rate": 9.729732368419363e-05, "loss": 2.3203, "step": 12410 }, { "epoch": 0.11, "learning_rate": 9.729514774211021e-05, "loss": 2.3699, "step": 12415 }, { "epoch": 0.11, "learning_rate": 9.729297094879779e-05, "loss": 2.4553, "step": 12420 }, { "epoch": 0.11, "learning_rate": 9.729079330429558e-05, "loss": 2.4315, "step": 12425 }, { "epoch": 0.11, "learning_rate": 9.728861480864278e-05, "loss": 2.3911, "step": 12430 }, { "epoch": 0.11, "learning_rate": 9.728643546187854e-05, "loss": 2.4099, "step": 12435 }, { "epoch": 0.11, "learning_rate": 9.728425526404216e-05, "loss": 2.4155, "step": 12440 }, { "epoch": 0.11, "learning_rate": 9.728207421517283e-05, "loss": 2.3899, "step": 12445 }, { "epoch": 0.11, "learning_rate": 9.727989231530983e-05, "loss": 2.4041, "step": 12450 }, { "epoch": 0.11, "learning_rate": 9.72777095644924e-05, "loss": 2.3881, "step": 12455 }, { "epoch": 0.11, "learning_rate": 9.727552596275986e-05, "loss": 2.3785, "step": 12460 }, { "epoch": 0.11, "learning_rate": 9.72733415101515e-05, "loss": 2.3872, "step": 12465 }, { "epoch": 0.11, "learning_rate": 9.727115620670664e-05, "loss": 2.4697, "step": 12470 }, { "epoch": 0.11, "learning_rate": 9.726897005246457e-05, "loss": 2.4176, "step": 12475 }, { "epoch": 0.11, "learning_rate": 9.72667830474647e-05, "loss": 2.3807, "step": 12480 }, { "epoch": 0.11, "learning_rate": 9.726459519174638e-05, "loss": 2.3613, "step": 12485 }, { "epoch": 0.11, "learning_rate": 9.726240648534894e-05, "loss": 2.4011, "step": 12490 }, { "epoch": 0.11, "learning_rate": 9.726021692831182e-05, "loss": 2.3627, "step": 12495 }, { "epoch": 0.11, "learning_rate": 9.725802652067439e-05, "loss": 2.4674, "step": 12500 }, { "epoch": 0.11, "learning_rate": 9.725583526247613e-05, "loss": 2.362, "step": 12505 }, { "epoch": 0.11, "learning_rate": 9.725364315375642e-05, "loss": 2.4027, "step": 12510 }, { "epoch": 0.11, "learning_rate": 9.725145019455475e-05, "loss": 2.4636, "step": 12515 }, { "epoch": 0.11, "learning_rate": 9.724925638491058e-05, "loss": 2.3447, "step": 12520 }, { "epoch": 0.11, "learning_rate": 9.724706172486339e-05, "loss": 2.3953, "step": 12525 }, { "epoch": 0.11, "learning_rate": 9.724486621445268e-05, "loss": 2.3608, "step": 12530 }, { "epoch": 0.11, "learning_rate": 9.724266985371797e-05, "loss": 2.4119, "step": 12535 }, { "epoch": 0.11, "learning_rate": 9.724047264269878e-05, "loss": 2.4032, "step": 12540 }, { "epoch": 0.11, "learning_rate": 9.723827458143468e-05, "loss": 2.4141, "step": 12545 }, { "epoch": 0.11, "learning_rate": 9.72360756699652e-05, "loss": 2.345, "step": 12550 }, { "epoch": 0.11, "learning_rate": 9.723387590832995e-05, "loss": 2.3297, "step": 12555 }, { "epoch": 0.11, "learning_rate": 9.723167529656849e-05, "loss": 2.3845, "step": 12560 }, { "epoch": 0.11, "learning_rate": 9.722947383472046e-05, "loss": 2.3617, "step": 12565 }, { "epoch": 0.11, "learning_rate": 9.722727152282543e-05, "loss": 2.4069, "step": 12570 }, { "epoch": 0.11, "learning_rate": 9.72250683609231e-05, "loss": 2.4428, "step": 12575 }, { "epoch": 0.11, "learning_rate": 9.722286434905308e-05, "loss": 2.4636, "step": 12580 }, { "epoch": 0.11, "learning_rate": 9.722065948725506e-05, "loss": 2.3899, "step": 12585 }, { "epoch": 0.11, "learning_rate": 9.721845377556872e-05, "loss": 2.3603, "step": 12590 }, { "epoch": 0.11, "learning_rate": 9.721624721403375e-05, "loss": 2.3351, "step": 12595 }, { "epoch": 0.11, "learning_rate": 9.721403980268987e-05, "loss": 2.4005, "step": 12600 }, { "epoch": 0.11, "learning_rate": 9.721183154157681e-05, "loss": 2.3725, "step": 12605 }, { "epoch": 0.11, "learning_rate": 9.72096224307343e-05, "loss": 2.3765, "step": 12610 }, { "epoch": 0.11, "learning_rate": 9.720741247020212e-05, "loss": 2.4806, "step": 12615 }, { "epoch": 0.11, "learning_rate": 9.720520166002006e-05, "loss": 2.3782, "step": 12620 }, { "epoch": 0.11, "learning_rate": 9.720299000022788e-05, "loss": 2.2709, "step": 12625 }, { "epoch": 0.11, "learning_rate": 9.72007774908654e-05, "loss": 2.4895, "step": 12630 }, { "epoch": 0.11, "learning_rate": 9.719856413197242e-05, "loss": 2.4197, "step": 12635 }, { "epoch": 0.11, "learning_rate": 9.71963499235888e-05, "loss": 2.4509, "step": 12640 }, { "epoch": 0.11, "learning_rate": 9.719413486575439e-05, "loss": 2.4317, "step": 12645 }, { "epoch": 0.11, "learning_rate": 9.719191895850906e-05, "loss": 2.4535, "step": 12650 }, { "epoch": 0.11, "learning_rate": 9.718970220189267e-05, "loss": 2.4426, "step": 12655 }, { "epoch": 0.11, "learning_rate": 9.718748459594513e-05, "loss": 2.4004, "step": 12660 }, { "epoch": 0.11, "learning_rate": 9.718526614070638e-05, "loss": 2.4372, "step": 12665 }, { "epoch": 0.11, "learning_rate": 9.718304683621631e-05, "loss": 2.3506, "step": 12670 }, { "epoch": 0.11, "learning_rate": 9.718082668251487e-05, "loss": 2.4017, "step": 12675 }, { "epoch": 0.11, "learning_rate": 9.717860567964203e-05, "loss": 2.3921, "step": 12680 }, { "epoch": 0.11, "learning_rate": 9.717638382763776e-05, "loss": 2.378, "step": 12685 }, { "epoch": 0.11, "learning_rate": 9.717416112654206e-05, "loss": 2.4554, "step": 12690 }, { "epoch": 0.11, "learning_rate": 9.717193757639491e-05, "loss": 2.382, "step": 12695 }, { "epoch": 0.11, "learning_rate": 9.716971317723636e-05, "loss": 2.359, "step": 12700 }, { "epoch": 0.11, "learning_rate": 9.716748792910642e-05, "loss": 2.3446, "step": 12705 }, { "epoch": 0.11, "learning_rate": 9.716526183204515e-05, "loss": 2.4019, "step": 12710 }, { "epoch": 0.11, "learning_rate": 9.716303488609262e-05, "loss": 2.394, "step": 12715 }, { "epoch": 0.11, "learning_rate": 9.716080709128891e-05, "loss": 2.3994, "step": 12720 }, { "epoch": 0.11, "learning_rate": 9.715857844767411e-05, "loss": 2.3943, "step": 12725 }, { "epoch": 0.11, "learning_rate": 9.715634895528833e-05, "loss": 2.4286, "step": 12730 }, { "epoch": 0.11, "learning_rate": 9.715411861417172e-05, "loss": 2.3686, "step": 12735 }, { "epoch": 0.11, "learning_rate": 9.715188742436439e-05, "loss": 2.3599, "step": 12740 }, { "epoch": 0.11, "learning_rate": 9.71496553859065e-05, "loss": 2.3802, "step": 12745 }, { "epoch": 0.11, "learning_rate": 9.714742249883825e-05, "loss": 2.3721, "step": 12750 }, { "epoch": 0.11, "learning_rate": 9.714518876319982e-05, "loss": 2.4534, "step": 12755 }, { "epoch": 0.11, "learning_rate": 9.714295417903139e-05, "loss": 2.3353, "step": 12760 }, { "epoch": 0.11, "learning_rate": 9.71407187463732e-05, "loss": 2.3345, "step": 12765 }, { "epoch": 0.11, "learning_rate": 9.71384824652655e-05, "loss": 2.3627, "step": 12770 }, { "epoch": 0.11, "learning_rate": 9.713624533574847e-05, "loss": 2.4245, "step": 12775 }, { "epoch": 0.11, "learning_rate": 9.713400735786247e-05, "loss": 2.4298, "step": 12780 }, { "epoch": 0.11, "learning_rate": 9.713176853164769e-05, "loss": 2.4287, "step": 12785 }, { "epoch": 0.11, "learning_rate": 9.71295288571445e-05, "loss": 2.4013, "step": 12790 }, { "epoch": 0.11, "learning_rate": 9.712728833439317e-05, "loss": 2.5279, "step": 12795 }, { "epoch": 0.11, "learning_rate": 9.712504696343401e-05, "loss": 2.3606, "step": 12800 }, { "epoch": 0.11, "learning_rate": 9.71228047443074e-05, "loss": 2.3308, "step": 12805 }, { "epoch": 0.11, "learning_rate": 9.712056167705368e-05, "loss": 2.3041, "step": 12810 }, { "epoch": 0.11, "learning_rate": 9.711831776171322e-05, "loss": 2.3993, "step": 12815 }, { "epoch": 0.11, "learning_rate": 9.71160729983264e-05, "loss": 2.339, "step": 12820 }, { "epoch": 0.11, "learning_rate": 9.711382738693363e-05, "loss": 2.3592, "step": 12825 }, { "epoch": 0.11, "learning_rate": 9.711158092757533e-05, "loss": 2.3283, "step": 12830 }, { "epoch": 0.11, "learning_rate": 9.710933362029192e-05, "loss": 2.3224, "step": 12835 }, { "epoch": 0.11, "learning_rate": 9.710708546512386e-05, "loss": 2.4141, "step": 12840 }, { "epoch": 0.11, "learning_rate": 9.710483646211161e-05, "loss": 2.5345, "step": 12845 }, { "epoch": 0.11, "learning_rate": 9.710258661129564e-05, "loss": 2.3791, "step": 12850 }, { "epoch": 0.11, "learning_rate": 9.710033591271645e-05, "loss": 2.3709, "step": 12855 }, { "epoch": 0.11, "learning_rate": 9.709808436641454e-05, "loss": 2.3314, "step": 12860 }, { "epoch": 0.11, "learning_rate": 9.709583197243046e-05, "loss": 2.3404, "step": 12865 }, { "epoch": 0.11, "learning_rate": 9.709357873080472e-05, "loss": 2.3735, "step": 12870 }, { "epoch": 0.11, "learning_rate": 9.709132464157788e-05, "loss": 2.4031, "step": 12875 }, { "epoch": 0.11, "learning_rate": 9.708906970479053e-05, "loss": 2.376, "step": 12880 }, { "epoch": 0.11, "learning_rate": 9.708681392048323e-05, "loss": 2.3494, "step": 12885 }, { "epoch": 0.11, "learning_rate": 9.708455728869659e-05, "loss": 2.4084, "step": 12890 }, { "epoch": 0.11, "learning_rate": 9.708229980947124e-05, "loss": 2.3907, "step": 12895 }, { "epoch": 0.11, "learning_rate": 9.708004148284777e-05, "loss": 2.3711, "step": 12900 }, { "epoch": 0.11, "learning_rate": 9.707778230886686e-05, "loss": 2.3636, "step": 12905 }, { "epoch": 0.11, "learning_rate": 9.707552228756918e-05, "loss": 2.3953, "step": 12910 }, { "epoch": 0.11, "learning_rate": 9.707326141899538e-05, "loss": 2.4558, "step": 12915 }, { "epoch": 0.11, "learning_rate": 9.707099970318615e-05, "loss": 2.3817, "step": 12920 }, { "epoch": 0.11, "learning_rate": 9.706873714018221e-05, "loss": 2.3614, "step": 12925 }, { "epoch": 0.11, "learning_rate": 9.706647373002429e-05, "loss": 2.4449, "step": 12930 }, { "epoch": 0.11, "learning_rate": 9.706420947275311e-05, "loss": 2.3176, "step": 12935 }, { "epoch": 0.11, "learning_rate": 9.706194436840943e-05, "loss": 2.3755, "step": 12940 }, { "epoch": 0.11, "learning_rate": 9.705967841703402e-05, "loss": 2.47, "step": 12945 }, { "epoch": 0.11, "learning_rate": 9.705741161866766e-05, "loss": 2.4536, "step": 12950 }, { "epoch": 0.11, "learning_rate": 9.705514397335116e-05, "loss": 2.3099, "step": 12955 }, { "epoch": 0.11, "learning_rate": 9.70528754811253e-05, "loss": 2.3952, "step": 12960 }, { "epoch": 0.11, "learning_rate": 9.705060614203094e-05, "loss": 2.34, "step": 12965 }, { "epoch": 0.11, "learning_rate": 9.704833595610893e-05, "loss": 2.3902, "step": 12970 }, { "epoch": 0.11, "learning_rate": 9.70460649234001e-05, "loss": 2.435, "step": 12975 }, { "epoch": 0.11, "learning_rate": 9.704379304394536e-05, "loss": 2.4075, "step": 12980 }, { "epoch": 0.11, "learning_rate": 9.704152031778556e-05, "loss": 2.3924, "step": 12985 }, { "epoch": 0.11, "learning_rate": 9.703924674496162e-05, "loss": 2.3442, "step": 12990 }, { "epoch": 0.11, "learning_rate": 9.703697232551448e-05, "loss": 2.4039, "step": 12995 }, { "epoch": 0.11, "learning_rate": 9.703469705948505e-05, "loss": 2.3002, "step": 13000 }, { "epoch": 0.11, "learning_rate": 9.703242094691429e-05, "loss": 2.3294, "step": 13005 }, { "epoch": 0.11, "learning_rate": 9.703014398784318e-05, "loss": 2.4036, "step": 13010 }, { "epoch": 0.11, "learning_rate": 9.702786618231267e-05, "loss": 2.3718, "step": 13015 }, { "epoch": 0.11, "learning_rate": 9.70255875303638e-05, "loss": 2.3609, "step": 13020 }, { "epoch": 0.11, "learning_rate": 9.702330803203754e-05, "loss": 2.3567, "step": 13025 }, { "epoch": 0.11, "learning_rate": 9.702102768737493e-05, "loss": 2.4428, "step": 13030 }, { "epoch": 0.11, "learning_rate": 9.701874649641702e-05, "loss": 2.4034, "step": 13035 }, { "epoch": 0.11, "learning_rate": 9.701646445920487e-05, "loss": 2.4076, "step": 13040 }, { "epoch": 0.11, "learning_rate": 9.701418157577953e-05, "loss": 2.4148, "step": 13045 }, { "epoch": 0.11, "learning_rate": 9.701189784618212e-05, "loss": 2.4045, "step": 13050 }, { "epoch": 0.11, "learning_rate": 9.700961327045371e-05, "loss": 2.4663, "step": 13055 }, { "epoch": 0.11, "learning_rate": 9.700732784863545e-05, "loss": 2.3903, "step": 13060 }, { "epoch": 0.11, "learning_rate": 9.700504158076845e-05, "loss": 2.3434, "step": 13065 }, { "epoch": 0.11, "learning_rate": 9.700275446689386e-05, "loss": 2.2877, "step": 13070 }, { "epoch": 0.11, "learning_rate": 9.700046650705288e-05, "loss": 2.4362, "step": 13075 }, { "epoch": 0.11, "learning_rate": 9.699817770128662e-05, "loss": 2.3402, "step": 13080 }, { "epoch": 0.11, "learning_rate": 9.699588804963635e-05, "loss": 2.4133, "step": 13085 }, { "epoch": 0.11, "learning_rate": 9.699359755214324e-05, "loss": 2.2366, "step": 13090 }, { "epoch": 0.11, "learning_rate": 9.699130620884851e-05, "loss": 2.3601, "step": 13095 }, { "epoch": 0.11, "learning_rate": 9.69890140197934e-05, "loss": 2.3654, "step": 13100 }, { "epoch": 0.11, "learning_rate": 9.69867209850192e-05, "loss": 2.3502, "step": 13105 }, { "epoch": 0.11, "learning_rate": 9.698442710456712e-05, "loss": 2.4216, "step": 13110 }, { "epoch": 0.11, "learning_rate": 9.698213237847851e-05, "loss": 2.389, "step": 13115 }, { "epoch": 0.11, "learning_rate": 9.697983680679463e-05, "loss": 2.4157, "step": 13120 }, { "epoch": 0.11, "learning_rate": 9.697754038955682e-05, "loss": 2.3533, "step": 13125 }, { "epoch": 0.11, "learning_rate": 9.697524312680639e-05, "loss": 2.3535, "step": 13130 }, { "epoch": 0.11, "learning_rate": 9.69729450185847e-05, "loss": 2.397, "step": 13135 }, { "epoch": 0.11, "learning_rate": 9.697064606493311e-05, "loss": 2.4615, "step": 13140 }, { "epoch": 0.11, "learning_rate": 9.696834626589299e-05, "loss": 2.3649, "step": 13145 }, { "epoch": 0.11, "learning_rate": 9.696604562150575e-05, "loss": 2.3741, "step": 13150 }, { "epoch": 0.11, "learning_rate": 9.696374413181277e-05, "loss": 2.3709, "step": 13155 }, { "epoch": 0.11, "learning_rate": 9.69614417968555e-05, "loss": 2.392, "step": 13160 }, { "epoch": 0.11, "learning_rate": 9.695913861667537e-05, "loss": 2.3964, "step": 13165 }, { "epoch": 0.11, "learning_rate": 9.695683459131382e-05, "loss": 2.3741, "step": 13170 }, { "epoch": 0.11, "learning_rate": 9.695452972081232e-05, "loss": 2.4157, "step": 13175 }, { "epoch": 0.11, "learning_rate": 9.695222400521237e-05, "loss": 2.3771, "step": 13180 }, { "epoch": 0.11, "learning_rate": 9.694991744455546e-05, "loss": 2.4221, "step": 13185 }, { "epoch": 0.11, "learning_rate": 9.69476100388831e-05, "loss": 2.4323, "step": 13190 }, { "epoch": 0.11, "learning_rate": 9.694530178823684e-05, "loss": 2.4093, "step": 13195 }, { "epoch": 0.11, "learning_rate": 9.694299269265819e-05, "loss": 2.3435, "step": 13200 }, { "epoch": 0.11, "learning_rate": 9.694068275218873e-05, "loss": 2.4002, "step": 13205 }, { "epoch": 0.11, "learning_rate": 9.693837196687004e-05, "loss": 2.369, "step": 13210 }, { "epoch": 0.11, "learning_rate": 9.69360603367437e-05, "loss": 2.4102, "step": 13215 }, { "epoch": 0.11, "learning_rate": 9.693374786185132e-05, "loss": 2.4214, "step": 13220 }, { "epoch": 0.11, "learning_rate": 9.693143454223451e-05, "loss": 2.3584, "step": 13225 }, { "epoch": 0.11, "learning_rate": 9.692912037793491e-05, "loss": 2.3168, "step": 13230 }, { "epoch": 0.11, "learning_rate": 9.692680536899419e-05, "loss": 2.2905, "step": 13235 }, { "epoch": 0.11, "learning_rate": 9.692448951545399e-05, "loss": 2.3836, "step": 13240 }, { "epoch": 0.11, "learning_rate": 9.692217281735601e-05, "loss": 2.3273, "step": 13245 }, { "epoch": 0.11, "learning_rate": 9.691985527474192e-05, "loss": 2.4513, "step": 13250 }, { "epoch": 0.11, "learning_rate": 9.691753688765347e-05, "loss": 2.367, "step": 13255 }, { "epoch": 0.11, "learning_rate": 9.691521765613236e-05, "loss": 2.3172, "step": 13260 }, { "epoch": 0.11, "learning_rate": 9.691289758022034e-05, "loss": 2.3492, "step": 13265 }, { "epoch": 0.11, "learning_rate": 9.691057665995917e-05, "loss": 2.4216, "step": 13270 }, { "epoch": 0.11, "learning_rate": 9.690825489539062e-05, "loss": 2.4268, "step": 13275 }, { "epoch": 0.11, "learning_rate": 9.690593228655646e-05, "loss": 2.4039, "step": 13280 }, { "epoch": 0.11, "learning_rate": 9.690360883349851e-05, "loss": 2.3982, "step": 13285 }, { "epoch": 0.11, "learning_rate": 9.690128453625861e-05, "loss": 2.362, "step": 13290 }, { "epoch": 0.11, "learning_rate": 9.689895939487856e-05, "loss": 2.4762, "step": 13295 }, { "epoch": 0.11, "learning_rate": 9.689663340940021e-05, "loss": 2.4168, "step": 13300 }, { "epoch": 0.11, "learning_rate": 9.689430657986543e-05, "loss": 2.448, "step": 13305 }, { "epoch": 0.11, "learning_rate": 9.689197890631612e-05, "loss": 2.4354, "step": 13310 }, { "epoch": 0.11, "learning_rate": 9.688965038879415e-05, "loss": 2.3881, "step": 13315 }, { "epoch": 0.11, "learning_rate": 9.688732102734141e-05, "loss": 2.4043, "step": 13320 }, { "epoch": 0.11, "learning_rate": 9.688499082199988e-05, "loss": 2.4083, "step": 13325 }, { "epoch": 0.11, "learning_rate": 9.688265977281146e-05, "loss": 2.4126, "step": 13330 }, { "epoch": 0.11, "learning_rate": 9.688032787981811e-05, "loss": 2.4186, "step": 13335 }, { "epoch": 0.11, "learning_rate": 9.68779951430618e-05, "loss": 2.3535, "step": 13340 }, { "epoch": 0.11, "learning_rate": 9.687566156258452e-05, "loss": 2.2934, "step": 13345 }, { "epoch": 0.11, "learning_rate": 9.687332713842828e-05, "loss": 2.3584, "step": 13350 }, { "epoch": 0.11, "learning_rate": 9.687099187063506e-05, "loss": 2.3461, "step": 13355 }, { "epoch": 0.11, "learning_rate": 9.686865575924693e-05, "loss": 2.3769, "step": 13360 }, { "epoch": 0.11, "learning_rate": 9.686631880430592e-05, "loss": 2.382, "step": 13365 }, { "epoch": 0.11, "learning_rate": 9.68639810058541e-05, "loss": 2.3237, "step": 13370 }, { "epoch": 0.11, "learning_rate": 9.686164236393352e-05, "loss": 2.3217, "step": 13375 }, { "epoch": 0.11, "learning_rate": 9.685930287858631e-05, "loss": 2.3239, "step": 13380 }, { "epoch": 0.11, "learning_rate": 9.685696254985454e-05, "loss": 2.4253, "step": 13385 }, { "epoch": 0.11, "learning_rate": 9.685462137778036e-05, "loss": 2.3039, "step": 13390 }, { "epoch": 0.11, "learning_rate": 9.685227936240589e-05, "loss": 2.4572, "step": 13395 }, { "epoch": 0.11, "learning_rate": 9.684993650377327e-05, "loss": 2.3893, "step": 13400 }, { "epoch": 0.11, "learning_rate": 9.68475928019247e-05, "loss": 2.3507, "step": 13405 }, { "epoch": 0.11, "learning_rate": 9.684524825690235e-05, "loss": 2.4037, "step": 13410 }, { "epoch": 0.11, "learning_rate": 9.684290286874843e-05, "loss": 2.4053, "step": 13415 }, { "epoch": 0.11, "learning_rate": 9.684055663750509e-05, "loss": 2.4483, "step": 13420 }, { "epoch": 0.11, "learning_rate": 9.683820956321464e-05, "loss": 2.3256, "step": 13425 }, { "epoch": 0.11, "learning_rate": 9.683586164591928e-05, "loss": 2.3384, "step": 13430 }, { "epoch": 0.11, "learning_rate": 9.683351288566128e-05, "loss": 2.4, "step": 13435 }, { "epoch": 0.11, "learning_rate": 9.683116328248291e-05, "loss": 2.5051, "step": 13440 }, { "epoch": 0.11, "learning_rate": 9.682881283642645e-05, "loss": 2.3355, "step": 13445 }, { "epoch": 0.11, "learning_rate": 9.682646154753423e-05, "loss": 2.3164, "step": 13450 }, { "epoch": 0.11, "learning_rate": 9.682410941584854e-05, "loss": 2.4507, "step": 13455 }, { "epoch": 0.11, "learning_rate": 9.682175644141172e-05, "loss": 2.3665, "step": 13460 }, { "epoch": 0.11, "learning_rate": 9.681940262426614e-05, "loss": 2.4426, "step": 13465 }, { "epoch": 0.11, "learning_rate": 9.681704796445415e-05, "loss": 2.3763, "step": 13470 }, { "epoch": 0.11, "learning_rate": 9.68146924620181e-05, "loss": 2.393, "step": 13475 }, { "epoch": 0.12, "learning_rate": 9.681233611700045e-05, "loss": 2.4174, "step": 13480 }, { "epoch": 0.12, "learning_rate": 9.680997892944357e-05, "loss": 2.3353, "step": 13485 }, { "epoch": 0.12, "learning_rate": 9.680762089938987e-05, "loss": 2.3722, "step": 13490 }, { "epoch": 0.12, "learning_rate": 9.680526202688183e-05, "loss": 2.3462, "step": 13495 }, { "epoch": 0.12, "learning_rate": 9.680290231196187e-05, "loss": 2.3165, "step": 13500 }, { "epoch": 0.12, "learning_rate": 9.680054175467248e-05, "loss": 2.3824, "step": 13505 }, { "epoch": 0.12, "learning_rate": 9.679818035505614e-05, "loss": 2.4258, "step": 13510 }, { "epoch": 0.12, "learning_rate": 9.679581811315537e-05, "loss": 2.3674, "step": 13515 }, { "epoch": 0.12, "learning_rate": 9.679345502901267e-05, "loss": 2.3361, "step": 13520 }, { "epoch": 0.12, "learning_rate": 9.679109110267055e-05, "loss": 2.3273, "step": 13525 }, { "epoch": 0.12, "learning_rate": 9.678872633417158e-05, "loss": 2.3746, "step": 13530 }, { "epoch": 0.12, "learning_rate": 9.678636072355833e-05, "loss": 2.4009, "step": 13535 }, { "epoch": 0.12, "learning_rate": 9.678399427087337e-05, "loss": 2.3958, "step": 13540 }, { "epoch": 0.12, "learning_rate": 9.678162697615928e-05, "loss": 2.4178, "step": 13545 }, { "epoch": 0.12, "learning_rate": 9.677925883945866e-05, "loss": 2.3478, "step": 13550 }, { "epoch": 0.12, "learning_rate": 9.677688986081417e-05, "loss": 2.3331, "step": 13555 }, { "epoch": 0.12, "learning_rate": 9.677452004026841e-05, "loss": 2.4411, "step": 13560 }, { "epoch": 0.12, "learning_rate": 9.677214937786407e-05, "loss": 2.3642, "step": 13565 }, { "epoch": 0.12, "learning_rate": 9.676977787364376e-05, "loss": 2.4223, "step": 13570 }, { "epoch": 0.12, "learning_rate": 9.676740552765023e-05, "loss": 2.4002, "step": 13575 }, { "epoch": 0.12, "learning_rate": 9.676503233992613e-05, "loss": 2.396, "step": 13580 }, { "epoch": 0.12, "learning_rate": 9.676265831051418e-05, "loss": 2.4062, "step": 13585 }, { "epoch": 0.12, "learning_rate": 9.676028343945713e-05, "loss": 2.3738, "step": 13590 }, { "epoch": 0.12, "learning_rate": 9.675790772679771e-05, "loss": 2.3977, "step": 13595 }, { "epoch": 0.12, "learning_rate": 9.675553117257868e-05, "loss": 2.3108, "step": 13600 }, { "epoch": 0.12, "learning_rate": 9.675315377684282e-05, "loss": 2.3736, "step": 13605 }, { "epoch": 0.12, "learning_rate": 9.67507755396329e-05, "loss": 2.3877, "step": 13610 }, { "epoch": 0.12, "learning_rate": 9.674839646099174e-05, "loss": 2.298, "step": 13615 }, { "epoch": 0.12, "learning_rate": 9.674601654096216e-05, "loss": 2.4301, "step": 13620 }, { "epoch": 0.12, "learning_rate": 9.674363577958698e-05, "loss": 2.4358, "step": 13625 }, { "epoch": 0.12, "learning_rate": 9.674125417690905e-05, "loss": 2.3642, "step": 13630 }, { "epoch": 0.12, "learning_rate": 9.673887173297127e-05, "loss": 2.297, "step": 13635 }, { "epoch": 0.12, "learning_rate": 9.673648844781647e-05, "loss": 2.4752, "step": 13640 }, { "epoch": 0.12, "learning_rate": 9.673410432148759e-05, "loss": 2.3753, "step": 13645 }, { "epoch": 0.12, "learning_rate": 9.673171935402751e-05, "loss": 2.2977, "step": 13650 }, { "epoch": 0.12, "learning_rate": 9.672933354547915e-05, "loss": 2.3783, "step": 13655 }, { "epoch": 0.12, "learning_rate": 9.672694689588548e-05, "loss": 2.3669, "step": 13660 }, { "epoch": 0.12, "learning_rate": 9.672455940528944e-05, "loss": 2.4619, "step": 13665 }, { "epoch": 0.12, "learning_rate": 9.6722171073734e-05, "loss": 2.3961, "step": 13670 }, { "epoch": 0.12, "learning_rate": 9.671978190126213e-05, "loss": 2.3946, "step": 13675 }, { "epoch": 0.12, "learning_rate": 9.671739188791687e-05, "loss": 2.3791, "step": 13680 }, { "epoch": 0.12, "learning_rate": 9.671500103374119e-05, "loss": 2.42, "step": 13685 }, { "epoch": 0.12, "learning_rate": 9.671260933877814e-05, "loss": 2.3223, "step": 13690 }, { "epoch": 0.12, "learning_rate": 9.671021680307079e-05, "loss": 2.3477, "step": 13695 }, { "epoch": 0.12, "learning_rate": 9.670782342666218e-05, "loss": 2.4114, "step": 13700 }, { "epoch": 0.12, "learning_rate": 9.67054292095954e-05, "loss": 2.3439, "step": 13705 }, { "epoch": 0.12, "learning_rate": 9.67030341519135e-05, "loss": 2.3816, "step": 13710 }, { "epoch": 0.12, "learning_rate": 9.670063825365963e-05, "loss": 2.4725, "step": 13715 }, { "epoch": 0.12, "learning_rate": 9.66982415148769e-05, "loss": 2.3729, "step": 13720 }, { "epoch": 0.12, "learning_rate": 9.669584393560844e-05, "loss": 2.3956, "step": 13725 }, { "epoch": 0.12, "learning_rate": 9.669344551589743e-05, "loss": 2.3648, "step": 13730 }, { "epoch": 0.12, "learning_rate": 9.6691046255787e-05, "loss": 2.4382, "step": 13735 }, { "epoch": 0.12, "learning_rate": 9.668864615532034e-05, "loss": 2.41, "step": 13740 }, { "epoch": 0.12, "learning_rate": 9.668624521454066e-05, "loss": 2.394, "step": 13745 }, { "epoch": 0.12, "learning_rate": 9.668384343349118e-05, "loss": 2.4054, "step": 13750 }, { "epoch": 0.12, "learning_rate": 9.668144081221509e-05, "loss": 2.3487, "step": 13755 }, { "epoch": 0.12, "learning_rate": 9.667903735075568e-05, "loss": 2.4053, "step": 13760 }, { "epoch": 0.12, "learning_rate": 9.667663304915617e-05, "loss": 2.4233, "step": 13765 }, { "epoch": 0.12, "learning_rate": 9.667422790745986e-05, "loss": 2.3079, "step": 13770 }, { "epoch": 0.12, "learning_rate": 9.667182192571003e-05, "loss": 2.3498, "step": 13775 }, { "epoch": 0.12, "learning_rate": 9.666941510394998e-05, "loss": 2.3727, "step": 13780 }, { "epoch": 0.12, "learning_rate": 9.666700744222303e-05, "loss": 2.4005, "step": 13785 }, { "epoch": 0.12, "learning_rate": 9.666459894057251e-05, "loss": 2.3454, "step": 13790 }, { "epoch": 0.12, "learning_rate": 9.666218959904177e-05, "loss": 2.3485, "step": 13795 }, { "epoch": 0.12, "learning_rate": 9.665977941767418e-05, "loss": 2.3844, "step": 13800 }, { "epoch": 0.12, "learning_rate": 9.665736839651312e-05, "loss": 2.3741, "step": 13805 }, { "epoch": 0.12, "learning_rate": 9.665495653560197e-05, "loss": 2.4492, "step": 13810 }, { "epoch": 0.12, "learning_rate": 9.665254383498415e-05, "loss": 2.4122, "step": 13815 }, { "epoch": 0.12, "learning_rate": 9.665013029470309e-05, "loss": 2.4136, "step": 13820 }, { "epoch": 0.12, "learning_rate": 9.664771591480222e-05, "loss": 2.2964, "step": 13825 }, { "epoch": 0.12, "learning_rate": 9.6645300695325e-05, "loss": 2.3782, "step": 13830 }, { "epoch": 0.12, "learning_rate": 9.66428846363149e-05, "loss": 2.4004, "step": 13835 }, { "epoch": 0.12, "learning_rate": 9.664046773781538e-05, "loss": 2.4044, "step": 13840 }, { "epoch": 0.12, "learning_rate": 9.663804999986999e-05, "loss": 2.3892, "step": 13845 }, { "epoch": 0.12, "learning_rate": 9.66356314225222e-05, "loss": 2.4054, "step": 13850 }, { "epoch": 0.12, "learning_rate": 9.663321200581555e-05, "loss": 2.4533, "step": 13855 }, { "epoch": 0.12, "learning_rate": 9.663079174979362e-05, "loss": 2.3034, "step": 13860 }, { "epoch": 0.12, "learning_rate": 9.662837065449991e-05, "loss": 2.3591, "step": 13865 }, { "epoch": 0.12, "learning_rate": 9.662594871997804e-05, "loss": 2.4161, "step": 13870 }, { "epoch": 0.12, "learning_rate": 9.662352594627159e-05, "loss": 2.3709, "step": 13875 }, { "epoch": 0.12, "learning_rate": 9.662110233342416e-05, "loss": 2.3825, "step": 13880 }, { "epoch": 0.12, "learning_rate": 9.661867788147939e-05, "loss": 2.3759, "step": 13885 }, { "epoch": 0.12, "learning_rate": 9.661625259048088e-05, "loss": 2.3598, "step": 13890 }, { "epoch": 0.12, "learning_rate": 9.66138264604723e-05, "loss": 2.356, "step": 13895 }, { "epoch": 0.12, "learning_rate": 9.661139949149734e-05, "loss": 2.3332, "step": 13900 }, { "epoch": 0.12, "learning_rate": 9.660897168359964e-05, "loss": 2.4655, "step": 13905 }, { "epoch": 0.12, "learning_rate": 9.660654303682291e-05, "loss": 2.3671, "step": 13910 }, { "epoch": 0.12, "learning_rate": 9.660411355121087e-05, "loss": 2.3187, "step": 13915 }, { "epoch": 0.12, "learning_rate": 9.660168322680725e-05, "loss": 2.3575, "step": 13920 }, { "epoch": 0.12, "learning_rate": 9.659925206365578e-05, "loss": 2.4518, "step": 13925 }, { "epoch": 0.12, "learning_rate": 9.659682006180021e-05, "loss": 2.3587, "step": 13930 }, { "epoch": 0.12, "learning_rate": 9.659438722128434e-05, "loss": 2.3739, "step": 13935 }, { "epoch": 0.12, "learning_rate": 9.659195354215193e-05, "loss": 2.4203, "step": 13940 }, { "epoch": 0.12, "learning_rate": 9.65895190244468e-05, "loss": 2.3984, "step": 13945 }, { "epoch": 0.12, "learning_rate": 9.658708366821275e-05, "loss": 2.3228, "step": 13950 }, { "epoch": 0.12, "learning_rate": 9.658464747349363e-05, "loss": 2.393, "step": 13955 }, { "epoch": 0.12, "learning_rate": 9.658221044033327e-05, "loss": 2.3751, "step": 13960 }, { "epoch": 0.12, "learning_rate": 9.657977256877553e-05, "loss": 2.407, "step": 13965 }, { "epoch": 0.12, "learning_rate": 9.657733385886431e-05, "loss": 2.3505, "step": 13970 }, { "epoch": 0.12, "learning_rate": 9.657489431064348e-05, "loss": 2.3693, "step": 13975 }, { "epoch": 0.12, "learning_rate": 9.657245392415697e-05, "loss": 2.3912, "step": 13980 }, { "epoch": 0.12, "learning_rate": 9.657001269944868e-05, "loss": 2.5087, "step": 13985 }, { "epoch": 0.12, "learning_rate": 9.656757063656255e-05, "loss": 2.4241, "step": 13990 }, { "epoch": 0.12, "learning_rate": 9.656512773554256e-05, "loss": 2.3472, "step": 13995 }, { "epoch": 0.12, "learning_rate": 9.656268399643264e-05, "loss": 2.3785, "step": 14000 }, { "epoch": 0.12, "learning_rate": 9.65602394192768e-05, "loss": 2.3637, "step": 14005 }, { "epoch": 0.12, "learning_rate": 9.655779400411902e-05, "loss": 2.4445, "step": 14010 }, { "epoch": 0.12, "learning_rate": 9.655534775100334e-05, "loss": 2.3199, "step": 14015 }, { "epoch": 0.12, "learning_rate": 9.655290065997376e-05, "loss": 2.4161, "step": 14020 }, { "epoch": 0.12, "learning_rate": 9.655045273107433e-05, "loss": 2.3719, "step": 14025 }, { "epoch": 0.12, "learning_rate": 9.654800396434912e-05, "loss": 2.3103, "step": 14030 }, { "epoch": 0.12, "learning_rate": 9.654555435984219e-05, "loss": 2.3216, "step": 14035 }, { "epoch": 0.12, "learning_rate": 9.654310391759764e-05, "loss": 2.4145, "step": 14040 }, { "epoch": 0.12, "learning_rate": 9.654065263765957e-05, "loss": 2.3467, "step": 14045 }, { "epoch": 0.12, "learning_rate": 9.653820052007208e-05, "loss": 2.2985, "step": 14050 }, { "epoch": 0.12, "learning_rate": 9.653574756487933e-05, "loss": 2.3742, "step": 14055 }, { "epoch": 0.12, "learning_rate": 9.653329377212546e-05, "loss": 2.3911, "step": 14060 }, { "epoch": 0.12, "learning_rate": 9.653083914185463e-05, "loss": 2.3472, "step": 14065 }, { "epoch": 0.12, "learning_rate": 9.652838367411103e-05, "loss": 2.4279, "step": 14070 }, { "epoch": 0.12, "learning_rate": 9.652592736893884e-05, "loss": 2.3533, "step": 14075 }, { "epoch": 0.12, "learning_rate": 9.652347022638228e-05, "loss": 2.4419, "step": 14080 }, { "epoch": 0.12, "learning_rate": 9.652101224648557e-05, "loss": 2.3991, "step": 14085 }, { "epoch": 0.12, "learning_rate": 9.651855342929294e-05, "loss": 2.2912, "step": 14090 }, { "epoch": 0.12, "learning_rate": 9.651609377484867e-05, "loss": 2.4204, "step": 14095 }, { "epoch": 0.12, "learning_rate": 9.6513633283197e-05, "loss": 2.4285, "step": 14100 }, { "epoch": 0.12, "learning_rate": 9.651117195438222e-05, "loss": 2.4175, "step": 14105 }, { "epoch": 0.12, "learning_rate": 9.650870978844866e-05, "loss": 2.386, "step": 14110 }, { "epoch": 0.12, "learning_rate": 9.650624678544061e-05, "loss": 2.3085, "step": 14115 }, { "epoch": 0.12, "learning_rate": 9.650378294540237e-05, "loss": 2.405, "step": 14120 }, { "epoch": 0.12, "learning_rate": 9.650131826837834e-05, "loss": 2.417, "step": 14125 }, { "epoch": 0.12, "learning_rate": 9.649885275441284e-05, "loss": 2.419, "step": 14130 }, { "epoch": 0.12, "learning_rate": 9.649638640355028e-05, "loss": 2.4744, "step": 14135 }, { "epoch": 0.12, "learning_rate": 9.649391921583501e-05, "loss": 2.3059, "step": 14140 }, { "epoch": 0.12, "learning_rate": 9.649145119131147e-05, "loss": 2.4495, "step": 14145 }, { "epoch": 0.12, "learning_rate": 9.648898233002406e-05, "loss": 2.3701, "step": 14150 }, { "epoch": 0.12, "learning_rate": 9.648651263201722e-05, "loss": 2.3479, "step": 14155 }, { "epoch": 0.12, "learning_rate": 9.648404209733542e-05, "loss": 2.3687, "step": 14160 }, { "epoch": 0.12, "learning_rate": 9.648157072602308e-05, "loss": 2.4092, "step": 14165 }, { "epoch": 0.12, "learning_rate": 9.647909851812471e-05, "loss": 2.3434, "step": 14170 }, { "epoch": 0.12, "learning_rate": 9.647662547368481e-05, "loss": 2.3644, "step": 14175 }, { "epoch": 0.12, "learning_rate": 9.647415159274789e-05, "loss": 2.4164, "step": 14180 }, { "epoch": 0.12, "learning_rate": 9.647167687535845e-05, "loss": 2.4079, "step": 14185 }, { "epoch": 0.12, "learning_rate": 9.646920132156105e-05, "loss": 2.3522, "step": 14190 }, { "epoch": 0.12, "learning_rate": 9.646672493140025e-05, "loss": 2.3604, "step": 14195 }, { "epoch": 0.12, "learning_rate": 9.646424770492062e-05, "loss": 2.3682, "step": 14200 }, { "epoch": 0.12, "learning_rate": 9.646176964216673e-05, "loss": 2.2929, "step": 14205 }, { "epoch": 0.12, "learning_rate": 9.645929074318321e-05, "loss": 2.3079, "step": 14210 }, { "epoch": 0.12, "learning_rate": 9.645681100801462e-05, "loss": 2.4282, "step": 14215 }, { "epoch": 0.12, "learning_rate": 9.645433043670566e-05, "loss": 2.3418, "step": 14220 }, { "epoch": 0.12, "learning_rate": 9.645184902930093e-05, "loss": 2.4258, "step": 14225 }, { "epoch": 0.12, "learning_rate": 9.64493667858451e-05, "loss": 2.3753, "step": 14230 }, { "epoch": 0.12, "learning_rate": 9.644688370638287e-05, "loss": 2.3839, "step": 14235 }, { "epoch": 0.12, "learning_rate": 9.64443997909589e-05, "loss": 2.429, "step": 14240 }, { "epoch": 0.12, "learning_rate": 9.64419150396179e-05, "loss": 2.4279, "step": 14245 }, { "epoch": 0.12, "learning_rate": 9.64394294524046e-05, "loss": 2.3777, "step": 14250 }, { "epoch": 0.12, "learning_rate": 9.643694302936374e-05, "loss": 2.2861, "step": 14255 }, { "epoch": 0.12, "learning_rate": 9.643445577054007e-05, "loss": 2.3868, "step": 14260 }, { "epoch": 0.12, "learning_rate": 9.643196767597835e-05, "loss": 2.3158, "step": 14265 }, { "epoch": 0.12, "learning_rate": 9.642947874572337e-05, "loss": 2.3901, "step": 14270 }, { "epoch": 0.12, "learning_rate": 9.642698897981991e-05, "loss": 2.3968, "step": 14275 }, { "epoch": 0.12, "learning_rate": 9.64244983783128e-05, "loss": 2.3795, "step": 14280 }, { "epoch": 0.12, "learning_rate": 9.642200694124685e-05, "loss": 2.3509, "step": 14285 }, { "epoch": 0.12, "learning_rate": 9.64195146686669e-05, "loss": 2.3399, "step": 14290 }, { "epoch": 0.12, "learning_rate": 9.641702156061783e-05, "loss": 2.3771, "step": 14295 }, { "epoch": 0.12, "learning_rate": 9.641452761714449e-05, "loss": 2.371, "step": 14300 }, { "epoch": 0.12, "learning_rate": 9.641203283829179e-05, "loss": 2.329, "step": 14305 }, { "epoch": 0.12, "learning_rate": 9.640953722410459e-05, "loss": 2.4105, "step": 14310 }, { "epoch": 0.12, "learning_rate": 9.640704077462786e-05, "loss": 2.2639, "step": 14315 }, { "epoch": 0.12, "learning_rate": 9.640454348990649e-05, "loss": 2.4248, "step": 14320 }, { "epoch": 0.12, "learning_rate": 9.640204536998543e-05, "loss": 2.4758, "step": 14325 }, { "epoch": 0.12, "learning_rate": 9.639954641490965e-05, "loss": 2.3408, "step": 14330 }, { "epoch": 0.12, "learning_rate": 9.639704662472415e-05, "loss": 2.3815, "step": 14335 }, { "epoch": 0.12, "learning_rate": 9.639454599947389e-05, "loss": 2.4389, "step": 14340 }, { "epoch": 0.12, "learning_rate": 9.639204453920389e-05, "loss": 2.3545, "step": 14345 }, { "epoch": 0.12, "learning_rate": 9.638954224395917e-05, "loss": 2.3761, "step": 14350 }, { "epoch": 0.12, "learning_rate": 9.638703911378475e-05, "loss": 2.4041, "step": 14355 }, { "epoch": 0.12, "learning_rate": 9.638453514872573e-05, "loss": 2.3781, "step": 14360 }, { "epoch": 0.12, "learning_rate": 9.638203034882712e-05, "loss": 2.3527, "step": 14365 }, { "epoch": 0.12, "learning_rate": 9.637952471413403e-05, "loss": 2.2995, "step": 14370 }, { "epoch": 0.12, "learning_rate": 9.637701824469157e-05, "loss": 2.3864, "step": 14375 }, { "epoch": 0.12, "learning_rate": 9.637451094054482e-05, "loss": 2.434, "step": 14380 }, { "epoch": 0.12, "learning_rate": 9.637200280173892e-05, "loss": 2.4379, "step": 14385 }, { "epoch": 0.12, "learning_rate": 9.636949382831903e-05, "loss": 2.3785, "step": 14390 }, { "epoch": 0.12, "learning_rate": 9.636698402033029e-05, "loss": 2.4888, "step": 14395 }, { "epoch": 0.12, "learning_rate": 9.636447337781786e-05, "loss": 2.3657, "step": 14400 }, { "epoch": 0.12, "learning_rate": 9.636196190082694e-05, "loss": 2.3291, "step": 14405 }, { "epoch": 0.12, "learning_rate": 9.635944958940275e-05, "loss": 2.295, "step": 14410 }, { "epoch": 0.12, "learning_rate": 9.63569364435905e-05, "loss": 2.3892, "step": 14415 }, { "epoch": 0.12, "learning_rate": 9.635442246343539e-05, "loss": 2.4138, "step": 14420 }, { "epoch": 0.12, "learning_rate": 9.635190764898269e-05, "loss": 2.265, "step": 14425 }, { "epoch": 0.12, "learning_rate": 9.634939200027768e-05, "loss": 2.4147, "step": 14430 }, { "epoch": 0.12, "learning_rate": 9.634687551736561e-05, "loss": 2.3433, "step": 14435 }, { "epoch": 0.12, "learning_rate": 9.634435820029179e-05, "loss": 2.4156, "step": 14440 }, { "epoch": 0.12, "learning_rate": 9.63418400491015e-05, "loss": 2.3626, "step": 14445 }, { "epoch": 0.12, "learning_rate": 9.633932106384009e-05, "loss": 2.3712, "step": 14450 }, { "epoch": 0.12, "learning_rate": 9.63368012445529e-05, "loss": 2.295, "step": 14455 }, { "epoch": 0.12, "learning_rate": 9.633428059128526e-05, "loss": 2.3767, "step": 14460 }, { "epoch": 0.12, "learning_rate": 9.633175910408255e-05, "loss": 2.3557, "step": 14465 }, { "epoch": 0.12, "learning_rate": 9.632923678299015e-05, "loss": 2.4493, "step": 14470 }, { "epoch": 0.12, "learning_rate": 9.632671362805347e-05, "loss": 2.4076, "step": 14475 }, { "epoch": 0.12, "learning_rate": 9.63241896393179e-05, "loss": 2.3884, "step": 14480 }, { "epoch": 0.12, "learning_rate": 9.632166481682887e-05, "loss": 2.4209, "step": 14485 }, { "epoch": 0.12, "learning_rate": 9.631913916063184e-05, "loss": 2.3381, "step": 14490 }, { "epoch": 0.12, "learning_rate": 9.631661267077226e-05, "loss": 2.3467, "step": 14495 }, { "epoch": 0.12, "learning_rate": 9.63140853472956e-05, "loss": 2.3809, "step": 14500 }, { "epoch": 0.12, "learning_rate": 9.631155719024733e-05, "loss": 2.3947, "step": 14505 }, { "epoch": 0.12, "learning_rate": 9.630902819967297e-05, "loss": 2.4375, "step": 14510 }, { "epoch": 0.12, "learning_rate": 9.630649837561806e-05, "loss": 2.3685, "step": 14515 }, { "epoch": 0.12, "learning_rate": 9.63039677181281e-05, "loss": 2.2637, "step": 14520 }, { "epoch": 0.12, "learning_rate": 9.630143622724863e-05, "loss": 2.3668, "step": 14525 }, { "epoch": 0.12, "learning_rate": 9.629890390302526e-05, "loss": 2.4053, "step": 14530 }, { "epoch": 0.12, "learning_rate": 9.629637074550351e-05, "loss": 2.3748, "step": 14535 }, { "epoch": 0.12, "learning_rate": 9.6293836754729e-05, "loss": 2.4202, "step": 14540 }, { "epoch": 0.12, "learning_rate": 9.629130193074735e-05, "loss": 2.4392, "step": 14545 }, { "epoch": 0.12, "learning_rate": 9.628876627360415e-05, "loss": 2.375, "step": 14550 }, { "epoch": 0.12, "learning_rate": 9.628622978334507e-05, "loss": 2.4224, "step": 14555 }, { "epoch": 0.12, "learning_rate": 9.628369246001575e-05, "loss": 2.4112, "step": 14560 }, { "epoch": 0.12, "learning_rate": 9.628115430366184e-05, "loss": 2.4334, "step": 14565 }, { "epoch": 0.12, "learning_rate": 9.627861531432905e-05, "loss": 2.4248, "step": 14570 }, { "epoch": 0.12, "learning_rate": 9.627607549206305e-05, "loss": 2.345, "step": 14575 }, { "epoch": 0.12, "learning_rate": 9.627353483690959e-05, "loss": 2.5167, "step": 14580 }, { "epoch": 0.12, "learning_rate": 9.627099334891437e-05, "loss": 2.3888, "step": 14585 }, { "epoch": 0.12, "learning_rate": 9.626845102812311e-05, "loss": 2.395, "step": 14590 }, { "epoch": 0.12, "learning_rate": 9.626590787458161e-05, "loss": 2.4611, "step": 14595 }, { "epoch": 0.12, "learning_rate": 9.626336388833564e-05, "loss": 2.3736, "step": 14600 }, { "epoch": 0.12, "learning_rate": 9.626081906943096e-05, "loss": 2.3846, "step": 14605 }, { "epoch": 0.12, "learning_rate": 9.625827341791338e-05, "loss": 2.4317, "step": 14610 }, { "epoch": 0.12, "learning_rate": 9.625572693382874e-05, "loss": 2.3315, "step": 14615 }, { "epoch": 0.12, "learning_rate": 9.625317961722284e-05, "loss": 2.447, "step": 14620 }, { "epoch": 0.12, "learning_rate": 9.625063146814155e-05, "loss": 2.4516, "step": 14625 }, { "epoch": 0.12, "learning_rate": 9.624808248663073e-05, "loss": 2.4384, "step": 14630 }, { "epoch": 0.12, "learning_rate": 9.624553267273624e-05, "loss": 2.3872, "step": 14635 }, { "epoch": 0.12, "learning_rate": 9.6242982026504e-05, "loss": 2.3677, "step": 14640 }, { "epoch": 0.12, "learning_rate": 9.624043054797988e-05, "loss": 2.355, "step": 14645 }, { "epoch": 0.13, "learning_rate": 9.623787823720982e-05, "loss": 2.4502, "step": 14650 }, { "epoch": 0.13, "learning_rate": 9.623532509423978e-05, "loss": 2.3284, "step": 14655 }, { "epoch": 0.13, "learning_rate": 9.623277111911569e-05, "loss": 2.2582, "step": 14660 }, { "epoch": 0.13, "learning_rate": 9.623021631188352e-05, "loss": 2.3864, "step": 14665 }, { "epoch": 0.13, "learning_rate": 9.622766067258924e-05, "loss": 2.3979, "step": 14670 }, { "epoch": 0.13, "learning_rate": 9.622510420127887e-05, "loss": 2.3773, "step": 14675 }, { "epoch": 0.13, "learning_rate": 9.622254689799839e-05, "loss": 2.3666, "step": 14680 }, { "epoch": 0.13, "learning_rate": 9.621998876279386e-05, "loss": 2.3618, "step": 14685 }, { "epoch": 0.13, "learning_rate": 9.621742979571131e-05, "loss": 2.3653, "step": 14690 }, { "epoch": 0.13, "learning_rate": 9.621486999679678e-05, "loss": 2.4052, "step": 14695 }, { "epoch": 0.13, "learning_rate": 9.621230936609637e-05, "loss": 2.3515, "step": 14700 }, { "epoch": 0.13, "learning_rate": 9.620974790365617e-05, "loss": 2.3849, "step": 14705 }, { "epoch": 0.13, "learning_rate": 9.620718560952225e-05, "loss": 2.4501, "step": 14710 }, { "epoch": 0.13, "learning_rate": 9.620462248374076e-05, "loss": 2.3863, "step": 14715 }, { "epoch": 0.13, "learning_rate": 9.62020585263578e-05, "loss": 2.3784, "step": 14720 }, { "epoch": 0.13, "learning_rate": 9.619949373741953e-05, "loss": 2.3394, "step": 14725 }, { "epoch": 0.13, "learning_rate": 9.619692811697212e-05, "loss": 2.426, "step": 14730 }, { "epoch": 0.13, "learning_rate": 9.619436166506173e-05, "loss": 2.3475, "step": 14735 }, { "epoch": 0.13, "learning_rate": 9.619179438173456e-05, "loss": 2.4079, "step": 14740 }, { "epoch": 0.13, "learning_rate": 9.618922626703684e-05, "loss": 2.381, "step": 14745 }, { "epoch": 0.13, "learning_rate": 9.618665732101475e-05, "loss": 2.3517, "step": 14750 }, { "epoch": 0.13, "learning_rate": 9.618408754371455e-05, "loss": 2.37, "step": 14755 }, { "epoch": 0.13, "learning_rate": 9.618151693518248e-05, "loss": 2.4528, "step": 14760 }, { "epoch": 0.13, "learning_rate": 9.617894549546483e-05, "loss": 2.342, "step": 14765 }, { "epoch": 0.13, "learning_rate": 9.617637322460786e-05, "loss": 2.3317, "step": 14770 }, { "epoch": 0.13, "learning_rate": 9.617380012265787e-05, "loss": 2.3691, "step": 14775 }, { "epoch": 0.13, "learning_rate": 9.617122618966117e-05, "loss": 2.3029, "step": 14780 }, { "epoch": 0.13, "learning_rate": 9.616865142566408e-05, "loss": 2.3203, "step": 14785 }, { "epoch": 0.13, "learning_rate": 9.616607583071295e-05, "loss": 2.3486, "step": 14790 }, { "epoch": 0.13, "learning_rate": 9.616349940485416e-05, "loss": 2.2637, "step": 14795 }, { "epoch": 0.13, "learning_rate": 9.616092214813403e-05, "loss": 2.3601, "step": 14800 }, { "epoch": 0.13, "learning_rate": 9.6158344060599e-05, "loss": 2.4694, "step": 14805 }, { "epoch": 0.13, "learning_rate": 9.615576514229543e-05, "loss": 2.4369, "step": 14810 }, { "epoch": 0.13, "learning_rate": 9.615318539326976e-05, "loss": 2.3813, "step": 14815 }, { "epoch": 0.13, "learning_rate": 9.61506048135684e-05, "loss": 2.3777, "step": 14820 }, { "epoch": 0.13, "learning_rate": 9.61480234032378e-05, "loss": 2.3858, "step": 14825 }, { "epoch": 0.13, "learning_rate": 9.614544116232444e-05, "loss": 2.3934, "step": 14830 }, { "epoch": 0.13, "learning_rate": 9.614285809087479e-05, "loss": 2.3885, "step": 14835 }, { "epoch": 0.13, "learning_rate": 9.614027418893533e-05, "loss": 2.332, "step": 14840 }, { "epoch": 0.13, "learning_rate": 9.613768945655258e-05, "loss": 2.3722, "step": 14845 }, { "epoch": 0.13, "learning_rate": 9.613510389377302e-05, "loss": 2.4066, "step": 14850 }, { "epoch": 0.13, "learning_rate": 9.613251750064324e-05, "loss": 2.3508, "step": 14855 }, { "epoch": 0.13, "learning_rate": 9.612993027720977e-05, "loss": 2.393, "step": 14860 }, { "epoch": 0.13, "learning_rate": 9.612734222351916e-05, "loss": 2.4235, "step": 14865 }, { "epoch": 0.13, "learning_rate": 9.612475333961801e-05, "loss": 2.3126, "step": 14870 }, { "epoch": 0.13, "learning_rate": 9.612216362555291e-05, "loss": 2.296, "step": 14875 }, { "epoch": 0.13, "learning_rate": 9.611957308137046e-05, "loss": 2.3585, "step": 14880 }, { "epoch": 0.13, "learning_rate": 9.611698170711729e-05, "loss": 2.4034, "step": 14885 }, { "epoch": 0.13, "learning_rate": 9.611438950284006e-05, "loss": 2.4075, "step": 14890 }, { "epoch": 0.13, "learning_rate": 9.611179646858541e-05, "loss": 2.4002, "step": 14895 }, { "epoch": 0.13, "learning_rate": 9.61092026044e-05, "loss": 2.3934, "step": 14900 }, { "epoch": 0.13, "learning_rate": 9.61066079103305e-05, "loss": 2.3331, "step": 14905 }, { "epoch": 0.13, "learning_rate": 9.610401238642367e-05, "loss": 2.3838, "step": 14910 }, { "epoch": 0.13, "learning_rate": 9.610141603272618e-05, "loss": 2.3818, "step": 14915 }, { "epoch": 0.13, "learning_rate": 9.609881884928475e-05, "loss": 2.3807, "step": 14920 }, { "epoch": 0.13, "learning_rate": 9.609622083614616e-05, "loss": 2.3712, "step": 14925 }, { "epoch": 0.13, "learning_rate": 9.609362199335716e-05, "loss": 2.3662, "step": 14930 }, { "epoch": 0.13, "learning_rate": 9.609102232096449e-05, "loss": 2.411, "step": 14935 }, { "epoch": 0.13, "learning_rate": 9.6088421819015e-05, "loss": 2.3217, "step": 14940 }, { "epoch": 0.13, "learning_rate": 9.608582048755543e-05, "loss": 2.416, "step": 14945 }, { "epoch": 0.13, "learning_rate": 9.608321832663265e-05, "loss": 2.4119, "step": 14950 }, { "epoch": 0.13, "learning_rate": 9.608061533629346e-05, "loss": 2.3808, "step": 14955 }, { "epoch": 0.13, "learning_rate": 9.607801151658475e-05, "loss": 2.3754, "step": 14960 }, { "epoch": 0.13, "learning_rate": 9.607540686755334e-05, "loss": 2.4264, "step": 14965 }, { "epoch": 0.13, "learning_rate": 9.607280138924613e-05, "loss": 2.3936, "step": 14970 }, { "epoch": 0.13, "learning_rate": 9.607019508171e-05, "loss": 2.2774, "step": 14975 }, { "epoch": 0.13, "learning_rate": 9.606758794499189e-05, "loss": 2.4042, "step": 14980 }, { "epoch": 0.13, "learning_rate": 9.60649799791387e-05, "loss": 2.3605, "step": 14985 }, { "epoch": 0.13, "learning_rate": 9.606237118419737e-05, "loss": 2.2979, "step": 14990 }, { "epoch": 0.13, "learning_rate": 9.605976156021484e-05, "loss": 2.4053, "step": 14995 }, { "epoch": 0.13, "learning_rate": 9.605715110723812e-05, "loss": 2.3236, "step": 15000 }, { "epoch": 0.13, "learning_rate": 9.605453982531416e-05, "loss": 2.4456, "step": 15005 }, { "epoch": 0.13, "learning_rate": 9.605192771448997e-05, "loss": 2.4214, "step": 15010 }, { "epoch": 0.13, "learning_rate": 9.604931477481254e-05, "loss": 2.4542, "step": 15015 }, { "epoch": 0.13, "learning_rate": 9.604670100632895e-05, "loss": 2.3634, "step": 15020 }, { "epoch": 0.13, "learning_rate": 9.604408640908619e-05, "loss": 2.3193, "step": 15025 }, { "epoch": 0.13, "learning_rate": 9.604147098313134e-05, "loss": 2.4158, "step": 15030 }, { "epoch": 0.13, "learning_rate": 9.603885472851148e-05, "loss": 2.337, "step": 15035 }, { "epoch": 0.13, "learning_rate": 9.60362376452737e-05, "loss": 2.3869, "step": 15040 }, { "epoch": 0.13, "learning_rate": 9.603361973346507e-05, "loss": 2.4022, "step": 15045 }, { "epoch": 0.13, "learning_rate": 9.603100099313276e-05, "loss": 2.3657, "step": 15050 }, { "epoch": 0.13, "learning_rate": 9.602838142432386e-05, "loss": 2.3415, "step": 15055 }, { "epoch": 0.13, "learning_rate": 9.602576102708554e-05, "loss": 2.3255, "step": 15060 }, { "epoch": 0.13, "learning_rate": 9.602313980146493e-05, "loss": 2.347, "step": 15065 }, { "epoch": 0.13, "learning_rate": 9.602051774750926e-05, "loss": 2.3423, "step": 15070 }, { "epoch": 0.13, "learning_rate": 9.60178948652657e-05, "loss": 2.4071, "step": 15075 }, { "epoch": 0.13, "learning_rate": 9.601527115478142e-05, "loss": 2.3903, "step": 15080 }, { "epoch": 0.13, "learning_rate": 9.601264661610368e-05, "loss": 2.4075, "step": 15085 }, { "epoch": 0.13, "learning_rate": 9.601002124927973e-05, "loss": 2.4153, "step": 15090 }, { "epoch": 0.13, "learning_rate": 9.600739505435679e-05, "loss": 2.4051, "step": 15095 }, { "epoch": 0.13, "learning_rate": 9.600476803138214e-05, "loss": 2.3962, "step": 15100 }, { "epoch": 0.13, "learning_rate": 9.600214018040307e-05, "loss": 2.372, "step": 15105 }, { "epoch": 0.13, "learning_rate": 9.599951150146686e-05, "loss": 2.463, "step": 15110 }, { "epoch": 0.13, "learning_rate": 9.599688199462082e-05, "loss": 2.3765, "step": 15115 }, { "epoch": 0.13, "learning_rate": 9.59942516599123e-05, "loss": 2.4001, "step": 15120 }, { "epoch": 0.13, "learning_rate": 9.599162049738863e-05, "loss": 2.3995, "step": 15125 }, { "epoch": 0.13, "learning_rate": 9.598898850709717e-05, "loss": 2.3468, "step": 15130 }, { "epoch": 0.13, "learning_rate": 9.598635568908527e-05, "loss": 2.3356, "step": 15135 }, { "epoch": 0.13, "learning_rate": 9.598372204340032e-05, "loss": 2.2688, "step": 15140 }, { "epoch": 0.13, "learning_rate": 9.598108757008974e-05, "loss": 2.2955, "step": 15145 }, { "epoch": 0.13, "learning_rate": 9.597845226920095e-05, "loss": 2.3743, "step": 15150 }, { "epoch": 0.13, "learning_rate": 9.597581614078137e-05, "loss": 2.4666, "step": 15155 }, { "epoch": 0.13, "learning_rate": 9.597317918487844e-05, "loss": 2.4215, "step": 15160 }, { "epoch": 0.13, "learning_rate": 9.597054140153961e-05, "loss": 2.3653, "step": 15165 }, { "epoch": 0.13, "learning_rate": 9.596790279081237e-05, "loss": 2.323, "step": 15170 }, { "epoch": 0.13, "learning_rate": 9.596526335274424e-05, "loss": 2.3323, "step": 15175 }, { "epoch": 0.13, "learning_rate": 9.596262308738267e-05, "loss": 2.3578, "step": 15180 }, { "epoch": 0.13, "learning_rate": 9.595998199477523e-05, "loss": 2.4073, "step": 15185 }, { "epoch": 0.13, "learning_rate": 9.595734007496941e-05, "loss": 2.4163, "step": 15190 }, { "epoch": 0.13, "learning_rate": 9.59546973280128e-05, "loss": 2.3632, "step": 15195 }, { "epoch": 0.13, "learning_rate": 9.595205375395291e-05, "loss": 2.3207, "step": 15200 }, { "epoch": 0.13, "learning_rate": 9.594940935283738e-05, "loss": 2.3112, "step": 15205 }, { "epoch": 0.13, "learning_rate": 9.594676412471377e-05, "loss": 2.332, "step": 15210 }, { "epoch": 0.13, "learning_rate": 9.59441180696297e-05, "loss": 2.4152, "step": 15215 }, { "epoch": 0.13, "learning_rate": 9.59414711876328e-05, "loss": 2.3606, "step": 15220 }, { "epoch": 0.13, "learning_rate": 9.59388234787707e-05, "loss": 2.3146, "step": 15225 }, { "epoch": 0.13, "learning_rate": 9.593617494309106e-05, "loss": 2.3751, "step": 15230 }, { "epoch": 0.13, "learning_rate": 9.593352558064155e-05, "loss": 2.4072, "step": 15235 }, { "epoch": 0.13, "learning_rate": 9.593087539146983e-05, "loss": 2.4305, "step": 15240 }, { "epoch": 0.13, "learning_rate": 9.592822437562364e-05, "loss": 2.3715, "step": 15245 }, { "epoch": 0.13, "learning_rate": 9.592557253315065e-05, "loss": 2.4057, "step": 15250 }, { "epoch": 0.13, "learning_rate": 9.592291986409862e-05, "loss": 2.4299, "step": 15255 }, { "epoch": 0.13, "learning_rate": 9.592026636851529e-05, "loss": 2.4047, "step": 15260 }, { "epoch": 0.13, "learning_rate": 9.59176120464484e-05, "loss": 2.3295, "step": 15265 }, { "epoch": 0.13, "learning_rate": 9.591495689794574e-05, "loss": 2.3798, "step": 15270 }, { "epoch": 0.13, "learning_rate": 9.59123009230551e-05, "loss": 2.4038, "step": 15275 }, { "epoch": 0.13, "learning_rate": 9.590964412182428e-05, "loss": 2.3991, "step": 15280 }, { "epoch": 0.13, "learning_rate": 9.590698649430108e-05, "loss": 2.382, "step": 15285 }, { "epoch": 0.13, "learning_rate": 9.590432804053336e-05, "loss": 2.3763, "step": 15290 }, { "epoch": 0.13, "learning_rate": 9.590166876056892e-05, "loss": 2.4247, "step": 15295 }, { "epoch": 0.13, "learning_rate": 9.589900865445569e-05, "loss": 2.3342, "step": 15300 }, { "epoch": 0.13, "learning_rate": 9.58963477222415e-05, "loss": 2.3049, "step": 15305 }, { "epoch": 0.13, "learning_rate": 9.589368596397426e-05, "loss": 2.4106, "step": 15310 }, { "epoch": 0.13, "learning_rate": 9.589102337970185e-05, "loss": 2.4354, "step": 15315 }, { "epoch": 0.13, "learning_rate": 9.588835996947225e-05, "loss": 2.412, "step": 15320 }, { "epoch": 0.13, "learning_rate": 9.588569573333335e-05, "loss": 2.4238, "step": 15325 }, { "epoch": 0.13, "learning_rate": 9.588303067133311e-05, "loss": 2.403, "step": 15330 }, { "epoch": 0.13, "learning_rate": 9.588036478351948e-05, "loss": 2.3334, "step": 15335 }, { "epoch": 0.13, "learning_rate": 9.587769806994047e-05, "loss": 2.3802, "step": 15340 }, { "epoch": 0.13, "learning_rate": 9.587503053064408e-05, "loss": 2.3428, "step": 15345 }, { "epoch": 0.13, "learning_rate": 9.58723621656783e-05, "loss": 2.3373, "step": 15350 }, { "epoch": 0.13, "learning_rate": 9.586969297509116e-05, "loss": 2.4066, "step": 15355 }, { "epoch": 0.13, "learning_rate": 9.586702295893069e-05, "loss": 2.3474, "step": 15360 }, { "epoch": 0.13, "learning_rate": 9.586435211724498e-05, "loss": 2.3624, "step": 15365 }, { "epoch": 0.13, "learning_rate": 9.586168045008206e-05, "loss": 2.4152, "step": 15370 }, { "epoch": 0.13, "learning_rate": 9.585900795749006e-05, "loss": 2.3721, "step": 15375 }, { "epoch": 0.13, "learning_rate": 9.585633463951704e-05, "loss": 2.4297, "step": 15380 }, { "epoch": 0.13, "learning_rate": 9.585366049621112e-05, "loss": 2.341, "step": 15385 }, { "epoch": 0.13, "learning_rate": 9.585098552762045e-05, "loss": 2.3458, "step": 15390 }, { "epoch": 0.13, "learning_rate": 9.584830973379316e-05, "loss": 2.4221, "step": 15395 }, { "epoch": 0.13, "learning_rate": 9.584563311477742e-05, "loss": 2.378, "step": 15400 }, { "epoch": 0.13, "learning_rate": 9.584295567062141e-05, "loss": 2.3376, "step": 15405 }, { "epoch": 0.13, "learning_rate": 9.584027740137329e-05, "loss": 2.4026, "step": 15410 }, { "epoch": 0.13, "learning_rate": 9.583759830708127e-05, "loss": 2.4169, "step": 15415 }, { "epoch": 0.13, "learning_rate": 9.58349183877936e-05, "loss": 2.3888, "step": 15420 }, { "epoch": 0.13, "learning_rate": 9.583223764355849e-05, "loss": 2.4204, "step": 15425 }, { "epoch": 0.13, "learning_rate": 9.58295560744242e-05, "loss": 2.3048, "step": 15430 }, { "epoch": 0.13, "learning_rate": 9.582687368043898e-05, "loss": 2.3105, "step": 15435 }, { "epoch": 0.13, "learning_rate": 9.582419046165113e-05, "loss": 2.4009, "step": 15440 }, { "epoch": 0.13, "learning_rate": 9.58215064181089e-05, "loss": 2.386, "step": 15445 }, { "epoch": 0.13, "learning_rate": 9.581882154986064e-05, "loss": 2.3185, "step": 15450 }, { "epoch": 0.13, "learning_rate": 9.581613585695465e-05, "loss": 2.3574, "step": 15455 }, { "epoch": 0.13, "learning_rate": 9.581344933943929e-05, "loss": 2.3802, "step": 15460 }, { "epoch": 0.13, "learning_rate": 9.581076199736289e-05, "loss": 2.3155, "step": 15465 }, { "epoch": 0.13, "learning_rate": 9.580807383077384e-05, "loss": 2.4388, "step": 15470 }, { "epoch": 0.13, "learning_rate": 9.58053848397205e-05, "loss": 2.4334, "step": 15475 }, { "epoch": 0.13, "learning_rate": 9.580269502425127e-05, "loss": 2.3408, "step": 15480 }, { "epoch": 0.13, "learning_rate": 9.580000438441458e-05, "loss": 2.3803, "step": 15485 }, { "epoch": 0.13, "learning_rate": 9.579731292025883e-05, "loss": 2.4641, "step": 15490 }, { "epoch": 0.13, "learning_rate": 9.579462063183249e-05, "loss": 2.3966, "step": 15495 }, { "epoch": 0.13, "learning_rate": 9.5791927519184e-05, "loss": 2.412, "step": 15500 }, { "epoch": 0.13, "learning_rate": 9.578923358236183e-05, "loss": 2.3459, "step": 15505 }, { "epoch": 0.13, "learning_rate": 9.578653882141447e-05, "loss": 2.3971, "step": 15510 }, { "epoch": 0.13, "learning_rate": 9.578384323639042e-05, "loss": 2.4284, "step": 15515 }, { "epoch": 0.13, "learning_rate": 9.57811468273382e-05, "loss": 2.3889, "step": 15520 }, { "epoch": 0.13, "learning_rate": 9.577844959430633e-05, "loss": 2.3034, "step": 15525 }, { "epoch": 0.13, "learning_rate": 9.577575153734337e-05, "loss": 2.4028, "step": 15530 }, { "epoch": 0.13, "learning_rate": 9.577305265649787e-05, "loss": 2.4323, "step": 15535 }, { "epoch": 0.13, "learning_rate": 9.577035295181842e-05, "loss": 2.3769, "step": 15540 }, { "epoch": 0.13, "learning_rate": 9.576765242335359e-05, "loss": 2.4751, "step": 15545 }, { "epoch": 0.13, "learning_rate": 9.5764951071152e-05, "loss": 2.3697, "step": 15550 }, { "epoch": 0.13, "learning_rate": 9.576224889526224e-05, "loss": 2.3361, "step": 15555 }, { "epoch": 0.13, "learning_rate": 9.5759545895733e-05, "loss": 2.3778, "step": 15560 }, { "epoch": 0.13, "learning_rate": 9.575684207261286e-05, "loss": 2.3741, "step": 15565 }, { "epoch": 0.13, "learning_rate": 9.575413742595053e-05, "loss": 2.4438, "step": 15570 }, { "epoch": 0.13, "learning_rate": 9.57514319557947e-05, "loss": 2.3074, "step": 15575 }, { "epoch": 0.13, "learning_rate": 9.574872566219402e-05, "loss": 2.455, "step": 15580 }, { "epoch": 0.13, "learning_rate": 9.574601854519723e-05, "loss": 2.3613, "step": 15585 }, { "epoch": 0.13, "learning_rate": 9.574331060485304e-05, "loss": 2.2587, "step": 15590 }, { "epoch": 0.13, "learning_rate": 9.57406018412102e-05, "loss": 2.2422, "step": 15595 }, { "epoch": 0.13, "learning_rate": 9.573789225431745e-05, "loss": 2.4214, "step": 15600 }, { "epoch": 0.13, "learning_rate": 9.573518184422356e-05, "loss": 2.4127, "step": 15605 }, { "epoch": 0.13, "learning_rate": 9.573247061097732e-05, "loss": 2.4652, "step": 15610 }, { "epoch": 0.13, "learning_rate": 9.572975855462754e-05, "loss": 2.3823, "step": 15615 }, { "epoch": 0.13, "learning_rate": 9.572704567522299e-05, "loss": 2.3468, "step": 15620 }, { "epoch": 0.13, "learning_rate": 9.572433197281251e-05, "loss": 2.3942, "step": 15625 }, { "epoch": 0.13, "learning_rate": 9.5721617447445e-05, "loss": 2.3575, "step": 15630 }, { "epoch": 0.13, "learning_rate": 9.571890209916924e-05, "loss": 2.3816, "step": 15635 }, { "epoch": 0.13, "learning_rate": 9.571618592803413e-05, "loss": 2.3679, "step": 15640 }, { "epoch": 0.13, "learning_rate": 9.571346893408856e-05, "loss": 2.3657, "step": 15645 }, { "epoch": 0.13, "learning_rate": 9.571075111738144e-05, "loss": 2.3619, "step": 15650 }, { "epoch": 0.13, "learning_rate": 9.570803247796167e-05, "loss": 2.4113, "step": 15655 }, { "epoch": 0.13, "learning_rate": 9.57053130158782e-05, "loss": 2.3573, "step": 15660 }, { "epoch": 0.13, "learning_rate": 9.570259273117995e-05, "loss": 2.372, "step": 15665 }, { "epoch": 0.13, "learning_rate": 9.56998716239159e-05, "loss": 2.3617, "step": 15670 }, { "epoch": 0.13, "learning_rate": 9.5697149694135e-05, "loss": 2.3594, "step": 15675 }, { "epoch": 0.13, "learning_rate": 9.569442694188626e-05, "loss": 2.454, "step": 15680 }, { "epoch": 0.13, "learning_rate": 9.56917033672187e-05, "loss": 2.3138, "step": 15685 }, { "epoch": 0.13, "learning_rate": 9.568897897018131e-05, "loss": 2.3336, "step": 15690 }, { "epoch": 0.13, "learning_rate": 9.568625375082313e-05, "loss": 2.3109, "step": 15695 }, { "epoch": 0.13, "learning_rate": 9.568352770919322e-05, "loss": 2.3493, "step": 15700 }, { "epoch": 0.13, "learning_rate": 9.568080084534065e-05, "loss": 2.4305, "step": 15705 }, { "epoch": 0.13, "learning_rate": 9.567807315931448e-05, "loss": 2.3277, "step": 15710 }, { "epoch": 0.13, "learning_rate": 9.56753446511638e-05, "loss": 2.4189, "step": 15715 }, { "epoch": 0.13, "learning_rate": 9.567261532093775e-05, "loss": 2.3971, "step": 15720 }, { "epoch": 0.13, "learning_rate": 9.56698851686854e-05, "loss": 2.2968, "step": 15725 }, { "epoch": 0.13, "learning_rate": 9.566715419445594e-05, "loss": 2.3065, "step": 15730 }, { "epoch": 0.13, "learning_rate": 9.566442239829852e-05, "loss": 2.3717, "step": 15735 }, { "epoch": 0.13, "learning_rate": 9.566168978026226e-05, "loss": 2.3573, "step": 15740 }, { "epoch": 0.13, "learning_rate": 9.565895634039638e-05, "loss": 2.4482, "step": 15745 }, { "epoch": 0.13, "learning_rate": 9.565622207875009e-05, "loss": 2.2979, "step": 15750 }, { "epoch": 0.13, "learning_rate": 9.565348699537256e-05, "loss": 2.3591, "step": 15755 }, { "epoch": 0.13, "learning_rate": 9.565075109031305e-05, "loss": 2.301, "step": 15760 }, { "epoch": 0.13, "learning_rate": 9.564801436362078e-05, "loss": 2.3919, "step": 15765 }, { "epoch": 0.13, "learning_rate": 9.564527681534503e-05, "loss": 2.3317, "step": 15770 }, { "epoch": 0.13, "learning_rate": 9.564253844553506e-05, "loss": 2.2735, "step": 15775 }, { "epoch": 0.13, "learning_rate": 9.563979925424014e-05, "loss": 2.4094, "step": 15780 }, { "epoch": 0.13, "learning_rate": 9.563705924150959e-05, "loss": 2.2847, "step": 15785 }, { "epoch": 0.13, "learning_rate": 9.563431840739271e-05, "loss": 2.3425, "step": 15790 }, { "epoch": 0.13, "learning_rate": 9.563157675193884e-05, "loss": 2.3299, "step": 15795 }, { "epoch": 0.13, "learning_rate": 9.562883427519733e-05, "loss": 2.3741, "step": 15800 }, { "epoch": 0.13, "learning_rate": 9.562609097721754e-05, "loss": 2.3158, "step": 15805 }, { "epoch": 0.13, "learning_rate": 9.562334685804882e-05, "loss": 2.3746, "step": 15810 }, { "epoch": 0.13, "learning_rate": 9.56206019177406e-05, "loss": 2.3249, "step": 15815 }, { "epoch": 0.13, "learning_rate": 9.561785615634225e-05, "loss": 2.3505, "step": 15820 }, { "epoch": 0.14, "learning_rate": 9.56151095739032e-05, "loss": 2.3482, "step": 15825 }, { "epoch": 0.14, "learning_rate": 9.561236217047288e-05, "loss": 2.3534, "step": 15830 }, { "epoch": 0.14, "learning_rate": 9.560961394610076e-05, "loss": 2.4138, "step": 15835 }, { "epoch": 0.14, "learning_rate": 9.560686490083626e-05, "loss": 2.4464, "step": 15840 }, { "epoch": 0.14, "learning_rate": 9.560411503472891e-05, "loss": 2.3021, "step": 15845 }, { "epoch": 0.14, "learning_rate": 9.560136434782816e-05, "loss": 2.466, "step": 15850 }, { "epoch": 0.14, "learning_rate": 9.559861284018354e-05, "loss": 2.3446, "step": 15855 }, { "epoch": 0.14, "learning_rate": 9.559586051184454e-05, "loss": 2.2842, "step": 15860 }, { "epoch": 0.14, "learning_rate": 9.559310736286075e-05, "loss": 2.3796, "step": 15865 }, { "epoch": 0.14, "learning_rate": 9.55903533932817e-05, "loss": 2.3651, "step": 15870 }, { "epoch": 0.14, "learning_rate": 9.558759860315694e-05, "loss": 2.3721, "step": 15875 }, { "epoch": 0.14, "learning_rate": 9.558484299253607e-05, "loss": 2.3766, "step": 15880 }, { "epoch": 0.14, "learning_rate": 9.558208656146868e-05, "loss": 2.3852, "step": 15885 }, { "epoch": 0.14, "learning_rate": 9.557932931000437e-05, "loss": 2.3226, "step": 15890 }, { "epoch": 0.14, "learning_rate": 9.55765712381928e-05, "loss": 2.4871, "step": 15895 }, { "epoch": 0.14, "learning_rate": 9.557381234608356e-05, "loss": 2.423, "step": 15900 }, { "epoch": 0.14, "learning_rate": 9.557105263372633e-05, "loss": 2.3465, "step": 15905 }, { "epoch": 0.14, "learning_rate": 9.55682921011708e-05, "loss": 2.3099, "step": 15910 }, { "epoch": 0.14, "learning_rate": 9.556553074846662e-05, "loss": 2.367, "step": 15915 }, { "epoch": 0.14, "learning_rate": 9.556276857566351e-05, "loss": 2.3462, "step": 15920 }, { "epoch": 0.14, "learning_rate": 9.556000558281118e-05, "loss": 2.4287, "step": 15925 }, { "epoch": 0.14, "learning_rate": 9.555724176995937e-05, "loss": 2.3548, "step": 15930 }, { "epoch": 0.14, "learning_rate": 9.55544771371578e-05, "loss": 2.3428, "step": 15935 }, { "epoch": 0.14, "learning_rate": 9.555171168445622e-05, "loss": 2.3627, "step": 15940 }, { "epoch": 0.14, "learning_rate": 9.554894541190446e-05, "loss": 2.3514, "step": 15945 }, { "epoch": 0.14, "learning_rate": 9.554617831955226e-05, "loss": 2.4192, "step": 15950 }, { "epoch": 0.14, "learning_rate": 9.554341040744943e-05, "loss": 2.393, "step": 15955 }, { "epoch": 0.14, "learning_rate": 9.554064167564579e-05, "loss": 2.4072, "step": 15960 }, { "epoch": 0.14, "learning_rate": 9.553787212419119e-05, "loss": 2.3881, "step": 15965 }, { "epoch": 0.14, "learning_rate": 9.553510175313544e-05, "loss": 2.3207, "step": 15970 }, { "epoch": 0.14, "learning_rate": 9.553233056252843e-05, "loss": 2.3823, "step": 15975 }, { "epoch": 0.14, "learning_rate": 9.552955855242004e-05, "loss": 2.4036, "step": 15980 }, { "epoch": 0.14, "learning_rate": 9.552678572286014e-05, "loss": 2.3194, "step": 15985 }, { "epoch": 0.14, "learning_rate": 9.552401207389866e-05, "loss": 2.3546, "step": 15990 }, { "epoch": 0.14, "learning_rate": 9.55212376055855e-05, "loss": 2.3956, "step": 15995 }, { "epoch": 0.14, "learning_rate": 9.551846231797061e-05, "loss": 2.3391, "step": 16000 }, { "epoch": 0.14, "learning_rate": 9.551568621110391e-05, "loss": 2.4515, "step": 16005 }, { "epoch": 0.14, "learning_rate": 9.551290928503543e-05, "loss": 2.4175, "step": 16010 }, { "epoch": 0.14, "learning_rate": 9.551013153981508e-05, "loss": 2.4038, "step": 16015 }, { "epoch": 0.14, "learning_rate": 9.550735297549289e-05, "loss": 2.2903, "step": 16020 }, { "epoch": 0.14, "learning_rate": 9.550457359211886e-05, "loss": 2.4047, "step": 16025 }, { "epoch": 0.14, "learning_rate": 9.550179338974302e-05, "loss": 2.407, "step": 16030 }, { "epoch": 0.14, "learning_rate": 9.549901236841539e-05, "loss": 2.2682, "step": 16035 }, { "epoch": 0.14, "learning_rate": 9.549623052818605e-05, "loss": 2.4094, "step": 16040 }, { "epoch": 0.14, "learning_rate": 9.549344786910506e-05, "loss": 2.4021, "step": 16045 }, { "epoch": 0.14, "learning_rate": 9.54906643912225e-05, "loss": 2.4832, "step": 16050 }, { "epoch": 0.14, "learning_rate": 9.548788009458846e-05, "loss": 2.2768, "step": 16055 }, { "epoch": 0.14, "learning_rate": 9.548509497925307e-05, "loss": 2.3646, "step": 16060 }, { "epoch": 0.14, "learning_rate": 9.548230904526643e-05, "loss": 2.3415, "step": 16065 }, { "epoch": 0.14, "learning_rate": 9.547952229267871e-05, "loss": 2.3512, "step": 16070 }, { "epoch": 0.14, "learning_rate": 9.547673472154006e-05, "loss": 2.3026, "step": 16075 }, { "epoch": 0.14, "learning_rate": 9.547394633190063e-05, "loss": 2.3728, "step": 16080 }, { "epoch": 0.14, "learning_rate": 9.547115712381065e-05, "loss": 2.4541, "step": 16085 }, { "epoch": 0.14, "learning_rate": 9.546836709732028e-05, "loss": 2.3792, "step": 16090 }, { "epoch": 0.14, "learning_rate": 9.546557625247974e-05, "loss": 2.3246, "step": 16095 }, { "epoch": 0.14, "learning_rate": 9.546278458933929e-05, "loss": 2.375, "step": 16100 }, { "epoch": 0.14, "learning_rate": 9.545999210794912e-05, "loss": 2.3415, "step": 16105 }, { "epoch": 0.14, "learning_rate": 9.545719880835955e-05, "loss": 2.3251, "step": 16110 }, { "epoch": 0.14, "learning_rate": 9.545440469062083e-05, "loss": 2.362, "step": 16115 }, { "epoch": 0.14, "learning_rate": 9.545160975478324e-05, "loss": 2.381, "step": 16120 }, { "epoch": 0.14, "learning_rate": 9.54488140008971e-05, "loss": 2.2871, "step": 16125 }, { "epoch": 0.14, "learning_rate": 9.544601742901271e-05, "loss": 2.3777, "step": 16130 }, { "epoch": 0.14, "learning_rate": 9.54432200391804e-05, "loss": 2.4189, "step": 16135 }, { "epoch": 0.14, "learning_rate": 9.544042183145056e-05, "loss": 2.4144, "step": 16140 }, { "epoch": 0.14, "learning_rate": 9.543762280587351e-05, "loss": 2.3506, "step": 16145 }, { "epoch": 0.14, "learning_rate": 9.543482296249964e-05, "loss": 2.4005, "step": 16150 }, { "epoch": 0.14, "learning_rate": 9.543202230137935e-05, "loss": 2.3677, "step": 16155 }, { "epoch": 0.14, "learning_rate": 9.542922082256303e-05, "loss": 2.4111, "step": 16160 }, { "epoch": 0.14, "learning_rate": 9.542641852610112e-05, "loss": 2.351, "step": 16165 }, { "epoch": 0.14, "learning_rate": 9.542361541204406e-05, "loss": 2.431, "step": 16170 }, { "epoch": 0.14, "learning_rate": 9.542081148044228e-05, "loss": 2.3134, "step": 16175 }, { "epoch": 0.14, "learning_rate": 9.541800673134626e-05, "loss": 2.3661, "step": 16180 }, { "epoch": 0.14, "learning_rate": 9.541520116480647e-05, "loss": 2.3632, "step": 16185 }, { "epoch": 0.14, "learning_rate": 9.541239478087342e-05, "loss": 2.3974, "step": 16190 }, { "epoch": 0.14, "learning_rate": 9.540958757959762e-05, "loss": 2.4063, "step": 16195 }, { "epoch": 0.14, "learning_rate": 9.540677956102957e-05, "loss": 2.3928, "step": 16200 }, { "epoch": 0.14, "learning_rate": 9.540397072521983e-05, "loss": 2.3838, "step": 16205 }, { "epoch": 0.14, "learning_rate": 9.540116107221895e-05, "loss": 2.3531, "step": 16210 }, { "epoch": 0.14, "learning_rate": 9.539835060207749e-05, "loss": 2.3367, "step": 16215 }, { "epoch": 0.14, "learning_rate": 9.539553931484605e-05, "loss": 2.3833, "step": 16220 }, { "epoch": 0.14, "learning_rate": 9.539272721057524e-05, "loss": 2.3507, "step": 16225 }, { "epoch": 0.14, "learning_rate": 9.538991428931563e-05, "loss": 2.4058, "step": 16230 }, { "epoch": 0.14, "learning_rate": 9.538710055111787e-05, "loss": 2.4943, "step": 16235 }, { "epoch": 0.14, "learning_rate": 9.538428599603261e-05, "loss": 2.3931, "step": 16240 }, { "epoch": 0.14, "learning_rate": 9.53814706241105e-05, "loss": 2.3692, "step": 16245 }, { "epoch": 0.14, "learning_rate": 9.537865443540221e-05, "loss": 2.3677, "step": 16250 }, { "epoch": 0.14, "learning_rate": 9.537583742995844e-05, "loss": 2.423, "step": 16255 }, { "epoch": 0.14, "learning_rate": 9.537301960782986e-05, "loss": 2.4195, "step": 16260 }, { "epoch": 0.14, "learning_rate": 9.537020096906721e-05, "loss": 2.407, "step": 16265 }, { "epoch": 0.14, "learning_rate": 9.536738151372122e-05, "loss": 2.2579, "step": 16270 }, { "epoch": 0.14, "learning_rate": 9.536456124184264e-05, "loss": 2.3815, "step": 16275 }, { "epoch": 0.14, "learning_rate": 9.53617401534822e-05, "loss": 2.3905, "step": 16280 }, { "epoch": 0.14, "learning_rate": 9.535891824869071e-05, "loss": 2.3465, "step": 16285 }, { "epoch": 0.14, "learning_rate": 9.535609552751895e-05, "loss": 2.3047, "step": 16290 }, { "epoch": 0.14, "learning_rate": 9.53532719900177e-05, "loss": 2.3762, "step": 16295 }, { "epoch": 0.14, "learning_rate": 9.535044763623781e-05, "loss": 2.3611, "step": 16300 }, { "epoch": 0.14, "learning_rate": 9.53476224662301e-05, "loss": 2.3354, "step": 16305 }, { "epoch": 0.14, "learning_rate": 9.534479648004541e-05, "loss": 2.3438, "step": 16310 }, { "epoch": 0.14, "learning_rate": 9.534196967773463e-05, "loss": 2.3843, "step": 16315 }, { "epoch": 0.14, "learning_rate": 9.53391420593486e-05, "loss": 2.4016, "step": 16320 }, { "epoch": 0.14, "learning_rate": 9.533631362493824e-05, "loss": 2.2717, "step": 16325 }, { "epoch": 0.14, "learning_rate": 9.533348437455445e-05, "loss": 2.4169, "step": 16330 }, { "epoch": 0.14, "learning_rate": 9.533065430824815e-05, "loss": 2.4468, "step": 16335 }, { "epoch": 0.14, "learning_rate": 9.532782342607027e-05, "loss": 2.3323, "step": 16340 }, { "epoch": 0.14, "learning_rate": 9.532499172807177e-05, "loss": 2.3319, "step": 16345 }, { "epoch": 0.14, "learning_rate": 9.532215921430361e-05, "loss": 2.4346, "step": 16350 }, { "epoch": 0.14, "learning_rate": 9.531932588481677e-05, "loss": 2.363, "step": 16355 }, { "epoch": 0.14, "learning_rate": 9.531649173966225e-05, "loss": 2.3374, "step": 16360 }, { "epoch": 0.14, "learning_rate": 9.531365677889105e-05, "loss": 2.44, "step": 16365 }, { "epoch": 0.14, "learning_rate": 9.531082100255422e-05, "loss": 2.3757, "step": 16370 }, { "epoch": 0.14, "learning_rate": 9.530798441070276e-05, "loss": 2.3706, "step": 16375 }, { "epoch": 0.14, "learning_rate": 9.530514700338776e-05, "loss": 2.3563, "step": 16380 }, { "epoch": 0.14, "learning_rate": 9.530230878066026e-05, "loss": 2.3282, "step": 16385 }, { "epoch": 0.14, "learning_rate": 9.529946974257136e-05, "loss": 2.3996, "step": 16390 }, { "epoch": 0.14, "learning_rate": 9.529662988917216e-05, "loss": 2.3543, "step": 16395 }, { "epoch": 0.14, "learning_rate": 9.529378922051375e-05, "loss": 2.3405, "step": 16400 }, { "epoch": 0.14, "learning_rate": 9.529094773664729e-05, "loss": 2.33, "step": 16405 }, { "epoch": 0.14, "learning_rate": 9.528810543762388e-05, "loss": 2.4333, "step": 16410 }, { "epoch": 0.14, "learning_rate": 9.52852623234947e-05, "loss": 2.4241, "step": 16415 }, { "epoch": 0.14, "learning_rate": 9.528241839431095e-05, "loss": 2.351, "step": 16420 }, { "epoch": 0.14, "learning_rate": 9.527957365012376e-05, "loss": 2.3909, "step": 16425 }, { "epoch": 0.14, "learning_rate": 9.527672809098438e-05, "loss": 2.4621, "step": 16430 }, { "epoch": 0.14, "learning_rate": 9.527388171694398e-05, "loss": 2.4247, "step": 16435 }, { "epoch": 0.14, "learning_rate": 9.527103452805381e-05, "loss": 2.4205, "step": 16440 }, { "epoch": 0.14, "learning_rate": 9.526818652436515e-05, "loss": 2.3695, "step": 16445 }, { "epoch": 0.14, "learning_rate": 9.52653377059292e-05, "loss": 2.3829, "step": 16450 }, { "epoch": 0.14, "learning_rate": 9.526248807279725e-05, "loss": 2.4017, "step": 16455 }, { "epoch": 0.14, "learning_rate": 9.525963762502062e-05, "loss": 2.3448, "step": 16460 }, { "epoch": 0.14, "learning_rate": 9.525678636265057e-05, "loss": 2.3561, "step": 16465 }, { "epoch": 0.14, "learning_rate": 9.525393428573846e-05, "loss": 2.3941, "step": 16470 }, { "epoch": 0.14, "learning_rate": 9.525108139433558e-05, "loss": 2.3952, "step": 16475 }, { "epoch": 0.14, "learning_rate": 9.524822768849331e-05, "loss": 2.3708, "step": 16480 }, { "epoch": 0.14, "learning_rate": 9.524537316826299e-05, "loss": 2.3916, "step": 16485 }, { "epoch": 0.14, "learning_rate": 9.524251783369602e-05, "loss": 2.3356, "step": 16490 }, { "epoch": 0.14, "learning_rate": 9.523966168484374e-05, "loss": 2.3841, "step": 16495 }, { "epoch": 0.14, "learning_rate": 9.523680472175764e-05, "loss": 2.4373, "step": 16500 }, { "epoch": 0.14, "learning_rate": 9.523394694448906e-05, "loss": 2.3356, "step": 16505 }, { "epoch": 0.14, "learning_rate": 9.523108835308948e-05, "loss": 2.3957, "step": 16510 }, { "epoch": 0.14, "learning_rate": 9.522822894761033e-05, "loss": 2.414, "step": 16515 }, { "epoch": 0.14, "learning_rate": 9.522536872810309e-05, "loss": 2.3113, "step": 16520 }, { "epoch": 0.14, "learning_rate": 9.522250769461922e-05, "loss": 2.4151, "step": 16525 }, { "epoch": 0.14, "learning_rate": 9.521964584721024e-05, "loss": 2.3049, "step": 16530 }, { "epoch": 0.14, "learning_rate": 9.521678318592761e-05, "loss": 2.3795, "step": 16535 }, { "epoch": 0.14, "learning_rate": 9.521391971082292e-05, "loss": 2.435, "step": 16540 }, { "epoch": 0.14, "learning_rate": 9.521105542194765e-05, "loss": 2.4014, "step": 16545 }, { "epoch": 0.14, "learning_rate": 9.520819031935338e-05, "loss": 2.3086, "step": 16550 }, { "epoch": 0.14, "learning_rate": 9.520532440309166e-05, "loss": 2.3816, "step": 16555 }, { "epoch": 0.14, "learning_rate": 9.520245767321409e-05, "loss": 2.4163, "step": 16560 }, { "epoch": 0.14, "learning_rate": 9.519959012977227e-05, "loss": 2.3816, "step": 16565 }, { "epoch": 0.14, "learning_rate": 9.51967217728178e-05, "loss": 2.2786, "step": 16570 }, { "epoch": 0.14, "learning_rate": 9.519385260240229e-05, "loss": 2.4444, "step": 16575 }, { "epoch": 0.14, "learning_rate": 9.51909826185774e-05, "loss": 2.4194, "step": 16580 }, { "epoch": 0.14, "learning_rate": 9.518811182139478e-05, "loss": 2.318, "step": 16585 }, { "epoch": 0.14, "learning_rate": 9.518524021090609e-05, "loss": 2.3556, "step": 16590 }, { "epoch": 0.14, "learning_rate": 9.518236778716303e-05, "loss": 2.4, "step": 16595 }, { "epoch": 0.14, "learning_rate": 9.517949455021728e-05, "loss": 2.3986, "step": 16600 }, { "epoch": 0.14, "learning_rate": 9.517662050012058e-05, "loss": 2.3155, "step": 16605 }, { "epoch": 0.14, "learning_rate": 9.517374563692463e-05, "loss": 2.4088, "step": 16610 }, { "epoch": 0.14, "learning_rate": 9.517086996068118e-05, "loss": 2.414, "step": 16615 }, { "epoch": 0.14, "learning_rate": 9.516799347144201e-05, "loss": 2.3799, "step": 16620 }, { "epoch": 0.14, "learning_rate": 9.516511616925887e-05, "loss": 2.3538, "step": 16625 }, { "epoch": 0.14, "learning_rate": 9.516223805418354e-05, "loss": 2.3756, "step": 16630 }, { "epoch": 0.14, "learning_rate": 9.515935912626783e-05, "loss": 2.3819, "step": 16635 }, { "epoch": 0.14, "learning_rate": 9.515647938556356e-05, "loss": 2.332, "step": 16640 }, { "epoch": 0.14, "learning_rate": 9.515359883212255e-05, "loss": 2.3797, "step": 16645 }, { "epoch": 0.14, "learning_rate": 9.515071746599666e-05, "loss": 2.4738, "step": 16650 }, { "epoch": 0.14, "learning_rate": 9.514783528723772e-05, "loss": 2.3264, "step": 16655 }, { "epoch": 0.14, "learning_rate": 9.514495229589765e-05, "loss": 2.3474, "step": 16660 }, { "epoch": 0.14, "learning_rate": 9.51420684920283e-05, "loss": 2.3955, "step": 16665 }, { "epoch": 0.14, "learning_rate": 9.513918387568159e-05, "loss": 2.4153, "step": 16670 }, { "epoch": 0.14, "learning_rate": 9.513629844690943e-05, "loss": 2.2553, "step": 16675 }, { "epoch": 0.14, "learning_rate": 9.513341220576377e-05, "loss": 2.3776, "step": 16680 }, { "epoch": 0.14, "learning_rate": 9.513052515229653e-05, "loss": 2.3604, "step": 16685 }, { "epoch": 0.14, "learning_rate": 9.512763728655969e-05, "loss": 2.3433, "step": 16690 }, { "epoch": 0.14, "learning_rate": 9.512474860860523e-05, "loss": 2.4177, "step": 16695 }, { "epoch": 0.14, "learning_rate": 9.512185911848512e-05, "loss": 2.3459, "step": 16700 }, { "epoch": 0.14, "learning_rate": 9.511896881625139e-05, "loss": 2.386, "step": 16705 }, { "epoch": 0.14, "learning_rate": 9.511607770195606e-05, "loss": 2.3631, "step": 16710 }, { "epoch": 0.14, "learning_rate": 9.511318577565114e-05, "loss": 2.3936, "step": 16715 }, { "epoch": 0.14, "learning_rate": 9.51102930373887e-05, "loss": 2.3677, "step": 16720 }, { "epoch": 0.14, "learning_rate": 9.51073994872208e-05, "loss": 2.3898, "step": 16725 }, { "epoch": 0.14, "learning_rate": 9.510450512519951e-05, "loss": 2.3869, "step": 16730 }, { "epoch": 0.14, "learning_rate": 9.510160995137693e-05, "loss": 2.415, "step": 16735 }, { "epoch": 0.14, "learning_rate": 9.509871396580518e-05, "loss": 2.3299, "step": 16740 }, { "epoch": 0.14, "learning_rate": 9.509581716853637e-05, "loss": 2.3862, "step": 16745 }, { "epoch": 0.14, "learning_rate": 9.509291955962262e-05, "loss": 2.3934, "step": 16750 }, { "epoch": 0.14, "learning_rate": 9.509002113911613e-05, "loss": 2.4121, "step": 16755 }, { "epoch": 0.14, "learning_rate": 9.508712190706903e-05, "loss": 2.4114, "step": 16760 }, { "epoch": 0.14, "learning_rate": 9.50842218635335e-05, "loss": 2.3821, "step": 16765 }, { "epoch": 0.14, "learning_rate": 9.508132100856173e-05, "loss": 2.3454, "step": 16770 }, { "epoch": 0.14, "learning_rate": 9.507841934220597e-05, "loss": 2.3264, "step": 16775 }, { "epoch": 0.14, "learning_rate": 9.50755168645184e-05, "loss": 2.4101, "step": 16780 }, { "epoch": 0.14, "learning_rate": 9.507261357555129e-05, "loss": 2.3536, "step": 16785 }, { "epoch": 0.14, "learning_rate": 9.506970947535688e-05, "loss": 2.3848, "step": 16790 }, { "epoch": 0.14, "learning_rate": 9.506680456398741e-05, "loss": 2.4085, "step": 16795 }, { "epoch": 0.14, "learning_rate": 9.506389884149525e-05, "loss": 2.3942, "step": 16800 }, { "epoch": 0.14, "learning_rate": 9.50609923079326e-05, "loss": 2.4049, "step": 16805 }, { "epoch": 0.14, "learning_rate": 9.505808496335183e-05, "loss": 2.2669, "step": 16810 }, { "epoch": 0.14, "learning_rate": 9.505517680780526e-05, "loss": 2.3545, "step": 16815 }, { "epoch": 0.14, "learning_rate": 9.505226784134521e-05, "loss": 2.3468, "step": 16820 }, { "epoch": 0.14, "learning_rate": 9.504935806402405e-05, "loss": 2.3197, "step": 16825 }, { "epoch": 0.14, "learning_rate": 9.504644747589415e-05, "loss": 2.4159, "step": 16830 }, { "epoch": 0.14, "learning_rate": 9.504353607700792e-05, "loss": 2.3522, "step": 16835 }, { "epoch": 0.14, "learning_rate": 9.50406238674177e-05, "loss": 2.3756, "step": 16840 }, { "epoch": 0.14, "learning_rate": 9.503771084717595e-05, "loss": 2.2679, "step": 16845 }, { "epoch": 0.14, "learning_rate": 9.50347970163351e-05, "loss": 2.4179, "step": 16850 }, { "epoch": 0.14, "learning_rate": 9.503188237494758e-05, "loss": 2.3867, "step": 16855 }, { "epoch": 0.14, "learning_rate": 9.502896692306584e-05, "loss": 2.3558, "step": 16860 }, { "epoch": 0.14, "learning_rate": 9.50260506607424e-05, "loss": 2.3684, "step": 16865 }, { "epoch": 0.14, "learning_rate": 9.502313358802968e-05, "loss": 2.4241, "step": 16870 }, { "epoch": 0.14, "learning_rate": 9.502021570498021e-05, "loss": 2.3312, "step": 16875 }, { "epoch": 0.14, "learning_rate": 9.501729701164652e-05, "loss": 2.3624, "step": 16880 }, { "epoch": 0.14, "learning_rate": 9.501437750808115e-05, "loss": 2.4006, "step": 16885 }, { "epoch": 0.14, "learning_rate": 9.501145719433662e-05, "loss": 2.3612, "step": 16890 }, { "epoch": 0.14, "learning_rate": 9.500853607046548e-05, "loss": 2.389, "step": 16895 }, { "epoch": 0.14, "learning_rate": 9.500561413652034e-05, "loss": 2.3788, "step": 16900 }, { "epoch": 0.14, "learning_rate": 9.500269139255377e-05, "loss": 2.3654, "step": 16905 }, { "epoch": 0.14, "learning_rate": 9.499976783861839e-05, "loss": 2.2816, "step": 16910 }, { "epoch": 0.14, "learning_rate": 9.499684347476678e-05, "loss": 2.4502, "step": 16915 }, { "epoch": 0.14, "learning_rate": 9.499391830105162e-05, "loss": 2.3909, "step": 16920 }, { "epoch": 0.14, "learning_rate": 9.499099231752554e-05, "loss": 2.2317, "step": 16925 }, { "epoch": 0.14, "learning_rate": 9.49880655242412e-05, "loss": 2.3139, "step": 16930 }, { "epoch": 0.14, "learning_rate": 9.498513792125126e-05, "loss": 2.4268, "step": 16935 }, { "epoch": 0.14, "learning_rate": 9.498220950860844e-05, "loss": 2.3224, "step": 16940 }, { "epoch": 0.14, "learning_rate": 9.497928028636545e-05, "loss": 2.3782, "step": 16945 }, { "epoch": 0.14, "learning_rate": 9.497635025457497e-05, "loss": 2.3233, "step": 16950 }, { "epoch": 0.14, "learning_rate": 9.497341941328977e-05, "loss": 2.3038, "step": 16955 }, { "epoch": 0.14, "learning_rate": 9.49704877625626e-05, "loss": 2.4553, "step": 16960 }, { "epoch": 0.14, "learning_rate": 9.496755530244622e-05, "loss": 2.3273, "step": 16965 }, { "epoch": 0.14, "learning_rate": 9.49646220329934e-05, "loss": 2.3386, "step": 16970 }, { "epoch": 0.14, "learning_rate": 9.496168795425693e-05, "loss": 2.3219, "step": 16975 }, { "epoch": 0.14, "learning_rate": 9.495875306628965e-05, "loss": 2.4085, "step": 16980 }, { "epoch": 0.14, "learning_rate": 9.495581736914433e-05, "loss": 2.4274, "step": 16985 }, { "epoch": 0.14, "learning_rate": 9.495288086287386e-05, "loss": 2.3227, "step": 16990 }, { "epoch": 0.15, "learning_rate": 9.494994354753106e-05, "loss": 2.4118, "step": 16995 }, { "epoch": 0.15, "learning_rate": 9.494700542316882e-05, "loss": 2.3689, "step": 17000 }, { "epoch": 0.15, "learning_rate": 9.494406648983998e-05, "loss": 2.3719, "step": 17005 }, { "epoch": 0.15, "learning_rate": 9.494112674759747e-05, "loss": 2.3463, "step": 17010 }, { "epoch": 0.15, "learning_rate": 9.493818619649421e-05, "loss": 2.3646, "step": 17015 }, { "epoch": 0.15, "learning_rate": 9.49352448365831e-05, "loss": 2.3976, "step": 17020 }, { "epoch": 0.15, "learning_rate": 9.493230266791707e-05, "loss": 2.3952, "step": 17025 }, { "epoch": 0.15, "learning_rate": 9.49293596905491e-05, "loss": 2.3316, "step": 17030 }, { "epoch": 0.15, "learning_rate": 9.492641590453215e-05, "loss": 2.386, "step": 17035 }, { "epoch": 0.15, "learning_rate": 9.49234713099192e-05, "loss": 2.4024, "step": 17040 }, { "epoch": 0.15, "learning_rate": 9.492052590676325e-05, "loss": 2.3943, "step": 17045 }, { "epoch": 0.15, "learning_rate": 9.491757969511732e-05, "loss": 2.4029, "step": 17050 }, { "epoch": 0.15, "learning_rate": 9.491463267503443e-05, "loss": 2.4344, "step": 17055 }, { "epoch": 0.15, "learning_rate": 9.491168484656761e-05, "loss": 2.3722, "step": 17060 }, { "epoch": 0.15, "learning_rate": 9.490873620976993e-05, "loss": 2.373, "step": 17065 }, { "epoch": 0.15, "learning_rate": 9.490578676469445e-05, "loss": 2.475, "step": 17070 }, { "epoch": 0.15, "learning_rate": 9.490283651139426e-05, "loss": 2.3237, "step": 17075 }, { "epoch": 0.15, "learning_rate": 9.489988544992245e-05, "loss": 2.3205, "step": 17080 }, { "epoch": 0.15, "learning_rate": 9.489693358033216e-05, "loss": 2.3807, "step": 17085 }, { "epoch": 0.15, "learning_rate": 9.48939809026765e-05, "loss": 2.3206, "step": 17090 }, { "epoch": 0.15, "learning_rate": 9.489102741700859e-05, "loss": 2.4568, "step": 17095 }, { "epoch": 0.15, "learning_rate": 9.488807312338163e-05, "loss": 2.3172, "step": 17100 }, { "epoch": 0.15, "learning_rate": 9.488511802184879e-05, "loss": 2.3484, "step": 17105 }, { "epoch": 0.15, "learning_rate": 9.488216211246321e-05, "loss": 2.3715, "step": 17110 }, { "epoch": 0.15, "learning_rate": 9.487920539527815e-05, "loss": 2.334, "step": 17115 }, { "epoch": 0.15, "learning_rate": 9.487624787034678e-05, "loss": 2.3475, "step": 17120 }, { "epoch": 0.15, "learning_rate": 9.487328953772234e-05, "loss": 2.5037, "step": 17125 }, { "epoch": 0.15, "learning_rate": 9.48703303974581e-05, "loss": 2.278, "step": 17130 }, { "epoch": 0.15, "learning_rate": 9.48673704496073e-05, "loss": 2.323, "step": 17135 }, { "epoch": 0.15, "learning_rate": 9.486440969422321e-05, "loss": 2.3155, "step": 17140 }, { "epoch": 0.15, "learning_rate": 9.486144813135913e-05, "loss": 2.4012, "step": 17145 }, { "epoch": 0.15, "learning_rate": 9.485848576106835e-05, "loss": 2.326, "step": 17150 }, { "epoch": 0.15, "learning_rate": 9.485552258340419e-05, "loss": 2.4049, "step": 17155 }, { "epoch": 0.15, "learning_rate": 9.485255859842e-05, "loss": 2.348, "step": 17160 }, { "epoch": 0.15, "learning_rate": 9.484959380616908e-05, "loss": 2.3917, "step": 17165 }, { "epoch": 0.15, "learning_rate": 9.484662820670486e-05, "loss": 2.4314, "step": 17170 }, { "epoch": 0.15, "learning_rate": 9.484366180008067e-05, "loss": 2.4165, "step": 17175 }, { "epoch": 0.15, "learning_rate": 9.48406945863499e-05, "loss": 2.4083, "step": 17180 }, { "epoch": 0.15, "learning_rate": 9.483772656556597e-05, "loss": 2.3949, "step": 17185 }, { "epoch": 0.15, "learning_rate": 9.48347577377823e-05, "loss": 2.4135, "step": 17190 }, { "epoch": 0.15, "learning_rate": 9.48317881030523e-05, "loss": 2.3498, "step": 17195 }, { "epoch": 0.15, "learning_rate": 9.482881766142943e-05, "loss": 2.3585, "step": 17200 }, { "epoch": 0.15, "learning_rate": 9.48258464129672e-05, "loss": 2.3749, "step": 17205 }, { "epoch": 0.15, "learning_rate": 9.4822874357719e-05, "loss": 2.2604, "step": 17210 }, { "epoch": 0.15, "learning_rate": 9.481990149573838e-05, "loss": 2.3492, "step": 17215 }, { "epoch": 0.15, "learning_rate": 9.481692782707883e-05, "loss": 2.3742, "step": 17220 }, { "epoch": 0.15, "learning_rate": 9.481395335179389e-05, "loss": 2.3681, "step": 17225 }, { "epoch": 0.15, "learning_rate": 9.481097806993706e-05, "loss": 2.3535, "step": 17230 }, { "epoch": 0.15, "learning_rate": 9.48080019815619e-05, "loss": 2.3815, "step": 17235 }, { "epoch": 0.15, "learning_rate": 9.4805025086722e-05, "loss": 2.3534, "step": 17240 }, { "epoch": 0.15, "learning_rate": 9.480204738547093e-05, "loss": 2.3835, "step": 17245 }, { "epoch": 0.15, "learning_rate": 9.479906887786227e-05, "loss": 2.3669, "step": 17250 }, { "epoch": 0.15, "learning_rate": 9.479608956394963e-05, "loss": 2.3734, "step": 17255 }, { "epoch": 0.15, "learning_rate": 9.479310944378662e-05, "loss": 2.3492, "step": 17260 }, { "epoch": 0.15, "learning_rate": 9.47901285174269e-05, "loss": 2.3662, "step": 17265 }, { "epoch": 0.15, "learning_rate": 9.478714678492413e-05, "loss": 2.3945, "step": 17270 }, { "epoch": 0.15, "learning_rate": 9.478416424633194e-05, "loss": 2.3553, "step": 17275 }, { "epoch": 0.15, "learning_rate": 9.478118090170404e-05, "loss": 2.3086, "step": 17280 }, { "epoch": 0.15, "learning_rate": 9.477819675109412e-05, "loss": 2.3643, "step": 17285 }, { "epoch": 0.15, "learning_rate": 9.477521179455588e-05, "loss": 2.3885, "step": 17290 }, { "epoch": 0.15, "learning_rate": 9.477222603214304e-05, "loss": 2.3008, "step": 17295 }, { "epoch": 0.15, "learning_rate": 9.476923946390934e-05, "loss": 2.4357, "step": 17300 }, { "epoch": 0.15, "learning_rate": 9.476625208990855e-05, "loss": 2.3806, "step": 17305 }, { "epoch": 0.15, "learning_rate": 9.476326391019444e-05, "loss": 2.3419, "step": 17310 }, { "epoch": 0.15, "learning_rate": 9.476027492482076e-05, "loss": 2.3941, "step": 17315 }, { "epoch": 0.15, "learning_rate": 9.475728513384133e-05, "loss": 2.3583, "step": 17320 }, { "epoch": 0.15, "learning_rate": 9.475429453730997e-05, "loss": 2.3751, "step": 17325 }, { "epoch": 0.15, "learning_rate": 9.475130313528047e-05, "loss": 2.3756, "step": 17330 }, { "epoch": 0.15, "learning_rate": 9.47483109278067e-05, "loss": 2.3206, "step": 17335 }, { "epoch": 0.15, "learning_rate": 9.474531791494251e-05, "loss": 2.329, "step": 17340 }, { "epoch": 0.15, "learning_rate": 9.474232409674178e-05, "loss": 2.4341, "step": 17345 }, { "epoch": 0.15, "learning_rate": 9.473932947325834e-05, "loss": 2.3642, "step": 17350 }, { "epoch": 0.15, "learning_rate": 9.473633404454616e-05, "loss": 2.3778, "step": 17355 }, { "epoch": 0.15, "learning_rate": 9.47333378106591e-05, "loss": 2.2773, "step": 17360 }, { "epoch": 0.15, "learning_rate": 9.473034077165111e-05, "loss": 2.2734, "step": 17365 }, { "epoch": 0.15, "learning_rate": 9.472734292757615e-05, "loss": 2.4001, "step": 17370 }, { "epoch": 0.15, "learning_rate": 9.472434427848812e-05, "loss": 2.3871, "step": 17375 }, { "epoch": 0.15, "learning_rate": 9.472134482444104e-05, "loss": 2.2886, "step": 17380 }, { "epoch": 0.15, "learning_rate": 9.471834456548888e-05, "loss": 2.3385, "step": 17385 }, { "epoch": 0.15, "learning_rate": 9.471534350168562e-05, "loss": 2.3768, "step": 17390 }, { "epoch": 0.15, "learning_rate": 9.471234163308532e-05, "loss": 2.4396, "step": 17395 }, { "epoch": 0.15, "learning_rate": 9.470933895974195e-05, "loss": 2.3916, "step": 17400 }, { "epoch": 0.15, "learning_rate": 9.470633548170959e-05, "loss": 2.3754, "step": 17405 }, { "epoch": 0.15, "learning_rate": 9.470333119904232e-05, "loss": 2.369, "step": 17410 }, { "epoch": 0.15, "learning_rate": 9.470032611179414e-05, "loss": 2.4119, "step": 17415 }, { "epoch": 0.15, "learning_rate": 9.469732022001921e-05, "loss": 2.4343, "step": 17420 }, { "epoch": 0.15, "learning_rate": 9.469431352377159e-05, "loss": 2.3807, "step": 17425 }, { "epoch": 0.15, "learning_rate": 9.469130602310538e-05, "loss": 2.3901, "step": 17430 }, { "epoch": 0.15, "learning_rate": 9.468829771807476e-05, "loss": 2.4665, "step": 17435 }, { "epoch": 0.15, "learning_rate": 9.468528860873384e-05, "loss": 2.3184, "step": 17440 }, { "epoch": 0.15, "learning_rate": 9.468227869513679e-05, "loss": 2.3873, "step": 17445 }, { "epoch": 0.15, "learning_rate": 9.467926797733777e-05, "loss": 2.3827, "step": 17450 }, { "epoch": 0.15, "learning_rate": 9.4676256455391e-05, "loss": 2.3871, "step": 17455 }, { "epoch": 0.15, "learning_rate": 9.467324412935064e-05, "loss": 2.3885, "step": 17460 }, { "epoch": 0.15, "learning_rate": 9.467023099927091e-05, "loss": 2.3762, "step": 17465 }, { "epoch": 0.15, "learning_rate": 9.466721706520608e-05, "loss": 2.4209, "step": 17470 }, { "epoch": 0.15, "learning_rate": 9.466420232721037e-05, "loss": 2.3873, "step": 17475 }, { "epoch": 0.15, "learning_rate": 9.466118678533804e-05, "loss": 2.3349, "step": 17480 }, { "epoch": 0.15, "learning_rate": 9.465817043964337e-05, "loss": 2.3942, "step": 17485 }, { "epoch": 0.15, "learning_rate": 9.465515329018065e-05, "loss": 2.3701, "step": 17490 }, { "epoch": 0.15, "learning_rate": 9.465213533700415e-05, "loss": 2.3549, "step": 17495 }, { "epoch": 0.15, "learning_rate": 9.464911658016824e-05, "loss": 2.415, "step": 17500 }, { "epoch": 0.15, "learning_rate": 9.464609701972723e-05, "loss": 2.3511, "step": 17505 }, { "epoch": 0.15, "learning_rate": 9.464307665573547e-05, "loss": 2.432, "step": 17510 }, { "epoch": 0.15, "learning_rate": 9.46400554882473e-05, "loss": 2.3874, "step": 17515 }, { "epoch": 0.15, "learning_rate": 9.463703351731712e-05, "loss": 2.459, "step": 17520 }, { "epoch": 0.15, "learning_rate": 9.46340107429993e-05, "loss": 2.4334, "step": 17525 }, { "epoch": 0.15, "learning_rate": 9.463098716534828e-05, "loss": 2.4031, "step": 17530 }, { "epoch": 0.15, "learning_rate": 9.462796278441846e-05, "loss": 2.4102, "step": 17535 }, { "epoch": 0.15, "learning_rate": 9.462493760026425e-05, "loss": 2.2223, "step": 17540 }, { "epoch": 0.15, "learning_rate": 9.462191161294012e-05, "loss": 2.4287, "step": 17545 }, { "epoch": 0.15, "learning_rate": 9.461888482250054e-05, "loss": 2.3911, "step": 17550 }, { "epoch": 0.15, "learning_rate": 9.461585722899997e-05, "loss": 2.338, "step": 17555 }, { "epoch": 0.15, "learning_rate": 9.461282883249292e-05, "loss": 2.383, "step": 17560 }, { "epoch": 0.15, "learning_rate": 9.460979963303388e-05, "loss": 2.4366, "step": 17565 }, { "epoch": 0.15, "learning_rate": 9.460676963067737e-05, "loss": 2.3252, "step": 17570 }, { "epoch": 0.15, "learning_rate": 9.460373882547792e-05, "loss": 2.3113, "step": 17575 }, { "epoch": 0.15, "learning_rate": 9.460070721749009e-05, "loss": 2.3625, "step": 17580 }, { "epoch": 0.15, "learning_rate": 9.459767480676845e-05, "loss": 2.3827, "step": 17585 }, { "epoch": 0.15, "learning_rate": 9.459464159336757e-05, "loss": 2.341, "step": 17590 }, { "epoch": 0.15, "learning_rate": 9.459160757734205e-05, "loss": 2.3505, "step": 17595 }, { "epoch": 0.15, "learning_rate": 9.458857275874646e-05, "loss": 2.3755, "step": 17600 }, { "epoch": 0.15, "learning_rate": 9.458553713763548e-05, "loss": 2.3164, "step": 17605 }, { "epoch": 0.15, "learning_rate": 9.458250071406371e-05, "loss": 2.3979, "step": 17610 }, { "epoch": 0.15, "learning_rate": 9.457946348808579e-05, "loss": 2.3875, "step": 17615 }, { "epoch": 0.15, "learning_rate": 9.457642545975643e-05, "loss": 2.3493, "step": 17620 }, { "epoch": 0.15, "learning_rate": 9.457338662913027e-05, "loss": 2.4208, "step": 17625 }, { "epoch": 0.15, "learning_rate": 9.457034699626199e-05, "loss": 2.3179, "step": 17630 }, { "epoch": 0.15, "learning_rate": 9.456730656120636e-05, "loss": 2.3649, "step": 17635 }, { "epoch": 0.15, "learning_rate": 9.456426532401803e-05, "loss": 2.3794, "step": 17640 }, { "epoch": 0.15, "learning_rate": 9.456122328475179e-05, "loss": 2.3943, "step": 17645 }, { "epoch": 0.15, "learning_rate": 9.455818044346238e-05, "loss": 2.3461, "step": 17650 }, { "epoch": 0.15, "learning_rate": 9.455513680020454e-05, "loss": 2.3855, "step": 17655 }, { "epoch": 0.15, "learning_rate": 9.455209235503308e-05, "loss": 2.3498, "step": 17660 }, { "epoch": 0.15, "learning_rate": 9.454904710800278e-05, "loss": 2.4332, "step": 17665 }, { "epoch": 0.15, "learning_rate": 9.454600105916846e-05, "loss": 2.4355, "step": 17670 }, { "epoch": 0.15, "learning_rate": 9.454295420858493e-05, "loss": 2.3872, "step": 17675 }, { "epoch": 0.15, "learning_rate": 9.453990655630702e-05, "loss": 2.3538, "step": 17680 }, { "epoch": 0.15, "learning_rate": 9.453685810238962e-05, "loss": 2.3709, "step": 17685 }, { "epoch": 0.15, "learning_rate": 9.453380884688756e-05, "loss": 2.2957, "step": 17690 }, { "epoch": 0.15, "learning_rate": 9.453075878985573e-05, "loss": 2.4267, "step": 17695 }, { "epoch": 0.15, "learning_rate": 9.452770793134904e-05, "loss": 2.4624, "step": 17700 }, { "epoch": 0.15, "learning_rate": 9.452465627142238e-05, "loss": 2.4279, "step": 17705 }, { "epoch": 0.15, "learning_rate": 9.452160381013069e-05, "loss": 2.4024, "step": 17710 }, { "epoch": 0.15, "learning_rate": 9.45185505475289e-05, "loss": 2.3799, "step": 17715 }, { "epoch": 0.15, "learning_rate": 9.451549648367198e-05, "loss": 2.4494, "step": 17720 }, { "epoch": 0.15, "learning_rate": 9.451244161861487e-05, "loss": 2.3337, "step": 17725 }, { "epoch": 0.15, "learning_rate": 9.450938595241257e-05, "loss": 2.4449, "step": 17730 }, { "epoch": 0.15, "learning_rate": 9.450632948512007e-05, "loss": 2.3681, "step": 17735 }, { "epoch": 0.15, "learning_rate": 9.450327221679239e-05, "loss": 2.3297, "step": 17740 }, { "epoch": 0.15, "learning_rate": 9.450021414748454e-05, "loss": 2.3598, "step": 17745 }, { "epoch": 0.15, "learning_rate": 9.449715527725159e-05, "loss": 2.2852, "step": 17750 }, { "epoch": 0.15, "learning_rate": 9.449409560614855e-05, "loss": 2.3972, "step": 17755 }, { "epoch": 0.15, "learning_rate": 9.449103513423053e-05, "loss": 2.348, "step": 17760 }, { "epoch": 0.15, "learning_rate": 9.448797386155258e-05, "loss": 2.2946, "step": 17765 }, { "epoch": 0.15, "learning_rate": 9.448491178816981e-05, "loss": 2.365, "step": 17770 }, { "epoch": 0.15, "learning_rate": 9.448184891413736e-05, "loss": 2.3289, "step": 17775 }, { "epoch": 0.15, "learning_rate": 9.447878523951031e-05, "loss": 2.3924, "step": 17780 }, { "epoch": 0.15, "learning_rate": 9.447572076434382e-05, "loss": 2.2749, "step": 17785 }, { "epoch": 0.15, "learning_rate": 9.447265548869307e-05, "loss": 2.3792, "step": 17790 }, { "epoch": 0.15, "learning_rate": 9.446958941261316e-05, "loss": 2.363, "step": 17795 }, { "epoch": 0.15, "learning_rate": 9.446652253615936e-05, "loss": 2.34, "step": 17800 }, { "epoch": 0.15, "learning_rate": 9.446345485938683e-05, "loss": 2.3121, "step": 17805 }, { "epoch": 0.15, "learning_rate": 9.446038638235076e-05, "loss": 2.3839, "step": 17810 }, { "epoch": 0.15, "learning_rate": 9.445731710510641e-05, "loss": 2.4279, "step": 17815 }, { "epoch": 0.15, "learning_rate": 9.445424702770903e-05, "loss": 2.3483, "step": 17820 }, { "epoch": 0.15, "learning_rate": 9.445117615021382e-05, "loss": 2.3566, "step": 17825 }, { "epoch": 0.15, "learning_rate": 9.444810447267609e-05, "loss": 2.3227, "step": 17830 }, { "epoch": 0.15, "learning_rate": 9.444503199515114e-05, "loss": 2.4219, "step": 17835 }, { "epoch": 0.15, "learning_rate": 9.444195871769425e-05, "loss": 2.3621, "step": 17840 }, { "epoch": 0.15, "learning_rate": 9.443888464036073e-05, "loss": 2.3666, "step": 17845 }, { "epoch": 0.15, "learning_rate": 9.44358097632059e-05, "loss": 2.3334, "step": 17850 }, { "epoch": 0.15, "learning_rate": 9.443273408628512e-05, "loss": 2.3671, "step": 17855 }, { "epoch": 0.15, "learning_rate": 9.442965760965374e-05, "loss": 2.4096, "step": 17860 }, { "epoch": 0.15, "learning_rate": 9.442658033336714e-05, "loss": 2.3718, "step": 17865 }, { "epoch": 0.15, "learning_rate": 9.44235022574807e-05, "loss": 2.3719, "step": 17870 }, { "epoch": 0.15, "learning_rate": 9.44204233820498e-05, "loss": 2.4222, "step": 17875 }, { "epoch": 0.15, "learning_rate": 9.44173437071299e-05, "loss": 2.3656, "step": 17880 }, { "epoch": 0.15, "learning_rate": 9.441426323277638e-05, "loss": 2.3859, "step": 17885 }, { "epoch": 0.15, "learning_rate": 9.44111819590447e-05, "loss": 2.3324, "step": 17890 }, { "epoch": 0.15, "learning_rate": 9.440809988599033e-05, "loss": 2.4552, "step": 17895 }, { "epoch": 0.15, "learning_rate": 9.440501701366873e-05, "loss": 2.3525, "step": 17900 }, { "epoch": 0.15, "learning_rate": 9.44019333421354e-05, "loss": 2.3311, "step": 17905 }, { "epoch": 0.15, "learning_rate": 9.43988488714458e-05, "loss": 2.2893, "step": 17910 }, { "epoch": 0.15, "learning_rate": 9.439576360165552e-05, "loss": 2.3403, "step": 17915 }, { "epoch": 0.15, "learning_rate": 9.439267753282002e-05, "loss": 2.4036, "step": 17920 }, { "epoch": 0.15, "learning_rate": 9.438959066499487e-05, "loss": 2.3821, "step": 17925 }, { "epoch": 0.15, "learning_rate": 9.438650299823562e-05, "loss": 2.3403, "step": 17930 }, { "epoch": 0.15, "learning_rate": 9.438341453259784e-05, "loss": 2.2645, "step": 17935 }, { "epoch": 0.15, "learning_rate": 9.438032526813713e-05, "loss": 2.3492, "step": 17940 }, { "epoch": 0.15, "learning_rate": 9.43772352049091e-05, "loss": 2.3473, "step": 17945 }, { "epoch": 0.15, "learning_rate": 9.437414434296937e-05, "loss": 2.3547, "step": 17950 }, { "epoch": 0.15, "learning_rate": 9.437105268237351e-05, "loss": 2.418, "step": 17955 }, { "epoch": 0.15, "learning_rate": 9.436796022317724e-05, "loss": 2.3814, "step": 17960 }, { "epoch": 0.15, "learning_rate": 9.436486696543617e-05, "loss": 2.3776, "step": 17965 }, { "epoch": 0.15, "learning_rate": 9.4361772909206e-05, "loss": 2.4216, "step": 17970 }, { "epoch": 0.15, "learning_rate": 9.43586780545424e-05, "loss": 2.2731, "step": 17975 }, { "epoch": 0.15, "learning_rate": 9.435558240150106e-05, "loss": 2.2716, "step": 17980 }, { "epoch": 0.15, "learning_rate": 9.435248595013775e-05, "loss": 2.3459, "step": 17985 }, { "epoch": 0.15, "learning_rate": 9.434938870050814e-05, "loss": 2.3098, "step": 17990 }, { "epoch": 0.15, "learning_rate": 9.434629065266801e-05, "loss": 2.3751, "step": 17995 }, { "epoch": 0.15, "learning_rate": 9.43431918066731e-05, "loss": 2.3887, "step": 18000 }, { "epoch": 0.15, "learning_rate": 9.434009216257921e-05, "loss": 2.3669, "step": 18005 }, { "epoch": 0.15, "learning_rate": 9.433699172044211e-05, "loss": 2.378, "step": 18010 }, { "epoch": 0.15, "learning_rate": 9.43338904803176e-05, "loss": 2.3275, "step": 18015 }, { "epoch": 0.15, "learning_rate": 9.433078844226148e-05, "loss": 2.3347, "step": 18020 }, { "epoch": 0.15, "learning_rate": 9.432768560632962e-05, "loss": 2.306, "step": 18025 }, { "epoch": 0.15, "learning_rate": 9.432458197257786e-05, "loss": 2.3785, "step": 18030 }, { "epoch": 0.15, "learning_rate": 9.432147754106204e-05, "loss": 2.2999, "step": 18035 }, { "epoch": 0.15, "learning_rate": 9.431837231183804e-05, "loss": 2.3578, "step": 18040 }, { "epoch": 0.15, "learning_rate": 9.431526628496174e-05, "loss": 2.4178, "step": 18045 }, { "epoch": 0.15, "learning_rate": 9.431215946048908e-05, "loss": 2.3583, "step": 18050 }, { "epoch": 0.15, "learning_rate": 9.430905183847593e-05, "loss": 2.3032, "step": 18055 }, { "epoch": 0.15, "learning_rate": 9.430594341897825e-05, "loss": 2.3553, "step": 18060 }, { "epoch": 0.15, "learning_rate": 9.430283420205197e-05, "loss": 2.393, "step": 18065 }, { "epoch": 0.15, "learning_rate": 9.429972418775306e-05, "loss": 2.3141, "step": 18070 }, { "epoch": 0.15, "learning_rate": 9.42966133761375e-05, "loss": 2.3759, "step": 18075 }, { "epoch": 0.15, "learning_rate": 9.429350176726127e-05, "loss": 2.3496, "step": 18080 }, { "epoch": 0.15, "learning_rate": 9.429038936118038e-05, "loss": 2.3309, "step": 18085 }, { "epoch": 0.15, "learning_rate": 9.428727615795084e-05, "loss": 2.373, "step": 18090 }, { "epoch": 0.15, "learning_rate": 9.428416215762868e-05, "loss": 2.3964, "step": 18095 }, { "epoch": 0.15, "learning_rate": 9.428104736026998e-05, "loss": 2.4359, "step": 18100 }, { "epoch": 0.15, "learning_rate": 9.427793176593073e-05, "loss": 2.3906, "step": 18105 }, { "epoch": 0.15, "learning_rate": 9.427481537466708e-05, "loss": 2.317, "step": 18110 }, { "epoch": 0.15, "learning_rate": 9.427169818653508e-05, "loss": 2.3394, "step": 18115 }, { "epoch": 0.15, "learning_rate": 9.426858020159085e-05, "loss": 2.2853, "step": 18120 }, { "epoch": 0.15, "learning_rate": 9.42654614198905e-05, "loss": 2.3808, "step": 18125 }, { "epoch": 0.15, "learning_rate": 9.426234184149015e-05, "loss": 2.407, "step": 18130 }, { "epoch": 0.15, "learning_rate": 9.425922146644596e-05, "loss": 2.3464, "step": 18135 }, { "epoch": 0.15, "learning_rate": 9.425610029481411e-05, "loss": 2.3793, "step": 18140 }, { "epoch": 0.15, "learning_rate": 9.425297832665075e-05, "loss": 2.3371, "step": 18145 }, { "epoch": 0.15, "learning_rate": 9.424985556201206e-05, "loss": 2.3872, "step": 18150 }, { "epoch": 0.15, "learning_rate": 9.424673200095427e-05, "loss": 2.4191, "step": 18155 }, { "epoch": 0.15, "learning_rate": 9.424360764353359e-05, "loss": 2.3378, "step": 18160 }, { "epoch": 0.16, "learning_rate": 9.424048248980625e-05, "loss": 2.4075, "step": 18165 }, { "epoch": 0.16, "learning_rate": 9.423735653982852e-05, "loss": 2.4001, "step": 18170 }, { "epoch": 0.16, "learning_rate": 9.423422979365662e-05, "loss": 2.4203, "step": 18175 }, { "epoch": 0.16, "learning_rate": 9.423110225134685e-05, "loss": 2.3588, "step": 18180 }, { "epoch": 0.16, "learning_rate": 9.422797391295551e-05, "loss": 2.3372, "step": 18185 }, { "epoch": 0.16, "learning_rate": 9.422484477853887e-05, "loss": 2.3302, "step": 18190 }, { "epoch": 0.16, "learning_rate": 9.422171484815328e-05, "loss": 2.3251, "step": 18195 }, { "epoch": 0.16, "learning_rate": 9.421858412185506e-05, "loss": 2.2952, "step": 18200 }, { "epoch": 0.16, "learning_rate": 9.421545259970057e-05, "loss": 2.2922, "step": 18205 }, { "epoch": 0.16, "learning_rate": 9.421232028174616e-05, "loss": 2.4019, "step": 18210 }, { "epoch": 0.16, "learning_rate": 9.420918716804821e-05, "loss": 2.3408, "step": 18215 }, { "epoch": 0.16, "learning_rate": 9.420605325866312e-05, "loss": 2.3353, "step": 18220 }, { "epoch": 0.16, "learning_rate": 9.420291855364726e-05, "loss": 2.3077, "step": 18225 }, { "epoch": 0.16, "learning_rate": 9.41997830530571e-05, "loss": 2.339, "step": 18230 }, { "epoch": 0.16, "learning_rate": 9.419664675694904e-05, "loss": 2.3584, "step": 18235 }, { "epoch": 0.16, "learning_rate": 9.419350966537952e-05, "loss": 2.358, "step": 18240 }, { "epoch": 0.16, "learning_rate": 9.419037177840502e-05, "loss": 2.3605, "step": 18245 }, { "epoch": 0.16, "learning_rate": 9.418723309608204e-05, "loss": 2.4084, "step": 18250 }, { "epoch": 0.16, "learning_rate": 9.418409361846701e-05, "loss": 2.2729, "step": 18255 }, { "epoch": 0.16, "learning_rate": 9.418095334561649e-05, "loss": 2.4056, "step": 18260 }, { "epoch": 0.16, "learning_rate": 9.417781227758698e-05, "loss": 2.3712, "step": 18265 }, { "epoch": 0.16, "learning_rate": 9.417467041443501e-05, "loss": 2.3816, "step": 18270 }, { "epoch": 0.16, "learning_rate": 9.417152775621712e-05, "loss": 2.4432, "step": 18275 }, { "epoch": 0.16, "learning_rate": 9.416838430298989e-05, "loss": 2.3264, "step": 18280 }, { "epoch": 0.16, "learning_rate": 9.416524005480988e-05, "loss": 2.3266, "step": 18285 }, { "epoch": 0.16, "learning_rate": 9.416209501173372e-05, "loss": 2.3665, "step": 18290 }, { "epoch": 0.16, "learning_rate": 9.415894917381796e-05, "loss": 2.3422, "step": 18295 }, { "epoch": 0.16, "learning_rate": 9.415580254111925e-05, "loss": 2.3472, "step": 18300 }, { "epoch": 0.16, "learning_rate": 9.415265511369422e-05, "loss": 2.3475, "step": 18305 }, { "epoch": 0.16, "learning_rate": 9.414950689159952e-05, "loss": 2.3124, "step": 18310 }, { "epoch": 0.16, "learning_rate": 9.41463578748918e-05, "loss": 2.3593, "step": 18315 }, { "epoch": 0.16, "learning_rate": 9.414320806362775e-05, "loss": 2.4198, "step": 18320 }, { "epoch": 0.16, "learning_rate": 9.414005745786406e-05, "loss": 2.3957, "step": 18325 }, { "epoch": 0.16, "learning_rate": 9.413690605765743e-05, "loss": 2.3581, "step": 18330 }, { "epoch": 0.16, "learning_rate": 9.413375386306459e-05, "loss": 2.3826, "step": 18335 }, { "epoch": 0.16, "learning_rate": 9.413060087414225e-05, "loss": 2.3311, "step": 18340 }, { "epoch": 0.16, "learning_rate": 9.412744709094718e-05, "loss": 2.3343, "step": 18345 }, { "epoch": 0.16, "learning_rate": 9.412429251353615e-05, "loss": 2.3189, "step": 18350 }, { "epoch": 0.16, "learning_rate": 9.41211371419659e-05, "loss": 2.3902, "step": 18355 }, { "epoch": 0.16, "learning_rate": 9.411798097629327e-05, "loss": 2.4389, "step": 18360 }, { "epoch": 0.16, "learning_rate": 9.411482401657503e-05, "loss": 2.3333, "step": 18365 }, { "epoch": 0.16, "learning_rate": 9.4111666262868e-05, "loss": 2.3843, "step": 18370 }, { "epoch": 0.16, "learning_rate": 9.410850771522904e-05, "loss": 2.1674, "step": 18375 }, { "epoch": 0.16, "learning_rate": 9.410534837371499e-05, "loss": 2.3392, "step": 18380 }, { "epoch": 0.16, "learning_rate": 9.410218823838269e-05, "loss": 2.3411, "step": 18385 }, { "epoch": 0.16, "learning_rate": 9.409902730928901e-05, "loss": 2.38, "step": 18390 }, { "epoch": 0.16, "learning_rate": 9.409586558649088e-05, "loss": 2.2825, "step": 18395 }, { "epoch": 0.16, "learning_rate": 9.409270307004521e-05, "loss": 2.289, "step": 18400 }, { "epoch": 0.16, "learning_rate": 9.408953976000886e-05, "loss": 2.3259, "step": 18405 }, { "epoch": 0.16, "learning_rate": 9.408637565643882e-05, "loss": 2.398, "step": 18410 }, { "epoch": 0.16, "learning_rate": 9.408321075939202e-05, "loss": 2.4515, "step": 18415 }, { "epoch": 0.16, "learning_rate": 9.408004506892543e-05, "loss": 2.428, "step": 18420 }, { "epoch": 0.16, "learning_rate": 9.407687858509602e-05, "loss": 2.2944, "step": 18425 }, { "epoch": 0.16, "learning_rate": 9.407371130796077e-05, "loss": 2.3371, "step": 18430 }, { "epoch": 0.16, "learning_rate": 9.407054323757669e-05, "loss": 2.3988, "step": 18435 }, { "epoch": 0.16, "learning_rate": 9.406737437400081e-05, "loss": 2.3483, "step": 18440 }, { "epoch": 0.16, "learning_rate": 9.406420471729016e-05, "loss": 2.3916, "step": 18445 }, { "epoch": 0.16, "learning_rate": 9.406103426750179e-05, "loss": 2.38, "step": 18450 }, { "epoch": 0.16, "learning_rate": 9.405786302469278e-05, "loss": 2.3447, "step": 18455 }, { "epoch": 0.16, "learning_rate": 9.405469098892015e-05, "loss": 2.2569, "step": 18460 }, { "epoch": 0.16, "learning_rate": 9.405151816024104e-05, "loss": 2.3965, "step": 18465 }, { "epoch": 0.16, "learning_rate": 9.404834453871256e-05, "loss": 2.3619, "step": 18470 }, { "epoch": 0.16, "learning_rate": 9.40451701243918e-05, "loss": 2.3201, "step": 18475 }, { "epoch": 0.16, "learning_rate": 9.404199491733591e-05, "loss": 2.3686, "step": 18480 }, { "epoch": 0.16, "learning_rate": 9.403881891760202e-05, "loss": 2.3382, "step": 18485 }, { "epoch": 0.16, "learning_rate": 9.403564212524732e-05, "loss": 2.3889, "step": 18490 }, { "epoch": 0.16, "learning_rate": 9.403246454032898e-05, "loss": 2.3141, "step": 18495 }, { "epoch": 0.16, "learning_rate": 9.402928616290418e-05, "loss": 2.2875, "step": 18500 }, { "epoch": 0.16, "learning_rate": 9.402610699303013e-05, "loss": 2.3755, "step": 18505 }, { "epoch": 0.16, "learning_rate": 9.402292703076404e-05, "loss": 2.3333, "step": 18510 }, { "epoch": 0.16, "learning_rate": 9.401974627616316e-05, "loss": 2.4582, "step": 18515 }, { "epoch": 0.16, "learning_rate": 9.401656472928473e-05, "loss": 2.3239, "step": 18520 }, { "epoch": 0.16, "learning_rate": 9.401338239018601e-05, "loss": 2.3964, "step": 18525 }, { "epoch": 0.16, "learning_rate": 9.401019925892429e-05, "loss": 2.3545, "step": 18530 }, { "epoch": 0.16, "learning_rate": 9.400701533555685e-05, "loss": 2.3809, "step": 18535 }, { "epoch": 0.16, "learning_rate": 9.400383062014097e-05, "loss": 2.3596, "step": 18540 }, { "epoch": 0.16, "learning_rate": 9.400064511273402e-05, "loss": 2.3475, "step": 18545 }, { "epoch": 0.16, "learning_rate": 9.39974588133933e-05, "loss": 2.3899, "step": 18550 }, { "epoch": 0.16, "learning_rate": 9.399427172217617e-05, "loss": 2.3669, "step": 18555 }, { "epoch": 0.16, "learning_rate": 9.399108383913998e-05, "loss": 2.3253, "step": 18560 }, { "epoch": 0.16, "learning_rate": 9.398789516434213e-05, "loss": 2.2871, "step": 18565 }, { "epoch": 0.16, "learning_rate": 9.398470569783997e-05, "loss": 2.3149, "step": 18570 }, { "epoch": 0.16, "learning_rate": 9.398151543969095e-05, "loss": 2.2773, "step": 18575 }, { "epoch": 0.16, "learning_rate": 9.397832438995245e-05, "loss": 2.3994, "step": 18580 }, { "epoch": 0.16, "learning_rate": 9.397513254868193e-05, "loss": 2.369, "step": 18585 }, { "epoch": 0.16, "learning_rate": 9.397193991593684e-05, "loss": 2.3402, "step": 18590 }, { "epoch": 0.16, "learning_rate": 9.396874649177462e-05, "loss": 2.3482, "step": 18595 }, { "epoch": 0.16, "learning_rate": 9.396555227625276e-05, "loss": 2.3522, "step": 18600 }, { "epoch": 0.16, "learning_rate": 9.396235726942874e-05, "loss": 2.3122, "step": 18605 }, { "epoch": 0.16, "learning_rate": 9.395916147136009e-05, "loss": 2.3975, "step": 18610 }, { "epoch": 0.16, "learning_rate": 9.39559648821043e-05, "loss": 2.3846, "step": 18615 }, { "epoch": 0.16, "learning_rate": 9.39527675017189e-05, "loss": 2.2663, "step": 18620 }, { "epoch": 0.16, "learning_rate": 9.394956933026146e-05, "loss": 2.3696, "step": 18625 }, { "epoch": 0.16, "learning_rate": 9.394637036778952e-05, "loss": 2.3875, "step": 18630 }, { "epoch": 0.16, "learning_rate": 9.394317061436068e-05, "loss": 2.4225, "step": 18635 }, { "epoch": 0.16, "learning_rate": 9.393997007003252e-05, "loss": 2.4342, "step": 18640 }, { "epoch": 0.16, "learning_rate": 9.393676873486265e-05, "loss": 2.3304, "step": 18645 }, { "epoch": 0.16, "learning_rate": 9.393356660890866e-05, "loss": 2.3464, "step": 18650 }, { "epoch": 0.16, "learning_rate": 9.39303636922282e-05, "loss": 2.3177, "step": 18655 }, { "epoch": 0.16, "learning_rate": 9.392715998487894e-05, "loss": 2.3683, "step": 18660 }, { "epoch": 0.16, "learning_rate": 9.392395548691851e-05, "loss": 2.4023, "step": 18665 }, { "epoch": 0.16, "learning_rate": 9.39207501984046e-05, "loss": 2.2998, "step": 18670 }, { "epoch": 0.16, "learning_rate": 9.391754411939489e-05, "loss": 2.4086, "step": 18675 }, { "epoch": 0.16, "learning_rate": 9.39143372499471e-05, "loss": 2.3699, "step": 18680 }, { "epoch": 0.16, "learning_rate": 9.391112959011891e-05, "loss": 2.3945, "step": 18685 }, { "epoch": 0.16, "learning_rate": 9.39079211399681e-05, "loss": 2.3947, "step": 18690 }, { "epoch": 0.16, "learning_rate": 9.390471189955238e-05, "loss": 2.2963, "step": 18695 }, { "epoch": 0.16, "learning_rate": 9.390150186892955e-05, "loss": 2.3641, "step": 18700 }, { "epoch": 0.16, "learning_rate": 9.389829104815735e-05, "loss": 2.3638, "step": 18705 }, { "epoch": 0.16, "learning_rate": 9.389507943729357e-05, "loss": 2.3749, "step": 18710 }, { "epoch": 0.16, "learning_rate": 9.389186703639603e-05, "loss": 2.3291, "step": 18715 }, { "epoch": 0.16, "learning_rate": 9.388865384552254e-05, "loss": 2.3946, "step": 18720 }, { "epoch": 0.16, "learning_rate": 9.388543986473096e-05, "loss": 2.3868, "step": 18725 }, { "epoch": 0.16, "learning_rate": 9.388222509407907e-05, "loss": 2.3543, "step": 18730 }, { "epoch": 0.16, "learning_rate": 9.387900953362479e-05, "loss": 2.3601, "step": 18735 }, { "epoch": 0.16, "learning_rate": 9.387579318342597e-05, "loss": 2.3491, "step": 18740 }, { "epoch": 0.16, "learning_rate": 9.387257604354049e-05, "loss": 2.3426, "step": 18745 }, { "epoch": 0.16, "learning_rate": 9.386935811402626e-05, "loss": 2.3349, "step": 18750 }, { "epoch": 0.16, "learning_rate": 9.386613939494123e-05, "loss": 2.2854, "step": 18755 }, { "epoch": 0.16, "learning_rate": 9.386291988634328e-05, "loss": 2.352, "step": 18760 }, { "epoch": 0.16, "learning_rate": 9.385969958829037e-05, "loss": 2.3601, "step": 18765 }, { "epoch": 0.16, "learning_rate": 9.385647850084049e-05, "loss": 2.3731, "step": 18770 }, { "epoch": 0.16, "learning_rate": 9.385325662405158e-05, "loss": 2.3579, "step": 18775 }, { "epoch": 0.16, "learning_rate": 9.385003395798165e-05, "loss": 2.4047, "step": 18780 }, { "epoch": 0.16, "learning_rate": 9.384681050268868e-05, "loss": 2.3713, "step": 18785 }, { "epoch": 0.16, "learning_rate": 9.384358625823073e-05, "loss": 2.3212, "step": 18790 }, { "epoch": 0.16, "learning_rate": 9.384036122466578e-05, "loss": 2.2859, "step": 18795 }, { "epoch": 0.16, "learning_rate": 9.383713540205188e-05, "loss": 2.4009, "step": 18800 }, { "epoch": 0.16, "learning_rate": 9.38339087904471e-05, "loss": 2.3744, "step": 18805 }, { "epoch": 0.16, "learning_rate": 9.383068138990953e-05, "loss": 2.3653, "step": 18810 }, { "epoch": 0.16, "learning_rate": 9.382745320049727e-05, "loss": 2.3733, "step": 18815 }, { "epoch": 0.16, "learning_rate": 9.382422422226836e-05, "loss": 2.3473, "step": 18820 }, { "epoch": 0.16, "learning_rate": 9.382099445528096e-05, "loss": 2.3772, "step": 18825 }, { "epoch": 0.16, "learning_rate": 9.381776389959319e-05, "loss": 2.3186, "step": 18830 }, { "epoch": 0.16, "learning_rate": 9.38145325552632e-05, "loss": 2.346, "step": 18835 }, { "epoch": 0.16, "learning_rate": 9.381130042234916e-05, "loss": 2.4563, "step": 18840 }, { "epoch": 0.16, "learning_rate": 9.380806750090921e-05, "loss": 2.3483, "step": 18845 }, { "epoch": 0.16, "learning_rate": 9.380483379100156e-05, "loss": 2.4088, "step": 18850 }, { "epoch": 0.16, "learning_rate": 9.38015992926844e-05, "loss": 2.377, "step": 18855 }, { "epoch": 0.16, "learning_rate": 9.379836400601595e-05, "loss": 2.3083, "step": 18860 }, { "epoch": 0.16, "learning_rate": 9.379512793105444e-05, "loss": 2.2634, "step": 18865 }, { "epoch": 0.16, "learning_rate": 9.379189106785811e-05, "loss": 2.4081, "step": 18870 }, { "epoch": 0.16, "learning_rate": 9.378865341648524e-05, "loss": 2.4102, "step": 18875 }, { "epoch": 0.16, "learning_rate": 9.378541497699406e-05, "loss": 2.422, "step": 18880 }, { "epoch": 0.16, "learning_rate": 9.37821757494429e-05, "loss": 2.2562, "step": 18885 }, { "epoch": 0.16, "learning_rate": 9.377893573389003e-05, "loss": 2.4032, "step": 18890 }, { "epoch": 0.16, "learning_rate": 9.377569493039378e-05, "loss": 2.3603, "step": 18895 }, { "epoch": 0.16, "learning_rate": 9.377245333901247e-05, "loss": 2.3657, "step": 18900 }, { "epoch": 0.16, "learning_rate": 9.376921095980444e-05, "loss": 2.3985, "step": 18905 }, { "epoch": 0.16, "learning_rate": 9.376596779282806e-05, "loss": 2.3295, "step": 18910 }, { "epoch": 0.16, "learning_rate": 9.37627238381417e-05, "loss": 2.3663, "step": 18915 }, { "epoch": 0.16, "learning_rate": 9.375947909580374e-05, "loss": 2.4117, "step": 18920 }, { "epoch": 0.16, "learning_rate": 9.375623356587256e-05, "loss": 2.4234, "step": 18925 }, { "epoch": 0.16, "learning_rate": 9.375298724840661e-05, "loss": 2.323, "step": 18930 }, { "epoch": 0.16, "learning_rate": 9.37497401434643e-05, "loss": 2.4144, "step": 18935 }, { "epoch": 0.16, "learning_rate": 9.374649225110406e-05, "loss": 2.363, "step": 18940 }, { "epoch": 0.16, "learning_rate": 9.374324357138438e-05, "loss": 2.4211, "step": 18945 }, { "epoch": 0.16, "learning_rate": 9.37399941043637e-05, "loss": 2.3425, "step": 18950 }, { "epoch": 0.16, "learning_rate": 9.373674385010052e-05, "loss": 2.3747, "step": 18955 }, { "epoch": 0.16, "learning_rate": 9.373349280865333e-05, "loss": 2.4256, "step": 18960 }, { "epoch": 0.16, "learning_rate": 9.373024098008066e-05, "loss": 2.3946, "step": 18965 }, { "epoch": 0.16, "learning_rate": 9.372698836444101e-05, "loss": 2.26, "step": 18970 }, { "epoch": 0.16, "learning_rate": 9.372373496179292e-05, "loss": 2.4099, "step": 18975 }, { "epoch": 0.16, "learning_rate": 9.372048077219497e-05, "loss": 2.3738, "step": 18980 }, { "epoch": 0.16, "learning_rate": 9.371722579570574e-05, "loss": 2.3743, "step": 18985 }, { "epoch": 0.16, "learning_rate": 9.371397003238378e-05, "loss": 2.3219, "step": 18990 }, { "epoch": 0.16, "learning_rate": 9.37107134822877e-05, "loss": 2.3741, "step": 18995 }, { "epoch": 0.16, "learning_rate": 9.370745614547613e-05, "loss": 2.3228, "step": 19000 }, { "epoch": 0.16, "learning_rate": 9.370419802200767e-05, "loss": 2.2782, "step": 19005 }, { "epoch": 0.16, "learning_rate": 9.370093911194096e-05, "loss": 2.305, "step": 19010 }, { "epoch": 0.16, "learning_rate": 9.369767941533468e-05, "loss": 2.3994, "step": 19015 }, { "epoch": 0.16, "learning_rate": 9.369441893224748e-05, "loss": 2.3587, "step": 19020 }, { "epoch": 0.16, "learning_rate": 9.369115766273804e-05, "loss": 2.3989, "step": 19025 }, { "epoch": 0.16, "learning_rate": 9.368789560686508e-05, "loss": 2.396, "step": 19030 }, { "epoch": 0.16, "learning_rate": 9.368463276468728e-05, "loss": 2.3983, "step": 19035 }, { "epoch": 0.16, "learning_rate": 9.36813691362634e-05, "loss": 2.2886, "step": 19040 }, { "epoch": 0.16, "learning_rate": 9.367810472165215e-05, "loss": 2.3791, "step": 19045 }, { "epoch": 0.16, "learning_rate": 9.36748395209123e-05, "loss": 2.2886, "step": 19050 }, { "epoch": 0.16, "learning_rate": 9.367157353410261e-05, "loss": 2.3605, "step": 19055 }, { "epoch": 0.16, "learning_rate": 9.366830676128185e-05, "loss": 2.4218, "step": 19060 }, { "epoch": 0.16, "learning_rate": 9.366503920250884e-05, "loss": 2.336, "step": 19065 }, { "epoch": 0.16, "learning_rate": 9.366177085784238e-05, "loss": 2.4541, "step": 19070 }, { "epoch": 0.16, "learning_rate": 9.36585017273413e-05, "loss": 2.3948, "step": 19075 }, { "epoch": 0.16, "learning_rate": 9.365523181106444e-05, "loss": 2.363, "step": 19080 }, { "epoch": 0.16, "learning_rate": 9.365196110907064e-05, "loss": 2.4633, "step": 19085 }, { "epoch": 0.16, "learning_rate": 9.364868962141876e-05, "loss": 2.3309, "step": 19090 }, { "epoch": 0.16, "learning_rate": 9.36454173481677e-05, "loss": 2.2746, "step": 19095 }, { "epoch": 0.16, "learning_rate": 9.364214428937637e-05, "loss": 2.4062, "step": 19100 }, { "epoch": 0.16, "learning_rate": 9.363887044510364e-05, "loss": 2.4421, "step": 19105 }, { "epoch": 0.16, "learning_rate": 9.363559581540844e-05, "loss": 2.3244, "step": 19110 }, { "epoch": 0.16, "learning_rate": 9.363232040034975e-05, "loss": 2.3182, "step": 19115 }, { "epoch": 0.16, "learning_rate": 9.362904419998647e-05, "loss": 2.3584, "step": 19120 }, { "epoch": 0.16, "learning_rate": 9.362576721437758e-05, "loss": 2.4011, "step": 19125 }, { "epoch": 0.16, "learning_rate": 9.362248944358209e-05, "loss": 2.3715, "step": 19130 }, { "epoch": 0.16, "learning_rate": 9.361921088765895e-05, "loss": 2.4251, "step": 19135 }, { "epoch": 0.16, "learning_rate": 9.361593154666721e-05, "loss": 2.3736, "step": 19140 }, { "epoch": 0.16, "learning_rate": 9.361265142066585e-05, "loss": 2.4121, "step": 19145 }, { "epoch": 0.16, "learning_rate": 9.360937050971395e-05, "loss": 2.3693, "step": 19150 }, { "epoch": 0.16, "learning_rate": 9.360608881387052e-05, "loss": 2.398, "step": 19155 }, { "epoch": 0.16, "learning_rate": 9.360280633319465e-05, "loss": 2.3797, "step": 19160 }, { "epoch": 0.16, "learning_rate": 9.359952306774542e-05, "loss": 2.3934, "step": 19165 }, { "epoch": 0.16, "learning_rate": 9.35962390175819e-05, "loss": 2.3878, "step": 19170 }, { "epoch": 0.16, "learning_rate": 9.359295418276322e-05, "loss": 2.2943, "step": 19175 }, { "epoch": 0.16, "learning_rate": 9.35896685633485e-05, "loss": 2.3676, "step": 19180 }, { "epoch": 0.16, "learning_rate": 9.358638215939686e-05, "loss": 2.3643, "step": 19185 }, { "epoch": 0.16, "learning_rate": 9.358309497096744e-05, "loss": 2.3259, "step": 19190 }, { "epoch": 0.16, "learning_rate": 9.357980699811946e-05, "loss": 2.3371, "step": 19195 }, { "epoch": 0.16, "learning_rate": 9.357651824091203e-05, "loss": 2.3367, "step": 19200 }, { "epoch": 0.16, "learning_rate": 9.357322869940439e-05, "loss": 2.2836, "step": 19205 }, { "epoch": 0.16, "learning_rate": 9.356993837365571e-05, "loss": 2.422, "step": 19210 }, { "epoch": 0.16, "learning_rate": 9.356664726372523e-05, "loss": 2.3546, "step": 19215 }, { "epoch": 0.16, "learning_rate": 9.35633553696722e-05, "loss": 2.3302, "step": 19220 }, { "epoch": 0.16, "learning_rate": 9.356006269155584e-05, "loss": 2.3998, "step": 19225 }, { "epoch": 0.16, "learning_rate": 9.355676922943541e-05, "loss": 2.3907, "step": 19230 }, { "epoch": 0.16, "learning_rate": 9.355347498337023e-05, "loss": 2.4286, "step": 19235 }, { "epoch": 0.16, "learning_rate": 9.355017995341953e-05, "loss": 2.3593, "step": 19240 }, { "epoch": 0.16, "learning_rate": 9.354688413964266e-05, "loss": 2.2967, "step": 19245 }, { "epoch": 0.16, "learning_rate": 9.354358754209891e-05, "loss": 2.427, "step": 19250 }, { "epoch": 0.16, "learning_rate": 9.354029016084762e-05, "loss": 2.3635, "step": 19255 }, { "epoch": 0.16, "learning_rate": 9.353699199594816e-05, "loss": 2.331, "step": 19260 }, { "epoch": 0.16, "learning_rate": 9.353369304745988e-05, "loss": 2.3288, "step": 19265 }, { "epoch": 0.16, "learning_rate": 9.353039331544213e-05, "loss": 2.2634, "step": 19270 }, { "epoch": 0.16, "learning_rate": 9.352709279995431e-05, "loss": 2.465, "step": 19275 }, { "epoch": 0.16, "learning_rate": 9.352379150105585e-05, "loss": 2.3191, "step": 19280 }, { "epoch": 0.16, "learning_rate": 9.352048941880614e-05, "loss": 2.3852, "step": 19285 }, { "epoch": 0.16, "learning_rate": 9.351718655326462e-05, "loss": 2.4288, "step": 19290 }, { "epoch": 0.16, "learning_rate": 9.351388290449074e-05, "loss": 2.344, "step": 19295 }, { "epoch": 0.16, "learning_rate": 9.351057847254397e-05, "loss": 2.4031, "step": 19300 }, { "epoch": 0.16, "learning_rate": 9.350727325748376e-05, "loss": 2.3515, "step": 19305 }, { "epoch": 0.16, "learning_rate": 9.350396725936961e-05, "loss": 2.3661, "step": 19310 }, { "epoch": 0.16, "learning_rate": 9.350066047826103e-05, "loss": 2.3401, "step": 19315 }, { "epoch": 0.16, "learning_rate": 9.34973529142175e-05, "loss": 2.3395, "step": 19320 }, { "epoch": 0.16, "learning_rate": 9.34940445672986e-05, "loss": 2.3952, "step": 19325 }, { "epoch": 0.16, "learning_rate": 9.349073543756384e-05, "loss": 2.3322, "step": 19330 }, { "epoch": 0.16, "learning_rate": 9.348742552507279e-05, "loss": 2.4109, "step": 19335 }, { "epoch": 0.17, "learning_rate": 9.348411482988504e-05, "loss": 2.3703, "step": 19340 }, { "epoch": 0.17, "learning_rate": 9.348080335206013e-05, "loss": 2.4091, "step": 19345 }, { "epoch": 0.17, "learning_rate": 9.347749109165771e-05, "loss": 2.3622, "step": 19350 }, { "epoch": 0.17, "learning_rate": 9.347417804873737e-05, "loss": 2.4817, "step": 19355 }, { "epoch": 0.17, "learning_rate": 9.347086422335875e-05, "loss": 2.3669, "step": 19360 }, { "epoch": 0.17, "learning_rate": 9.346754961558149e-05, "loss": 2.3752, "step": 19365 }, { "epoch": 0.17, "learning_rate": 9.346423422546522e-05, "loss": 2.3669, "step": 19370 }, { "epoch": 0.17, "learning_rate": 9.346091805306964e-05, "loss": 2.4368, "step": 19375 }, { "epoch": 0.17, "learning_rate": 9.345760109845446e-05, "loss": 2.4697, "step": 19380 }, { "epoch": 0.17, "learning_rate": 9.345428336167931e-05, "loss": 2.3433, "step": 19385 }, { "epoch": 0.17, "learning_rate": 9.345096484280398e-05, "loss": 2.3255, "step": 19390 }, { "epoch": 0.17, "learning_rate": 9.344764554188813e-05, "loss": 2.4262, "step": 19395 }, { "epoch": 0.17, "learning_rate": 9.344432545899155e-05, "loss": 2.4219, "step": 19400 }, { "epoch": 0.17, "learning_rate": 9.344100459417397e-05, "loss": 2.3167, "step": 19405 }, { "epoch": 0.17, "learning_rate": 9.343768294749518e-05, "loss": 2.3877, "step": 19410 }, { "epoch": 0.17, "learning_rate": 9.343436051901492e-05, "loss": 2.3392, "step": 19415 }, { "epoch": 0.17, "learning_rate": 9.343103730879305e-05, "loss": 2.268, "step": 19420 }, { "epoch": 0.17, "learning_rate": 9.342771331688933e-05, "loss": 2.3053, "step": 19425 }, { "epoch": 0.17, "learning_rate": 9.342438854336361e-05, "loss": 2.452, "step": 19430 }, { "epoch": 0.17, "learning_rate": 9.342106298827575e-05, "loss": 2.3954, "step": 19435 }, { "epoch": 0.17, "learning_rate": 9.341773665168556e-05, "loss": 2.3211, "step": 19440 }, { "epoch": 0.17, "learning_rate": 9.341440953365293e-05, "loss": 2.4079, "step": 19445 }, { "epoch": 0.17, "learning_rate": 9.341108163423776e-05, "loss": 2.3666, "step": 19450 }, { "epoch": 0.17, "learning_rate": 9.34077529534999e-05, "loss": 2.3854, "step": 19455 }, { "epoch": 0.17, "learning_rate": 9.340442349149929e-05, "loss": 2.3224, "step": 19460 }, { "epoch": 0.17, "learning_rate": 9.340109324829587e-05, "loss": 2.322, "step": 19465 }, { "epoch": 0.17, "learning_rate": 9.339776222394955e-05, "loss": 2.2796, "step": 19470 }, { "epoch": 0.17, "learning_rate": 9.339443041852029e-05, "loss": 2.443, "step": 19475 }, { "epoch": 0.17, "learning_rate": 9.339109783206808e-05, "loss": 2.4022, "step": 19480 }, { "epoch": 0.17, "learning_rate": 9.338776446465285e-05, "loss": 2.3415, "step": 19485 }, { "epoch": 0.17, "learning_rate": 9.338443031633465e-05, "loss": 2.3891, "step": 19490 }, { "epoch": 0.17, "learning_rate": 9.338109538717345e-05, "loss": 2.4164, "step": 19495 }, { "epoch": 0.17, "learning_rate": 9.337775967722931e-05, "loss": 2.3305, "step": 19500 }, { "epoch": 0.17, "learning_rate": 9.337442318656221e-05, "loss": 2.3905, "step": 19505 }, { "epoch": 0.17, "learning_rate": 9.337108591523224e-05, "loss": 2.3551, "step": 19510 }, { "epoch": 0.17, "learning_rate": 9.336774786329949e-05, "loss": 2.3254, "step": 19515 }, { "epoch": 0.17, "learning_rate": 9.336440903082398e-05, "loss": 2.3041, "step": 19520 }, { "epoch": 0.17, "learning_rate": 9.336106941786584e-05, "loss": 2.3341, "step": 19525 }, { "epoch": 0.17, "learning_rate": 9.335772902448517e-05, "loss": 2.395, "step": 19530 }, { "epoch": 0.17, "learning_rate": 9.335438785074208e-05, "loss": 2.3904, "step": 19535 }, { "epoch": 0.17, "learning_rate": 9.335104589669674e-05, "loss": 2.279, "step": 19540 }, { "epoch": 0.17, "learning_rate": 9.334770316240927e-05, "loss": 2.2607, "step": 19545 }, { "epoch": 0.17, "learning_rate": 9.334435964793981e-05, "loss": 2.3706, "step": 19550 }, { "epoch": 0.17, "learning_rate": 9.334101535334858e-05, "loss": 2.3909, "step": 19555 }, { "epoch": 0.17, "learning_rate": 9.333767027869576e-05, "loss": 2.3713, "step": 19560 }, { "epoch": 0.17, "learning_rate": 9.333432442404156e-05, "loss": 2.3851, "step": 19565 }, { "epoch": 0.17, "learning_rate": 9.333097778944617e-05, "loss": 2.4448, "step": 19570 }, { "epoch": 0.17, "learning_rate": 9.332763037496987e-05, "loss": 2.3452, "step": 19575 }, { "epoch": 0.17, "learning_rate": 9.332428218067287e-05, "loss": 2.2924, "step": 19580 }, { "epoch": 0.17, "learning_rate": 9.332093320661545e-05, "loss": 2.4283, "step": 19585 }, { "epoch": 0.17, "learning_rate": 9.331758345285787e-05, "loss": 2.3081, "step": 19590 }, { "epoch": 0.17, "learning_rate": 9.331423291946043e-05, "loss": 2.4177, "step": 19595 }, { "epoch": 0.17, "learning_rate": 9.331088160648344e-05, "loss": 2.3781, "step": 19600 }, { "epoch": 0.17, "learning_rate": 9.33075295139872e-05, "loss": 2.3759, "step": 19605 }, { "epoch": 0.17, "learning_rate": 9.330417664203206e-05, "loss": 2.3731, "step": 19610 }, { "epoch": 0.17, "learning_rate": 9.330082299067838e-05, "loss": 2.3076, "step": 19615 }, { "epoch": 0.17, "learning_rate": 9.329746855998646e-05, "loss": 2.4549, "step": 19620 }, { "epoch": 0.17, "learning_rate": 9.329411335001671e-05, "loss": 2.3296, "step": 19625 }, { "epoch": 0.17, "learning_rate": 9.329075736082955e-05, "loss": 2.3912, "step": 19630 }, { "epoch": 0.17, "learning_rate": 9.328740059248535e-05, "loss": 2.3141, "step": 19635 }, { "epoch": 0.17, "learning_rate": 9.328404304504451e-05, "loss": 2.3614, "step": 19640 }, { "epoch": 0.17, "learning_rate": 9.328068471856748e-05, "loss": 2.3535, "step": 19645 }, { "epoch": 0.17, "learning_rate": 9.327732561311471e-05, "loss": 2.3395, "step": 19650 }, { "epoch": 0.17, "learning_rate": 9.327396572874665e-05, "loss": 2.4723, "step": 19655 }, { "epoch": 0.17, "learning_rate": 9.327060506552376e-05, "loss": 2.3208, "step": 19660 }, { "epoch": 0.17, "learning_rate": 9.326724362350654e-05, "loss": 2.3647, "step": 19665 }, { "epoch": 0.17, "learning_rate": 9.326388140275549e-05, "loss": 2.398, "step": 19670 }, { "epoch": 0.17, "learning_rate": 9.326051840333112e-05, "loss": 2.3394, "step": 19675 }, { "epoch": 0.17, "learning_rate": 9.325715462529397e-05, "loss": 2.3384, "step": 19680 }, { "epoch": 0.17, "learning_rate": 9.325379006870456e-05, "loss": 2.367, "step": 19685 }, { "epoch": 0.17, "learning_rate": 9.325042473362345e-05, "loss": 2.3196, "step": 19690 }, { "epoch": 0.17, "learning_rate": 9.324705862011123e-05, "loss": 2.3624, "step": 19695 }, { "epoch": 0.17, "learning_rate": 9.324369172822846e-05, "loss": 2.3655, "step": 19700 }, { "epoch": 0.17, "learning_rate": 9.324032405803577e-05, "loss": 2.3491, "step": 19705 }, { "epoch": 0.17, "learning_rate": 9.323695560959373e-05, "loss": 2.3312, "step": 19710 }, { "epoch": 0.17, "learning_rate": 9.3233586382963e-05, "loss": 2.4449, "step": 19715 }, { "epoch": 0.17, "learning_rate": 9.323021637820421e-05, "loss": 2.2996, "step": 19720 }, { "epoch": 0.17, "learning_rate": 9.322684559537801e-05, "loss": 2.3985, "step": 19725 }, { "epoch": 0.17, "learning_rate": 9.322347403454507e-05, "loss": 2.3817, "step": 19730 }, { "epoch": 0.17, "learning_rate": 9.322010169576607e-05, "loss": 2.4523, "step": 19735 }, { "epoch": 0.17, "learning_rate": 9.321672857910171e-05, "loss": 2.3076, "step": 19740 }, { "epoch": 0.17, "learning_rate": 9.32133546846127e-05, "loss": 2.3515, "step": 19745 }, { "epoch": 0.17, "learning_rate": 9.320998001235974e-05, "loss": 2.4039, "step": 19750 }, { "epoch": 0.17, "learning_rate": 9.320660456240363e-05, "loss": 2.4118, "step": 19755 }, { "epoch": 0.17, "learning_rate": 9.320322833480507e-05, "loss": 2.3645, "step": 19760 }, { "epoch": 0.17, "learning_rate": 9.319985132962482e-05, "loss": 2.4225, "step": 19765 }, { "epoch": 0.17, "learning_rate": 9.319647354692369e-05, "loss": 2.3492, "step": 19770 }, { "epoch": 0.17, "learning_rate": 9.319309498676246e-05, "loss": 2.3989, "step": 19775 }, { "epoch": 0.17, "learning_rate": 9.318971564920196e-05, "loss": 2.324, "step": 19780 }, { "epoch": 0.17, "learning_rate": 9.318633553430298e-05, "loss": 2.323, "step": 19785 }, { "epoch": 0.17, "learning_rate": 9.318295464212637e-05, "loss": 2.3972, "step": 19790 }, { "epoch": 0.17, "learning_rate": 9.317957297273298e-05, "loss": 2.2489, "step": 19795 }, { "epoch": 0.17, "learning_rate": 9.317619052618367e-05, "loss": 2.3402, "step": 19800 }, { "epoch": 0.17, "learning_rate": 9.317280730253932e-05, "loss": 2.3334, "step": 19805 }, { "epoch": 0.17, "learning_rate": 9.316942330186084e-05, "loss": 2.4096, "step": 19810 }, { "epoch": 0.17, "learning_rate": 9.316603852420911e-05, "loss": 2.3102, "step": 19815 }, { "epoch": 0.17, "learning_rate": 9.316265296964506e-05, "loss": 2.3559, "step": 19820 }, { "epoch": 0.17, "learning_rate": 9.315926663822962e-05, "loss": 2.3659, "step": 19825 }, { "epoch": 0.17, "learning_rate": 9.315587953002373e-05, "loss": 2.289, "step": 19830 }, { "epoch": 0.17, "learning_rate": 9.315249164508839e-05, "loss": 2.3473, "step": 19835 }, { "epoch": 0.17, "learning_rate": 9.314910298348453e-05, "loss": 2.3121, "step": 19840 }, { "epoch": 0.17, "learning_rate": 9.314571354527318e-05, "loss": 2.3988, "step": 19845 }, { "epoch": 0.17, "learning_rate": 9.314232333051531e-05, "loss": 2.3496, "step": 19850 }, { "epoch": 0.17, "learning_rate": 9.313893233927195e-05, "loss": 2.4554, "step": 19855 }, { "epoch": 0.17, "learning_rate": 9.313554057160414e-05, "loss": 2.3621, "step": 19860 }, { "epoch": 0.17, "learning_rate": 9.313214802757294e-05, "loss": 2.3159, "step": 19865 }, { "epoch": 0.17, "learning_rate": 9.312875470723934e-05, "loss": 2.2892, "step": 19870 }, { "epoch": 0.17, "learning_rate": 9.31253606106645e-05, "loss": 2.3656, "step": 19875 }, { "epoch": 0.17, "learning_rate": 9.312196573790946e-05, "loss": 2.3176, "step": 19880 }, { "epoch": 0.17, "learning_rate": 9.311857008903533e-05, "loss": 2.3165, "step": 19885 }, { "epoch": 0.17, "learning_rate": 9.311517366410323e-05, "loss": 2.3688, "step": 19890 }, { "epoch": 0.17, "learning_rate": 9.311177646317428e-05, "loss": 2.3499, "step": 19895 }, { "epoch": 0.17, "learning_rate": 9.310837848630964e-05, "loss": 2.4078, "step": 19900 }, { "epoch": 0.17, "learning_rate": 9.310497973357046e-05, "loss": 2.3298, "step": 19905 }, { "epoch": 0.17, "learning_rate": 9.310158020501789e-05, "loss": 2.3438, "step": 19910 }, { "epoch": 0.17, "learning_rate": 9.309817990071315e-05, "loss": 2.3461, "step": 19915 }, { "epoch": 0.17, "learning_rate": 9.309477882071743e-05, "loss": 2.3757, "step": 19920 }, { "epoch": 0.17, "learning_rate": 9.309137696509193e-05, "loss": 2.3502, "step": 19925 }, { "epoch": 0.17, "learning_rate": 9.30879743338979e-05, "loss": 2.3012, "step": 19930 }, { "epoch": 0.17, "learning_rate": 9.308457092719656e-05, "loss": 2.2983, "step": 19935 }, { "epoch": 0.17, "learning_rate": 9.308116674504916e-05, "loss": 2.3919, "step": 19940 }, { "epoch": 0.17, "learning_rate": 9.3077761787517e-05, "loss": 2.3392, "step": 19945 }, { "epoch": 0.17, "learning_rate": 9.307435605466134e-05, "loss": 2.3419, "step": 19950 }, { "epoch": 0.17, "learning_rate": 9.307094954654347e-05, "loss": 2.3061, "step": 19955 }, { "epoch": 0.17, "learning_rate": 9.306754226322473e-05, "loss": 2.4317, "step": 19960 }, { "epoch": 0.17, "learning_rate": 9.306413420476643e-05, "loss": 2.2926, "step": 19965 }, { "epoch": 0.17, "learning_rate": 9.30607253712299e-05, "loss": 2.3523, "step": 19970 }, { "epoch": 0.17, "learning_rate": 9.305731576267649e-05, "loss": 2.3415, "step": 19975 }, { "epoch": 0.17, "learning_rate": 9.305390537916758e-05, "loss": 2.3438, "step": 19980 }, { "epoch": 0.17, "learning_rate": 9.305049422076454e-05, "loss": 2.3721, "step": 19985 }, { "epoch": 0.17, "learning_rate": 9.30470822875288e-05, "loss": 2.3363, "step": 19990 }, { "epoch": 0.17, "learning_rate": 9.304366957952173e-05, "loss": 2.2917, "step": 19995 }, { "epoch": 0.17, "learning_rate": 9.304025609680476e-05, "loss": 2.3107, "step": 20000 }, { "epoch": 0.17, "learning_rate": 9.303684183943935e-05, "loss": 2.3624, "step": 20005 }, { "epoch": 0.17, "learning_rate": 9.30334268074869e-05, "loss": 2.3563, "step": 20010 }, { "epoch": 0.17, "learning_rate": 9.303001100100892e-05, "loss": 2.4141, "step": 20015 }, { "epoch": 0.17, "learning_rate": 9.302659442006689e-05, "loss": 2.3519, "step": 20020 }, { "epoch": 0.17, "learning_rate": 9.302317706472228e-05, "loss": 2.361, "step": 20025 }, { "epoch": 0.17, "learning_rate": 9.301975893503659e-05, "loss": 2.4109, "step": 20030 }, { "epoch": 0.17, "learning_rate": 9.301634003107135e-05, "loss": 2.4106, "step": 20035 }, { "epoch": 0.17, "learning_rate": 9.301292035288811e-05, "loss": 2.3984, "step": 20040 }, { "epoch": 0.17, "learning_rate": 9.300949990054841e-05, "loss": 2.3452, "step": 20045 }, { "epoch": 0.17, "learning_rate": 9.300607867411381e-05, "loss": 2.3307, "step": 20050 }, { "epoch": 0.17, "learning_rate": 9.300265667364587e-05, "loss": 2.3636, "step": 20055 }, { "epoch": 0.17, "learning_rate": 9.29992338992062e-05, "loss": 2.338, "step": 20060 }, { "epoch": 0.17, "learning_rate": 9.29958103508564e-05, "loss": 2.2759, "step": 20065 }, { "epoch": 0.17, "learning_rate": 9.29923860286581e-05, "loss": 2.3389, "step": 20070 }, { "epoch": 0.17, "learning_rate": 9.29889609326729e-05, "loss": 2.3922, "step": 20075 }, { "epoch": 0.17, "learning_rate": 9.298553506296246e-05, "loss": 2.3214, "step": 20080 }, { "epoch": 0.17, "learning_rate": 9.298210841958845e-05, "loss": 2.2781, "step": 20085 }, { "epoch": 0.17, "learning_rate": 9.297868100261253e-05, "loss": 2.3294, "step": 20090 }, { "epoch": 0.17, "learning_rate": 9.297525281209641e-05, "loss": 2.4247, "step": 20095 }, { "epoch": 0.17, "learning_rate": 9.297182384810177e-05, "loss": 2.307, "step": 20100 }, { "epoch": 0.17, "learning_rate": 9.296839411069031e-05, "loss": 2.3844, "step": 20105 }, { "epoch": 0.17, "learning_rate": 9.29649635999238e-05, "loss": 2.3262, "step": 20110 }, { "epoch": 0.17, "learning_rate": 9.296153231586396e-05, "loss": 2.3591, "step": 20115 }, { "epoch": 0.17, "learning_rate": 9.295810025857255e-05, "loss": 2.429, "step": 20120 }, { "epoch": 0.17, "learning_rate": 9.295466742811135e-05, "loss": 2.3915, "step": 20125 }, { "epoch": 0.17, "learning_rate": 9.295123382454211e-05, "loss": 2.311, "step": 20130 }, { "epoch": 0.17, "learning_rate": 9.294779944792667e-05, "loss": 2.309, "step": 20135 }, { "epoch": 0.17, "learning_rate": 9.294436429832683e-05, "loss": 2.2957, "step": 20140 }, { "epoch": 0.17, "learning_rate": 9.294092837580442e-05, "loss": 2.4598, "step": 20145 }, { "epoch": 0.17, "learning_rate": 9.293749168042125e-05, "loss": 2.4171, "step": 20150 }, { "epoch": 0.17, "learning_rate": 9.293405421223922e-05, "loss": 2.3642, "step": 20155 }, { "epoch": 0.17, "learning_rate": 9.293061597132015e-05, "loss": 2.3373, "step": 20160 }, { "epoch": 0.17, "learning_rate": 9.292717695772599e-05, "loss": 2.4546, "step": 20165 }, { "epoch": 0.17, "learning_rate": 9.292373717151856e-05, "loss": 2.3984, "step": 20170 }, { "epoch": 0.17, "learning_rate": 9.292029661275982e-05, "loss": 2.445, "step": 20175 }, { "epoch": 0.17, "learning_rate": 9.29168552815117e-05, "loss": 2.365, "step": 20180 }, { "epoch": 0.17, "learning_rate": 9.291341317783608e-05, "loss": 2.383, "step": 20185 }, { "epoch": 0.17, "learning_rate": 9.290997030179498e-05, "loss": 2.2836, "step": 20190 }, { "epoch": 0.17, "learning_rate": 9.290652665345032e-05, "loss": 2.3962, "step": 20195 }, { "epoch": 0.17, "learning_rate": 9.290308223286409e-05, "loss": 2.3648, "step": 20200 }, { "epoch": 0.17, "learning_rate": 9.289963704009829e-05, "loss": 2.4236, "step": 20205 }, { "epoch": 0.17, "learning_rate": 9.289619107521495e-05, "loss": 2.3909, "step": 20210 }, { "epoch": 0.17, "learning_rate": 9.289274433827602e-05, "loss": 2.399, "step": 20215 }, { "epoch": 0.17, "learning_rate": 9.288929682934361e-05, "loss": 2.3335, "step": 20220 }, { "epoch": 0.17, "learning_rate": 9.288584854847975e-05, "loss": 2.3853, "step": 20225 }, { "epoch": 0.17, "learning_rate": 9.288239949574648e-05, "loss": 2.3403, "step": 20230 }, { "epoch": 0.17, "learning_rate": 9.287894967120589e-05, "loss": 2.3464, "step": 20235 }, { "epoch": 0.17, "learning_rate": 9.287549907492008e-05, "loss": 2.4749, "step": 20240 }, { "epoch": 0.17, "learning_rate": 9.287204770695114e-05, "loss": 2.3955, "step": 20245 }, { "epoch": 0.17, "learning_rate": 9.28685955673612e-05, "loss": 2.3551, "step": 20250 }, { "epoch": 0.17, "learning_rate": 9.286514265621238e-05, "loss": 2.4056, "step": 20255 }, { "epoch": 0.17, "learning_rate": 9.286168897356683e-05, "loss": 2.3712, "step": 20260 }, { "epoch": 0.17, "learning_rate": 9.285823451948671e-05, "loss": 2.2873, "step": 20265 }, { "epoch": 0.17, "learning_rate": 9.285477929403421e-05, "loss": 2.3967, "step": 20270 }, { "epoch": 0.17, "learning_rate": 9.28513232972715e-05, "loss": 2.3543, "step": 20275 }, { "epoch": 0.17, "learning_rate": 9.284786652926078e-05, "loss": 2.3415, "step": 20280 }, { "epoch": 0.17, "learning_rate": 9.284440899006429e-05, "loss": 2.384, "step": 20285 }, { "epoch": 0.17, "learning_rate": 9.284095067974424e-05, "loss": 2.3156, "step": 20290 }, { "epoch": 0.17, "learning_rate": 9.283749159836285e-05, "loss": 2.3593, "step": 20295 }, { "epoch": 0.17, "learning_rate": 9.283403174598244e-05, "loss": 2.3378, "step": 20300 }, { "epoch": 0.17, "learning_rate": 9.283057112266522e-05, "loss": 2.3233, "step": 20305 }, { "epoch": 0.17, "learning_rate": 9.282710972847351e-05, "loss": 2.3439, "step": 20310 }, { "epoch": 0.17, "learning_rate": 9.282364756346959e-05, "loss": 2.3718, "step": 20315 }, { "epoch": 0.17, "learning_rate": 9.28201846277158e-05, "loss": 2.3487, "step": 20320 }, { "epoch": 0.17, "learning_rate": 9.281672092127442e-05, "loss": 2.2314, "step": 20325 }, { "epoch": 0.17, "learning_rate": 9.281325644420784e-05, "loss": 2.381, "step": 20330 }, { "epoch": 0.17, "learning_rate": 9.280979119657839e-05, "loss": 2.372, "step": 20335 }, { "epoch": 0.17, "learning_rate": 9.280632517844842e-05, "loss": 2.2052, "step": 20340 }, { "epoch": 0.17, "learning_rate": 9.280285838988036e-05, "loss": 2.4442, "step": 20345 }, { "epoch": 0.17, "learning_rate": 9.279939083093659e-05, "loss": 2.3825, "step": 20350 }, { "epoch": 0.17, "learning_rate": 9.279592250167948e-05, "loss": 2.3802, "step": 20355 }, { "epoch": 0.17, "learning_rate": 9.27924534021715e-05, "loss": 2.3595, "step": 20360 }, { "epoch": 0.17, "learning_rate": 9.278898353247507e-05, "loss": 2.3294, "step": 20365 }, { "epoch": 0.17, "learning_rate": 9.278551289265262e-05, "loss": 2.3953, "step": 20370 }, { "epoch": 0.17, "learning_rate": 9.278204148276666e-05, "loss": 2.3689, "step": 20375 }, { "epoch": 0.17, "learning_rate": 9.277856930287964e-05, "loss": 2.4141, "step": 20380 }, { "epoch": 0.17, "learning_rate": 9.277509635305408e-05, "loss": 2.3783, "step": 20385 }, { "epoch": 0.17, "learning_rate": 9.277162263335245e-05, "loss": 2.4269, "step": 20390 }, { "epoch": 0.17, "learning_rate": 9.27681481438373e-05, "loss": 2.332, "step": 20395 }, { "epoch": 0.17, "learning_rate": 9.276467288457114e-05, "loss": 2.362, "step": 20400 }, { "epoch": 0.17, "learning_rate": 9.276119685561653e-05, "loss": 2.356, "step": 20405 }, { "epoch": 0.17, "learning_rate": 9.275772005703603e-05, "loss": 2.3821, "step": 20410 }, { "epoch": 0.17, "learning_rate": 9.275424248889223e-05, "loss": 2.3409, "step": 20415 }, { "epoch": 0.17, "learning_rate": 9.275076415124771e-05, "loss": 2.3688, "step": 20420 }, { "epoch": 0.17, "learning_rate": 9.274728504416508e-05, "loss": 2.3514, "step": 20425 }, { "epoch": 0.17, "learning_rate": 9.274380516770694e-05, "loss": 2.3387, "step": 20430 }, { "epoch": 0.17, "learning_rate": 9.274032452193593e-05, "loss": 2.4286, "step": 20435 }, { "epoch": 0.17, "learning_rate": 9.27368431069147e-05, "loss": 2.3648, "step": 20440 }, { "epoch": 0.17, "learning_rate": 9.273336092270593e-05, "loss": 2.4084, "step": 20445 }, { "epoch": 0.17, "learning_rate": 9.272987796937225e-05, "loss": 2.359, "step": 20450 }, { "epoch": 0.17, "learning_rate": 9.272639424697637e-05, "loss": 2.3077, "step": 20455 }, { "epoch": 0.17, "learning_rate": 9.2722909755581e-05, "loss": 2.3615, "step": 20460 }, { "epoch": 0.17, "learning_rate": 9.271942449524883e-05, "loss": 2.3995, "step": 20465 }, { "epoch": 0.17, "learning_rate": 9.271593846604261e-05, "loss": 2.3637, "step": 20470 }, { "epoch": 0.17, "learning_rate": 9.271245166802507e-05, "loss": 2.3427, "step": 20475 }, { "epoch": 0.17, "learning_rate": 9.270896410125897e-05, "loss": 2.3742, "step": 20480 }, { "epoch": 0.17, "learning_rate": 9.270547576580708e-05, "loss": 2.458, "step": 20485 }, { "epoch": 0.17, "learning_rate": 9.27019866617322e-05, "loss": 2.3654, "step": 20490 }, { "epoch": 0.17, "learning_rate": 9.26984967890971e-05, "loss": 2.357, "step": 20495 }, { "epoch": 0.17, "learning_rate": 9.26950061479646e-05, "loss": 2.4227, "step": 20500 }, { "epoch": 0.17, "learning_rate": 9.269151473839755e-05, "loss": 2.2614, "step": 20505 }, { "epoch": 0.18, "learning_rate": 9.268802256045874e-05, "loss": 2.4058, "step": 20510 }, { "epoch": 0.18, "learning_rate": 9.268452961421107e-05, "loss": 2.3867, "step": 20515 }, { "epoch": 0.18, "learning_rate": 9.268103589971738e-05, "loss": 2.3303, "step": 20520 }, { "epoch": 0.18, "learning_rate": 9.267754141704058e-05, "loss": 2.3762, "step": 20525 }, { "epoch": 0.18, "learning_rate": 9.267404616624352e-05, "loss": 2.3727, "step": 20530 }, { "epoch": 0.18, "learning_rate": 9.267055014738913e-05, "loss": 2.3628, "step": 20535 }, { "epoch": 0.18, "learning_rate": 9.266705336054034e-05, "loss": 2.3395, "step": 20540 }, { "epoch": 0.18, "learning_rate": 9.266355580576008e-05, "loss": 2.3766, "step": 20545 }, { "epoch": 0.18, "learning_rate": 9.266005748311131e-05, "loss": 2.3335, "step": 20550 }, { "epoch": 0.18, "learning_rate": 9.265655839265697e-05, "loss": 2.4785, "step": 20555 }, { "epoch": 0.18, "learning_rate": 9.265305853446004e-05, "loss": 2.3435, "step": 20560 }, { "epoch": 0.18, "learning_rate": 9.264955790858355e-05, "loss": 2.4117, "step": 20565 }, { "epoch": 0.18, "learning_rate": 9.264605651509047e-05, "loss": 2.4017, "step": 20570 }, { "epoch": 0.18, "learning_rate": 9.264255435404381e-05, "loss": 2.2807, "step": 20575 }, { "epoch": 0.18, "learning_rate": 9.263905142550664e-05, "loss": 2.4151, "step": 20580 }, { "epoch": 0.18, "learning_rate": 9.263554772954198e-05, "loss": 2.3298, "step": 20585 }, { "epoch": 0.18, "learning_rate": 9.263204326621288e-05, "loss": 2.2719, "step": 20590 }, { "epoch": 0.18, "learning_rate": 9.262853803558244e-05, "loss": 2.4503, "step": 20595 }, { "epoch": 0.18, "learning_rate": 9.262503203771374e-05, "loss": 2.337, "step": 20600 }, { "epoch": 0.18, "learning_rate": 9.262152527266989e-05, "loss": 2.2983, "step": 20605 }, { "epoch": 0.18, "learning_rate": 9.261801774051397e-05, "loss": 2.4471, "step": 20610 }, { "epoch": 0.18, "learning_rate": 9.261450944130916e-05, "loss": 2.3442, "step": 20615 }, { "epoch": 0.18, "learning_rate": 9.261100037511857e-05, "loss": 2.3228, "step": 20620 }, { "epoch": 0.18, "learning_rate": 9.260749054200535e-05, "loss": 2.3671, "step": 20625 }, { "epoch": 0.18, "learning_rate": 9.260397994203269e-05, "loss": 2.3229, "step": 20630 }, { "epoch": 0.18, "learning_rate": 9.260046857526378e-05, "loss": 2.3465, "step": 20635 }, { "epoch": 0.18, "learning_rate": 9.25969564417618e-05, "loss": 2.3025, "step": 20640 }, { "epoch": 0.18, "learning_rate": 9.259344354158997e-05, "loss": 2.3923, "step": 20645 }, { "epoch": 0.18, "learning_rate": 9.258992987481153e-05, "loss": 2.3573, "step": 20650 }, { "epoch": 0.18, "learning_rate": 9.258641544148969e-05, "loss": 2.4365, "step": 20655 }, { "epoch": 0.18, "learning_rate": 9.258290024168773e-05, "loss": 2.4183, "step": 20660 }, { "epoch": 0.18, "learning_rate": 9.25793842754689e-05, "loss": 2.4005, "step": 20665 }, { "epoch": 0.18, "learning_rate": 9.25758675428965e-05, "loss": 2.3474, "step": 20670 }, { "epoch": 0.18, "learning_rate": 9.25723500440338e-05, "loss": 2.4358, "step": 20675 }, { "epoch": 0.18, "learning_rate": 9.256883177894413e-05, "loss": 2.4459, "step": 20680 }, { "epoch": 0.18, "learning_rate": 9.25653127476908e-05, "loss": 2.3367, "step": 20685 }, { "epoch": 0.18, "learning_rate": 9.256179295033716e-05, "loss": 2.3666, "step": 20690 }, { "epoch": 0.18, "learning_rate": 9.255827238694654e-05, "loss": 2.3587, "step": 20695 }, { "epoch": 0.18, "learning_rate": 9.255475105758232e-05, "loss": 2.3465, "step": 20700 }, { "epoch": 0.18, "learning_rate": 9.255122896230788e-05, "loss": 2.3898, "step": 20705 }, { "epoch": 0.18, "learning_rate": 9.254770610118659e-05, "loss": 2.4395, "step": 20710 }, { "epoch": 0.18, "learning_rate": 9.254418247428189e-05, "loss": 2.451, "step": 20715 }, { "epoch": 0.18, "learning_rate": 9.254065808165717e-05, "loss": 2.3247, "step": 20720 }, { "epoch": 0.18, "learning_rate": 9.253713292337586e-05, "loss": 2.3193, "step": 20725 }, { "epoch": 0.18, "learning_rate": 9.253360699950142e-05, "loss": 2.3178, "step": 20730 }, { "epoch": 0.18, "learning_rate": 9.253008031009731e-05, "loss": 2.3856, "step": 20735 }, { "epoch": 0.18, "learning_rate": 9.252655285522701e-05, "loss": 2.4224, "step": 20740 }, { "epoch": 0.18, "learning_rate": 9.2523024634954e-05, "loss": 2.3282, "step": 20745 }, { "epoch": 0.18, "learning_rate": 9.251949564934177e-05, "loss": 2.386, "step": 20750 }, { "epoch": 0.18, "learning_rate": 9.251596589845386e-05, "loss": 2.349, "step": 20755 }, { "epoch": 0.18, "learning_rate": 9.251243538235378e-05, "loss": 2.3454, "step": 20760 }, { "epoch": 0.18, "learning_rate": 9.250890410110509e-05, "loss": 2.3498, "step": 20765 }, { "epoch": 0.18, "learning_rate": 9.250537205477132e-05, "loss": 2.3524, "step": 20770 }, { "epoch": 0.18, "learning_rate": 9.250183924341608e-05, "loss": 2.4274, "step": 20775 }, { "epoch": 0.18, "learning_rate": 9.249830566710291e-05, "loss": 2.3389, "step": 20780 }, { "epoch": 0.18, "learning_rate": 9.249477132589545e-05, "loss": 2.3215, "step": 20785 }, { "epoch": 0.18, "learning_rate": 9.249123621985727e-05, "loss": 2.3823, "step": 20790 }, { "epoch": 0.18, "learning_rate": 9.248770034905204e-05, "loss": 2.3618, "step": 20795 }, { "epoch": 0.18, "learning_rate": 9.248416371354336e-05, "loss": 2.3783, "step": 20800 }, { "epoch": 0.18, "learning_rate": 9.248062631339491e-05, "loss": 2.3435, "step": 20805 }, { "epoch": 0.18, "learning_rate": 9.247708814867035e-05, "loss": 2.3536, "step": 20810 }, { "epoch": 0.18, "learning_rate": 9.247354921943334e-05, "loss": 2.3726, "step": 20815 }, { "epoch": 0.18, "learning_rate": 9.247000952574761e-05, "loss": 2.4622, "step": 20820 }, { "epoch": 0.18, "learning_rate": 9.246646906767684e-05, "loss": 2.3891, "step": 20825 }, { "epoch": 0.18, "learning_rate": 9.246292784528476e-05, "loss": 2.3639, "step": 20830 }, { "epoch": 0.18, "learning_rate": 9.245938585863511e-05, "loss": 2.3218, "step": 20835 }, { "epoch": 0.18, "learning_rate": 9.245584310779165e-05, "loss": 2.3252, "step": 20840 }, { "epoch": 0.18, "learning_rate": 9.245229959281813e-05, "loss": 2.3909, "step": 20845 }, { "epoch": 0.18, "learning_rate": 9.244875531377833e-05, "loss": 2.3512, "step": 20850 }, { "epoch": 0.18, "learning_rate": 9.2445210270736e-05, "loss": 2.3416, "step": 20855 }, { "epoch": 0.18, "learning_rate": 9.244166446375503e-05, "loss": 2.4316, "step": 20860 }, { "epoch": 0.18, "learning_rate": 9.243811789289916e-05, "loss": 2.3403, "step": 20865 }, { "epoch": 0.18, "learning_rate": 9.243457055823228e-05, "loss": 2.3123, "step": 20870 }, { "epoch": 0.18, "learning_rate": 9.24310224598182e-05, "loss": 2.3494, "step": 20875 }, { "epoch": 0.18, "learning_rate": 9.242747359772077e-05, "loss": 2.4112, "step": 20880 }, { "epoch": 0.18, "learning_rate": 9.24239239720039e-05, "loss": 2.3282, "step": 20885 }, { "epoch": 0.18, "learning_rate": 9.242037358273145e-05, "loss": 2.4182, "step": 20890 }, { "epoch": 0.18, "learning_rate": 9.241682242996734e-05, "loss": 2.3801, "step": 20895 }, { "epoch": 0.18, "learning_rate": 9.241327051377547e-05, "loss": 2.3331, "step": 20900 }, { "epoch": 0.18, "learning_rate": 9.240971783421976e-05, "loss": 2.4257, "step": 20905 }, { "epoch": 0.18, "learning_rate": 9.240616439136419e-05, "loss": 2.3892, "step": 20910 }, { "epoch": 0.18, "learning_rate": 9.240261018527267e-05, "loss": 2.3641, "step": 20915 }, { "epoch": 0.18, "learning_rate": 9.23990552160092e-05, "loss": 2.3367, "step": 20920 }, { "epoch": 0.18, "learning_rate": 9.239549948363774e-05, "loss": 2.3117, "step": 20925 }, { "epoch": 0.18, "learning_rate": 9.239194298822231e-05, "loss": 2.3588, "step": 20930 }, { "epoch": 0.18, "learning_rate": 9.238838572982691e-05, "loss": 2.3854, "step": 20935 }, { "epoch": 0.18, "learning_rate": 9.238482770851557e-05, "loss": 2.3643, "step": 20940 }, { "epoch": 0.18, "learning_rate": 9.23812689243523e-05, "loss": 2.3306, "step": 20945 }, { "epoch": 0.18, "learning_rate": 9.23777093774012e-05, "loss": 2.4022, "step": 20950 }, { "epoch": 0.18, "learning_rate": 9.23741490677263e-05, "loss": 2.4206, "step": 20955 }, { "epoch": 0.18, "learning_rate": 9.237058799539167e-05, "loss": 2.4055, "step": 20960 }, { "epoch": 0.18, "learning_rate": 9.236702616046144e-05, "loss": 2.4082, "step": 20965 }, { "epoch": 0.18, "learning_rate": 9.23634635629997e-05, "loss": 2.334, "step": 20970 }, { "epoch": 0.18, "learning_rate": 9.235990020307058e-05, "loss": 2.377, "step": 20975 }, { "epoch": 0.18, "learning_rate": 9.235633608073818e-05, "loss": 2.3388, "step": 20980 }, { "epoch": 0.18, "learning_rate": 9.23527711960667e-05, "loss": 2.3165, "step": 20985 }, { "epoch": 0.18, "learning_rate": 9.234920554912024e-05, "loss": 2.3579, "step": 20990 }, { "epoch": 0.18, "learning_rate": 9.234563913996301e-05, "loss": 2.3657, "step": 20995 }, { "epoch": 0.18, "learning_rate": 9.234207196865923e-05, "loss": 2.3277, "step": 21000 }, { "epoch": 0.18, "learning_rate": 9.233850403527304e-05, "loss": 2.3248, "step": 21005 }, { "epoch": 0.18, "learning_rate": 9.23349353398687e-05, "loss": 2.2894, "step": 21010 }, { "epoch": 0.18, "learning_rate": 9.233136588251041e-05, "loss": 2.4131, "step": 21015 }, { "epoch": 0.18, "learning_rate": 9.232779566326246e-05, "loss": 2.3814, "step": 21020 }, { "epoch": 0.18, "learning_rate": 9.232422468218907e-05, "loss": 2.4023, "step": 21025 }, { "epoch": 0.18, "learning_rate": 9.23206529393545e-05, "loss": 2.3276, "step": 21030 }, { "epoch": 0.18, "learning_rate": 9.231708043482307e-05, "loss": 2.4289, "step": 21035 }, { "epoch": 0.18, "learning_rate": 9.231350716865905e-05, "loss": 2.2666, "step": 21040 }, { "epoch": 0.18, "learning_rate": 9.230993314092678e-05, "loss": 2.3246, "step": 21045 }, { "epoch": 0.18, "learning_rate": 9.230635835169057e-05, "loss": 2.3415, "step": 21050 }, { "epoch": 0.18, "learning_rate": 9.230278280101476e-05, "loss": 2.4184, "step": 21055 }, { "epoch": 0.18, "learning_rate": 9.229920648896371e-05, "loss": 2.3432, "step": 21060 }, { "epoch": 0.18, "learning_rate": 9.229562941560177e-05, "loss": 2.3634, "step": 21065 }, { "epoch": 0.18, "learning_rate": 9.229205158099335e-05, "loss": 2.36, "step": 21070 }, { "epoch": 0.18, "learning_rate": 9.228847298520282e-05, "loss": 2.2966, "step": 21075 }, { "epoch": 0.18, "learning_rate": 9.22848936282946e-05, "loss": 2.381, "step": 21080 }, { "epoch": 0.18, "learning_rate": 9.228131351033311e-05, "loss": 2.3526, "step": 21085 }, { "epoch": 0.18, "learning_rate": 9.227773263138278e-05, "loss": 2.3015, "step": 21090 }, { "epoch": 0.18, "learning_rate": 9.227415099150807e-05, "loss": 2.3243, "step": 21095 }, { "epoch": 0.18, "learning_rate": 9.227056859077343e-05, "loss": 2.3166, "step": 21100 }, { "epoch": 0.18, "learning_rate": 9.226698542924335e-05, "loss": 2.3529, "step": 21105 }, { "epoch": 0.18, "learning_rate": 9.226340150698232e-05, "loss": 2.3344, "step": 21110 }, { "epoch": 0.18, "learning_rate": 9.225981682405482e-05, "loss": 2.3436, "step": 21115 }, { "epoch": 0.18, "learning_rate": 9.225623138052541e-05, "loss": 2.376, "step": 21120 }, { "epoch": 0.18, "learning_rate": 9.225264517645859e-05, "loss": 2.3559, "step": 21125 }, { "epoch": 0.18, "learning_rate": 9.22490582119189e-05, "loss": 2.4037, "step": 21130 }, { "epoch": 0.18, "learning_rate": 9.224547048697092e-05, "loss": 2.3344, "step": 21135 }, { "epoch": 0.18, "learning_rate": 9.224188200167923e-05, "loss": 2.3223, "step": 21140 }, { "epoch": 0.18, "learning_rate": 9.22382927561084e-05, "loss": 2.3791, "step": 21145 }, { "epoch": 0.18, "learning_rate": 9.223470275032302e-05, "loss": 2.3571, "step": 21150 }, { "epoch": 0.18, "learning_rate": 9.223111198438772e-05, "loss": 2.3784, "step": 21155 }, { "epoch": 0.18, "learning_rate": 9.222752045836713e-05, "loss": 2.338, "step": 21160 }, { "epoch": 0.18, "learning_rate": 9.222392817232588e-05, "loss": 2.3144, "step": 21165 }, { "epoch": 0.18, "learning_rate": 9.222033512632863e-05, "loss": 2.4228, "step": 21170 }, { "epoch": 0.18, "learning_rate": 9.221674132044005e-05, "loss": 2.3699, "step": 21175 }, { "epoch": 0.18, "learning_rate": 9.22131467547248e-05, "loss": 2.358, "step": 21180 }, { "epoch": 0.18, "learning_rate": 9.220955142924763e-05, "loss": 2.3161, "step": 21185 }, { "epoch": 0.18, "learning_rate": 9.22059553440732e-05, "loss": 2.3781, "step": 21190 }, { "epoch": 0.18, "learning_rate": 9.220235849926624e-05, "loss": 2.3727, "step": 21195 }, { "epoch": 0.18, "learning_rate": 9.219876089489151e-05, "loss": 2.3702, "step": 21200 }, { "epoch": 0.18, "learning_rate": 9.219516253101373e-05, "loss": 2.3835, "step": 21205 }, { "epoch": 0.18, "learning_rate": 9.21915634076977e-05, "loss": 2.3801, "step": 21210 }, { "epoch": 0.18, "learning_rate": 9.218796352500816e-05, "loss": 2.3867, "step": 21215 }, { "epoch": 0.18, "learning_rate": 9.218436288300993e-05, "loss": 2.3439, "step": 21220 }, { "epoch": 0.18, "learning_rate": 9.21807614817678e-05, "loss": 2.4061, "step": 21225 }, { "epoch": 0.18, "learning_rate": 9.21771593213466e-05, "loss": 2.4186, "step": 21230 }, { "epoch": 0.18, "learning_rate": 9.217355640181114e-05, "loss": 2.3252, "step": 21235 }, { "epoch": 0.18, "learning_rate": 9.21699527232263e-05, "loss": 2.4093, "step": 21240 }, { "epoch": 0.18, "learning_rate": 9.216634828565692e-05, "loss": 2.3098, "step": 21245 }, { "epoch": 0.18, "learning_rate": 9.216274308916785e-05, "loss": 2.2911, "step": 21250 }, { "epoch": 0.18, "learning_rate": 9.215913713382403e-05, "loss": 2.333, "step": 21255 }, { "epoch": 0.18, "learning_rate": 9.215553041969034e-05, "loss": 2.3329, "step": 21260 }, { "epoch": 0.18, "learning_rate": 9.215192294683166e-05, "loss": 2.375, "step": 21265 }, { "epoch": 0.18, "learning_rate": 9.214831471531296e-05, "loss": 2.3741, "step": 21270 }, { "epoch": 0.18, "learning_rate": 9.214470572519918e-05, "loss": 2.3562, "step": 21275 }, { "epoch": 0.18, "learning_rate": 9.214109597655525e-05, "loss": 2.3327, "step": 21280 }, { "epoch": 0.18, "learning_rate": 9.213748546944614e-05, "loss": 2.3804, "step": 21285 }, { "epoch": 0.18, "learning_rate": 9.213387420393687e-05, "loss": 2.3624, "step": 21290 }, { "epoch": 0.18, "learning_rate": 9.21302621800924e-05, "loss": 2.314, "step": 21295 }, { "epoch": 0.18, "learning_rate": 9.212664939797775e-05, "loss": 2.3387, "step": 21300 }, { "epoch": 0.18, "learning_rate": 9.212303585765793e-05, "loss": 2.2927, "step": 21305 }, { "epoch": 0.18, "learning_rate": 9.211942155919802e-05, "loss": 2.4014, "step": 21310 }, { "epoch": 0.18, "learning_rate": 9.211580650266303e-05, "loss": 2.4115, "step": 21315 }, { "epoch": 0.18, "learning_rate": 9.211219068811805e-05, "loss": 2.3899, "step": 21320 }, { "epoch": 0.18, "learning_rate": 9.210857411562813e-05, "loss": 2.3651, "step": 21325 }, { "epoch": 0.18, "learning_rate": 9.210495678525839e-05, "loss": 2.4052, "step": 21330 }, { "epoch": 0.18, "learning_rate": 9.210133869707392e-05, "loss": 2.3343, "step": 21335 }, { "epoch": 0.18, "learning_rate": 9.209771985113985e-05, "loss": 2.3627, "step": 21340 }, { "epoch": 0.18, "learning_rate": 9.209410024752129e-05, "loss": 2.3882, "step": 21345 }, { "epoch": 0.18, "learning_rate": 9.209047988628342e-05, "loss": 2.2892, "step": 21350 }, { "epoch": 0.18, "learning_rate": 9.208685876749136e-05, "loss": 2.38, "step": 21355 }, { "epoch": 0.18, "learning_rate": 9.208323689121032e-05, "loss": 2.3057, "step": 21360 }, { "epoch": 0.18, "learning_rate": 9.207961425750548e-05, "loss": 2.3011, "step": 21365 }, { "epoch": 0.18, "learning_rate": 9.207599086644201e-05, "loss": 2.3622, "step": 21370 }, { "epoch": 0.18, "learning_rate": 9.207236671808517e-05, "loss": 2.3695, "step": 21375 }, { "epoch": 0.18, "learning_rate": 9.206874181250018e-05, "loss": 2.3473, "step": 21380 }, { "epoch": 0.18, "learning_rate": 9.206511614975224e-05, "loss": 2.3935, "step": 21385 }, { "epoch": 0.18, "learning_rate": 9.206148972990665e-05, "loss": 2.4027, "step": 21390 }, { "epoch": 0.18, "learning_rate": 9.205786255302867e-05, "loss": 2.4048, "step": 21395 }, { "epoch": 0.18, "learning_rate": 9.205423461918356e-05, "loss": 2.3494, "step": 21400 }, { "epoch": 0.18, "learning_rate": 9.205060592843665e-05, "loss": 2.2761, "step": 21405 }, { "epoch": 0.18, "learning_rate": 9.204697648085321e-05, "loss": 2.2487, "step": 21410 }, { "epoch": 0.18, "learning_rate": 9.204334627649862e-05, "loss": 2.3245, "step": 21415 }, { "epoch": 0.18, "learning_rate": 9.203971531543815e-05, "loss": 2.3003, "step": 21420 }, { "epoch": 0.18, "learning_rate": 9.203608359773721e-05, "loss": 2.3624, "step": 21425 }, { "epoch": 0.18, "learning_rate": 9.203245112346113e-05, "loss": 2.3573, "step": 21430 }, { "epoch": 0.18, "learning_rate": 9.20288178926753e-05, "loss": 2.4153, "step": 21435 }, { "epoch": 0.18, "learning_rate": 9.20251839054451e-05, "loss": 2.3086, "step": 21440 }, { "epoch": 0.18, "learning_rate": 9.202154916183597e-05, "loss": 2.4015, "step": 21445 }, { "epoch": 0.18, "learning_rate": 9.201791366191327e-05, "loss": 2.3352, "step": 21450 }, { "epoch": 0.18, "learning_rate": 9.201427740574249e-05, "loss": 2.2776, "step": 21455 }, { "epoch": 0.18, "learning_rate": 9.201064039338904e-05, "loss": 2.3536, "step": 21460 }, { "epoch": 0.18, "learning_rate": 9.200700262491839e-05, "loss": 2.3213, "step": 21465 }, { "epoch": 0.18, "learning_rate": 9.200336410039603e-05, "loss": 2.3917, "step": 21470 }, { "epoch": 0.18, "learning_rate": 9.199972481988742e-05, "loss": 2.3494, "step": 21475 }, { "epoch": 0.18, "learning_rate": 9.199608478345806e-05, "loss": 2.2506, "step": 21480 }, { "epoch": 0.18, "learning_rate": 9.199244399117351e-05, "loss": 2.2636, "step": 21485 }, { "epoch": 0.18, "learning_rate": 9.198880244309925e-05, "loss": 2.3487, "step": 21490 }, { "epoch": 0.18, "learning_rate": 9.198516013930083e-05, "loss": 2.3335, "step": 21495 }, { "epoch": 0.18, "learning_rate": 9.198151707984381e-05, "loss": 2.3776, "step": 21500 }, { "epoch": 0.18, "learning_rate": 9.197787326479377e-05, "loss": 2.3393, "step": 21505 }, { "epoch": 0.18, "learning_rate": 9.197422869421629e-05, "loss": 2.305, "step": 21510 }, { "epoch": 0.18, "learning_rate": 9.197058336817694e-05, "loss": 2.3636, "step": 21515 }, { "epoch": 0.18, "learning_rate": 9.196693728674135e-05, "loss": 2.4193, "step": 21520 }, { "epoch": 0.18, "learning_rate": 9.196329044997516e-05, "loss": 2.2793, "step": 21525 }, { "epoch": 0.18, "learning_rate": 9.195964285794397e-05, "loss": 2.2904, "step": 21530 }, { "epoch": 0.18, "learning_rate": 9.195599451071344e-05, "loss": 2.3431, "step": 21535 }, { "epoch": 0.18, "learning_rate": 9.195234540834926e-05, "loss": 2.267, "step": 21540 }, { "epoch": 0.18, "learning_rate": 9.194869555091707e-05, "loss": 2.2676, "step": 21545 }, { "epoch": 0.18, "learning_rate": 9.19450449384826e-05, "loss": 2.3295, "step": 21550 }, { "epoch": 0.18, "learning_rate": 9.194139357111153e-05, "loss": 2.355, "step": 21555 }, { "epoch": 0.18, "learning_rate": 9.193774144886957e-05, "loss": 2.4097, "step": 21560 }, { "epoch": 0.18, "learning_rate": 9.193408857182247e-05, "loss": 2.338, "step": 21565 }, { "epoch": 0.18, "learning_rate": 9.193043494003597e-05, "loss": 2.4007, "step": 21570 }, { "epoch": 0.18, "learning_rate": 9.192678055357582e-05, "loss": 2.4127, "step": 21575 }, { "epoch": 0.18, "learning_rate": 9.192312541250783e-05, "loss": 2.3452, "step": 21580 }, { "epoch": 0.18, "learning_rate": 9.191946951689773e-05, "loss": 2.4465, "step": 21585 }, { "epoch": 0.18, "learning_rate": 9.191581286681134e-05, "loss": 2.3437, "step": 21590 }, { "epoch": 0.18, "learning_rate": 9.191215546231451e-05, "loss": 2.3051, "step": 21595 }, { "epoch": 0.18, "learning_rate": 9.190849730347301e-05, "loss": 2.2882, "step": 21600 }, { "epoch": 0.18, "learning_rate": 9.190483839035271e-05, "loss": 2.2902, "step": 21605 }, { "epoch": 0.18, "learning_rate": 9.190117872301947e-05, "loss": 2.4003, "step": 21610 }, { "epoch": 0.18, "learning_rate": 9.189751830153914e-05, "loss": 2.3422, "step": 21615 }, { "epoch": 0.18, "learning_rate": 9.189385712597762e-05, "loss": 2.3082, "step": 21620 }, { "epoch": 0.18, "learning_rate": 9.189019519640078e-05, "loss": 2.2868, "step": 21625 }, { "epoch": 0.18, "learning_rate": 9.188653251287456e-05, "loss": 2.3485, "step": 21630 }, { "epoch": 0.18, "learning_rate": 9.188286907546486e-05, "loss": 2.35, "step": 21635 }, { "epoch": 0.18, "learning_rate": 9.187920488423762e-05, "loss": 2.3475, "step": 21640 }, { "epoch": 0.18, "learning_rate": 9.187553993925877e-05, "loss": 2.4363, "step": 21645 }, { "epoch": 0.18, "learning_rate": 9.187187424059431e-05, "loss": 2.293, "step": 21650 }, { "epoch": 0.18, "learning_rate": 9.18682077883102e-05, "loss": 2.3309, "step": 21655 }, { "epoch": 0.18, "learning_rate": 9.186454058247242e-05, "loss": 2.4409, "step": 21660 }, { "epoch": 0.18, "learning_rate": 9.186087262314698e-05, "loss": 2.3077, "step": 21665 }, { "epoch": 0.18, "learning_rate": 9.185720391039989e-05, "loss": 2.3228, "step": 21670 }, { "epoch": 0.18, "learning_rate": 9.18535344442972e-05, "loss": 2.3799, "step": 21675 }, { "epoch": 0.19, "learning_rate": 9.184986422490493e-05, "loss": 2.3333, "step": 21680 }, { "epoch": 0.19, "learning_rate": 9.184619325228916e-05, "loss": 2.4257, "step": 21685 }, { "epoch": 0.19, "learning_rate": 9.184252152651594e-05, "loss": 2.3177, "step": 21690 }, { "epoch": 0.19, "learning_rate": 9.183884904765137e-05, "loss": 2.4602, "step": 21695 }, { "epoch": 0.19, "learning_rate": 9.183517581576153e-05, "loss": 2.2879, "step": 21700 }, { "epoch": 0.19, "learning_rate": 9.183150183091255e-05, "loss": 2.3514, "step": 21705 }, { "epoch": 0.19, "learning_rate": 9.182782709317058e-05, "loss": 2.4189, "step": 21710 }, { "epoch": 0.19, "learning_rate": 9.18241516026017e-05, "loss": 2.3839, "step": 21715 }, { "epoch": 0.19, "learning_rate": 9.182047535927207e-05, "loss": 2.4167, "step": 21720 }, { "epoch": 0.19, "learning_rate": 9.18167983632479e-05, "loss": 2.2442, "step": 21725 }, { "epoch": 0.19, "learning_rate": 9.181312061459535e-05, "loss": 2.3551, "step": 21730 }, { "epoch": 0.19, "learning_rate": 9.18094421133806e-05, "loss": 2.3978, "step": 21735 }, { "epoch": 0.19, "learning_rate": 9.180576285966986e-05, "loss": 2.3812, "step": 21740 }, { "epoch": 0.19, "learning_rate": 9.180208285352938e-05, "loss": 2.2745, "step": 21745 }, { "epoch": 0.19, "learning_rate": 9.179840209502534e-05, "loss": 2.3931, "step": 21750 }, { "epoch": 0.19, "learning_rate": 9.179472058422403e-05, "loss": 2.3993, "step": 21755 }, { "epoch": 0.19, "learning_rate": 9.17910383211917e-05, "loss": 2.3283, "step": 21760 }, { "epoch": 0.19, "learning_rate": 9.178735530599461e-05, "loss": 2.3234, "step": 21765 }, { "epoch": 0.19, "learning_rate": 9.178367153869906e-05, "loss": 2.3536, "step": 21770 }, { "epoch": 0.19, "learning_rate": 9.177998701937136e-05, "loss": 2.3279, "step": 21775 }, { "epoch": 0.19, "learning_rate": 9.17763017480778e-05, "loss": 2.3546, "step": 21780 }, { "epoch": 0.19, "learning_rate": 9.177261572488474e-05, "loss": 2.4014, "step": 21785 }, { "epoch": 0.19, "learning_rate": 9.176892894985849e-05, "loss": 2.4004, "step": 21790 }, { "epoch": 0.19, "learning_rate": 9.176524142306542e-05, "loss": 2.3347, "step": 21795 }, { "epoch": 0.19, "learning_rate": 9.176155314457191e-05, "loss": 2.3054, "step": 21800 }, { "epoch": 0.19, "learning_rate": 9.175786411444433e-05, "loss": 2.3986, "step": 21805 }, { "epoch": 0.19, "learning_rate": 9.175417433274907e-05, "loss": 2.384, "step": 21810 }, { "epoch": 0.19, "learning_rate": 9.175048379955255e-05, "loss": 2.2822, "step": 21815 }, { "epoch": 0.19, "learning_rate": 9.17467925149212e-05, "loss": 2.2977, "step": 21820 }, { "epoch": 0.19, "learning_rate": 9.174310047892143e-05, "loss": 2.331, "step": 21825 }, { "epoch": 0.19, "learning_rate": 9.173940769161973e-05, "loss": 2.4014, "step": 21830 }, { "epoch": 0.19, "learning_rate": 9.173571415308252e-05, "loss": 2.3479, "step": 21835 }, { "epoch": 0.19, "learning_rate": 9.17320198633763e-05, "loss": 2.3938, "step": 21840 }, { "epoch": 0.19, "learning_rate": 9.172832482256757e-05, "loss": 2.2761, "step": 21845 }, { "epoch": 0.19, "learning_rate": 9.172462903072282e-05, "loss": 2.3781, "step": 21850 }, { "epoch": 0.19, "learning_rate": 9.172093248790857e-05, "loss": 2.3199, "step": 21855 }, { "epoch": 0.19, "learning_rate": 9.171723519419134e-05, "loss": 2.2469, "step": 21860 }, { "epoch": 0.19, "learning_rate": 9.17135371496377e-05, "loss": 2.3533, "step": 21865 }, { "epoch": 0.19, "learning_rate": 9.170983835431419e-05, "loss": 2.4031, "step": 21870 }, { "epoch": 0.19, "learning_rate": 9.17061388082874e-05, "loss": 2.2909, "step": 21875 }, { "epoch": 0.19, "learning_rate": 9.170243851162387e-05, "loss": 2.3694, "step": 21880 }, { "epoch": 0.19, "learning_rate": 9.169873746439026e-05, "loss": 2.2943, "step": 21885 }, { "epoch": 0.19, "learning_rate": 9.169503566665314e-05, "loss": 2.3839, "step": 21890 }, { "epoch": 0.19, "learning_rate": 9.169133311847914e-05, "loss": 2.4204, "step": 21895 }, { "epoch": 0.19, "learning_rate": 9.168762981993493e-05, "loss": 2.3838, "step": 21900 }, { "epoch": 0.19, "learning_rate": 9.168392577108713e-05, "loss": 2.3428, "step": 21905 }, { "epoch": 0.19, "learning_rate": 9.168022097200242e-05, "loss": 2.3804, "step": 21910 }, { "epoch": 0.19, "learning_rate": 9.167651542274747e-05, "loss": 2.2928, "step": 21915 }, { "epoch": 0.19, "learning_rate": 9.167280912338898e-05, "loss": 2.331, "step": 21920 }, { "epoch": 0.19, "learning_rate": 9.166910207399367e-05, "loss": 2.365, "step": 21925 }, { "epoch": 0.19, "learning_rate": 9.166539427462823e-05, "loss": 2.2838, "step": 21930 }, { "epoch": 0.19, "learning_rate": 9.166168572535943e-05, "loss": 2.3123, "step": 21935 }, { "epoch": 0.19, "learning_rate": 9.165797642625399e-05, "loss": 2.3604, "step": 21940 }, { "epoch": 0.19, "learning_rate": 9.165426637737868e-05, "loss": 2.4332, "step": 21945 }, { "epoch": 0.19, "learning_rate": 9.165055557880027e-05, "loss": 2.3671, "step": 21950 }, { "epoch": 0.19, "learning_rate": 9.164684403058557e-05, "loss": 2.3302, "step": 21955 }, { "epoch": 0.19, "learning_rate": 9.164313173280132e-05, "loss": 2.4327, "step": 21960 }, { "epoch": 0.19, "learning_rate": 9.163941868551442e-05, "loss": 2.3724, "step": 21965 }, { "epoch": 0.19, "learning_rate": 9.163570488879164e-05, "loss": 2.303, "step": 21970 }, { "epoch": 0.19, "learning_rate": 9.163199034269985e-05, "loss": 2.3399, "step": 21975 }, { "epoch": 0.19, "learning_rate": 9.162827504730586e-05, "loss": 2.314, "step": 21980 }, { "epoch": 0.19, "learning_rate": 9.16245590026766e-05, "loss": 2.3989, "step": 21985 }, { "epoch": 0.19, "learning_rate": 9.162084220887892e-05, "loss": 2.3788, "step": 21990 }, { "epoch": 0.19, "learning_rate": 9.161712466597972e-05, "loss": 2.3802, "step": 21995 }, { "epoch": 0.19, "learning_rate": 9.161340637404591e-05, "loss": 2.3199, "step": 22000 }, { "epoch": 0.19, "learning_rate": 9.160968733314442e-05, "loss": 2.4275, "step": 22005 }, { "epoch": 0.19, "learning_rate": 9.160596754334215e-05, "loss": 2.3849, "step": 22010 }, { "epoch": 0.19, "learning_rate": 9.16022470047061e-05, "loss": 2.2715, "step": 22015 }, { "epoch": 0.19, "learning_rate": 9.15985257173032e-05, "loss": 2.3985, "step": 22020 }, { "epoch": 0.19, "learning_rate": 9.159480368120044e-05, "loss": 2.4131, "step": 22025 }, { "epoch": 0.19, "learning_rate": 9.15910808964648e-05, "loss": 2.3463, "step": 22030 }, { "epoch": 0.19, "learning_rate": 9.15873573631633e-05, "loss": 2.3558, "step": 22035 }, { "epoch": 0.19, "learning_rate": 9.158363308136295e-05, "loss": 2.3608, "step": 22040 }, { "epoch": 0.19, "learning_rate": 9.157990805113077e-05, "loss": 2.3279, "step": 22045 }, { "epoch": 0.19, "learning_rate": 9.157618227253382e-05, "loss": 2.2958, "step": 22050 }, { "epoch": 0.19, "learning_rate": 9.157245574563915e-05, "loss": 2.3707, "step": 22055 }, { "epoch": 0.19, "learning_rate": 9.156872847051383e-05, "loss": 2.4097, "step": 22060 }, { "epoch": 0.19, "learning_rate": 9.156500044722493e-05, "loss": 2.3815, "step": 22065 }, { "epoch": 0.19, "learning_rate": 9.156127167583958e-05, "loss": 2.3006, "step": 22070 }, { "epoch": 0.19, "learning_rate": 9.155754215642487e-05, "loss": 2.3629, "step": 22075 }, { "epoch": 0.19, "learning_rate": 9.155381188904793e-05, "loss": 2.2533, "step": 22080 }, { "epoch": 0.19, "learning_rate": 9.155008087377587e-05, "loss": 2.3577, "step": 22085 }, { "epoch": 0.19, "learning_rate": 9.15463491106759e-05, "loss": 2.4436, "step": 22090 }, { "epoch": 0.19, "learning_rate": 9.154261659981515e-05, "loss": 2.3425, "step": 22095 }, { "epoch": 0.19, "learning_rate": 9.153888334126079e-05, "loss": 2.3555, "step": 22100 }, { "epoch": 0.19, "learning_rate": 9.153514933508005e-05, "loss": 2.4199, "step": 22105 }, { "epoch": 0.19, "learning_rate": 9.153141458134008e-05, "loss": 2.3374, "step": 22110 }, { "epoch": 0.19, "learning_rate": 9.152767908010814e-05, "loss": 2.2633, "step": 22115 }, { "epoch": 0.19, "learning_rate": 9.152394283145145e-05, "loss": 2.3234, "step": 22120 }, { "epoch": 0.19, "learning_rate": 9.152020583543727e-05, "loss": 2.3456, "step": 22125 }, { "epoch": 0.19, "learning_rate": 9.151646809213284e-05, "loss": 2.4035, "step": 22130 }, { "epoch": 0.19, "learning_rate": 9.151272960160542e-05, "loss": 2.3114, "step": 22135 }, { "epoch": 0.19, "learning_rate": 9.150899036392233e-05, "loss": 2.4099, "step": 22140 }, { "epoch": 0.19, "learning_rate": 9.150525037915086e-05, "loss": 2.379, "step": 22145 }, { "epoch": 0.19, "learning_rate": 9.150150964735831e-05, "loss": 2.2102, "step": 22150 }, { "epoch": 0.19, "learning_rate": 9.149776816861202e-05, "loss": 2.3274, "step": 22155 }, { "epoch": 0.19, "learning_rate": 9.149402594297932e-05, "loss": 2.3942, "step": 22160 }, { "epoch": 0.19, "learning_rate": 9.149028297052758e-05, "loss": 2.3564, "step": 22165 }, { "epoch": 0.19, "learning_rate": 9.148653925132413e-05, "loss": 2.3664, "step": 22170 }, { "epoch": 0.19, "learning_rate": 9.14827947854364e-05, "loss": 2.348, "step": 22175 }, { "epoch": 0.19, "learning_rate": 9.147904957293175e-05, "loss": 2.2872, "step": 22180 }, { "epoch": 0.19, "learning_rate": 9.14753036138776e-05, "loss": 2.3011, "step": 22185 }, { "epoch": 0.19, "learning_rate": 9.147155690834136e-05, "loss": 2.3568, "step": 22190 }, { "epoch": 0.19, "learning_rate": 9.146780945639048e-05, "loss": 2.4169, "step": 22195 }, { "epoch": 0.19, "learning_rate": 9.146406125809238e-05, "loss": 2.3059, "step": 22200 }, { "epoch": 0.19, "learning_rate": 9.146031231351455e-05, "loss": 2.3574, "step": 22205 }, { "epoch": 0.19, "learning_rate": 9.145656262272446e-05, "loss": 2.4421, "step": 22210 }, { "epoch": 0.19, "learning_rate": 9.145281218578959e-05, "loss": 2.3968, "step": 22215 }, { "epoch": 0.19, "learning_rate": 9.144906100277744e-05, "loss": 2.3637, "step": 22220 }, { "epoch": 0.19, "learning_rate": 9.144530907375552e-05, "loss": 2.2803, "step": 22225 }, { "epoch": 0.19, "learning_rate": 9.144155639879137e-05, "loss": 2.3432, "step": 22230 }, { "epoch": 0.19, "learning_rate": 9.143780297795255e-05, "loss": 2.2768, "step": 22235 }, { "epoch": 0.19, "learning_rate": 9.143404881130656e-05, "loss": 2.3997, "step": 22240 }, { "epoch": 0.19, "learning_rate": 9.143029389892101e-05, "loss": 2.3717, "step": 22245 }, { "epoch": 0.19, "learning_rate": 9.142653824086347e-05, "loss": 2.314, "step": 22250 }, { "epoch": 0.19, "learning_rate": 9.142278183720154e-05, "loss": 2.3912, "step": 22255 }, { "epoch": 0.19, "learning_rate": 9.141902468800284e-05, "loss": 2.4111, "step": 22260 }, { "epoch": 0.19, "learning_rate": 9.141526679333496e-05, "loss": 2.3213, "step": 22265 }, { "epoch": 0.19, "learning_rate": 9.141150815326557e-05, "loss": 2.2919, "step": 22270 }, { "epoch": 0.19, "learning_rate": 9.140774876786229e-05, "loss": 2.3751, "step": 22275 }, { "epoch": 0.19, "learning_rate": 9.14039886371928e-05, "loss": 2.392, "step": 22280 }, { "epoch": 0.19, "learning_rate": 9.140022776132476e-05, "loss": 2.3228, "step": 22285 }, { "epoch": 0.19, "learning_rate": 9.139646614032587e-05, "loss": 2.3999, "step": 22290 }, { "epoch": 0.19, "learning_rate": 9.139270377426385e-05, "loss": 2.3189, "step": 22295 }, { "epoch": 0.19, "learning_rate": 9.138894066320639e-05, "loss": 2.3783, "step": 22300 }, { "epoch": 0.19, "learning_rate": 9.13851768072212e-05, "loss": 2.2713, "step": 22305 }, { "epoch": 0.19, "learning_rate": 9.138141220637609e-05, "loss": 2.4006, "step": 22310 }, { "epoch": 0.19, "learning_rate": 9.137764686073875e-05, "loss": 2.3038, "step": 22315 }, { "epoch": 0.19, "learning_rate": 9.137388077037698e-05, "loss": 2.3047, "step": 22320 }, { "epoch": 0.19, "learning_rate": 9.137011393535857e-05, "loss": 2.2736, "step": 22325 }, { "epoch": 0.19, "learning_rate": 9.13663463557513e-05, "loss": 2.3621, "step": 22330 }, { "epoch": 0.19, "learning_rate": 9.136257803162298e-05, "loss": 2.3986, "step": 22335 }, { "epoch": 0.19, "learning_rate": 9.135880896304145e-05, "loss": 2.419, "step": 22340 }, { "epoch": 0.19, "learning_rate": 9.135503915007453e-05, "loss": 2.3712, "step": 22345 }, { "epoch": 0.19, "learning_rate": 9.135126859279006e-05, "loss": 2.3162, "step": 22350 }, { "epoch": 0.19, "learning_rate": 9.134749729125594e-05, "loss": 2.2819, "step": 22355 }, { "epoch": 0.19, "learning_rate": 9.134372524554e-05, "loss": 2.3786, "step": 22360 }, { "epoch": 0.19, "learning_rate": 9.133995245571018e-05, "loss": 2.4057, "step": 22365 }, { "epoch": 0.19, "learning_rate": 9.133617892183435e-05, "loss": 2.4258, "step": 22370 }, { "epoch": 0.19, "learning_rate": 9.133240464398043e-05, "loss": 2.3518, "step": 22375 }, { "epoch": 0.19, "learning_rate": 9.132862962221636e-05, "loss": 2.3359, "step": 22380 }, { "epoch": 0.19, "learning_rate": 9.132485385661007e-05, "loss": 2.3755, "step": 22385 }, { "epoch": 0.19, "learning_rate": 9.132107734722952e-05, "loss": 2.3486, "step": 22390 }, { "epoch": 0.19, "learning_rate": 9.13173000941427e-05, "loss": 2.4154, "step": 22395 }, { "epoch": 0.19, "learning_rate": 9.13135220974176e-05, "loss": 2.3309, "step": 22400 }, { "epoch": 0.19, "learning_rate": 9.130974335712217e-05, "loss": 2.3843, "step": 22405 }, { "epoch": 0.19, "learning_rate": 9.130596387332445e-05, "loss": 2.3669, "step": 22410 }, { "epoch": 0.19, "learning_rate": 9.130218364609246e-05, "loss": 2.3351, "step": 22415 }, { "epoch": 0.19, "learning_rate": 9.129840267549426e-05, "loss": 2.2975, "step": 22420 }, { "epoch": 0.19, "learning_rate": 9.129462096159787e-05, "loss": 2.2897, "step": 22425 }, { "epoch": 0.19, "learning_rate": 9.129083850447137e-05, "loss": 2.2591, "step": 22430 }, { "epoch": 0.19, "learning_rate": 9.128705530418282e-05, "loss": 2.3849, "step": 22435 }, { "epoch": 0.19, "learning_rate": 9.128327136080033e-05, "loss": 2.3339, "step": 22440 }, { "epoch": 0.19, "learning_rate": 9.127948667439201e-05, "loss": 2.4488, "step": 22445 }, { "epoch": 0.19, "learning_rate": 9.127570124502595e-05, "loss": 2.4535, "step": 22450 }, { "epoch": 0.19, "learning_rate": 9.12719150727703e-05, "loss": 2.3679, "step": 22455 }, { "epoch": 0.19, "learning_rate": 9.12681281576932e-05, "loss": 2.346, "step": 22460 }, { "epoch": 0.19, "learning_rate": 9.126434049986281e-05, "loss": 2.331, "step": 22465 }, { "epoch": 0.19, "learning_rate": 9.12605520993473e-05, "loss": 2.273, "step": 22470 }, { "epoch": 0.19, "learning_rate": 9.125676295621486e-05, "loss": 2.3186, "step": 22475 }, { "epoch": 0.19, "learning_rate": 9.125297307053367e-05, "loss": 2.3277, "step": 22480 }, { "epoch": 0.19, "learning_rate": 9.124918244237195e-05, "loss": 2.376, "step": 22485 }, { "epoch": 0.19, "learning_rate": 9.124539107179795e-05, "loss": 2.2261, "step": 22490 }, { "epoch": 0.19, "learning_rate": 9.124159895887987e-05, "loss": 2.3806, "step": 22495 }, { "epoch": 0.19, "learning_rate": 9.123780610368598e-05, "loss": 2.3902, "step": 22500 }, { "epoch": 0.19, "learning_rate": 9.123401250628454e-05, "loss": 2.3436, "step": 22505 }, { "epoch": 0.19, "learning_rate": 9.123021816674383e-05, "loss": 2.3584, "step": 22510 }, { "epoch": 0.19, "learning_rate": 9.122642308513214e-05, "loss": 2.3094, "step": 22515 }, { "epoch": 0.19, "learning_rate": 9.122262726151778e-05, "loss": 2.4148, "step": 22520 }, { "epoch": 0.19, "learning_rate": 9.121883069596906e-05, "loss": 2.3779, "step": 22525 }, { "epoch": 0.19, "learning_rate": 9.121503338855433e-05, "loss": 2.3666, "step": 22530 }, { "epoch": 0.19, "learning_rate": 9.12112353393419e-05, "loss": 2.3838, "step": 22535 }, { "epoch": 0.19, "learning_rate": 9.120743654840015e-05, "loss": 2.4085, "step": 22540 }, { "epoch": 0.19, "learning_rate": 9.120363701579747e-05, "loss": 2.2891, "step": 22545 }, { "epoch": 0.19, "learning_rate": 9.119983674160221e-05, "loss": 2.2673, "step": 22550 }, { "epoch": 0.19, "learning_rate": 9.11960357258828e-05, "loss": 2.3386, "step": 22555 }, { "epoch": 0.19, "learning_rate": 9.119223396870763e-05, "loss": 2.3269, "step": 22560 }, { "epoch": 0.19, "learning_rate": 9.11884314701451e-05, "loss": 2.4126, "step": 22565 }, { "epoch": 0.19, "learning_rate": 9.118462823026371e-05, "loss": 2.2346, "step": 22570 }, { "epoch": 0.19, "learning_rate": 9.118082424913186e-05, "loss": 2.3686, "step": 22575 }, { "epoch": 0.19, "learning_rate": 9.117701952681805e-05, "loss": 2.3411, "step": 22580 }, { "epoch": 0.19, "learning_rate": 9.117321406339073e-05, "loss": 2.3602, "step": 22585 }, { "epoch": 0.19, "learning_rate": 9.116940785891841e-05, "loss": 2.4408, "step": 22590 }, { "epoch": 0.19, "learning_rate": 9.116560091346959e-05, "loss": 2.4442, "step": 22595 }, { "epoch": 0.19, "learning_rate": 9.11617932271128e-05, "loss": 2.2914, "step": 22600 }, { "epoch": 0.19, "learning_rate": 9.115798479991654e-05, "loss": 2.3942, "step": 22605 }, { "epoch": 0.19, "learning_rate": 9.115417563194937e-05, "loss": 2.3467, "step": 22610 }, { "epoch": 0.19, "learning_rate": 9.115036572327986e-05, "loss": 2.3572, "step": 22615 }, { "epoch": 0.19, "learning_rate": 9.11465550739766e-05, "loss": 2.4224, "step": 22620 }, { "epoch": 0.19, "learning_rate": 9.114274368410811e-05, "loss": 2.3343, "step": 22625 }, { "epoch": 0.19, "learning_rate": 9.113893155374305e-05, "loss": 2.3074, "step": 22630 }, { "epoch": 0.19, "learning_rate": 9.113511868295e-05, "loss": 2.3651, "step": 22635 }, { "epoch": 0.19, "learning_rate": 9.11313050717976e-05, "loss": 2.3889, "step": 22640 }, { "epoch": 0.19, "learning_rate": 9.112749072035447e-05, "loss": 2.434, "step": 22645 }, { "epoch": 0.19, "learning_rate": 9.112367562868928e-05, "loss": 2.3429, "step": 22650 }, { "epoch": 0.19, "learning_rate": 9.11198597968707e-05, "loss": 2.3463, "step": 22655 }, { "epoch": 0.19, "learning_rate": 9.111604322496739e-05, "loss": 2.275, "step": 22660 }, { "epoch": 0.19, "learning_rate": 9.111222591304804e-05, "loss": 2.3106, "step": 22665 }, { "epoch": 0.19, "learning_rate": 9.110840786118136e-05, "loss": 2.2361, "step": 22670 }, { "epoch": 0.19, "learning_rate": 9.110458906943608e-05, "loss": 2.2877, "step": 22675 }, { "epoch": 0.19, "learning_rate": 9.110076953788092e-05, "loss": 2.4383, "step": 22680 }, { "epoch": 0.19, "learning_rate": 9.109694926658463e-05, "loss": 2.2596, "step": 22685 }, { "epoch": 0.19, "learning_rate": 9.109312825561598e-05, "loss": 2.3414, "step": 22690 }, { "epoch": 0.19, "learning_rate": 9.10893065050437e-05, "loss": 2.314, "step": 22695 }, { "epoch": 0.19, "learning_rate": 9.108548401493662e-05, "loss": 2.3149, "step": 22700 }, { "epoch": 0.19, "learning_rate": 9.108166078536351e-05, "loss": 2.3604, "step": 22705 }, { "epoch": 0.19, "learning_rate": 9.10778368163932e-05, "loss": 2.3297, "step": 22710 }, { "epoch": 0.19, "learning_rate": 9.107401210809449e-05, "loss": 2.417, "step": 22715 }, { "epoch": 0.19, "learning_rate": 9.107018666053626e-05, "loss": 2.3158, "step": 22720 }, { "epoch": 0.19, "learning_rate": 9.106636047378732e-05, "loss": 2.3881, "step": 22725 }, { "epoch": 0.19, "learning_rate": 9.106253354791654e-05, "loss": 2.3291, "step": 22730 }, { "epoch": 0.19, "learning_rate": 9.105870588299284e-05, "loss": 2.3863, "step": 22735 }, { "epoch": 0.19, "learning_rate": 9.105487747908505e-05, "loss": 2.3644, "step": 22740 }, { "epoch": 0.19, "learning_rate": 9.105104833626211e-05, "loss": 2.3542, "step": 22745 }, { "epoch": 0.19, "learning_rate": 9.104721845459294e-05, "loss": 2.3699, "step": 22750 }, { "epoch": 0.19, "learning_rate": 9.104338783414646e-05, "loss": 2.3169, "step": 22755 }, { "epoch": 0.19, "learning_rate": 9.103955647499161e-05, "loss": 2.3052, "step": 22760 }, { "epoch": 0.19, "learning_rate": 9.103572437719736e-05, "loss": 2.3269, "step": 22765 }, { "epoch": 0.19, "learning_rate": 9.103189154083266e-05, "loss": 2.3204, "step": 22770 }, { "epoch": 0.19, "learning_rate": 9.102805796596652e-05, "loss": 2.3679, "step": 22775 }, { "epoch": 0.19, "learning_rate": 9.102422365266793e-05, "loss": 2.3111, "step": 22780 }, { "epoch": 0.19, "learning_rate": 9.10203886010059e-05, "loss": 2.3508, "step": 22785 }, { "epoch": 0.19, "learning_rate": 9.101655281104944e-05, "loss": 2.3285, "step": 22790 }, { "epoch": 0.19, "learning_rate": 9.101271628286762e-05, "loss": 2.2934, "step": 22795 }, { "epoch": 0.19, "learning_rate": 9.100887901652945e-05, "loss": 2.3936, "step": 22800 }, { "epoch": 0.19, "learning_rate": 9.100504101210403e-05, "loss": 2.3293, "step": 22805 }, { "epoch": 0.19, "learning_rate": 9.100120226966042e-05, "loss": 2.3623, "step": 22810 }, { "epoch": 0.19, "learning_rate": 9.09973627892677e-05, "loss": 2.3, "step": 22815 }, { "epoch": 0.19, "learning_rate": 9.099352257099501e-05, "loss": 2.3649, "step": 22820 }, { "epoch": 0.19, "learning_rate": 9.098968161491141e-05, "loss": 2.3487, "step": 22825 }, { "epoch": 0.19, "learning_rate": 9.098583992108609e-05, "loss": 2.3649, "step": 22830 }, { "epoch": 0.19, "learning_rate": 9.098199748958815e-05, "loss": 2.3426, "step": 22835 }, { "epoch": 0.19, "learning_rate": 9.097815432048678e-05, "loss": 2.4159, "step": 22840 }, { "epoch": 0.19, "learning_rate": 9.097431041385113e-05, "loss": 2.3362, "step": 22845 }, { "epoch": 0.19, "learning_rate": 9.097046576975038e-05, "loss": 2.408, "step": 22850 }, { "epoch": 0.2, "learning_rate": 9.096662038825375e-05, "loss": 2.3477, "step": 22855 }, { "epoch": 0.2, "learning_rate": 9.096277426943042e-05, "loss": 2.3268, "step": 22860 }, { "epoch": 0.2, "learning_rate": 9.095892741334964e-05, "loss": 2.378, "step": 22865 }, { "epoch": 0.2, "learning_rate": 9.095507982008063e-05, "loss": 2.3211, "step": 22870 }, { "epoch": 0.2, "learning_rate": 9.095123148969264e-05, "loss": 2.3392, "step": 22875 }, { "epoch": 0.2, "learning_rate": 9.094738242225494e-05, "loss": 2.3525, "step": 22880 }, { "epoch": 0.2, "learning_rate": 9.09435326178368e-05, "loss": 2.3861, "step": 22885 }, { "epoch": 0.2, "learning_rate": 9.093968207650752e-05, "loss": 2.2953, "step": 22890 }, { "epoch": 0.2, "learning_rate": 9.09358307983364e-05, "loss": 2.3194, "step": 22895 }, { "epoch": 0.2, "learning_rate": 9.093197878339274e-05, "loss": 2.3987, "step": 22900 }, { "epoch": 0.2, "learning_rate": 9.092812603174589e-05, "loss": 2.3386, "step": 22905 }, { "epoch": 0.2, "learning_rate": 9.09242725434652e-05, "loss": 2.2967, "step": 22910 }, { "epoch": 0.2, "learning_rate": 9.092041831862e-05, "loss": 2.4124, "step": 22915 }, { "epoch": 0.2, "learning_rate": 9.091656335727966e-05, "loss": 2.3702, "step": 22920 }, { "epoch": 0.2, "learning_rate": 9.091270765951359e-05, "loss": 2.3425, "step": 22925 }, { "epoch": 0.2, "learning_rate": 9.090885122539115e-05, "loss": 2.3978, "step": 22930 }, { "epoch": 0.2, "learning_rate": 9.090499405498178e-05, "loss": 2.3814, "step": 22935 }, { "epoch": 0.2, "learning_rate": 9.09011361483549e-05, "loss": 2.3601, "step": 22940 }, { "epoch": 0.2, "learning_rate": 9.089727750557991e-05, "loss": 2.3173, "step": 22945 }, { "epoch": 0.2, "learning_rate": 9.08934181267263e-05, "loss": 2.4242, "step": 22950 }, { "epoch": 0.2, "learning_rate": 9.088955801186351e-05, "loss": 2.3354, "step": 22955 }, { "epoch": 0.2, "learning_rate": 9.088569716106104e-05, "loss": 2.3538, "step": 22960 }, { "epoch": 0.2, "learning_rate": 9.088183557438834e-05, "loss": 2.3855, "step": 22965 }, { "epoch": 0.2, "learning_rate": 9.087797325191494e-05, "loss": 2.3882, "step": 22970 }, { "epoch": 0.2, "learning_rate": 9.087411019371034e-05, "loss": 2.3591, "step": 22975 }, { "epoch": 0.2, "learning_rate": 9.087024639984407e-05, "loss": 2.3396, "step": 22980 }, { "epoch": 0.2, "learning_rate": 9.08663818703857e-05, "loss": 2.4431, "step": 22985 }, { "epoch": 0.2, "learning_rate": 9.086251660540475e-05, "loss": 2.3241, "step": 22990 }, { "epoch": 0.2, "learning_rate": 9.085865060497078e-05, "loss": 2.4122, "step": 22995 }, { "epoch": 0.2, "learning_rate": 9.08547838691534e-05, "loss": 2.343, "step": 23000 }, { "epoch": 0.2, "learning_rate": 9.085091639802222e-05, "loss": 2.3244, "step": 23005 }, { "epoch": 0.2, "learning_rate": 9.084704819164679e-05, "loss": 2.3464, "step": 23010 }, { "epoch": 0.2, "learning_rate": 9.084317925009678e-05, "loss": 2.3784, "step": 23015 }, { "epoch": 0.2, "learning_rate": 9.08393095734418e-05, "loss": 2.3126, "step": 23020 }, { "epoch": 0.2, "learning_rate": 9.08354391617515e-05, "loss": 2.3166, "step": 23025 }, { "epoch": 0.2, "learning_rate": 9.083156801509554e-05, "loss": 2.3132, "step": 23030 }, { "epoch": 0.2, "learning_rate": 9.082769613354362e-05, "loss": 2.3923, "step": 23035 }, { "epoch": 0.2, "learning_rate": 9.082382351716538e-05, "loss": 2.4303, "step": 23040 }, { "epoch": 0.2, "learning_rate": 9.081995016603057e-05, "loss": 2.3175, "step": 23045 }, { "epoch": 0.2, "learning_rate": 9.081607608020888e-05, "loss": 2.2134, "step": 23050 }, { "epoch": 0.2, "learning_rate": 9.081220125977001e-05, "loss": 2.3621, "step": 23055 }, { "epoch": 0.2, "learning_rate": 9.080832570478374e-05, "loss": 2.4259, "step": 23060 }, { "epoch": 0.2, "learning_rate": 9.080444941531983e-05, "loss": 2.3258, "step": 23065 }, { "epoch": 0.2, "learning_rate": 9.0800572391448e-05, "loss": 2.3108, "step": 23070 }, { "epoch": 0.2, "learning_rate": 9.079669463323807e-05, "loss": 2.3817, "step": 23075 }, { "epoch": 0.2, "learning_rate": 9.079281614075981e-05, "loss": 2.3281, "step": 23080 }, { "epoch": 0.2, "learning_rate": 9.078893691408303e-05, "loss": 2.3395, "step": 23085 }, { "epoch": 0.2, "learning_rate": 9.078505695327755e-05, "loss": 2.3382, "step": 23090 }, { "epoch": 0.2, "learning_rate": 9.078117625841323e-05, "loss": 2.3397, "step": 23095 }, { "epoch": 0.2, "learning_rate": 9.077729482955987e-05, "loss": 2.351, "step": 23100 }, { "epoch": 0.2, "learning_rate": 9.077341266678734e-05, "loss": 2.3633, "step": 23105 }, { "epoch": 0.2, "learning_rate": 9.076952977016555e-05, "loss": 2.3449, "step": 23110 }, { "epoch": 0.2, "learning_rate": 9.076564613976434e-05, "loss": 2.3224, "step": 23115 }, { "epoch": 0.2, "learning_rate": 9.076176177565363e-05, "loss": 2.4321, "step": 23120 }, { "epoch": 0.2, "learning_rate": 9.075787667790333e-05, "loss": 2.4091, "step": 23125 }, { "epoch": 0.2, "learning_rate": 9.075399084658336e-05, "loss": 2.3557, "step": 23130 }, { "epoch": 0.2, "learning_rate": 9.075010428176365e-05, "loss": 2.3285, "step": 23135 }, { "epoch": 0.2, "learning_rate": 9.074621698351418e-05, "loss": 2.3218, "step": 23140 }, { "epoch": 0.2, "learning_rate": 9.074232895190489e-05, "loss": 2.3235, "step": 23145 }, { "epoch": 0.2, "learning_rate": 9.073844018700574e-05, "loss": 2.3798, "step": 23150 }, { "epoch": 0.2, "learning_rate": 9.073455068888679e-05, "loss": 2.3127, "step": 23155 }, { "epoch": 0.2, "learning_rate": 9.073066045761798e-05, "loss": 2.3605, "step": 23160 }, { "epoch": 0.2, "learning_rate": 9.072676949326933e-05, "loss": 2.3245, "step": 23165 }, { "epoch": 0.2, "learning_rate": 9.07228777959109e-05, "loss": 2.2976, "step": 23170 }, { "epoch": 0.2, "learning_rate": 9.071898536561272e-05, "loss": 2.2582, "step": 23175 }, { "epoch": 0.2, "learning_rate": 9.071509220244484e-05, "loss": 2.3846, "step": 23180 }, { "epoch": 0.2, "learning_rate": 9.071119830647735e-05, "loss": 2.3818, "step": 23185 }, { "epoch": 0.2, "learning_rate": 9.070730367778031e-05, "loss": 2.4317, "step": 23190 }, { "epoch": 0.2, "learning_rate": 9.070340831642383e-05, "loss": 2.2481, "step": 23195 }, { "epoch": 0.2, "learning_rate": 9.069951222247802e-05, "loss": 2.4165, "step": 23200 }, { "epoch": 0.2, "learning_rate": 9.0695615396013e-05, "loss": 2.379, "step": 23205 }, { "epoch": 0.2, "learning_rate": 9.069171783709892e-05, "loss": 2.3902, "step": 23210 }, { "epoch": 0.2, "learning_rate": 9.068781954580587e-05, "loss": 2.3805, "step": 23215 }, { "epoch": 0.2, "learning_rate": 9.068392052220409e-05, "loss": 2.3963, "step": 23220 }, { "epoch": 0.2, "learning_rate": 9.068002076636373e-05, "loss": 2.3136, "step": 23225 }, { "epoch": 0.2, "learning_rate": 9.067612027835495e-05, "loss": 2.343, "step": 23230 }, { "epoch": 0.2, "learning_rate": 9.067221905824798e-05, "loss": 2.3674, "step": 23235 }, { "epoch": 0.2, "learning_rate": 9.066831710611304e-05, "loss": 2.3292, "step": 23240 }, { "epoch": 0.2, "learning_rate": 9.066441442202031e-05, "loss": 2.408, "step": 23245 }, { "epoch": 0.2, "learning_rate": 9.066051100604011e-05, "loss": 2.3497, "step": 23250 }, { "epoch": 0.2, "learning_rate": 9.065660685824262e-05, "loss": 2.2631, "step": 23255 }, { "epoch": 0.2, "learning_rate": 9.065270197869816e-05, "loss": 2.3547, "step": 23260 }, { "epoch": 0.2, "learning_rate": 9.064879636747698e-05, "loss": 2.3236, "step": 23265 }, { "epoch": 0.2, "learning_rate": 9.06448900246494e-05, "loss": 2.3638, "step": 23270 }, { "epoch": 0.2, "learning_rate": 9.06409829502857e-05, "loss": 2.2802, "step": 23275 }, { "epoch": 0.2, "learning_rate": 9.063707514445622e-05, "loss": 2.3653, "step": 23280 }, { "epoch": 0.2, "learning_rate": 9.063316660723128e-05, "loss": 2.3338, "step": 23285 }, { "epoch": 0.2, "learning_rate": 9.062925733868124e-05, "loss": 2.3874, "step": 23290 }, { "epoch": 0.2, "learning_rate": 9.062534733887645e-05, "loss": 2.3121, "step": 23295 }, { "epoch": 0.2, "learning_rate": 9.062143660788727e-05, "loss": 2.2827, "step": 23300 }, { "epoch": 0.2, "learning_rate": 9.061752514578412e-05, "loss": 2.3888, "step": 23305 }, { "epoch": 0.2, "learning_rate": 9.061361295263737e-05, "loss": 2.3882, "step": 23310 }, { "epoch": 0.2, "learning_rate": 9.060970002851747e-05, "loss": 2.3772, "step": 23315 }, { "epoch": 0.2, "learning_rate": 9.06057863734948e-05, "loss": 2.3265, "step": 23320 }, { "epoch": 0.2, "learning_rate": 9.06018719876398e-05, "loss": 2.4715, "step": 23325 }, { "epoch": 0.2, "learning_rate": 9.059795687102297e-05, "loss": 2.3052, "step": 23330 }, { "epoch": 0.2, "learning_rate": 9.059404102371473e-05, "loss": 2.3714, "step": 23335 }, { "epoch": 0.2, "learning_rate": 9.05901244457856e-05, "loss": 2.4077, "step": 23340 }, { "epoch": 0.2, "learning_rate": 9.058620713730602e-05, "loss": 2.3639, "step": 23345 }, { "epoch": 0.2, "learning_rate": 9.058228909834653e-05, "loss": 2.2573, "step": 23350 }, { "epoch": 0.2, "learning_rate": 9.057837032897763e-05, "loss": 2.391, "step": 23355 }, { "epoch": 0.2, "learning_rate": 9.057445082926988e-05, "loss": 2.3669, "step": 23360 }, { "epoch": 0.2, "learning_rate": 9.057053059929379e-05, "loss": 2.3665, "step": 23365 }, { "epoch": 0.2, "learning_rate": 9.056660963911992e-05, "loss": 2.3804, "step": 23370 }, { "epoch": 0.2, "learning_rate": 9.056268794881886e-05, "loss": 2.3365, "step": 23375 }, { "epoch": 0.2, "learning_rate": 9.055876552846119e-05, "loss": 2.4101, "step": 23380 }, { "epoch": 0.2, "learning_rate": 9.055484237811748e-05, "loss": 2.2751, "step": 23385 }, { "epoch": 0.2, "learning_rate": 9.055091849785838e-05, "loss": 2.2713, "step": 23390 }, { "epoch": 0.2, "learning_rate": 9.05469938877545e-05, "loss": 2.409, "step": 23395 }, { "epoch": 0.2, "learning_rate": 9.054306854787644e-05, "loss": 2.3702, "step": 23400 }, { "epoch": 0.2, "learning_rate": 9.053914247829492e-05, "loss": 2.3222, "step": 23405 }, { "epoch": 0.2, "learning_rate": 9.053521567908052e-05, "loss": 2.299, "step": 23410 }, { "epoch": 0.2, "learning_rate": 9.053128815030398e-05, "loss": 2.4127, "step": 23415 }, { "epoch": 0.2, "learning_rate": 9.052735989203595e-05, "loss": 2.3414, "step": 23420 }, { "epoch": 0.2, "learning_rate": 9.052343090434716e-05, "loss": 2.4119, "step": 23425 }, { "epoch": 0.2, "learning_rate": 9.051950118730832e-05, "loss": 2.3836, "step": 23430 }, { "epoch": 0.2, "learning_rate": 9.051557074099012e-05, "loss": 2.3471, "step": 23435 }, { "epoch": 0.2, "learning_rate": 9.051163956546336e-05, "loss": 2.3792, "step": 23440 }, { "epoch": 0.2, "learning_rate": 9.050770766079874e-05, "loss": 2.4227, "step": 23445 }, { "epoch": 0.2, "learning_rate": 9.050377502706708e-05, "loss": 2.2794, "step": 23450 }, { "epoch": 0.2, "learning_rate": 9.049984166433911e-05, "loss": 2.3581, "step": 23455 }, { "epoch": 0.2, "learning_rate": 9.049590757268566e-05, "loss": 2.3366, "step": 23460 }, { "epoch": 0.2, "learning_rate": 9.049197275217751e-05, "loss": 2.4155, "step": 23465 }, { "epoch": 0.2, "learning_rate": 9.04880372028855e-05, "loss": 2.3327, "step": 23470 }, { "epoch": 0.2, "learning_rate": 9.048410092488046e-05, "loss": 2.3307, "step": 23475 }, { "epoch": 0.2, "learning_rate": 9.048016391823322e-05, "loss": 2.4106, "step": 23480 }, { "epoch": 0.2, "learning_rate": 9.047622618301465e-05, "loss": 2.4286, "step": 23485 }, { "epoch": 0.2, "learning_rate": 9.047228771929564e-05, "loss": 2.3908, "step": 23490 }, { "epoch": 0.2, "learning_rate": 9.046834852714705e-05, "loss": 2.3934, "step": 23495 }, { "epoch": 0.2, "learning_rate": 9.046440860663978e-05, "loss": 2.3253, "step": 23500 }, { "epoch": 0.2, "learning_rate": 9.046046795784475e-05, "loss": 2.3157, "step": 23505 }, { "epoch": 0.2, "learning_rate": 9.04565265808329e-05, "loss": 2.3059, "step": 23510 }, { "epoch": 0.2, "learning_rate": 9.045258447567513e-05, "loss": 2.327, "step": 23515 }, { "epoch": 0.2, "learning_rate": 9.044864164244242e-05, "loss": 2.3204, "step": 23520 }, { "epoch": 0.2, "learning_rate": 9.044469808120572e-05, "loss": 2.3078, "step": 23525 }, { "epoch": 0.2, "learning_rate": 9.044075379203603e-05, "loss": 2.2848, "step": 23530 }, { "epoch": 0.2, "learning_rate": 9.043680877500431e-05, "loss": 2.3303, "step": 23535 }, { "epoch": 0.2, "learning_rate": 9.043286303018157e-05, "loss": 2.403, "step": 23540 }, { "epoch": 0.2, "learning_rate": 9.042891655763885e-05, "loss": 2.3028, "step": 23545 }, { "epoch": 0.2, "learning_rate": 9.042496935744715e-05, "loss": 2.326, "step": 23550 }, { "epoch": 0.2, "learning_rate": 9.042102142967754e-05, "loss": 2.408, "step": 23555 }, { "epoch": 0.2, "learning_rate": 9.041707277440103e-05, "loss": 2.2486, "step": 23560 }, { "epoch": 0.2, "learning_rate": 9.041312339168874e-05, "loss": 2.3359, "step": 23565 }, { "epoch": 0.2, "learning_rate": 9.040917328161174e-05, "loss": 2.3864, "step": 23570 }, { "epoch": 0.2, "learning_rate": 9.040522244424111e-05, "loss": 2.3866, "step": 23575 }, { "epoch": 0.2, "learning_rate": 9.040127087964795e-05, "loss": 2.3451, "step": 23580 }, { "epoch": 0.2, "learning_rate": 9.039731858790342e-05, "loss": 2.367, "step": 23585 }, { "epoch": 0.2, "learning_rate": 9.039336556907863e-05, "loss": 2.4076, "step": 23590 }, { "epoch": 0.2, "learning_rate": 9.038941182324471e-05, "loss": 2.3395, "step": 23595 }, { "epoch": 0.2, "learning_rate": 9.038545735047284e-05, "loss": 2.35, "step": 23600 }, { "epoch": 0.2, "learning_rate": 9.03815021508342e-05, "loss": 2.3696, "step": 23605 }, { "epoch": 0.2, "learning_rate": 9.037754622439996e-05, "loss": 2.4099, "step": 23610 }, { "epoch": 0.2, "learning_rate": 9.037358957124134e-05, "loss": 2.3629, "step": 23615 }, { "epoch": 0.2, "learning_rate": 9.036963219142954e-05, "loss": 2.4035, "step": 23620 }, { "epoch": 0.2, "learning_rate": 9.036567408503576e-05, "loss": 2.3797, "step": 23625 }, { "epoch": 0.2, "learning_rate": 9.036171525213128e-05, "loss": 2.4056, "step": 23630 }, { "epoch": 0.2, "learning_rate": 9.035775569278735e-05, "loss": 2.3793, "step": 23635 }, { "epoch": 0.2, "learning_rate": 9.03537954070752e-05, "loss": 2.3288, "step": 23640 }, { "epoch": 0.2, "learning_rate": 9.034983439506614e-05, "loss": 2.3389, "step": 23645 }, { "epoch": 0.2, "learning_rate": 9.034587265683147e-05, "loss": 2.3988, "step": 23650 }, { "epoch": 0.2, "learning_rate": 9.034191019244245e-05, "loss": 2.3241, "step": 23655 }, { "epoch": 0.2, "learning_rate": 9.033794700197045e-05, "loss": 2.3398, "step": 23660 }, { "epoch": 0.2, "learning_rate": 9.033398308548675e-05, "loss": 2.342, "step": 23665 }, { "epoch": 0.2, "learning_rate": 9.033001844306272e-05, "loss": 2.2998, "step": 23670 }, { "epoch": 0.2, "learning_rate": 9.03260530747697e-05, "loss": 2.2835, "step": 23675 }, { "epoch": 0.2, "learning_rate": 9.03220869806791e-05, "loss": 2.3022, "step": 23680 }, { "epoch": 0.2, "learning_rate": 9.031812016086227e-05, "loss": 2.3247, "step": 23685 }, { "epoch": 0.2, "learning_rate": 9.031415261539061e-05, "loss": 2.3367, "step": 23690 }, { "epoch": 0.2, "learning_rate": 9.031018434433554e-05, "loss": 2.3882, "step": 23695 }, { "epoch": 0.2, "learning_rate": 9.030621534776847e-05, "loss": 2.3406, "step": 23700 }, { "epoch": 0.2, "learning_rate": 9.030224562576082e-05, "loss": 2.3628, "step": 23705 }, { "epoch": 0.2, "learning_rate": 9.029827517838406e-05, "loss": 2.3613, "step": 23710 }, { "epoch": 0.2, "learning_rate": 9.029430400570966e-05, "loss": 2.3497, "step": 23715 }, { "epoch": 0.2, "learning_rate": 9.029033210780906e-05, "loss": 2.3276, "step": 23720 }, { "epoch": 0.2, "learning_rate": 9.028635948475378e-05, "loss": 2.3578, "step": 23725 }, { "epoch": 0.2, "learning_rate": 9.02823861366153e-05, "loss": 2.4138, "step": 23730 }, { "epoch": 0.2, "learning_rate": 9.027841206346514e-05, "loss": 2.3265, "step": 23735 }, { "epoch": 0.2, "learning_rate": 9.027443726537484e-05, "loss": 2.2094, "step": 23740 }, { "epoch": 0.2, "learning_rate": 9.027046174241592e-05, "loss": 2.3957, "step": 23745 }, { "epoch": 0.2, "learning_rate": 9.026648549465994e-05, "loss": 2.3736, "step": 23750 }, { "epoch": 0.2, "learning_rate": 9.026250852217845e-05, "loss": 2.3164, "step": 23755 }, { "epoch": 0.2, "learning_rate": 9.025853082504308e-05, "loss": 2.3366, "step": 23760 }, { "epoch": 0.2, "learning_rate": 9.025455240332536e-05, "loss": 2.3279, "step": 23765 }, { "epoch": 0.2, "learning_rate": 9.025057325709691e-05, "loss": 2.3358, "step": 23770 }, { "epoch": 0.2, "learning_rate": 9.024659338642936e-05, "loss": 2.2883, "step": 23775 }, { "epoch": 0.2, "learning_rate": 9.024261279139435e-05, "loss": 2.2912, "step": 23780 }, { "epoch": 0.2, "learning_rate": 9.023863147206351e-05, "loss": 2.4055, "step": 23785 }, { "epoch": 0.2, "learning_rate": 9.023464942850849e-05, "loss": 2.3535, "step": 23790 }, { "epoch": 0.2, "learning_rate": 9.023066666080095e-05, "loss": 2.3378, "step": 23795 }, { "epoch": 0.2, "learning_rate": 9.022668316901261e-05, "loss": 2.2997, "step": 23800 }, { "epoch": 0.2, "learning_rate": 9.022269895321516e-05, "loss": 2.3422, "step": 23805 }, { "epoch": 0.2, "learning_rate": 9.021871401348028e-05, "loss": 2.3628, "step": 23810 }, { "epoch": 0.2, "learning_rate": 9.021472834987969e-05, "loss": 2.2751, "step": 23815 }, { "epoch": 0.2, "learning_rate": 9.021074196248516e-05, "loss": 2.3568, "step": 23820 }, { "epoch": 0.2, "learning_rate": 9.020675485136842e-05, "loss": 2.3606, "step": 23825 }, { "epoch": 0.2, "learning_rate": 9.020276701660122e-05, "loss": 2.4086, "step": 23830 }, { "epoch": 0.2, "learning_rate": 9.019877845825536e-05, "loss": 2.3877, "step": 23835 }, { "epoch": 0.2, "learning_rate": 9.01947891764026e-05, "loss": 2.28, "step": 23840 }, { "epoch": 0.2, "learning_rate": 9.019079917111474e-05, "loss": 2.3671, "step": 23845 }, { "epoch": 0.2, "learning_rate": 9.018680844246363e-05, "loss": 2.2851, "step": 23850 }, { "epoch": 0.2, "learning_rate": 9.018281699052105e-05, "loss": 2.3627, "step": 23855 }, { "epoch": 0.2, "learning_rate": 9.017882481535887e-05, "loss": 2.3659, "step": 23860 }, { "epoch": 0.2, "learning_rate": 9.017483191704892e-05, "loss": 2.4276, "step": 23865 }, { "epoch": 0.2, "learning_rate": 9.017083829566308e-05, "loss": 2.3843, "step": 23870 }, { "epoch": 0.2, "learning_rate": 9.016684395127324e-05, "loss": 2.3693, "step": 23875 }, { "epoch": 0.2, "learning_rate": 9.016284888395126e-05, "loss": 2.3834, "step": 23880 }, { "epoch": 0.2, "learning_rate": 9.015885309376907e-05, "loss": 2.2773, "step": 23885 }, { "epoch": 0.2, "learning_rate": 9.015485658079857e-05, "loss": 2.4106, "step": 23890 }, { "epoch": 0.2, "learning_rate": 9.01508593451117e-05, "loss": 2.2982, "step": 23895 }, { "epoch": 0.2, "learning_rate": 9.014686138678039e-05, "loss": 2.3119, "step": 23900 }, { "epoch": 0.2, "learning_rate": 9.014286270587662e-05, "loss": 2.3525, "step": 23905 }, { "epoch": 0.2, "learning_rate": 9.013886330247234e-05, "loss": 2.3379, "step": 23910 }, { "epoch": 0.2, "learning_rate": 9.013486317663955e-05, "loss": 2.2523, "step": 23915 }, { "epoch": 0.2, "learning_rate": 9.013086232845022e-05, "loss": 2.365, "step": 23920 }, { "epoch": 0.2, "learning_rate": 9.012686075797637e-05, "loss": 2.3371, "step": 23925 }, { "epoch": 0.2, "learning_rate": 9.012285846529003e-05, "loss": 2.3872, "step": 23930 }, { "epoch": 0.2, "learning_rate": 9.011885545046321e-05, "loss": 2.2782, "step": 23935 }, { "epoch": 0.2, "learning_rate": 9.0114851713568e-05, "loss": 2.3209, "step": 23940 }, { "epoch": 0.2, "learning_rate": 9.011084725467643e-05, "loss": 2.2416, "step": 23945 }, { "epoch": 0.2, "learning_rate": 9.010684207386056e-05, "loss": 2.3162, "step": 23950 }, { "epoch": 0.2, "learning_rate": 9.01028361711925e-05, "loss": 2.3334, "step": 23955 }, { "epoch": 0.2, "learning_rate": 9.009882954674433e-05, "loss": 2.3314, "step": 23960 }, { "epoch": 0.2, "learning_rate": 9.009482220058821e-05, "loss": 2.3394, "step": 23965 }, { "epoch": 0.2, "learning_rate": 9.009081413279621e-05, "loss": 2.4082, "step": 23970 }, { "epoch": 0.2, "learning_rate": 9.008680534344047e-05, "loss": 2.3318, "step": 23975 }, { "epoch": 0.2, "learning_rate": 9.008279583259318e-05, "loss": 2.3341, "step": 23980 }, { "epoch": 0.2, "learning_rate": 9.007878560032648e-05, "loss": 2.3371, "step": 23985 }, { "epoch": 0.2, "learning_rate": 9.007477464671256e-05, "loss": 2.3339, "step": 23990 }, { "epoch": 0.2, "learning_rate": 9.007076297182359e-05, "loss": 2.3232, "step": 23995 }, { "epoch": 0.2, "learning_rate": 9.006675057573178e-05, "loss": 2.3211, "step": 24000 }, { "epoch": 0.2, "learning_rate": 9.006273745850934e-05, "loss": 2.322, "step": 24005 }, { "epoch": 0.2, "learning_rate": 9.005872362022854e-05, "loss": 2.3038, "step": 24010 }, { "epoch": 0.2, "learning_rate": 9.005470906096156e-05, "loss": 2.3369, "step": 24015 }, { "epoch": 0.2, "learning_rate": 9.00506937807807e-05, "loss": 2.3481, "step": 24020 }, { "epoch": 0.21, "learning_rate": 9.004667777975822e-05, "loss": 2.2981, "step": 24025 }, { "epoch": 0.21, "learning_rate": 9.004266105796637e-05, "loss": 2.3703, "step": 24030 }, { "epoch": 0.21, "learning_rate": 9.003864361547749e-05, "loss": 2.3017, "step": 24035 }, { "epoch": 0.21, "learning_rate": 9.003462545236385e-05, "loss": 2.3136, "step": 24040 }, { "epoch": 0.21, "learning_rate": 9.003060656869781e-05, "loss": 2.384, "step": 24045 }, { "epoch": 0.21, "learning_rate": 9.002658696455167e-05, "loss": 2.4593, "step": 24050 }, { "epoch": 0.21, "learning_rate": 9.002256663999775e-05, "loss": 2.3827, "step": 24055 }, { "epoch": 0.21, "learning_rate": 9.001854559510847e-05, "loss": 2.3062, "step": 24060 }, { "epoch": 0.21, "learning_rate": 9.001452382995617e-05, "loss": 2.3644, "step": 24065 }, { "epoch": 0.21, "learning_rate": 9.001050134461324e-05, "loss": 2.2345, "step": 24070 }, { "epoch": 0.21, "learning_rate": 9.000647813915208e-05, "loss": 2.4356, "step": 24075 }, { "epoch": 0.21, "learning_rate": 9.000245421364509e-05, "loss": 2.3192, "step": 24080 }, { "epoch": 0.21, "learning_rate": 8.99984295681647e-05, "loss": 2.417, "step": 24085 }, { "epoch": 0.21, "learning_rate": 8.999440420278335e-05, "loss": 2.3926, "step": 24090 }, { "epoch": 0.21, "learning_rate": 8.999037811757348e-05, "loss": 2.4023, "step": 24095 }, { "epoch": 0.21, "learning_rate": 8.998635131260757e-05, "loss": 2.3408, "step": 24100 }, { "epoch": 0.21, "learning_rate": 8.998232378795808e-05, "loss": 2.3771, "step": 24105 }, { "epoch": 0.21, "learning_rate": 8.99782955436975e-05, "loss": 2.368, "step": 24110 }, { "epoch": 0.21, "learning_rate": 8.997426657989832e-05, "loss": 2.3914, "step": 24115 }, { "epoch": 0.21, "learning_rate": 8.997023689663308e-05, "loss": 2.3352, "step": 24120 }, { "epoch": 0.21, "learning_rate": 8.99662064939743e-05, "loss": 2.337, "step": 24125 }, { "epoch": 0.21, "learning_rate": 8.996217537199452e-05, "loss": 2.3742, "step": 24130 }, { "epoch": 0.21, "learning_rate": 8.995814353076627e-05, "loss": 2.4176, "step": 24135 }, { "epoch": 0.21, "learning_rate": 8.995411097036214e-05, "loss": 2.3353, "step": 24140 }, { "epoch": 0.21, "learning_rate": 8.99500776908547e-05, "loss": 2.3661, "step": 24145 }, { "epoch": 0.21, "learning_rate": 8.994604369231657e-05, "loss": 2.3999, "step": 24150 }, { "epoch": 0.21, "learning_rate": 8.99420089748203e-05, "loss": 2.2771, "step": 24155 }, { "epoch": 0.21, "learning_rate": 8.993797353843856e-05, "loss": 2.3813, "step": 24160 }, { "epoch": 0.21, "learning_rate": 8.993393738324394e-05, "loss": 2.3816, "step": 24165 }, { "epoch": 0.21, "learning_rate": 8.99299005093091e-05, "loss": 2.3422, "step": 24170 }, { "epoch": 0.21, "learning_rate": 8.992586291670671e-05, "loss": 2.3853, "step": 24175 }, { "epoch": 0.21, "learning_rate": 8.992182460550943e-05, "loss": 2.2961, "step": 24180 }, { "epoch": 0.21, "learning_rate": 8.991778557578994e-05, "loss": 2.3235, "step": 24185 }, { "epoch": 0.21, "learning_rate": 8.991374582762093e-05, "loss": 2.3312, "step": 24190 }, { "epoch": 0.21, "learning_rate": 8.99097053610751e-05, "loss": 2.4255, "step": 24195 }, { "epoch": 0.21, "learning_rate": 8.990566417622521e-05, "loss": 2.3522, "step": 24200 }, { "epoch": 0.21, "learning_rate": 8.990162227314396e-05, "loss": 2.4004, "step": 24205 }, { "epoch": 0.21, "learning_rate": 8.989757965190411e-05, "loss": 2.3816, "step": 24210 }, { "epoch": 0.21, "learning_rate": 8.989353631257841e-05, "loss": 2.2889, "step": 24215 }, { "epoch": 0.21, "learning_rate": 8.988949225523964e-05, "loss": 2.42, "step": 24220 }, { "epoch": 0.21, "learning_rate": 8.98854474799606e-05, "loss": 2.3019, "step": 24225 }, { "epoch": 0.21, "learning_rate": 8.988140198681406e-05, "loss": 2.3579, "step": 24230 }, { "epoch": 0.21, "learning_rate": 8.987735577587285e-05, "loss": 2.3252, "step": 24235 }, { "epoch": 0.21, "learning_rate": 8.98733088472098e-05, "loss": 2.3584, "step": 24240 }, { "epoch": 0.21, "learning_rate": 8.986926120089772e-05, "loss": 2.3208, "step": 24245 }, { "epoch": 0.21, "learning_rate": 8.986521283700949e-05, "loss": 2.2907, "step": 24250 }, { "epoch": 0.21, "learning_rate": 8.986116375561795e-05, "loss": 2.3708, "step": 24255 }, { "epoch": 0.21, "learning_rate": 8.985711395679602e-05, "loss": 2.3086, "step": 24260 }, { "epoch": 0.21, "learning_rate": 8.985306344061652e-05, "loss": 2.2565, "step": 24265 }, { "epoch": 0.21, "learning_rate": 8.98490122071524e-05, "loss": 2.3002, "step": 24270 }, { "epoch": 0.21, "learning_rate": 8.984496025647658e-05, "loss": 2.2888, "step": 24275 }, { "epoch": 0.21, "learning_rate": 8.984090758866196e-05, "loss": 2.2568, "step": 24280 }, { "epoch": 0.21, "learning_rate": 8.983685420378149e-05, "loss": 2.3093, "step": 24285 }, { "epoch": 0.21, "learning_rate": 8.983280010190815e-05, "loss": 2.3128, "step": 24290 }, { "epoch": 0.21, "learning_rate": 8.982874528311487e-05, "loss": 2.4153, "step": 24295 }, { "epoch": 0.21, "learning_rate": 8.982468974747464e-05, "loss": 2.3742, "step": 24300 }, { "epoch": 0.21, "learning_rate": 8.982063349506045e-05, "loss": 2.356, "step": 24305 }, { "epoch": 0.21, "learning_rate": 8.981657652594533e-05, "loss": 2.3201, "step": 24310 }, { "epoch": 0.21, "learning_rate": 8.981251884020226e-05, "loss": 2.3247, "step": 24315 }, { "epoch": 0.21, "learning_rate": 8.98084604379043e-05, "loss": 2.3613, "step": 24320 }, { "epoch": 0.21, "learning_rate": 8.980440131912448e-05, "loss": 2.3394, "step": 24325 }, { "epoch": 0.21, "learning_rate": 8.980034148393588e-05, "loss": 2.3115, "step": 24330 }, { "epoch": 0.21, "learning_rate": 8.979628093241154e-05, "loss": 2.3146, "step": 24335 }, { "epoch": 0.21, "learning_rate": 8.979221966462455e-05, "loss": 2.3514, "step": 24340 }, { "epoch": 0.21, "learning_rate": 8.978815768064801e-05, "loss": 2.338, "step": 24345 }, { "epoch": 0.21, "learning_rate": 8.978409498055504e-05, "loss": 2.3475, "step": 24350 }, { "epoch": 0.21, "learning_rate": 8.978003156441875e-05, "loss": 2.3526, "step": 24355 }, { "epoch": 0.21, "learning_rate": 8.977596743231225e-05, "loss": 2.3654, "step": 24360 }, { "epoch": 0.21, "learning_rate": 8.977190258430874e-05, "loss": 2.3446, "step": 24365 }, { "epoch": 0.21, "learning_rate": 8.976783702048132e-05, "loss": 2.3394, "step": 24370 }, { "epoch": 0.21, "learning_rate": 8.976377074090323e-05, "loss": 2.3689, "step": 24375 }, { "epoch": 0.21, "learning_rate": 8.97597037456476e-05, "loss": 2.4033, "step": 24380 }, { "epoch": 0.21, "learning_rate": 8.975563603478766e-05, "loss": 2.2984, "step": 24385 }, { "epoch": 0.21, "learning_rate": 8.97515676083966e-05, "loss": 2.3107, "step": 24390 }, { "epoch": 0.21, "learning_rate": 8.974749846654767e-05, "loss": 2.2726, "step": 24395 }, { "epoch": 0.21, "learning_rate": 8.974342860931408e-05, "loss": 2.4237, "step": 24400 }, { "epoch": 0.21, "learning_rate": 8.97393580367691e-05, "loss": 2.3007, "step": 24405 }, { "epoch": 0.21, "learning_rate": 8.973528674898597e-05, "loss": 2.2752, "step": 24410 }, { "epoch": 0.21, "learning_rate": 8.973121474603801e-05, "loss": 2.2927, "step": 24415 }, { "epoch": 0.21, "learning_rate": 8.972714202799846e-05, "loss": 2.3879, "step": 24420 }, { "epoch": 0.21, "learning_rate": 8.972306859494064e-05, "loss": 2.3422, "step": 24425 }, { "epoch": 0.21, "learning_rate": 8.971899444693788e-05, "loss": 2.3581, "step": 24430 }, { "epoch": 0.21, "learning_rate": 8.971491958406348e-05, "loss": 2.3438, "step": 24435 }, { "epoch": 0.21, "learning_rate": 8.97108440063908e-05, "loss": 2.4168, "step": 24440 }, { "epoch": 0.21, "learning_rate": 8.97067677139932e-05, "loss": 2.3388, "step": 24445 }, { "epoch": 0.21, "learning_rate": 8.970269070694401e-05, "loss": 2.3201, "step": 24450 }, { "epoch": 0.21, "learning_rate": 8.969861298531666e-05, "loss": 2.3146, "step": 24455 }, { "epoch": 0.21, "learning_rate": 8.969453454918451e-05, "loss": 2.3978, "step": 24460 }, { "epoch": 0.21, "learning_rate": 8.969045539862096e-05, "loss": 2.334, "step": 24465 }, { "epoch": 0.21, "learning_rate": 8.968637553369943e-05, "loss": 2.2911, "step": 24470 }, { "epoch": 0.21, "learning_rate": 8.968229495449336e-05, "loss": 2.3069, "step": 24475 }, { "epoch": 0.21, "learning_rate": 8.967821366107621e-05, "loss": 2.3534, "step": 24480 }, { "epoch": 0.21, "learning_rate": 8.96741316535214e-05, "loss": 2.3578, "step": 24485 }, { "epoch": 0.21, "learning_rate": 8.967004893190242e-05, "loss": 2.3853, "step": 24490 }, { "epoch": 0.21, "learning_rate": 8.966596549629274e-05, "loss": 2.2835, "step": 24495 }, { "epoch": 0.21, "learning_rate": 8.966188134676588e-05, "loss": 2.3803, "step": 24500 }, { "epoch": 0.21, "learning_rate": 8.965779648339531e-05, "loss": 2.3786, "step": 24505 }, { "epoch": 0.21, "learning_rate": 8.965371090625458e-05, "loss": 2.3652, "step": 24510 }, { "epoch": 0.21, "learning_rate": 8.96496246154172e-05, "loss": 2.3466, "step": 24515 }, { "epoch": 0.21, "learning_rate": 8.964553761095674e-05, "loss": 2.3875, "step": 24520 }, { "epoch": 0.21, "learning_rate": 8.964144989294674e-05, "loss": 2.3604, "step": 24525 }, { "epoch": 0.21, "learning_rate": 8.963736146146079e-05, "loss": 2.4032, "step": 24530 }, { "epoch": 0.21, "learning_rate": 8.963327231657246e-05, "loss": 2.3353, "step": 24535 }, { "epoch": 0.21, "learning_rate": 8.962918245835534e-05, "loss": 2.3139, "step": 24540 }, { "epoch": 0.21, "learning_rate": 8.962509188688307e-05, "loss": 2.3332, "step": 24545 }, { "epoch": 0.21, "learning_rate": 8.962100060222925e-05, "loss": 2.4022, "step": 24550 }, { "epoch": 0.21, "learning_rate": 8.96169086044675e-05, "loss": 2.356, "step": 24555 }, { "epoch": 0.21, "learning_rate": 8.961281589367152e-05, "loss": 2.3334, "step": 24560 }, { "epoch": 0.21, "learning_rate": 8.960872246991492e-05, "loss": 2.3878, "step": 24565 }, { "epoch": 0.21, "learning_rate": 8.96046283332714e-05, "loss": 2.3077, "step": 24570 }, { "epoch": 0.21, "learning_rate": 8.960053348381466e-05, "loss": 2.3922, "step": 24575 }, { "epoch": 0.21, "learning_rate": 8.959643792161835e-05, "loss": 2.2164, "step": 24580 }, { "epoch": 0.21, "learning_rate": 8.959234164675623e-05, "loss": 2.3109, "step": 24585 }, { "epoch": 0.21, "learning_rate": 8.958824465930201e-05, "loss": 2.4006, "step": 24590 }, { "epoch": 0.21, "learning_rate": 8.958414695932943e-05, "loss": 2.3239, "step": 24595 }, { "epoch": 0.21, "learning_rate": 8.958004854691224e-05, "loss": 2.2841, "step": 24600 }, { "epoch": 0.21, "learning_rate": 8.957594942212421e-05, "loss": 2.361, "step": 24605 }, { "epoch": 0.21, "learning_rate": 8.95718495850391e-05, "loss": 2.2891, "step": 24610 }, { "epoch": 0.21, "learning_rate": 8.956774903573072e-05, "loss": 2.367, "step": 24615 }, { "epoch": 0.21, "learning_rate": 8.956364777427286e-05, "loss": 2.3407, "step": 24620 }, { "epoch": 0.21, "learning_rate": 8.955954580073935e-05, "loss": 2.3668, "step": 24625 }, { "epoch": 0.21, "learning_rate": 8.955544311520401e-05, "loss": 2.3042, "step": 24630 }, { "epoch": 0.21, "learning_rate": 8.955133971774066e-05, "loss": 2.3921, "step": 24635 }, { "epoch": 0.21, "learning_rate": 8.954723560842318e-05, "loss": 2.4666, "step": 24640 }, { "epoch": 0.21, "learning_rate": 8.954313078732543e-05, "loss": 2.2823, "step": 24645 }, { "epoch": 0.21, "learning_rate": 8.95390252545213e-05, "loss": 2.442, "step": 24650 }, { "epoch": 0.21, "learning_rate": 8.953491901008467e-05, "loss": 2.3621, "step": 24655 }, { "epoch": 0.21, "learning_rate": 8.953081205408944e-05, "loss": 2.3933, "step": 24660 }, { "epoch": 0.21, "learning_rate": 8.952670438660953e-05, "loss": 2.3545, "step": 24665 }, { "epoch": 0.21, "learning_rate": 8.952259600771889e-05, "loss": 2.3393, "step": 24670 }, { "epoch": 0.21, "learning_rate": 8.951848691749143e-05, "loss": 2.4028, "step": 24675 }, { "epoch": 0.21, "learning_rate": 8.951437711600113e-05, "loss": 2.2431, "step": 24680 }, { "epoch": 0.21, "learning_rate": 8.951026660332195e-05, "loss": 2.447, "step": 24685 }, { "epoch": 0.21, "learning_rate": 8.95061553795279e-05, "loss": 2.3398, "step": 24690 }, { "epoch": 0.21, "learning_rate": 8.950204344469292e-05, "loss": 2.3472, "step": 24695 }, { "epoch": 0.21, "learning_rate": 8.949793079889109e-05, "loss": 2.395, "step": 24700 }, { "epoch": 0.21, "learning_rate": 8.949381744219636e-05, "loss": 2.3677, "step": 24705 }, { "epoch": 0.21, "learning_rate": 8.948970337468278e-05, "loss": 2.3282, "step": 24710 }, { "epoch": 0.21, "learning_rate": 8.948558859642444e-05, "loss": 2.3059, "step": 24715 }, { "epoch": 0.21, "learning_rate": 8.948147310749535e-05, "loss": 2.3004, "step": 24720 }, { "epoch": 0.21, "learning_rate": 8.94773569079696e-05, "loss": 2.3106, "step": 24725 }, { "epoch": 0.21, "learning_rate": 8.947323999792126e-05, "loss": 2.4144, "step": 24730 }, { "epoch": 0.21, "learning_rate": 8.946912237742446e-05, "loss": 2.319, "step": 24735 }, { "epoch": 0.21, "learning_rate": 8.946500404655328e-05, "loss": 2.3837, "step": 24740 }, { "epoch": 0.21, "learning_rate": 8.946088500538186e-05, "loss": 2.3351, "step": 24745 }, { "epoch": 0.21, "learning_rate": 8.945676525398432e-05, "loss": 2.3599, "step": 24750 }, { "epoch": 0.21, "learning_rate": 8.945264479243481e-05, "loss": 2.3432, "step": 24755 }, { "epoch": 0.21, "learning_rate": 8.944852362080751e-05, "loss": 2.3844, "step": 24760 }, { "epoch": 0.21, "learning_rate": 8.944440173917657e-05, "loss": 2.3771, "step": 24765 }, { "epoch": 0.21, "learning_rate": 8.944027914761621e-05, "loss": 2.3985, "step": 24770 }, { "epoch": 0.21, "learning_rate": 8.943615584620057e-05, "loss": 2.3224, "step": 24775 }, { "epoch": 0.21, "learning_rate": 8.943203183500393e-05, "loss": 2.3566, "step": 24780 }, { "epoch": 0.21, "learning_rate": 8.942790711410048e-05, "loss": 2.3783, "step": 24785 }, { "epoch": 0.21, "learning_rate": 8.942378168356445e-05, "loss": 2.3937, "step": 24790 }, { "epoch": 0.21, "learning_rate": 8.94196555434701e-05, "loss": 2.3014, "step": 24795 }, { "epoch": 0.21, "learning_rate": 8.941552869389171e-05, "loss": 2.3652, "step": 24800 }, { "epoch": 0.21, "learning_rate": 8.941140113490352e-05, "loss": 2.4895, "step": 24805 }, { "epoch": 0.21, "learning_rate": 8.940727286657986e-05, "loss": 2.3148, "step": 24810 }, { "epoch": 0.21, "learning_rate": 8.9403143888995e-05, "loss": 2.3521, "step": 24815 }, { "epoch": 0.21, "learning_rate": 8.939901420222328e-05, "loss": 2.2964, "step": 24820 }, { "epoch": 0.21, "learning_rate": 8.939488380633899e-05, "loss": 2.3126, "step": 24825 }, { "epoch": 0.21, "learning_rate": 8.93907527014165e-05, "loss": 2.3639, "step": 24830 }, { "epoch": 0.21, "learning_rate": 8.938662088753017e-05, "loss": 2.3585, "step": 24835 }, { "epoch": 0.21, "learning_rate": 8.938248836475434e-05, "loss": 2.2965, "step": 24840 }, { "epoch": 0.21, "learning_rate": 8.937835513316339e-05, "loss": 2.3225, "step": 24845 }, { "epoch": 0.21, "learning_rate": 8.937422119283174e-05, "loss": 2.3137, "step": 24850 }, { "epoch": 0.21, "learning_rate": 8.937008654383375e-05, "loss": 2.3832, "step": 24855 }, { "epoch": 0.21, "learning_rate": 8.936595118624387e-05, "loss": 2.3361, "step": 24860 }, { "epoch": 0.21, "learning_rate": 8.936181512013652e-05, "loss": 2.4152, "step": 24865 }, { "epoch": 0.21, "learning_rate": 8.935767834558614e-05, "loss": 2.3048, "step": 24870 }, { "epoch": 0.21, "learning_rate": 8.935354086266719e-05, "loss": 2.2542, "step": 24875 }, { "epoch": 0.21, "learning_rate": 8.934940267145412e-05, "loss": 2.2768, "step": 24880 }, { "epoch": 0.21, "learning_rate": 8.934526377202144e-05, "loss": 2.333, "step": 24885 }, { "epoch": 0.21, "learning_rate": 8.934112416444362e-05, "loss": 2.3903, "step": 24890 }, { "epoch": 0.21, "learning_rate": 8.933698384879516e-05, "loss": 2.3436, "step": 24895 }, { "epoch": 0.21, "learning_rate": 8.93328428251506e-05, "loss": 2.3748, "step": 24900 }, { "epoch": 0.21, "learning_rate": 8.932870109358444e-05, "loss": 2.3344, "step": 24905 }, { "epoch": 0.21, "learning_rate": 8.932455865417126e-05, "loss": 2.3704, "step": 24910 }, { "epoch": 0.21, "learning_rate": 8.932041550698561e-05, "loss": 2.2775, "step": 24915 }, { "epoch": 0.21, "learning_rate": 8.931627165210204e-05, "loss": 2.3021, "step": 24920 }, { "epoch": 0.21, "learning_rate": 8.931212708959516e-05, "loss": 2.3351, "step": 24925 }, { "epoch": 0.21, "learning_rate": 8.930798181953952e-05, "loss": 2.2691, "step": 24930 }, { "epoch": 0.21, "learning_rate": 8.930383584200976e-05, "loss": 2.4087, "step": 24935 }, { "epoch": 0.21, "learning_rate": 8.92996891570805e-05, "loss": 2.3529, "step": 24940 }, { "epoch": 0.21, "learning_rate": 8.929554176482638e-05, "loss": 2.3226, "step": 24945 }, { "epoch": 0.21, "learning_rate": 8.929139366532202e-05, "loss": 2.3286, "step": 24950 }, { "epoch": 0.21, "learning_rate": 8.928724485864208e-05, "loss": 2.3827, "step": 24955 }, { "epoch": 0.21, "learning_rate": 8.928309534486126e-05, "loss": 2.371, "step": 24960 }, { "epoch": 0.21, "learning_rate": 8.927894512405422e-05, "loss": 2.3841, "step": 24965 }, { "epoch": 0.21, "learning_rate": 8.927479419629567e-05, "loss": 2.3825, "step": 24970 }, { "epoch": 0.21, "learning_rate": 8.927064256166031e-05, "loss": 2.3091, "step": 24975 }, { "epoch": 0.21, "learning_rate": 8.926649022022288e-05, "loss": 2.3703, "step": 24980 }, { "epoch": 0.21, "learning_rate": 8.926233717205807e-05, "loss": 2.334, "step": 24985 }, { "epoch": 0.21, "learning_rate": 8.925818341724068e-05, "loss": 2.2891, "step": 24990 }, { "epoch": 0.21, "learning_rate": 8.925402895584545e-05, "loss": 2.3471, "step": 24995 }, { "epoch": 0.21, "learning_rate": 8.924987378794713e-05, "loss": 2.3759, "step": 25000 }, { "epoch": 0.21, "learning_rate": 8.924571791362055e-05, "loss": 2.337, "step": 25005 }, { "epoch": 0.21, "learning_rate": 8.924156133294047e-05, "loss": 2.4122, "step": 25010 }, { "epoch": 0.21, "learning_rate": 8.92374040459817e-05, "loss": 2.2733, "step": 25015 }, { "epoch": 0.21, "learning_rate": 8.923324605281912e-05, "loss": 2.3078, "step": 25020 }, { "epoch": 0.21, "learning_rate": 8.92290873535275e-05, "loss": 2.3628, "step": 25025 }, { "epoch": 0.21, "learning_rate": 8.922492794818171e-05, "loss": 2.2928, "step": 25030 }, { "epoch": 0.21, "learning_rate": 8.922076783685664e-05, "loss": 2.3283, "step": 25035 }, { "epoch": 0.21, "learning_rate": 8.921660701962712e-05, "loss": 2.3512, "step": 25040 }, { "epoch": 0.21, "learning_rate": 8.921244549656806e-05, "loss": 2.353, "step": 25045 }, { "epoch": 0.21, "learning_rate": 8.920828326775438e-05, "loss": 2.3914, "step": 25050 }, { "epoch": 0.21, "learning_rate": 8.920412033326096e-05, "loss": 2.2797, "step": 25055 }, { "epoch": 0.21, "learning_rate": 8.919995669316274e-05, "loss": 2.2777, "step": 25060 }, { "epoch": 0.21, "learning_rate": 8.919579234753465e-05, "loss": 2.3913, "step": 25065 }, { "epoch": 0.21, "learning_rate": 8.919162729645165e-05, "loss": 2.3704, "step": 25070 }, { "epoch": 0.21, "learning_rate": 8.91874615399887e-05, "loss": 2.3268, "step": 25075 }, { "epoch": 0.21, "learning_rate": 8.918329507822077e-05, "loss": 2.3723, "step": 25080 }, { "epoch": 0.21, "learning_rate": 8.917912791122287e-05, "loss": 2.329, "step": 25085 }, { "epoch": 0.21, "learning_rate": 8.917496003906998e-05, "loss": 2.3835, "step": 25090 }, { "epoch": 0.21, "learning_rate": 8.917079146183711e-05, "loss": 2.2699, "step": 25095 }, { "epoch": 0.21, "learning_rate": 8.916662217959931e-05, "loss": 2.3509, "step": 25100 }, { "epoch": 0.21, "learning_rate": 8.916245219243161e-05, "loss": 2.3359, "step": 25105 }, { "epoch": 0.21, "learning_rate": 8.915828150040906e-05, "loss": 2.3425, "step": 25110 }, { "epoch": 0.21, "learning_rate": 8.915411010360673e-05, "loss": 2.3143, "step": 25115 }, { "epoch": 0.21, "learning_rate": 8.914993800209968e-05, "loss": 2.2658, "step": 25120 }, { "epoch": 0.21, "learning_rate": 8.914576519596302e-05, "loss": 2.401, "step": 25125 }, { "epoch": 0.21, "learning_rate": 8.914159168527184e-05, "loss": 2.3768, "step": 25130 }, { "epoch": 0.21, "learning_rate": 8.913741747010126e-05, "loss": 2.376, "step": 25135 }, { "epoch": 0.21, "learning_rate": 8.913324255052642e-05, "loss": 2.4491, "step": 25140 }, { "epoch": 0.21, "learning_rate": 8.912906692662247e-05, "loss": 2.3684, "step": 25145 }, { "epoch": 0.21, "learning_rate": 8.912489059846452e-05, "loss": 2.3269, "step": 25150 }, { "epoch": 0.21, "learning_rate": 8.912071356612776e-05, "loss": 2.3607, "step": 25155 }, { "epoch": 0.21, "learning_rate": 8.91165358296874e-05, "loss": 2.3665, "step": 25160 }, { "epoch": 0.21, "learning_rate": 8.911235738921857e-05, "loss": 2.3025, "step": 25165 }, { "epoch": 0.21, "learning_rate": 8.910817824479654e-05, "loss": 2.3157, "step": 25170 }, { "epoch": 0.21, "learning_rate": 8.910399839649646e-05, "loss": 2.3808, "step": 25175 }, { "epoch": 0.21, "learning_rate": 8.909981784439363e-05, "loss": 2.3508, "step": 25180 }, { "epoch": 0.21, "learning_rate": 8.909563658856324e-05, "loss": 2.3493, "step": 25185 }, { "epoch": 0.21, "learning_rate": 8.909145462908056e-05, "loss": 2.3065, "step": 25190 }, { "epoch": 0.21, "learning_rate": 8.908727196602087e-05, "loss": 2.3663, "step": 25195 }, { "epoch": 0.22, "learning_rate": 8.908308859945943e-05, "loss": 2.3445, "step": 25200 }, { "epoch": 0.22, "learning_rate": 8.907890452947156e-05, "loss": 2.3012, "step": 25205 }, { "epoch": 0.22, "learning_rate": 8.907471975613255e-05, "loss": 2.3844, "step": 25210 }, { "epoch": 0.22, "learning_rate": 8.907053427951771e-05, "loss": 2.4541, "step": 25215 }, { "epoch": 0.22, "learning_rate": 8.906634809970237e-05, "loss": 2.4159, "step": 25220 }, { "epoch": 0.22, "learning_rate": 8.90621612167619e-05, "loss": 2.3816, "step": 25225 }, { "epoch": 0.22, "learning_rate": 8.905797363077164e-05, "loss": 2.4352, "step": 25230 }, { "epoch": 0.22, "learning_rate": 8.905378534180696e-05, "loss": 2.3262, "step": 25235 }, { "epoch": 0.22, "learning_rate": 8.904959634994323e-05, "loss": 2.3712, "step": 25240 }, { "epoch": 0.22, "learning_rate": 8.904540665525587e-05, "loss": 2.3511, "step": 25245 }, { "epoch": 0.22, "learning_rate": 8.904121625782028e-05, "loss": 2.4094, "step": 25250 }, { "epoch": 0.22, "learning_rate": 8.903702515771185e-05, "loss": 2.3684, "step": 25255 }, { "epoch": 0.22, "learning_rate": 8.903283335500605e-05, "loss": 2.3434, "step": 25260 }, { "epoch": 0.22, "learning_rate": 8.90286408497783e-05, "loss": 2.3322, "step": 25265 }, { "epoch": 0.22, "learning_rate": 8.902444764210407e-05, "loss": 2.283, "step": 25270 }, { "epoch": 0.22, "learning_rate": 8.902025373205884e-05, "loss": 2.3353, "step": 25275 }, { "epoch": 0.22, "learning_rate": 8.901605911971806e-05, "loss": 2.3562, "step": 25280 }, { "epoch": 0.22, "learning_rate": 8.901186380515726e-05, "loss": 2.3957, "step": 25285 }, { "epoch": 0.22, "learning_rate": 8.900766778845193e-05, "loss": 2.3359, "step": 25290 }, { "epoch": 0.22, "learning_rate": 8.900347106967761e-05, "loss": 2.3241, "step": 25295 }, { "epoch": 0.22, "learning_rate": 8.899927364890981e-05, "loss": 2.3582, "step": 25300 }, { "epoch": 0.22, "learning_rate": 8.899507552622408e-05, "loss": 2.3649, "step": 25305 }, { "epoch": 0.22, "learning_rate": 8.8990876701696e-05, "loss": 2.3464, "step": 25310 }, { "epoch": 0.22, "learning_rate": 8.89866771754011e-05, "loss": 2.3206, "step": 25315 }, { "epoch": 0.22, "learning_rate": 8.898247694741499e-05, "loss": 2.3928, "step": 25320 }, { "epoch": 0.22, "learning_rate": 8.89782760178133e-05, "loss": 2.3912, "step": 25325 }, { "epoch": 0.22, "learning_rate": 8.897407438667158e-05, "loss": 2.349, "step": 25330 }, { "epoch": 0.22, "learning_rate": 8.896987205406548e-05, "loss": 2.3339, "step": 25335 }, { "epoch": 0.22, "learning_rate": 8.896566902007064e-05, "loss": 2.4058, "step": 25340 }, { "epoch": 0.22, "learning_rate": 8.89614652847627e-05, "loss": 2.3658, "step": 25345 }, { "epoch": 0.22, "learning_rate": 8.895726084821732e-05, "loss": 2.347, "step": 25350 }, { "epoch": 0.22, "learning_rate": 8.895305571051015e-05, "loss": 2.348, "step": 25355 }, { "epoch": 0.22, "learning_rate": 8.894884987171692e-05, "loss": 2.3382, "step": 25360 }, { "epoch": 0.22, "learning_rate": 8.89446433319133e-05, "loss": 2.3166, "step": 25365 }, { "epoch": 0.22, "learning_rate": 8.8940436091175e-05, "loss": 2.4251, "step": 25370 }, { "epoch": 0.22, "learning_rate": 8.893622814957774e-05, "loss": 2.2616, "step": 25375 }, { "epoch": 0.22, "learning_rate": 8.893201950719727e-05, "loss": 2.3731, "step": 25380 }, { "epoch": 0.22, "learning_rate": 8.892781016410934e-05, "loss": 2.2922, "step": 25385 }, { "epoch": 0.22, "learning_rate": 8.892360012038969e-05, "loss": 2.3257, "step": 25390 }, { "epoch": 0.22, "learning_rate": 8.891938937611411e-05, "loss": 2.4353, "step": 25395 }, { "epoch": 0.22, "learning_rate": 8.891517793135838e-05, "loss": 2.4655, "step": 25400 }, { "epoch": 0.22, "learning_rate": 8.89109657861983e-05, "loss": 2.3162, "step": 25405 }, { "epoch": 0.22, "learning_rate": 8.890675294070968e-05, "loss": 2.3359, "step": 25410 }, { "epoch": 0.22, "learning_rate": 8.890253939496834e-05, "loss": 2.3651, "step": 25415 }, { "epoch": 0.22, "learning_rate": 8.889832514905013e-05, "loss": 2.4211, "step": 25420 }, { "epoch": 0.22, "learning_rate": 8.889411020303088e-05, "loss": 2.354, "step": 25425 }, { "epoch": 0.22, "learning_rate": 8.888989455698648e-05, "loss": 2.3803, "step": 25430 }, { "epoch": 0.22, "learning_rate": 8.888567821099276e-05, "loss": 2.2658, "step": 25435 }, { "epoch": 0.22, "learning_rate": 8.888146116512565e-05, "loss": 2.2996, "step": 25440 }, { "epoch": 0.22, "learning_rate": 8.887724341946103e-05, "loss": 2.3748, "step": 25445 }, { "epoch": 0.22, "learning_rate": 8.887302497407481e-05, "loss": 2.3599, "step": 25450 }, { "epoch": 0.22, "learning_rate": 8.886880582904292e-05, "loss": 2.2928, "step": 25455 }, { "epoch": 0.22, "learning_rate": 8.886458598444129e-05, "loss": 2.2481, "step": 25460 }, { "epoch": 0.22, "learning_rate": 8.886036544034588e-05, "loss": 2.352, "step": 25465 }, { "epoch": 0.22, "learning_rate": 8.885614419683265e-05, "loss": 2.2615, "step": 25470 }, { "epoch": 0.22, "learning_rate": 8.885192225397757e-05, "loss": 2.3717, "step": 25475 }, { "epoch": 0.22, "learning_rate": 8.884769961185662e-05, "loss": 2.2886, "step": 25480 }, { "epoch": 0.22, "learning_rate": 8.884347627054582e-05, "loss": 2.3815, "step": 25485 }, { "epoch": 0.22, "learning_rate": 8.883925223012117e-05, "loss": 2.364, "step": 25490 }, { "epoch": 0.22, "learning_rate": 8.88350274906587e-05, "loss": 2.3174, "step": 25495 }, { "epoch": 0.22, "learning_rate": 8.883080205223444e-05, "loss": 2.2911, "step": 25500 }, { "epoch": 0.22, "learning_rate": 8.882657591492445e-05, "loss": 2.3141, "step": 25505 }, { "epoch": 0.22, "learning_rate": 8.88223490788048e-05, "loss": 2.3208, "step": 25510 }, { "epoch": 0.22, "learning_rate": 8.881812154395156e-05, "loss": 2.3669, "step": 25515 }, { "epoch": 0.22, "learning_rate": 8.881389331044079e-05, "loss": 2.2627, "step": 25520 }, { "epoch": 0.22, "learning_rate": 8.880966437834861e-05, "loss": 2.322, "step": 25525 }, { "epoch": 0.22, "learning_rate": 8.880543474775116e-05, "loss": 2.3929, "step": 25530 }, { "epoch": 0.22, "learning_rate": 8.880120441872452e-05, "loss": 2.3727, "step": 25535 }, { "epoch": 0.22, "learning_rate": 8.879697339134487e-05, "loss": 2.3366, "step": 25540 }, { "epoch": 0.22, "learning_rate": 8.879274166568834e-05, "loss": 2.4199, "step": 25545 }, { "epoch": 0.22, "learning_rate": 8.878850924183108e-05, "loss": 2.3786, "step": 25550 }, { "epoch": 0.22, "learning_rate": 8.87842761198493e-05, "loss": 2.2771, "step": 25555 }, { "epoch": 0.22, "learning_rate": 8.878004229981915e-05, "loss": 2.3357, "step": 25560 }, { "epoch": 0.22, "learning_rate": 8.877580778181686e-05, "loss": 2.3823, "step": 25565 }, { "epoch": 0.22, "learning_rate": 8.877157256591866e-05, "loss": 2.4203, "step": 25570 }, { "epoch": 0.22, "learning_rate": 8.876733665220072e-05, "loss": 2.3905, "step": 25575 }, { "epoch": 0.22, "learning_rate": 8.876310004073933e-05, "loss": 2.32, "step": 25580 }, { "epoch": 0.22, "learning_rate": 8.875886273161071e-05, "loss": 2.3703, "step": 25585 }, { "epoch": 0.22, "learning_rate": 8.875462472489115e-05, "loss": 2.3775, "step": 25590 }, { "epoch": 0.22, "learning_rate": 8.87503860206569e-05, "loss": 2.3513, "step": 25595 }, { "epoch": 0.22, "learning_rate": 8.874614661898425e-05, "loss": 2.2836, "step": 25600 }, { "epoch": 0.22, "learning_rate": 8.874190651994954e-05, "loss": 2.3914, "step": 25605 }, { "epoch": 0.22, "learning_rate": 8.873766572362906e-05, "loss": 2.3037, "step": 25610 }, { "epoch": 0.22, "learning_rate": 8.873342423009912e-05, "loss": 2.3969, "step": 25615 }, { "epoch": 0.22, "learning_rate": 8.87291820394361e-05, "loss": 2.3858, "step": 25620 }, { "epoch": 0.22, "learning_rate": 8.872493915171629e-05, "loss": 2.3875, "step": 25625 }, { "epoch": 0.22, "learning_rate": 8.872069556701611e-05, "loss": 2.3602, "step": 25630 }, { "epoch": 0.22, "learning_rate": 8.871645128541192e-05, "loss": 2.3187, "step": 25635 }, { "epoch": 0.22, "learning_rate": 8.87122063069801e-05, "loss": 2.3637, "step": 25640 }, { "epoch": 0.22, "learning_rate": 8.870796063179707e-05, "loss": 2.2983, "step": 25645 }, { "epoch": 0.22, "learning_rate": 8.870371425993922e-05, "loss": 2.3203, "step": 25650 }, { "epoch": 0.22, "learning_rate": 8.869946719148301e-05, "loss": 2.392, "step": 25655 }, { "epoch": 0.22, "learning_rate": 8.869521942650486e-05, "loss": 2.3332, "step": 25660 }, { "epoch": 0.22, "learning_rate": 8.86909709650812e-05, "loss": 2.2912, "step": 25665 }, { "epoch": 0.22, "learning_rate": 8.868672180728852e-05, "loss": 2.3344, "step": 25670 }, { "epoch": 0.22, "learning_rate": 8.868247195320331e-05, "loss": 2.3783, "step": 25675 }, { "epoch": 0.22, "learning_rate": 8.867822140290205e-05, "loss": 2.3487, "step": 25680 }, { "epoch": 0.22, "learning_rate": 8.867397015646124e-05, "loss": 2.387, "step": 25685 }, { "epoch": 0.22, "learning_rate": 8.866971821395737e-05, "loss": 2.2919, "step": 25690 }, { "epoch": 0.22, "learning_rate": 8.8665465575467e-05, "loss": 2.3308, "step": 25695 }, { "epoch": 0.22, "learning_rate": 8.866121224106666e-05, "loss": 2.3422, "step": 25700 }, { "epoch": 0.22, "learning_rate": 8.865695821083292e-05, "loss": 2.2717, "step": 25705 }, { "epoch": 0.22, "learning_rate": 8.865270348484231e-05, "loss": 2.3311, "step": 25710 }, { "epoch": 0.22, "learning_rate": 8.864844806317144e-05, "loss": 2.3076, "step": 25715 }, { "epoch": 0.22, "learning_rate": 8.864419194589687e-05, "loss": 2.3322, "step": 25720 }, { "epoch": 0.22, "learning_rate": 8.863993513309523e-05, "loss": 2.3233, "step": 25725 }, { "epoch": 0.22, "learning_rate": 8.86356776248431e-05, "loss": 2.3605, "step": 25730 }, { "epoch": 0.22, "learning_rate": 8.863141942121716e-05, "loss": 2.3412, "step": 25735 }, { "epoch": 0.22, "learning_rate": 8.8627160522294e-05, "loss": 2.3332, "step": 25740 }, { "epoch": 0.22, "learning_rate": 8.862290092815031e-05, "loss": 2.3287, "step": 25745 }, { "epoch": 0.22, "learning_rate": 8.861864063886274e-05, "loss": 2.3553, "step": 25750 }, { "epoch": 0.22, "learning_rate": 8.861437965450793e-05, "loss": 2.3579, "step": 25755 }, { "epoch": 0.22, "learning_rate": 8.861011797516265e-05, "loss": 2.3965, "step": 25760 }, { "epoch": 0.22, "learning_rate": 8.860585560090353e-05, "loss": 2.3283, "step": 25765 }, { "epoch": 0.22, "learning_rate": 8.860159253180733e-05, "loss": 2.3639, "step": 25770 }, { "epoch": 0.22, "learning_rate": 8.859732876795076e-05, "loss": 2.3114, "step": 25775 }, { "epoch": 0.22, "learning_rate": 8.859306430941056e-05, "loss": 2.3521, "step": 25780 }, { "epoch": 0.22, "learning_rate": 8.858879915626348e-05, "loss": 2.3311, "step": 25785 }, { "epoch": 0.22, "learning_rate": 8.858453330858629e-05, "loss": 2.327, "step": 25790 }, { "epoch": 0.22, "learning_rate": 8.858026676645579e-05, "loss": 2.3527, "step": 25795 }, { "epoch": 0.22, "learning_rate": 8.857599952994873e-05, "loss": 2.4514, "step": 25800 }, { "epoch": 0.22, "learning_rate": 8.857173159914192e-05, "loss": 2.3364, "step": 25805 }, { "epoch": 0.22, "learning_rate": 8.856746297411221e-05, "loss": 2.352, "step": 25810 }, { "epoch": 0.22, "learning_rate": 8.856319365493638e-05, "loss": 2.3612, "step": 25815 }, { "epoch": 0.22, "learning_rate": 8.85589236416913e-05, "loss": 2.2856, "step": 25820 }, { "epoch": 0.22, "learning_rate": 8.855465293445382e-05, "loss": 2.359, "step": 25825 }, { "epoch": 0.22, "learning_rate": 8.855038153330081e-05, "loss": 2.3766, "step": 25830 }, { "epoch": 0.22, "learning_rate": 8.854610943830913e-05, "loss": 2.3614, "step": 25835 }, { "epoch": 0.22, "learning_rate": 8.854183664955567e-05, "loss": 2.4255, "step": 25840 }, { "epoch": 0.22, "learning_rate": 8.853756316711736e-05, "loss": 2.2619, "step": 25845 }, { "epoch": 0.22, "learning_rate": 8.853328899107109e-05, "loss": 2.2959, "step": 25850 }, { "epoch": 0.22, "learning_rate": 8.852901412149379e-05, "loss": 2.3818, "step": 25855 }, { "epoch": 0.22, "learning_rate": 8.852473855846242e-05, "loss": 2.3785, "step": 25860 }, { "epoch": 0.22, "learning_rate": 8.852046230205391e-05, "loss": 2.3622, "step": 25865 }, { "epoch": 0.22, "learning_rate": 8.851618535234523e-05, "loss": 2.3812, "step": 25870 }, { "epoch": 0.22, "learning_rate": 8.851190770941335e-05, "loss": 2.345, "step": 25875 }, { "epoch": 0.22, "learning_rate": 8.850762937333529e-05, "loss": 2.3286, "step": 25880 }, { "epoch": 0.22, "learning_rate": 8.850335034418802e-05, "loss": 2.3486, "step": 25885 }, { "epoch": 0.22, "learning_rate": 8.849907062204857e-05, "loss": 2.4114, "step": 25890 }, { "epoch": 0.22, "learning_rate": 8.849479020699397e-05, "loss": 2.3541, "step": 25895 }, { "epoch": 0.22, "learning_rate": 8.849050909910124e-05, "loss": 2.3741, "step": 25900 }, { "epoch": 0.22, "learning_rate": 8.848622729844747e-05, "loss": 2.2993, "step": 25905 }, { "epoch": 0.22, "learning_rate": 8.848194480510969e-05, "loss": 2.369, "step": 25910 }, { "epoch": 0.22, "learning_rate": 8.847766161916497e-05, "loss": 2.4571, "step": 25915 }, { "epoch": 0.22, "learning_rate": 8.847337774069044e-05, "loss": 2.3484, "step": 25920 }, { "epoch": 0.22, "learning_rate": 8.84690931697632e-05, "loss": 2.2709, "step": 25925 }, { "epoch": 0.22, "learning_rate": 8.846480790646032e-05, "loss": 2.2905, "step": 25930 }, { "epoch": 0.22, "learning_rate": 8.846052195085895e-05, "loss": 2.4091, "step": 25935 }, { "epoch": 0.22, "learning_rate": 8.845623530303623e-05, "loss": 2.388, "step": 25940 }, { "epoch": 0.22, "learning_rate": 8.845194796306935e-05, "loss": 2.3619, "step": 25945 }, { "epoch": 0.22, "learning_rate": 8.844765993103541e-05, "loss": 2.3146, "step": 25950 }, { "epoch": 0.22, "learning_rate": 8.844337120701163e-05, "loss": 2.3946, "step": 25955 }, { "epoch": 0.22, "learning_rate": 8.843908179107516e-05, "loss": 2.3407, "step": 25960 }, { "epoch": 0.22, "learning_rate": 8.843479168330325e-05, "loss": 2.4041, "step": 25965 }, { "epoch": 0.22, "learning_rate": 8.843050088377309e-05, "loss": 2.3449, "step": 25970 }, { "epoch": 0.22, "learning_rate": 8.842620939256191e-05, "loss": 2.4788, "step": 25975 }, { "epoch": 0.22, "learning_rate": 8.842191720974695e-05, "loss": 2.3476, "step": 25980 }, { "epoch": 0.22, "learning_rate": 8.841762433540545e-05, "loss": 2.3962, "step": 25985 }, { "epoch": 0.22, "learning_rate": 8.841333076961468e-05, "loss": 2.3323, "step": 25990 }, { "epoch": 0.22, "learning_rate": 8.840903651245194e-05, "loss": 2.3738, "step": 25995 }, { "epoch": 0.22, "learning_rate": 8.840474156399449e-05, "loss": 2.3484, "step": 26000 }, { "epoch": 0.22, "learning_rate": 8.840044592431964e-05, "loss": 2.2368, "step": 26005 }, { "epoch": 0.22, "learning_rate": 8.839614959350471e-05, "loss": 2.3496, "step": 26010 }, { "epoch": 0.22, "learning_rate": 8.839185257162701e-05, "loss": 2.3892, "step": 26015 }, { "epoch": 0.22, "learning_rate": 8.83875548587639e-05, "loss": 2.3004, "step": 26020 }, { "epoch": 0.22, "learning_rate": 8.838325645499271e-05, "loss": 2.2848, "step": 26025 }, { "epoch": 0.22, "learning_rate": 8.837895736039083e-05, "loss": 2.2479, "step": 26030 }, { "epoch": 0.22, "learning_rate": 8.837465757503562e-05, "loss": 2.3245, "step": 26035 }, { "epoch": 0.22, "learning_rate": 8.837035709900446e-05, "loss": 2.3719, "step": 26040 }, { "epoch": 0.22, "learning_rate": 8.836605593237475e-05, "loss": 2.3067, "step": 26045 }, { "epoch": 0.22, "learning_rate": 8.836175407522394e-05, "loss": 2.3395, "step": 26050 }, { "epoch": 0.22, "learning_rate": 8.835745152762942e-05, "loss": 2.3716, "step": 26055 }, { "epoch": 0.22, "learning_rate": 8.835314828966863e-05, "loss": 2.3591, "step": 26060 }, { "epoch": 0.22, "learning_rate": 8.834884436141904e-05, "loss": 2.3376, "step": 26065 }, { "epoch": 0.22, "learning_rate": 8.83445397429581e-05, "loss": 2.3647, "step": 26070 }, { "epoch": 0.22, "learning_rate": 8.834023443436328e-05, "loss": 2.2946, "step": 26075 }, { "epoch": 0.22, "learning_rate": 8.833592843571207e-05, "loss": 2.3452, "step": 26080 }, { "epoch": 0.22, "learning_rate": 8.8331621747082e-05, "loss": 2.3318, "step": 26085 }, { "epoch": 0.22, "learning_rate": 8.832731436855054e-05, "loss": 2.343, "step": 26090 }, { "epoch": 0.22, "learning_rate": 8.832300630019523e-05, "loss": 2.3296, "step": 26095 }, { "epoch": 0.22, "learning_rate": 8.831869754209363e-05, "loss": 2.3105, "step": 26100 }, { "epoch": 0.22, "learning_rate": 8.831438809432325e-05, "loss": 2.3687, "step": 26105 }, { "epoch": 0.22, "learning_rate": 8.831007795696169e-05, "loss": 2.3594, "step": 26110 }, { "epoch": 0.22, "learning_rate": 8.83057671300865e-05, "loss": 2.3241, "step": 26115 }, { "epoch": 0.22, "learning_rate": 8.830145561377527e-05, "loss": 2.3771, "step": 26120 }, { "epoch": 0.22, "learning_rate": 8.829714340810562e-05, "loss": 2.3688, "step": 26125 }, { "epoch": 0.22, "learning_rate": 8.829283051315514e-05, "loss": 2.3774, "step": 26130 }, { "epoch": 0.22, "learning_rate": 8.828851692900147e-05, "loss": 2.2829, "step": 26135 }, { "epoch": 0.22, "learning_rate": 8.828420265572222e-05, "loss": 2.3658, "step": 26140 }, { "epoch": 0.22, "learning_rate": 8.827988769339508e-05, "loss": 2.3568, "step": 26145 }, { "epoch": 0.22, "learning_rate": 8.827557204209768e-05, "loss": 2.3754, "step": 26150 }, { "epoch": 0.22, "learning_rate": 8.827125570190771e-05, "loss": 2.3895, "step": 26155 }, { "epoch": 0.22, "learning_rate": 8.826693867290283e-05, "loss": 2.3319, "step": 26160 }, { "epoch": 0.22, "learning_rate": 8.826262095516077e-05, "loss": 2.25, "step": 26165 }, { "epoch": 0.22, "learning_rate": 8.825830254875925e-05, "loss": 2.3584, "step": 26170 }, { "epoch": 0.22, "learning_rate": 8.825398345377595e-05, "loss": 2.2977, "step": 26175 }, { "epoch": 0.22, "learning_rate": 8.824966367028864e-05, "loss": 2.3465, "step": 26180 }, { "epoch": 0.22, "learning_rate": 8.824534319837505e-05, "loss": 2.3663, "step": 26185 }, { "epoch": 0.22, "learning_rate": 8.824102203811296e-05, "loss": 2.415, "step": 26190 }, { "epoch": 0.22, "learning_rate": 8.823670018958013e-05, "loss": 2.3436, "step": 26195 }, { "epoch": 0.22, "learning_rate": 8.823237765285435e-05, "loss": 2.304, "step": 26200 }, { "epoch": 0.22, "learning_rate": 8.822805442801342e-05, "loss": 2.3614, "step": 26205 }, { "epoch": 0.22, "learning_rate": 8.822373051513514e-05, "loss": 2.2331, "step": 26210 }, { "epoch": 0.22, "learning_rate": 8.821940591429734e-05, "loss": 2.3785, "step": 26215 }, { "epoch": 0.22, "learning_rate": 8.821508062557786e-05, "loss": 2.3458, "step": 26220 }, { "epoch": 0.22, "learning_rate": 8.821075464905453e-05, "loss": 2.3956, "step": 26225 }, { "epoch": 0.22, "learning_rate": 8.820642798480524e-05, "loss": 2.2962, "step": 26230 }, { "epoch": 0.22, "learning_rate": 8.820210063290783e-05, "loss": 2.4101, "step": 26235 }, { "epoch": 0.22, "learning_rate": 8.819777259344022e-05, "loss": 2.3219, "step": 26240 }, { "epoch": 0.22, "learning_rate": 8.819344386648025e-05, "loss": 2.3763, "step": 26245 }, { "epoch": 0.22, "learning_rate": 8.818911445210589e-05, "loss": 2.3824, "step": 26250 }, { "epoch": 0.22, "learning_rate": 8.818478435039504e-05, "loss": 2.348, "step": 26255 }, { "epoch": 0.22, "learning_rate": 8.818045356142564e-05, "loss": 2.2709, "step": 26260 }, { "epoch": 0.22, "learning_rate": 8.817612208527561e-05, "loss": 2.319, "step": 26265 }, { "epoch": 0.22, "learning_rate": 8.817178992202293e-05, "loss": 2.3717, "step": 26270 }, { "epoch": 0.22, "learning_rate": 8.816745707174556e-05, "loss": 2.322, "step": 26275 }, { "epoch": 0.22, "learning_rate": 8.816312353452151e-05, "loss": 2.2881, "step": 26280 }, { "epoch": 0.22, "learning_rate": 8.815878931042876e-05, "loss": 2.3351, "step": 26285 }, { "epoch": 0.22, "learning_rate": 8.81544543995453e-05, "loss": 2.3827, "step": 26290 }, { "epoch": 0.22, "learning_rate": 8.815011880194917e-05, "loss": 2.3165, "step": 26295 }, { "epoch": 0.22, "learning_rate": 8.81457825177184e-05, "loss": 2.3161, "step": 26300 }, { "epoch": 0.22, "learning_rate": 8.814144554693105e-05, "loss": 2.3791, "step": 26305 }, { "epoch": 0.22, "learning_rate": 8.813710788966517e-05, "loss": 2.3436, "step": 26310 }, { "epoch": 0.22, "learning_rate": 8.81327695459988e-05, "loss": 2.3222, "step": 26315 }, { "epoch": 0.22, "learning_rate": 8.812843051601004e-05, "loss": 2.3074, "step": 26320 }, { "epoch": 0.22, "learning_rate": 8.812409079977701e-05, "loss": 2.2987, "step": 26325 }, { "epoch": 0.22, "learning_rate": 8.811975039737778e-05, "loss": 2.2509, "step": 26330 }, { "epoch": 0.22, "learning_rate": 8.811540930889051e-05, "loss": 2.3248, "step": 26335 }, { "epoch": 0.22, "learning_rate": 8.81110675343933e-05, "loss": 2.402, "step": 26340 }, { "epoch": 0.22, "learning_rate": 8.810672507396432e-05, "loss": 2.343, "step": 26345 }, { "epoch": 0.22, "learning_rate": 8.810238192768169e-05, "loss": 2.3877, "step": 26350 }, { "epoch": 0.22, "learning_rate": 8.80980380956236e-05, "loss": 2.3358, "step": 26355 }, { "epoch": 0.22, "learning_rate": 8.809369357786825e-05, "loss": 2.3214, "step": 26360 }, { "epoch": 0.22, "learning_rate": 8.808934837449379e-05, "loss": 2.4234, "step": 26365 }, { "epoch": 0.23, "learning_rate": 8.808500248557847e-05, "loss": 2.3188, "step": 26370 }, { "epoch": 0.23, "learning_rate": 8.808065591120047e-05, "loss": 2.3713, "step": 26375 }, { "epoch": 0.23, "learning_rate": 8.807630865143805e-05, "loss": 2.3003, "step": 26380 }, { "epoch": 0.23, "learning_rate": 8.807196070636946e-05, "loss": 2.3457, "step": 26385 }, { "epoch": 0.23, "learning_rate": 8.80676120760729e-05, "loss": 2.3448, "step": 26390 }, { "epoch": 0.23, "learning_rate": 8.80632627606267e-05, "loss": 2.2532, "step": 26395 }, { "epoch": 0.23, "learning_rate": 8.805891276010912e-05, "loss": 2.3007, "step": 26400 }, { "epoch": 0.23, "learning_rate": 8.805456207459843e-05, "loss": 2.3695, "step": 26405 }, { "epoch": 0.23, "learning_rate": 8.805021070417297e-05, "loss": 2.3278, "step": 26410 }, { "epoch": 0.23, "learning_rate": 8.804585864891102e-05, "loss": 2.3555, "step": 26415 }, { "epoch": 0.23, "learning_rate": 8.804150590889094e-05, "loss": 2.3317, "step": 26420 }, { "epoch": 0.23, "learning_rate": 8.803715248419106e-05, "loss": 2.4085, "step": 26425 }, { "epoch": 0.23, "learning_rate": 8.803279837488973e-05, "loss": 2.4045, "step": 26430 }, { "epoch": 0.23, "learning_rate": 8.802844358106532e-05, "loss": 2.4026, "step": 26435 }, { "epoch": 0.23, "learning_rate": 8.802408810279621e-05, "loss": 2.3999, "step": 26440 }, { "epoch": 0.23, "learning_rate": 8.80197319401608e-05, "loss": 2.25, "step": 26445 }, { "epoch": 0.23, "learning_rate": 8.801537509323748e-05, "loss": 2.3965, "step": 26450 }, { "epoch": 0.23, "learning_rate": 8.801101756210467e-05, "loss": 2.2898, "step": 26455 }, { "epoch": 0.23, "learning_rate": 8.800665934684078e-05, "loss": 2.3579, "step": 26460 }, { "epoch": 0.23, "learning_rate": 8.800230044752427e-05, "loss": 2.329, "step": 26465 }, { "epoch": 0.23, "learning_rate": 8.799794086423361e-05, "loss": 2.2736, "step": 26470 }, { "epoch": 0.23, "learning_rate": 8.799358059704721e-05, "loss": 2.2436, "step": 26475 }, { "epoch": 0.23, "learning_rate": 8.798921964604361e-05, "loss": 2.31, "step": 26480 }, { "epoch": 0.23, "learning_rate": 8.798485801130127e-05, "loss": 2.2721, "step": 26485 }, { "epoch": 0.23, "learning_rate": 8.798049569289868e-05, "loss": 2.3877, "step": 26490 }, { "epoch": 0.23, "learning_rate": 8.797613269091435e-05, "loss": 2.33, "step": 26495 }, { "epoch": 0.23, "learning_rate": 8.797176900542686e-05, "loss": 2.3897, "step": 26500 }, { "epoch": 0.23, "learning_rate": 8.796740463651469e-05, "loss": 2.3246, "step": 26505 }, { "epoch": 0.23, "learning_rate": 8.796303958425643e-05, "loss": 2.3236, "step": 26510 }, { "epoch": 0.23, "learning_rate": 8.79586738487306e-05, "loss": 2.3368, "step": 26515 }, { "epoch": 0.23, "learning_rate": 8.79543074300158e-05, "loss": 2.3859, "step": 26520 }, { "epoch": 0.23, "learning_rate": 8.794994032819063e-05, "loss": 2.4123, "step": 26525 }, { "epoch": 0.23, "learning_rate": 8.794557254333369e-05, "loss": 2.3437, "step": 26530 }, { "epoch": 0.23, "learning_rate": 8.794120407552356e-05, "loss": 2.3725, "step": 26535 }, { "epoch": 0.23, "learning_rate": 8.793683492483891e-05, "loss": 2.3512, "step": 26540 }, { "epoch": 0.23, "learning_rate": 8.793246509135833e-05, "loss": 2.3143, "step": 26545 }, { "epoch": 0.23, "learning_rate": 8.79280945751605e-05, "loss": 2.3668, "step": 26550 }, { "epoch": 0.23, "learning_rate": 8.792372337632407e-05, "loss": 2.3463, "step": 26555 }, { "epoch": 0.23, "learning_rate": 8.791935149492772e-05, "loss": 2.3228, "step": 26560 }, { "epoch": 0.23, "learning_rate": 8.791497893105014e-05, "loss": 2.3504, "step": 26565 }, { "epoch": 0.23, "learning_rate": 8.791060568477002e-05, "loss": 2.3886, "step": 26570 }, { "epoch": 0.23, "learning_rate": 8.790623175616607e-05, "loss": 2.4289, "step": 26575 }, { "epoch": 0.23, "learning_rate": 8.790185714531701e-05, "loss": 2.3758, "step": 26580 }, { "epoch": 0.23, "learning_rate": 8.789748185230159e-05, "loss": 2.2827, "step": 26585 }, { "epoch": 0.23, "learning_rate": 8.789310587719855e-05, "loss": 2.3813, "step": 26590 }, { "epoch": 0.23, "learning_rate": 8.788872922008664e-05, "loss": 2.3393, "step": 26595 }, { "epoch": 0.23, "learning_rate": 8.788435188104463e-05, "loss": 2.331, "step": 26600 }, { "epoch": 0.23, "learning_rate": 8.787997386015134e-05, "loss": 2.3719, "step": 26605 }, { "epoch": 0.23, "learning_rate": 8.787559515748552e-05, "loss": 2.3629, "step": 26610 }, { "epoch": 0.23, "learning_rate": 8.787121577312601e-05, "loss": 2.3556, "step": 26615 }, { "epoch": 0.23, "learning_rate": 8.786683570715162e-05, "loss": 2.3265, "step": 26620 }, { "epoch": 0.23, "learning_rate": 8.786245495964119e-05, "loss": 2.4077, "step": 26625 }, { "epoch": 0.23, "learning_rate": 8.785807353067355e-05, "loss": 2.3293, "step": 26630 }, { "epoch": 0.23, "learning_rate": 8.785369142032758e-05, "loss": 2.3559, "step": 26635 }, { "epoch": 0.23, "learning_rate": 8.784930862868212e-05, "loss": 2.278, "step": 26640 }, { "epoch": 0.23, "learning_rate": 8.78449251558161e-05, "loss": 2.2319, "step": 26645 }, { "epoch": 0.23, "learning_rate": 8.784054100180836e-05, "loss": 2.3864, "step": 26650 }, { "epoch": 0.23, "learning_rate": 8.783615616673784e-05, "loss": 2.3312, "step": 26655 }, { "epoch": 0.23, "learning_rate": 8.783177065068347e-05, "loss": 2.3141, "step": 26660 }, { "epoch": 0.23, "learning_rate": 8.782738445372414e-05, "loss": 2.2485, "step": 26665 }, { "epoch": 0.23, "learning_rate": 8.782299757593883e-05, "loss": 2.3441, "step": 26670 }, { "epoch": 0.23, "learning_rate": 8.781861001740648e-05, "loss": 2.3009, "step": 26675 }, { "epoch": 0.23, "learning_rate": 8.781422177820607e-05, "loss": 2.3565, "step": 26680 }, { "epoch": 0.23, "learning_rate": 8.780983285841655e-05, "loss": 2.4205, "step": 26685 }, { "epoch": 0.23, "learning_rate": 8.780544325811694e-05, "loss": 2.2655, "step": 26690 }, { "epoch": 0.23, "learning_rate": 8.780105297738625e-05, "loss": 2.3755, "step": 26695 }, { "epoch": 0.23, "learning_rate": 8.77966620163035e-05, "loss": 2.3875, "step": 26700 }, { "epoch": 0.23, "learning_rate": 8.77922703749477e-05, "loss": 2.396, "step": 26705 }, { "epoch": 0.23, "learning_rate": 8.778787805339789e-05, "loss": 2.3673, "step": 26710 }, { "epoch": 0.23, "learning_rate": 8.778348505173312e-05, "loss": 2.3099, "step": 26715 }, { "epoch": 0.23, "learning_rate": 8.777909137003251e-05, "loss": 2.3717, "step": 26720 }, { "epoch": 0.23, "learning_rate": 8.777469700837507e-05, "loss": 2.284, "step": 26725 }, { "epoch": 0.23, "learning_rate": 8.777030196683991e-05, "loss": 2.3323, "step": 26730 }, { "epoch": 0.23, "learning_rate": 8.776590624550615e-05, "loss": 2.3784, "step": 26735 }, { "epoch": 0.23, "learning_rate": 8.77615098444529e-05, "loss": 2.3425, "step": 26740 }, { "epoch": 0.23, "learning_rate": 8.775711276375929e-05, "loss": 2.272, "step": 26745 }, { "epoch": 0.23, "learning_rate": 8.775271500350445e-05, "loss": 2.4207, "step": 26750 }, { "epoch": 0.23, "learning_rate": 8.774831656376752e-05, "loss": 2.2486, "step": 26755 }, { "epoch": 0.23, "learning_rate": 8.77439174446277e-05, "loss": 2.3176, "step": 26760 }, { "epoch": 0.23, "learning_rate": 8.773951764616414e-05, "loss": 2.3429, "step": 26765 }, { "epoch": 0.23, "learning_rate": 8.773511716845603e-05, "loss": 2.3297, "step": 26770 }, { "epoch": 0.23, "learning_rate": 8.773071601158259e-05, "loss": 2.3575, "step": 26775 }, { "epoch": 0.23, "learning_rate": 8.7726314175623e-05, "loss": 2.3595, "step": 26780 }, { "epoch": 0.23, "learning_rate": 8.772191166065651e-05, "loss": 2.3853, "step": 26785 }, { "epoch": 0.23, "learning_rate": 8.771750846676235e-05, "loss": 2.1992, "step": 26790 }, { "epoch": 0.23, "learning_rate": 8.771310459401978e-05, "loss": 2.3156, "step": 26795 }, { "epoch": 0.23, "learning_rate": 8.770870004250805e-05, "loss": 2.3314, "step": 26800 }, { "epoch": 0.23, "learning_rate": 8.770429481230642e-05, "loss": 2.3675, "step": 26805 }, { "epoch": 0.23, "learning_rate": 8.769988890349422e-05, "loss": 2.3432, "step": 26810 }, { "epoch": 0.23, "learning_rate": 8.76954823161507e-05, "loss": 2.3355, "step": 26815 }, { "epoch": 0.23, "learning_rate": 8.769107505035518e-05, "loss": 2.3194, "step": 26820 }, { "epoch": 0.23, "learning_rate": 8.768666710618702e-05, "loss": 2.3352, "step": 26825 }, { "epoch": 0.23, "learning_rate": 8.768225848372553e-05, "loss": 2.3431, "step": 26830 }, { "epoch": 0.23, "learning_rate": 8.767784918305007e-05, "loss": 2.2601, "step": 26835 }, { "epoch": 0.23, "learning_rate": 8.767343920423997e-05, "loss": 2.2697, "step": 26840 }, { "epoch": 0.23, "learning_rate": 8.766902854737462e-05, "loss": 2.3731, "step": 26845 }, { "epoch": 0.23, "learning_rate": 8.766461721253341e-05, "loss": 2.3534, "step": 26850 }, { "epoch": 0.23, "learning_rate": 8.766020519979572e-05, "loss": 2.3655, "step": 26855 }, { "epoch": 0.23, "learning_rate": 8.765579250924096e-05, "loss": 2.3887, "step": 26860 }, { "epoch": 0.23, "learning_rate": 8.765137914094858e-05, "loss": 2.4235, "step": 26865 }, { "epoch": 0.23, "learning_rate": 8.764696509499798e-05, "loss": 2.3377, "step": 26870 }, { "epoch": 0.23, "learning_rate": 8.764255037146864e-05, "loss": 2.2478, "step": 26875 }, { "epoch": 0.23, "learning_rate": 8.763813497043997e-05, "loss": 2.3579, "step": 26880 }, { "epoch": 0.23, "learning_rate": 8.763371889199147e-05, "loss": 2.3553, "step": 26885 }, { "epoch": 0.23, "learning_rate": 8.762930213620262e-05, "loss": 2.3483, "step": 26890 }, { "epoch": 0.23, "learning_rate": 8.76248847031529e-05, "loss": 2.303, "step": 26895 }, { "epoch": 0.23, "learning_rate": 8.762046659292183e-05, "loss": 2.3577, "step": 26900 }, { "epoch": 0.23, "learning_rate": 8.761604780558892e-05, "loss": 2.3265, "step": 26905 }, { "epoch": 0.23, "learning_rate": 8.76116283412337e-05, "loss": 2.2858, "step": 26910 }, { "epoch": 0.23, "learning_rate": 8.760720819993572e-05, "loss": 2.3313, "step": 26915 }, { "epoch": 0.23, "learning_rate": 8.760278738177453e-05, "loss": 2.2485, "step": 26920 }, { "epoch": 0.23, "learning_rate": 8.75983658868297e-05, "loss": 2.3387, "step": 26925 }, { "epoch": 0.23, "learning_rate": 8.75939437151808e-05, "loss": 2.3823, "step": 26930 }, { "epoch": 0.23, "learning_rate": 8.758952086690744e-05, "loss": 2.3689, "step": 26935 }, { "epoch": 0.23, "learning_rate": 8.758509734208919e-05, "loss": 2.3292, "step": 26940 }, { "epoch": 0.23, "learning_rate": 8.758067314080571e-05, "loss": 2.3682, "step": 26945 }, { "epoch": 0.23, "learning_rate": 8.75762482631366e-05, "loss": 2.3396, "step": 26950 }, { "epoch": 0.23, "learning_rate": 8.75718227091615e-05, "loss": 2.3158, "step": 26955 }, { "epoch": 0.23, "learning_rate": 8.756739647896007e-05, "loss": 2.4095, "step": 26960 }, { "epoch": 0.23, "learning_rate": 8.756296957261196e-05, "loss": 2.4081, "step": 26965 }, { "epoch": 0.23, "learning_rate": 8.755854199019687e-05, "loss": 2.3552, "step": 26970 }, { "epoch": 0.23, "learning_rate": 8.755411373179447e-05, "loss": 2.2711, "step": 26975 }, { "epoch": 0.23, "learning_rate": 8.754968479748446e-05, "loss": 2.3421, "step": 26980 }, { "epoch": 0.23, "learning_rate": 8.754525518734657e-05, "loss": 2.3604, "step": 26985 }, { "epoch": 0.23, "learning_rate": 8.754082490146051e-05, "loss": 2.3384, "step": 26990 }, { "epoch": 0.23, "learning_rate": 8.753639393990604e-05, "loss": 2.3599, "step": 26995 }, { "epoch": 0.23, "learning_rate": 8.753196230276288e-05, "loss": 2.3152, "step": 27000 }, { "epoch": 0.23, "learning_rate": 8.75275299901108e-05, "loss": 2.3679, "step": 27005 }, { "epoch": 0.23, "learning_rate": 8.752309700202959e-05, "loss": 2.2504, "step": 27010 }, { "epoch": 0.23, "learning_rate": 8.7518663338599e-05, "loss": 2.3121, "step": 27015 }, { "epoch": 0.23, "learning_rate": 8.751422899989887e-05, "loss": 2.3631, "step": 27020 }, { "epoch": 0.23, "learning_rate": 8.750979398600898e-05, "loss": 2.3868, "step": 27025 }, { "epoch": 0.23, "learning_rate": 8.750535829700918e-05, "loss": 2.3037, "step": 27030 }, { "epoch": 0.23, "learning_rate": 8.750092193297927e-05, "loss": 2.2721, "step": 27035 }, { "epoch": 0.23, "learning_rate": 8.749648489399913e-05, "loss": 2.2667, "step": 27040 }, { "epoch": 0.23, "learning_rate": 8.749204718014859e-05, "loss": 2.3552, "step": 27045 }, { "epoch": 0.23, "learning_rate": 8.748760879150755e-05, "loss": 2.2966, "step": 27050 }, { "epoch": 0.23, "learning_rate": 8.748316972815586e-05, "loss": 2.3426, "step": 27055 }, { "epoch": 0.23, "learning_rate": 8.747872999017346e-05, "loss": 2.3172, "step": 27060 }, { "epoch": 0.23, "learning_rate": 8.747428957764021e-05, "loss": 2.2459, "step": 27065 }, { "epoch": 0.23, "learning_rate": 8.746984849063607e-05, "loss": 2.378, "step": 27070 }, { "epoch": 0.23, "learning_rate": 8.746540672924093e-05, "loss": 2.336, "step": 27075 }, { "epoch": 0.23, "learning_rate": 8.746096429353476e-05, "loss": 2.2877, "step": 27080 }, { "epoch": 0.23, "learning_rate": 8.745652118359752e-05, "loss": 2.3525, "step": 27085 }, { "epoch": 0.23, "learning_rate": 8.745207739950915e-05, "loss": 2.4081, "step": 27090 }, { "epoch": 0.23, "learning_rate": 8.744763294134969e-05, "loss": 2.2741, "step": 27095 }, { "epoch": 0.23, "learning_rate": 8.744318780919907e-05, "loss": 2.3205, "step": 27100 }, { "epoch": 0.23, "learning_rate": 8.74387420031373e-05, "loss": 2.3375, "step": 27105 }, { "epoch": 0.23, "learning_rate": 8.743429552324444e-05, "loss": 2.3517, "step": 27110 }, { "epoch": 0.23, "learning_rate": 8.74298483696005e-05, "loss": 2.3259, "step": 27115 }, { "epoch": 0.23, "learning_rate": 8.74254005422855e-05, "loss": 2.4193, "step": 27120 }, { "epoch": 0.23, "learning_rate": 8.74209520413795e-05, "loss": 2.3272, "step": 27125 }, { "epoch": 0.23, "learning_rate": 8.741650286696258e-05, "loss": 2.3515, "step": 27130 }, { "epoch": 0.23, "learning_rate": 8.74120530191148e-05, "loss": 2.4112, "step": 27135 }, { "epoch": 0.23, "learning_rate": 8.740760249791628e-05, "loss": 2.2921, "step": 27140 }, { "epoch": 0.23, "learning_rate": 8.740315130344707e-05, "loss": 2.341, "step": 27145 }, { "epoch": 0.23, "learning_rate": 8.739869943578733e-05, "loss": 2.3504, "step": 27150 }, { "epoch": 0.23, "learning_rate": 8.739424689501718e-05, "loss": 2.3451, "step": 27155 }, { "epoch": 0.23, "learning_rate": 8.738979368121674e-05, "loss": 2.3499, "step": 27160 }, { "epoch": 0.23, "learning_rate": 8.738533979446614e-05, "loss": 2.3032, "step": 27165 }, { "epoch": 0.23, "learning_rate": 8.73808852348456e-05, "loss": 2.422, "step": 27170 }, { "epoch": 0.23, "learning_rate": 8.737643000243525e-05, "loss": 2.3158, "step": 27175 }, { "epoch": 0.23, "learning_rate": 8.73719740973153e-05, "loss": 2.342, "step": 27180 }, { "epoch": 0.23, "learning_rate": 8.736751751956594e-05, "loss": 2.303, "step": 27185 }, { "epoch": 0.23, "learning_rate": 8.736306026926737e-05, "loss": 2.3569, "step": 27190 }, { "epoch": 0.23, "learning_rate": 8.735860234649983e-05, "loss": 2.268, "step": 27195 }, { "epoch": 0.23, "learning_rate": 8.735414375134354e-05, "loss": 2.2314, "step": 27200 }, { "epoch": 0.23, "learning_rate": 8.734968448387875e-05, "loss": 2.3129, "step": 27205 }, { "epoch": 0.23, "learning_rate": 8.734522454418572e-05, "loss": 2.2971, "step": 27210 }, { "epoch": 0.23, "learning_rate": 8.734076393234474e-05, "loss": 2.3131, "step": 27215 }, { "epoch": 0.23, "learning_rate": 8.733630264843606e-05, "loss": 2.2662, "step": 27220 }, { "epoch": 0.23, "learning_rate": 8.733184069253999e-05, "loss": 2.361, "step": 27225 }, { "epoch": 0.23, "learning_rate": 8.732737806473685e-05, "loss": 2.2297, "step": 27230 }, { "epoch": 0.23, "learning_rate": 8.732291476510694e-05, "loss": 2.353, "step": 27235 }, { "epoch": 0.23, "learning_rate": 8.73184507937306e-05, "loss": 2.3396, "step": 27240 }, { "epoch": 0.23, "learning_rate": 8.731398615068818e-05, "loss": 2.2641, "step": 27245 }, { "epoch": 0.23, "learning_rate": 8.730952083606e-05, "loss": 2.3037, "step": 27250 }, { "epoch": 0.23, "learning_rate": 8.73050548499265e-05, "loss": 2.355, "step": 27255 }, { "epoch": 0.23, "learning_rate": 8.730058819236799e-05, "loss": 2.2985, "step": 27260 }, { "epoch": 0.23, "learning_rate": 8.729612086346489e-05, "loss": 2.3467, "step": 27265 }, { "epoch": 0.23, "learning_rate": 8.729165286329762e-05, "loss": 2.3008, "step": 27270 }, { "epoch": 0.23, "learning_rate": 8.728718419194655e-05, "loss": 2.3509, "step": 27275 }, { "epoch": 0.23, "learning_rate": 8.728271484949215e-05, "loss": 2.2402, "step": 27280 }, { "epoch": 0.23, "learning_rate": 8.727824483601485e-05, "loss": 2.3902, "step": 27285 }, { "epoch": 0.23, "learning_rate": 8.72737741515951e-05, "loss": 2.3228, "step": 27290 }, { "epoch": 0.23, "learning_rate": 8.726930279631335e-05, "loss": 2.3427, "step": 27295 }, { "epoch": 0.23, "learning_rate": 8.72648307702501e-05, "loss": 2.3253, "step": 27300 }, { "epoch": 0.23, "learning_rate": 8.726035807348582e-05, "loss": 2.2602, "step": 27305 }, { "epoch": 0.23, "learning_rate": 8.725588470610104e-05, "loss": 2.2982, "step": 27310 }, { "epoch": 0.23, "learning_rate": 8.725141066817623e-05, "loss": 2.3644, "step": 27315 }, { "epoch": 0.23, "learning_rate": 8.724693595979197e-05, "loss": 2.3304, "step": 27320 }, { "epoch": 0.23, "learning_rate": 8.724246058102872e-05, "loss": 2.3136, "step": 27325 }, { "epoch": 0.23, "learning_rate": 8.723798453196709e-05, "loss": 2.2672, "step": 27330 }, { "epoch": 0.23, "learning_rate": 8.723350781268763e-05, "loss": 2.2494, "step": 27335 }, { "epoch": 0.23, "learning_rate": 8.72290304232709e-05, "loss": 2.2862, "step": 27340 }, { "epoch": 0.23, "learning_rate": 8.72245523637975e-05, "loss": 2.3528, "step": 27345 }, { "epoch": 0.23, "learning_rate": 8.7220073634348e-05, "loss": 2.3059, "step": 27350 }, { "epoch": 0.23, "learning_rate": 8.721559423500305e-05, "loss": 2.318, "step": 27355 }, { "epoch": 0.23, "learning_rate": 8.721111416584324e-05, "loss": 2.3331, "step": 27360 }, { "epoch": 0.23, "learning_rate": 8.720663342694922e-05, "loss": 2.4293, "step": 27365 }, { "epoch": 0.23, "learning_rate": 8.72021520184016e-05, "loss": 2.4036, "step": 27370 }, { "epoch": 0.23, "learning_rate": 8.719766994028109e-05, "loss": 2.3482, "step": 27375 }, { "epoch": 0.23, "learning_rate": 8.719318719266834e-05, "loss": 2.311, "step": 27380 }, { "epoch": 0.23, "learning_rate": 8.718870377564401e-05, "loss": 2.3608, "step": 27385 }, { "epoch": 0.23, "learning_rate": 8.71842196892888e-05, "loss": 2.3343, "step": 27390 }, { "epoch": 0.23, "learning_rate": 8.717973493368345e-05, "loss": 2.3697, "step": 27395 }, { "epoch": 0.23, "learning_rate": 8.717524950890863e-05, "loss": 2.362, "step": 27400 }, { "epoch": 0.23, "learning_rate": 8.717076341504511e-05, "loss": 2.3567, "step": 27405 }, { "epoch": 0.23, "learning_rate": 8.716627665217362e-05, "loss": 2.3286, "step": 27410 }, { "epoch": 0.23, "learning_rate": 8.716178922037489e-05, "loss": 2.3426, "step": 27415 }, { "epoch": 0.23, "learning_rate": 8.715730111972972e-05, "loss": 2.3416, "step": 27420 }, { "epoch": 0.23, "learning_rate": 8.715281235031886e-05, "loss": 2.3805, "step": 27425 }, { "epoch": 0.23, "learning_rate": 8.714832291222312e-05, "loss": 2.3362, "step": 27430 }, { "epoch": 0.23, "learning_rate": 8.714383280552329e-05, "loss": 2.4035, "step": 27435 }, { "epoch": 0.23, "learning_rate": 8.713934203030018e-05, "loss": 2.2852, "step": 27440 }, { "epoch": 0.23, "learning_rate": 8.713485058663464e-05, "loss": 2.37, "step": 27445 }, { "epoch": 0.23, "learning_rate": 8.713035847460748e-05, "loss": 2.2501, "step": 27450 }, { "epoch": 0.23, "learning_rate": 8.712586569429957e-05, "loss": 2.3357, "step": 27455 }, { "epoch": 0.23, "learning_rate": 8.712137224579175e-05, "loss": 2.4689, "step": 27460 }, { "epoch": 0.23, "learning_rate": 8.711687812916492e-05, "loss": 2.3633, "step": 27465 }, { "epoch": 0.23, "learning_rate": 8.711238334449996e-05, "loss": 2.288, "step": 27470 }, { "epoch": 0.23, "learning_rate": 8.710788789187774e-05, "loss": 2.2722, "step": 27475 }, { "epoch": 0.23, "learning_rate": 8.710339177137922e-05, "loss": 2.4025, "step": 27480 }, { "epoch": 0.23, "learning_rate": 8.709889498308528e-05, "loss": 2.3209, "step": 27485 }, { "epoch": 0.23, "learning_rate": 8.709439752707687e-05, "loss": 2.3776, "step": 27490 }, { "epoch": 0.23, "learning_rate": 8.708989940343494e-05, "loss": 2.2698, "step": 27495 }, { "epoch": 0.23, "learning_rate": 8.708540061224044e-05, "loss": 2.3255, "step": 27500 }, { "epoch": 0.23, "learning_rate": 8.708090115357434e-05, "loss": 2.2695, "step": 27505 }, { "epoch": 0.23, "learning_rate": 8.707640102751764e-05, "loss": 2.3228, "step": 27510 }, { "epoch": 0.23, "learning_rate": 8.707190023415131e-05, "loss": 2.2834, "step": 27515 }, { "epoch": 0.23, "learning_rate": 8.706739877355637e-05, "loss": 2.2692, "step": 27520 }, { "epoch": 0.23, "learning_rate": 8.706289664581382e-05, "loss": 2.3302, "step": 27525 }, { "epoch": 0.23, "learning_rate": 8.705839385100471e-05, "loss": 2.3898, "step": 27530 }, { "epoch": 0.23, "learning_rate": 8.70538903892101e-05, "loss": 2.3047, "step": 27535 }, { "epoch": 0.24, "learning_rate": 8.7049386260511e-05, "loss": 2.3204, "step": 27540 }, { "epoch": 0.24, "learning_rate": 8.704488146498851e-05, "loss": 2.3652, "step": 27545 }, { "epoch": 0.24, "learning_rate": 8.70403760027237e-05, "loss": 2.3611, "step": 27550 }, { "epoch": 0.24, "learning_rate": 8.703586987379765e-05, "loss": 2.3599, "step": 27555 }, { "epoch": 0.24, "learning_rate": 8.703136307829147e-05, "loss": 2.3593, "step": 27560 }, { "epoch": 0.24, "learning_rate": 8.702685561628628e-05, "loss": 2.3549, "step": 27565 }, { "epoch": 0.24, "learning_rate": 8.702234748786319e-05, "loss": 2.4016, "step": 27570 }, { "epoch": 0.24, "learning_rate": 8.701783869310335e-05, "loss": 2.3412, "step": 27575 }, { "epoch": 0.24, "learning_rate": 8.701332923208791e-05, "loss": 2.2373, "step": 27580 }, { "epoch": 0.24, "learning_rate": 8.700881910489805e-05, "loss": 2.3053, "step": 27585 }, { "epoch": 0.24, "learning_rate": 8.70043083116149e-05, "loss": 2.2703, "step": 27590 }, { "epoch": 0.24, "learning_rate": 8.699979685231968e-05, "loss": 2.3666, "step": 27595 }, { "epoch": 0.24, "learning_rate": 8.699528472709358e-05, "loss": 2.3503, "step": 27600 }, { "epoch": 0.24, "learning_rate": 8.699077193601781e-05, "loss": 2.3558, "step": 27605 }, { "epoch": 0.24, "learning_rate": 8.698625847917358e-05, "loss": 2.3197, "step": 27610 }, { "epoch": 0.24, "learning_rate": 8.698174435664217e-05, "loss": 2.3394, "step": 27615 }, { "epoch": 0.24, "learning_rate": 8.697722956850478e-05, "loss": 2.4157, "step": 27620 }, { "epoch": 0.24, "learning_rate": 8.697271411484266e-05, "loss": 2.3906, "step": 27625 }, { "epoch": 0.24, "learning_rate": 8.696819799573713e-05, "loss": 2.3589, "step": 27630 }, { "epoch": 0.24, "learning_rate": 8.696368121126943e-05, "loss": 2.3147, "step": 27635 }, { "epoch": 0.24, "learning_rate": 8.695916376152087e-05, "loss": 2.3231, "step": 27640 }, { "epoch": 0.24, "learning_rate": 8.695464564657274e-05, "loss": 2.3919, "step": 27645 }, { "epoch": 0.24, "learning_rate": 8.695012686650638e-05, "loss": 2.3055, "step": 27650 }, { "epoch": 0.24, "learning_rate": 8.694560742140314e-05, "loss": 2.2706, "step": 27655 }, { "epoch": 0.24, "learning_rate": 8.694108731134429e-05, "loss": 2.3036, "step": 27660 }, { "epoch": 0.24, "learning_rate": 8.693656653641126e-05, "loss": 2.364, "step": 27665 }, { "epoch": 0.24, "learning_rate": 8.693204509668538e-05, "loss": 2.4054, "step": 27670 }, { "epoch": 0.24, "learning_rate": 8.692752299224801e-05, "loss": 2.3102, "step": 27675 }, { "epoch": 0.24, "learning_rate": 8.692300022318059e-05, "loss": 2.343, "step": 27680 }, { "epoch": 0.24, "learning_rate": 8.691847678956446e-05, "loss": 2.2602, "step": 27685 }, { "epoch": 0.24, "learning_rate": 8.69139526914811e-05, "loss": 2.343, "step": 27690 }, { "epoch": 0.24, "learning_rate": 8.690942792901189e-05, "loss": 2.308, "step": 27695 }, { "epoch": 0.24, "learning_rate": 8.690490250223829e-05, "loss": 2.4132, "step": 27700 }, { "epoch": 0.24, "learning_rate": 8.690037641124172e-05, "loss": 2.3212, "step": 27705 }, { "epoch": 0.24, "learning_rate": 8.689584965610367e-05, "loss": 2.3029, "step": 27710 }, { "epoch": 0.24, "learning_rate": 8.689132223690562e-05, "loss": 2.2771, "step": 27715 }, { "epoch": 0.24, "learning_rate": 8.688679415372902e-05, "loss": 2.3485, "step": 27720 }, { "epoch": 0.24, "learning_rate": 8.68822654066554e-05, "loss": 2.415, "step": 27725 }, { "epoch": 0.24, "learning_rate": 8.687773599576626e-05, "loss": 2.3585, "step": 27730 }, { "epoch": 0.24, "learning_rate": 8.687320592114311e-05, "loss": 2.3126, "step": 27735 }, { "epoch": 0.24, "learning_rate": 8.686867518286751e-05, "loss": 2.2852, "step": 27740 }, { "epoch": 0.24, "learning_rate": 8.686414378102097e-05, "loss": 2.3597, "step": 27745 }, { "epoch": 0.24, "learning_rate": 8.685961171568508e-05, "loss": 2.3323, "step": 27750 }, { "epoch": 0.24, "learning_rate": 8.685507898694139e-05, "loss": 2.2633, "step": 27755 }, { "epoch": 0.24, "learning_rate": 8.685054559487148e-05, "loss": 2.2879, "step": 27760 }, { "epoch": 0.24, "learning_rate": 8.684601153955696e-05, "loss": 2.3401, "step": 27765 }, { "epoch": 0.24, "learning_rate": 8.684147682107941e-05, "loss": 2.3365, "step": 27770 }, { "epoch": 0.24, "learning_rate": 8.683694143952046e-05, "loss": 2.2852, "step": 27775 }, { "epoch": 0.24, "learning_rate": 8.683240539496175e-05, "loss": 2.3696, "step": 27780 }, { "epoch": 0.24, "learning_rate": 8.682786868748492e-05, "loss": 2.3703, "step": 27785 }, { "epoch": 0.24, "learning_rate": 8.682333131717159e-05, "loss": 2.307, "step": 27790 }, { "epoch": 0.24, "learning_rate": 8.681879328410347e-05, "loss": 2.3758, "step": 27795 }, { "epoch": 0.24, "learning_rate": 8.681425458836219e-05, "loss": 2.3759, "step": 27800 }, { "epoch": 0.24, "learning_rate": 8.680971523002947e-05, "loss": 2.3071, "step": 27805 }, { "epoch": 0.24, "learning_rate": 8.680517520918701e-05, "loss": 2.3374, "step": 27810 }, { "epoch": 0.24, "learning_rate": 8.680063452591652e-05, "loss": 2.325, "step": 27815 }, { "epoch": 0.24, "learning_rate": 8.679609318029971e-05, "loss": 2.3047, "step": 27820 }, { "epoch": 0.24, "learning_rate": 8.679155117241832e-05, "loss": 2.3072, "step": 27825 }, { "epoch": 0.24, "learning_rate": 8.678700850235413e-05, "loss": 2.3298, "step": 27830 }, { "epoch": 0.24, "learning_rate": 8.678246517018884e-05, "loss": 2.2842, "step": 27835 }, { "epoch": 0.24, "learning_rate": 8.677792117600428e-05, "loss": 2.3593, "step": 27840 }, { "epoch": 0.24, "learning_rate": 8.67733765198822e-05, "loss": 2.313, "step": 27845 }, { "epoch": 0.24, "learning_rate": 8.67688312019044e-05, "loss": 2.3309, "step": 27850 }, { "epoch": 0.24, "learning_rate": 8.67642852221527e-05, "loss": 2.2617, "step": 27855 }, { "epoch": 0.24, "learning_rate": 8.675973858070892e-05, "loss": 2.2793, "step": 27860 }, { "epoch": 0.24, "learning_rate": 8.675519127765488e-05, "loss": 2.3335, "step": 27865 }, { "epoch": 0.24, "learning_rate": 8.675064331307242e-05, "loss": 2.3052, "step": 27870 }, { "epoch": 0.24, "learning_rate": 8.67460946870434e-05, "loss": 2.2963, "step": 27875 }, { "epoch": 0.24, "learning_rate": 8.674154539964971e-05, "loss": 2.4229, "step": 27880 }, { "epoch": 0.24, "learning_rate": 8.67369954509732e-05, "loss": 2.3877, "step": 27885 }, { "epoch": 0.24, "learning_rate": 8.673244484109574e-05, "loss": 2.2836, "step": 27890 }, { "epoch": 0.24, "learning_rate": 8.672789357009931e-05, "loss": 2.3669, "step": 27895 }, { "epoch": 0.24, "learning_rate": 8.672334163806577e-05, "loss": 2.3121, "step": 27900 }, { "epoch": 0.24, "learning_rate": 8.671878904507704e-05, "loss": 2.2901, "step": 27905 }, { "epoch": 0.24, "learning_rate": 8.671423579121507e-05, "loss": 2.3921, "step": 27910 }, { "epoch": 0.24, "learning_rate": 8.670968187656182e-05, "loss": 2.339, "step": 27915 }, { "epoch": 0.24, "learning_rate": 8.670512730119925e-05, "loss": 2.413, "step": 27920 }, { "epoch": 0.24, "learning_rate": 8.670057206520934e-05, "loss": 2.3212, "step": 27925 }, { "epoch": 0.24, "learning_rate": 8.669601616867405e-05, "loss": 2.2936, "step": 27930 }, { "epoch": 0.24, "learning_rate": 8.669145961167539e-05, "loss": 2.3499, "step": 27935 }, { "epoch": 0.24, "learning_rate": 8.66869023942954e-05, "loss": 2.3364, "step": 27940 }, { "epoch": 0.24, "learning_rate": 8.668234451661605e-05, "loss": 2.3077, "step": 27945 }, { "epoch": 0.24, "learning_rate": 8.667778597871943e-05, "loss": 2.3295, "step": 27950 }, { "epoch": 0.24, "learning_rate": 8.667322678068752e-05, "loss": 2.2907, "step": 27955 }, { "epoch": 0.24, "learning_rate": 8.666866692260245e-05, "loss": 2.3856, "step": 27960 }, { "epoch": 0.24, "learning_rate": 8.666410640454623e-05, "loss": 2.3044, "step": 27965 }, { "epoch": 0.24, "learning_rate": 8.665954522660097e-05, "loss": 2.3106, "step": 27970 }, { "epoch": 0.24, "learning_rate": 8.665498338884876e-05, "loss": 2.2884, "step": 27975 }, { "epoch": 0.24, "learning_rate": 8.66504208913717e-05, "loss": 2.3766, "step": 27980 }, { "epoch": 0.24, "learning_rate": 8.66458577342519e-05, "loss": 2.361, "step": 27985 }, { "epoch": 0.24, "learning_rate": 8.664129391757151e-05, "loss": 2.4138, "step": 27990 }, { "epoch": 0.24, "learning_rate": 8.663672944141266e-05, "loss": 2.2947, "step": 27995 }, { "epoch": 0.24, "learning_rate": 8.66321643058575e-05, "loss": 2.3011, "step": 28000 }, { "epoch": 0.24, "learning_rate": 8.662759851098819e-05, "loss": 2.3211, "step": 28005 }, { "epoch": 0.24, "learning_rate": 8.66230320568869e-05, "loss": 2.3329, "step": 28010 }, { "epoch": 0.24, "learning_rate": 8.661846494363585e-05, "loss": 2.3988, "step": 28015 }, { "epoch": 0.24, "learning_rate": 8.661389717131722e-05, "loss": 2.3489, "step": 28020 }, { "epoch": 0.24, "learning_rate": 8.660932874001322e-05, "loss": 2.38, "step": 28025 }, { "epoch": 0.24, "learning_rate": 8.660475964980607e-05, "loss": 2.3772, "step": 28030 }, { "epoch": 0.24, "learning_rate": 8.660018990077801e-05, "loss": 2.3899, "step": 28035 }, { "epoch": 0.24, "learning_rate": 8.659561949301129e-05, "loss": 2.3137, "step": 28040 }, { "epoch": 0.24, "learning_rate": 8.659104842658816e-05, "loss": 2.3405, "step": 28045 }, { "epoch": 0.24, "learning_rate": 8.658647670159091e-05, "loss": 2.2816, "step": 28050 }, { "epoch": 0.24, "learning_rate": 8.65819043181018e-05, "loss": 2.3744, "step": 28055 }, { "epoch": 0.24, "learning_rate": 8.657733127620316e-05, "loss": 2.3302, "step": 28060 }, { "epoch": 0.24, "learning_rate": 8.657275757597725e-05, "loss": 2.2937, "step": 28065 }, { "epoch": 0.24, "learning_rate": 8.656818321750642e-05, "loss": 2.3184, "step": 28070 }, { "epoch": 0.24, "learning_rate": 8.6563608200873e-05, "loss": 2.3834, "step": 28075 }, { "epoch": 0.24, "learning_rate": 8.65590325261593e-05, "loss": 2.3402, "step": 28080 }, { "epoch": 0.24, "learning_rate": 8.655445619344772e-05, "loss": 2.4245, "step": 28085 }, { "epoch": 0.24, "learning_rate": 8.654987920282059e-05, "loss": 2.2974, "step": 28090 }, { "epoch": 0.24, "learning_rate": 8.654530155436032e-05, "loss": 2.348, "step": 28095 }, { "epoch": 0.24, "learning_rate": 8.654072324814926e-05, "loss": 2.3093, "step": 28100 }, { "epoch": 0.24, "learning_rate": 8.653614428426983e-05, "loss": 2.2728, "step": 28105 }, { "epoch": 0.24, "learning_rate": 8.653156466280447e-05, "loss": 2.3146, "step": 28110 }, { "epoch": 0.24, "learning_rate": 8.652698438383557e-05, "loss": 2.4058, "step": 28115 }, { "epoch": 0.24, "learning_rate": 8.652240344744557e-05, "loss": 2.299, "step": 28120 }, { "epoch": 0.24, "learning_rate": 8.651782185371696e-05, "loss": 2.3617, "step": 28125 }, { "epoch": 0.24, "learning_rate": 8.651323960273214e-05, "loss": 2.3004, "step": 28130 }, { "epoch": 0.24, "learning_rate": 8.65086566945736e-05, "loss": 2.3902, "step": 28135 }, { "epoch": 0.24, "learning_rate": 8.650407312932384e-05, "loss": 2.3488, "step": 28140 }, { "epoch": 0.24, "learning_rate": 8.649948890706536e-05, "loss": 2.3752, "step": 28145 }, { "epoch": 0.24, "learning_rate": 8.649490402788065e-05, "loss": 2.3341, "step": 28150 }, { "epoch": 0.24, "learning_rate": 8.649031849185226e-05, "loss": 2.3315, "step": 28155 }, { "epoch": 0.24, "learning_rate": 8.648573229906267e-05, "loss": 2.3071, "step": 28160 }, { "epoch": 0.24, "learning_rate": 8.648114544959447e-05, "loss": 2.3704, "step": 28165 }, { "epoch": 0.24, "learning_rate": 8.647655794353018e-05, "loss": 2.3894, "step": 28170 }, { "epoch": 0.24, "learning_rate": 8.64719697809524e-05, "loss": 2.3039, "step": 28175 }, { "epoch": 0.24, "learning_rate": 8.646738096194368e-05, "loss": 2.4238, "step": 28180 }, { "epoch": 0.24, "learning_rate": 8.646279148658665e-05, "loss": 2.4052, "step": 28185 }, { "epoch": 0.24, "learning_rate": 8.645820135496388e-05, "loss": 2.3302, "step": 28190 }, { "epoch": 0.24, "learning_rate": 8.645361056715797e-05, "loss": 2.3731, "step": 28195 }, { "epoch": 0.24, "learning_rate": 8.644901912325158e-05, "loss": 2.3767, "step": 28200 }, { "epoch": 0.24, "learning_rate": 8.644442702332733e-05, "loss": 2.2888, "step": 28205 }, { "epoch": 0.24, "learning_rate": 8.643983426746787e-05, "loss": 2.3231, "step": 28210 }, { "epoch": 0.24, "learning_rate": 8.643524085575587e-05, "loss": 2.3764, "step": 28215 }, { "epoch": 0.24, "learning_rate": 8.643064678827402e-05, "loss": 2.3114, "step": 28220 }, { "epoch": 0.24, "learning_rate": 8.642605206510496e-05, "loss": 2.3161, "step": 28225 }, { "epoch": 0.24, "learning_rate": 8.642145668633142e-05, "loss": 2.3651, "step": 28230 }, { "epoch": 0.24, "learning_rate": 8.64168606520361e-05, "loss": 2.3651, "step": 28235 }, { "epoch": 0.24, "learning_rate": 8.641226396230171e-05, "loss": 2.2613, "step": 28240 }, { "epoch": 0.24, "learning_rate": 8.6407666617211e-05, "loss": 2.3383, "step": 28245 }, { "epoch": 0.24, "learning_rate": 8.640306861684671e-05, "loss": 2.2855, "step": 28250 }, { "epoch": 0.24, "learning_rate": 8.63984699612916e-05, "loss": 2.3449, "step": 28255 }, { "epoch": 0.24, "learning_rate": 8.63938706506284e-05, "loss": 2.3348, "step": 28260 }, { "epoch": 0.24, "learning_rate": 8.638927068493995e-05, "loss": 2.3972, "step": 28265 }, { "epoch": 0.24, "learning_rate": 8.6384670064309e-05, "loss": 2.4303, "step": 28270 }, { "epoch": 0.24, "learning_rate": 8.638006878881837e-05, "loss": 2.3986, "step": 28275 }, { "epoch": 0.24, "learning_rate": 8.637546685855085e-05, "loss": 2.3389, "step": 28280 }, { "epoch": 0.24, "learning_rate": 8.637086427358932e-05, "loss": 2.3578, "step": 28285 }, { "epoch": 0.24, "learning_rate": 8.636626103401655e-05, "loss": 2.3527, "step": 28290 }, { "epoch": 0.24, "learning_rate": 8.636165713991544e-05, "loss": 2.382, "step": 28295 }, { "epoch": 0.24, "learning_rate": 8.635705259136884e-05, "loss": 2.304, "step": 28300 }, { "epoch": 0.24, "learning_rate": 8.63524473884596e-05, "loss": 2.3451, "step": 28305 }, { "epoch": 0.24, "learning_rate": 8.634784153127064e-05, "loss": 2.3798, "step": 28310 }, { "epoch": 0.24, "learning_rate": 8.634323501988484e-05, "loss": 2.2789, "step": 28315 }, { "epoch": 0.24, "learning_rate": 8.633862785438511e-05, "loss": 2.3124, "step": 28320 }, { "epoch": 0.24, "learning_rate": 8.633402003485438e-05, "loss": 2.4011, "step": 28325 }, { "epoch": 0.24, "learning_rate": 8.632941156137558e-05, "loss": 2.3447, "step": 28330 }, { "epoch": 0.24, "learning_rate": 8.632480243403162e-05, "loss": 2.3286, "step": 28335 }, { "epoch": 0.24, "learning_rate": 8.632019265290551e-05, "loss": 2.3728, "step": 28340 }, { "epoch": 0.24, "learning_rate": 8.631558221808019e-05, "loss": 2.2979, "step": 28345 }, { "epoch": 0.24, "learning_rate": 8.631097112963864e-05, "loss": 2.3485, "step": 28350 }, { "epoch": 0.24, "learning_rate": 8.630635938766384e-05, "loss": 2.3912, "step": 28355 }, { "epoch": 0.24, "learning_rate": 8.630174699223883e-05, "loss": 2.3165, "step": 28360 }, { "epoch": 0.24, "learning_rate": 8.629713394344659e-05, "loss": 2.334, "step": 28365 }, { "epoch": 0.24, "learning_rate": 8.629252024137017e-05, "loss": 2.3871, "step": 28370 }, { "epoch": 0.24, "learning_rate": 8.628790588609259e-05, "loss": 2.3437, "step": 28375 }, { "epoch": 0.24, "learning_rate": 8.628329087769692e-05, "loss": 2.3778, "step": 28380 }, { "epoch": 0.24, "learning_rate": 8.627867521626618e-05, "loss": 2.3492, "step": 28385 }, { "epoch": 0.24, "learning_rate": 8.62740589018835e-05, "loss": 2.3966, "step": 28390 }, { "epoch": 0.24, "learning_rate": 8.626944193463194e-05, "loss": 2.25, "step": 28395 }, { "epoch": 0.24, "learning_rate": 8.626482431459458e-05, "loss": 2.3477, "step": 28400 }, { "epoch": 0.24, "learning_rate": 8.626020604185456e-05, "loss": 2.3181, "step": 28405 }, { "epoch": 0.24, "learning_rate": 8.625558711649497e-05, "loss": 2.3651, "step": 28410 }, { "epoch": 0.24, "learning_rate": 8.625096753859899e-05, "loss": 2.3747, "step": 28415 }, { "epoch": 0.24, "learning_rate": 8.624634730824969e-05, "loss": 2.2813, "step": 28420 }, { "epoch": 0.24, "learning_rate": 8.62417264255303e-05, "loss": 2.3696, "step": 28425 }, { "epoch": 0.24, "learning_rate": 8.623710489052394e-05, "loss": 2.3234, "step": 28430 }, { "epoch": 0.24, "learning_rate": 8.623248270331383e-05, "loss": 2.2818, "step": 28435 }, { "epoch": 0.24, "learning_rate": 8.62278598639831e-05, "loss": 2.2769, "step": 28440 }, { "epoch": 0.24, "learning_rate": 8.622323637261502e-05, "loss": 2.3356, "step": 28445 }, { "epoch": 0.24, "learning_rate": 8.621861222929277e-05, "loss": 2.3218, "step": 28450 }, { "epoch": 0.24, "learning_rate": 8.621398743409957e-05, "loss": 2.3323, "step": 28455 }, { "epoch": 0.24, "learning_rate": 8.620936198711868e-05, "loss": 2.3991, "step": 28460 }, { "epoch": 0.24, "learning_rate": 8.620473588843334e-05, "loss": 2.3493, "step": 28465 }, { "epoch": 0.24, "learning_rate": 8.620010913812681e-05, "loss": 2.3778, "step": 28470 }, { "epoch": 0.24, "learning_rate": 8.619548173628236e-05, "loss": 2.3341, "step": 28475 }, { "epoch": 0.24, "learning_rate": 8.619085368298327e-05, "loss": 2.3455, "step": 28480 }, { "epoch": 0.24, "learning_rate": 8.618622497831285e-05, "loss": 2.3671, "step": 28485 }, { "epoch": 0.24, "learning_rate": 8.618159562235441e-05, "loss": 2.4057, "step": 28490 }, { "epoch": 0.24, "learning_rate": 8.617696561519126e-05, "loss": 2.3336, "step": 28495 }, { "epoch": 0.24, "learning_rate": 8.617233495690675e-05, "loss": 2.3221, "step": 28500 }, { "epoch": 0.24, "learning_rate": 8.61677036475842e-05, "loss": 2.3727, "step": 28505 }, { "epoch": 0.24, "learning_rate": 8.616307168730698e-05, "loss": 2.3354, "step": 28510 }, { "epoch": 0.24, "learning_rate": 8.615843907615844e-05, "loss": 2.4195, "step": 28515 }, { "epoch": 0.24, "learning_rate": 8.615380581422199e-05, "loss": 2.3392, "step": 28520 }, { "epoch": 0.24, "learning_rate": 8.614917190158099e-05, "loss": 2.2908, "step": 28525 }, { "epoch": 0.24, "learning_rate": 8.614453733831887e-05, "loss": 2.4039, "step": 28530 }, { "epoch": 0.24, "learning_rate": 8.613990212451902e-05, "loss": 2.4119, "step": 28535 }, { "epoch": 0.24, "learning_rate": 8.613526626026485e-05, "loss": 2.3221, "step": 28540 }, { "epoch": 0.24, "learning_rate": 8.613062974563985e-05, "loss": 2.3207, "step": 28545 }, { "epoch": 0.24, "learning_rate": 8.612599258072741e-05, "loss": 2.2836, "step": 28550 }, { "epoch": 0.24, "learning_rate": 8.612135476561105e-05, "loss": 2.3269, "step": 28555 }, { "epoch": 0.24, "learning_rate": 8.611671630037421e-05, "loss": 2.3437, "step": 28560 }, { "epoch": 0.24, "learning_rate": 8.611207718510037e-05, "loss": 2.3464, "step": 28565 }, { "epoch": 0.24, "learning_rate": 8.610743741987304e-05, "loss": 2.2398, "step": 28570 }, { "epoch": 0.24, "learning_rate": 8.610279700477573e-05, "loss": 2.31, "step": 28575 }, { "epoch": 0.24, "learning_rate": 8.609815593989193e-05, "loss": 2.3943, "step": 28580 }, { "epoch": 0.24, "learning_rate": 8.609351422530519e-05, "loss": 2.3857, "step": 28585 }, { "epoch": 0.24, "learning_rate": 8.608887186109906e-05, "loss": 2.3694, "step": 28590 }, { "epoch": 0.24, "learning_rate": 8.608422884735709e-05, "loss": 2.2925, "step": 28595 }, { "epoch": 0.24, "learning_rate": 8.607958518416286e-05, "loss": 2.3724, "step": 28600 }, { "epoch": 0.24, "learning_rate": 8.607494087159991e-05, "loss": 2.3563, "step": 28605 }, { "epoch": 0.24, "learning_rate": 8.607029590975187e-05, "loss": 2.3315, "step": 28610 }, { "epoch": 0.24, "learning_rate": 8.606565029870231e-05, "loss": 2.2485, "step": 28615 }, { "epoch": 0.24, "learning_rate": 8.606100403853485e-05, "loss": 2.3204, "step": 28620 }, { "epoch": 0.24, "learning_rate": 8.605635712933314e-05, "loss": 2.2361, "step": 28625 }, { "epoch": 0.24, "learning_rate": 8.605170957118078e-05, "loss": 2.317, "step": 28630 }, { "epoch": 0.24, "learning_rate": 8.604706136416143e-05, "loss": 2.3498, "step": 28635 }, { "epoch": 0.24, "learning_rate": 8.604241250835876e-05, "loss": 2.3274, "step": 28640 }, { "epoch": 0.24, "learning_rate": 8.603776300385644e-05, "loss": 2.383, "step": 28645 }, { "epoch": 0.24, "learning_rate": 8.603311285073813e-05, "loss": 2.275, "step": 28650 }, { "epoch": 0.24, "learning_rate": 8.602846204908757e-05, "loss": 2.3454, "step": 28655 }, { "epoch": 0.24, "learning_rate": 8.60238105989884e-05, "loss": 2.341, "step": 28660 }, { "epoch": 0.24, "learning_rate": 8.60191585005244e-05, "loss": 2.4038, "step": 28665 }, { "epoch": 0.24, "learning_rate": 8.601450575377928e-05, "loss": 2.4101, "step": 28670 }, { "epoch": 0.24, "learning_rate": 8.600985235883676e-05, "loss": 2.4148, "step": 28675 }, { "epoch": 0.24, "learning_rate": 8.600519831578063e-05, "loss": 2.3171, "step": 28680 }, { "epoch": 0.24, "learning_rate": 8.600054362469462e-05, "loss": 2.333, "step": 28685 }, { "epoch": 0.24, "learning_rate": 8.599588828566252e-05, "loss": 2.3586, "step": 28690 }, { "epoch": 0.24, "learning_rate": 8.599123229876814e-05, "loss": 2.3741, "step": 28695 }, { "epoch": 0.24, "learning_rate": 8.598657566409522e-05, "loss": 2.2841, "step": 28700 }, { "epoch": 0.24, "learning_rate": 8.598191838172763e-05, "loss": 2.3549, "step": 28705 }, { "epoch": 0.24, "learning_rate": 8.597726045174916e-05, "loss": 2.3693, "step": 28710 }, { "epoch": 0.25, "learning_rate": 8.597260187424368e-05, "loss": 2.3574, "step": 28715 }, { "epoch": 0.25, "learning_rate": 8.596794264929499e-05, "loss": 2.268, "step": 28720 }, { "epoch": 0.25, "learning_rate": 8.596328277698698e-05, "loss": 2.2248, "step": 28725 }, { "epoch": 0.25, "learning_rate": 8.595862225740351e-05, "loss": 2.3262, "step": 28730 }, { "epoch": 0.25, "learning_rate": 8.595396109062845e-05, "loss": 2.3251, "step": 28735 }, { "epoch": 0.25, "learning_rate": 8.594929927674572e-05, "loss": 2.4234, "step": 28740 }, { "epoch": 0.25, "learning_rate": 8.59446368158392e-05, "loss": 2.3687, "step": 28745 }, { "epoch": 0.25, "learning_rate": 8.593997370799282e-05, "loss": 2.3566, "step": 28750 }, { "epoch": 0.25, "learning_rate": 8.593530995329049e-05, "loss": 2.3764, "step": 28755 }, { "epoch": 0.25, "learning_rate": 8.593064555181617e-05, "loss": 2.3765, "step": 28760 }, { "epoch": 0.25, "learning_rate": 8.592598050365379e-05, "loss": 2.2209, "step": 28765 }, { "epoch": 0.25, "learning_rate": 8.592131480888734e-05, "loss": 2.3219, "step": 28770 }, { "epoch": 0.25, "learning_rate": 8.591664846760077e-05, "loss": 2.3428, "step": 28775 }, { "epoch": 0.25, "learning_rate": 8.591198147987808e-05, "loss": 2.3171, "step": 28780 }, { "epoch": 0.25, "learning_rate": 8.590731384580324e-05, "loss": 2.3984, "step": 28785 }, { "epoch": 0.25, "learning_rate": 8.590264556546032e-05, "loss": 2.3387, "step": 28790 }, { "epoch": 0.25, "learning_rate": 8.589797663893328e-05, "loss": 2.353, "step": 28795 }, { "epoch": 0.25, "learning_rate": 8.589330706630618e-05, "loss": 2.3567, "step": 28800 }, { "epoch": 0.25, "learning_rate": 8.588863684766305e-05, "loss": 2.3204, "step": 28805 }, { "epoch": 0.25, "learning_rate": 8.588396598308796e-05, "loss": 2.2706, "step": 28810 }, { "epoch": 0.25, "learning_rate": 8.587929447266496e-05, "loss": 2.4131, "step": 28815 }, { "epoch": 0.25, "learning_rate": 8.587462231647816e-05, "loss": 2.3634, "step": 28820 }, { "epoch": 0.25, "learning_rate": 8.586994951461163e-05, "loss": 2.4199, "step": 28825 }, { "epoch": 0.25, "learning_rate": 8.586527606714945e-05, "loss": 2.3305, "step": 28830 }, { "epoch": 0.25, "learning_rate": 8.586060197417578e-05, "loss": 2.3645, "step": 28835 }, { "epoch": 0.25, "learning_rate": 8.585592723577472e-05, "loss": 2.3458, "step": 28840 }, { "epoch": 0.25, "learning_rate": 8.58512518520304e-05, "loss": 2.2338, "step": 28845 }, { "epoch": 0.25, "learning_rate": 8.584657582302697e-05, "loss": 2.3288, "step": 28850 }, { "epoch": 0.25, "learning_rate": 8.584189914884862e-05, "loss": 2.421, "step": 28855 }, { "epoch": 0.25, "learning_rate": 8.58372218295795e-05, "loss": 2.3086, "step": 28860 }, { "epoch": 0.25, "learning_rate": 8.583254386530377e-05, "loss": 2.3944, "step": 28865 }, { "epoch": 0.25, "learning_rate": 8.582786525610567e-05, "loss": 2.3388, "step": 28870 }, { "epoch": 0.25, "learning_rate": 8.582318600206937e-05, "loss": 2.3029, "step": 28875 }, { "epoch": 0.25, "learning_rate": 8.581850610327911e-05, "loss": 2.2746, "step": 28880 }, { "epoch": 0.25, "learning_rate": 8.581382555981913e-05, "loss": 2.333, "step": 28885 }, { "epoch": 0.25, "learning_rate": 8.580914437177363e-05, "loss": 2.2872, "step": 28890 }, { "epoch": 0.25, "learning_rate": 8.58044625392269e-05, "loss": 2.4, "step": 28895 }, { "epoch": 0.25, "learning_rate": 8.579978006226319e-05, "loss": 2.3097, "step": 28900 }, { "epoch": 0.25, "learning_rate": 8.579509694096678e-05, "loss": 2.249, "step": 28905 }, { "epoch": 0.25, "learning_rate": 8.579041317542197e-05, "loss": 2.388, "step": 28910 }, { "epoch": 0.25, "learning_rate": 8.578572876571302e-05, "loss": 2.4453, "step": 28915 }, { "epoch": 0.25, "learning_rate": 8.578104371192428e-05, "loss": 2.3304, "step": 28920 }, { "epoch": 0.25, "learning_rate": 8.577635801414008e-05, "loss": 2.2692, "step": 28925 }, { "epoch": 0.25, "learning_rate": 8.57716716724447e-05, "loss": 2.2616, "step": 28930 }, { "epoch": 0.25, "learning_rate": 8.576698468692254e-05, "loss": 2.3491, "step": 28935 }, { "epoch": 0.25, "learning_rate": 8.576229705765794e-05, "loss": 2.37, "step": 28940 }, { "epoch": 0.25, "learning_rate": 8.575760878473527e-05, "loss": 2.3181, "step": 28945 }, { "epoch": 0.25, "learning_rate": 8.57529198682389e-05, "loss": 2.3737, "step": 28950 }, { "epoch": 0.25, "learning_rate": 8.574823030825323e-05, "loss": 2.2608, "step": 28955 }, { "epoch": 0.25, "learning_rate": 8.574354010486266e-05, "loss": 2.3687, "step": 28960 }, { "epoch": 0.25, "learning_rate": 8.573884925815161e-05, "loss": 2.3802, "step": 28965 }, { "epoch": 0.25, "learning_rate": 8.573415776820451e-05, "loss": 2.3436, "step": 28970 }, { "epoch": 0.25, "learning_rate": 8.57294656351058e-05, "loss": 2.3659, "step": 28975 }, { "epoch": 0.25, "learning_rate": 8.572477285893991e-05, "loss": 2.4256, "step": 28980 }, { "epoch": 0.25, "learning_rate": 8.572007943979132e-05, "loss": 2.3332, "step": 28985 }, { "epoch": 0.25, "learning_rate": 8.57153853777445e-05, "loss": 2.3201, "step": 28990 }, { "epoch": 0.25, "learning_rate": 8.571069067288393e-05, "loss": 2.2557, "step": 28995 }, { "epoch": 0.25, "learning_rate": 8.570599532529413e-05, "loss": 2.3718, "step": 29000 }, { "epoch": 0.25, "learning_rate": 8.570129933505957e-05, "loss": 2.327, "step": 29005 }, { "epoch": 0.25, "learning_rate": 8.56966027022648e-05, "loss": 2.3752, "step": 29010 }, { "epoch": 0.25, "learning_rate": 8.569190542699433e-05, "loss": 2.3113, "step": 29015 }, { "epoch": 0.25, "learning_rate": 8.568720750933271e-05, "loss": 2.297, "step": 29020 }, { "epoch": 0.25, "learning_rate": 8.56825089493645e-05, "loss": 2.3841, "step": 29025 }, { "epoch": 0.25, "learning_rate": 8.567780974717427e-05, "loss": 2.3319, "step": 29030 }, { "epoch": 0.25, "learning_rate": 8.567310990284658e-05, "loss": 2.292, "step": 29035 }, { "epoch": 0.25, "learning_rate": 8.566840941646603e-05, "loss": 2.297, "step": 29040 }, { "epoch": 0.25, "learning_rate": 8.566370828811721e-05, "loss": 2.3644, "step": 29045 }, { "epoch": 0.25, "learning_rate": 8.565900651788476e-05, "loss": 2.3012, "step": 29050 }, { "epoch": 0.25, "learning_rate": 8.565430410585327e-05, "loss": 2.3461, "step": 29055 }, { "epoch": 0.25, "learning_rate": 8.564960105210738e-05, "loss": 2.3605, "step": 29060 }, { "epoch": 0.25, "learning_rate": 8.564489735673176e-05, "loss": 2.3031, "step": 29065 }, { "epoch": 0.25, "learning_rate": 8.564019301981106e-05, "loss": 2.3463, "step": 29070 }, { "epoch": 0.25, "learning_rate": 8.563548804142993e-05, "loss": 2.3464, "step": 29075 }, { "epoch": 0.25, "learning_rate": 8.563078242167306e-05, "loss": 2.3245, "step": 29080 }, { "epoch": 0.25, "learning_rate": 8.562607616062517e-05, "loss": 2.4296, "step": 29085 }, { "epoch": 0.25, "learning_rate": 8.562136925837092e-05, "loss": 2.2868, "step": 29090 }, { "epoch": 0.25, "learning_rate": 8.561666171499506e-05, "loss": 2.2871, "step": 29095 }, { "epoch": 0.25, "learning_rate": 8.56119535305823e-05, "loss": 2.2933, "step": 29100 }, { "epoch": 0.25, "learning_rate": 8.560724470521739e-05, "loss": 2.3552, "step": 29105 }, { "epoch": 0.25, "learning_rate": 8.560253523898508e-05, "loss": 2.3328, "step": 29110 }, { "epoch": 0.25, "learning_rate": 8.55978251319701e-05, "loss": 2.3563, "step": 29115 }, { "epoch": 0.25, "learning_rate": 8.559311438425728e-05, "loss": 2.4121, "step": 29120 }, { "epoch": 0.25, "learning_rate": 8.558840299593137e-05, "loss": 2.3331, "step": 29125 }, { "epoch": 0.25, "learning_rate": 8.558369096707716e-05, "loss": 2.343, "step": 29130 }, { "epoch": 0.25, "learning_rate": 8.557897829777948e-05, "loss": 2.2616, "step": 29135 }, { "epoch": 0.25, "learning_rate": 8.557426498812314e-05, "loss": 2.3048, "step": 29140 }, { "epoch": 0.25, "learning_rate": 8.556955103819295e-05, "loss": 2.2586, "step": 29145 }, { "epoch": 0.25, "learning_rate": 8.55648364480738e-05, "loss": 2.2674, "step": 29150 }, { "epoch": 0.25, "learning_rate": 8.556012121785052e-05, "loss": 2.4078, "step": 29155 }, { "epoch": 0.25, "learning_rate": 8.555540534760797e-05, "loss": 2.2927, "step": 29160 }, { "epoch": 0.25, "learning_rate": 8.555068883743103e-05, "loss": 2.3031, "step": 29165 }, { "epoch": 0.25, "learning_rate": 8.554597168740458e-05, "loss": 2.3988, "step": 29170 }, { "epoch": 0.25, "learning_rate": 8.554125389761353e-05, "loss": 2.3311, "step": 29175 }, { "epoch": 0.25, "learning_rate": 8.553653546814282e-05, "loss": 2.4417, "step": 29180 }, { "epoch": 0.25, "learning_rate": 8.553181639907732e-05, "loss": 2.2869, "step": 29185 }, { "epoch": 0.25, "learning_rate": 8.552709669050201e-05, "loss": 2.3275, "step": 29190 }, { "epoch": 0.25, "learning_rate": 8.55223763425018e-05, "loss": 2.3976, "step": 29195 }, { "epoch": 0.25, "learning_rate": 8.551765535516167e-05, "loss": 2.3561, "step": 29200 }, { "epoch": 0.25, "learning_rate": 8.55129337285666e-05, "loss": 2.3469, "step": 29205 }, { "epoch": 0.25, "learning_rate": 8.550821146280153e-05, "loss": 2.4003, "step": 29210 }, { "epoch": 0.25, "learning_rate": 8.55034885579515e-05, "loss": 2.3471, "step": 29215 }, { "epoch": 0.25, "learning_rate": 8.549876501410148e-05, "loss": 2.3597, "step": 29220 }, { "epoch": 0.25, "learning_rate": 8.54940408313365e-05, "loss": 2.3651, "step": 29225 }, { "epoch": 0.25, "learning_rate": 8.548931600974159e-05, "loss": 2.3313, "step": 29230 }, { "epoch": 0.25, "learning_rate": 8.548459054940176e-05, "loss": 2.358, "step": 29235 }, { "epoch": 0.25, "learning_rate": 8.54798644504021e-05, "loss": 2.3493, "step": 29240 }, { "epoch": 0.25, "learning_rate": 8.547513771282766e-05, "loss": 2.3051, "step": 29245 }, { "epoch": 0.25, "learning_rate": 8.54704103367635e-05, "loss": 2.3613, "step": 29250 }, { "epoch": 0.25, "learning_rate": 8.546568232229473e-05, "loss": 2.3485, "step": 29255 }, { "epoch": 0.25, "learning_rate": 8.54609536695064e-05, "loss": 2.387, "step": 29260 }, { "epoch": 0.25, "learning_rate": 8.545622437848366e-05, "loss": 2.3956, "step": 29265 }, { "epoch": 0.25, "learning_rate": 8.54514944493116e-05, "loss": 2.3018, "step": 29270 }, { "epoch": 0.25, "learning_rate": 8.544676388207537e-05, "loss": 2.3784, "step": 29275 }, { "epoch": 0.25, "learning_rate": 8.544203267686012e-05, "loss": 2.3157, "step": 29280 }, { "epoch": 0.25, "learning_rate": 8.543730083375098e-05, "loss": 2.386, "step": 29285 }, { "epoch": 0.25, "learning_rate": 8.543256835283312e-05, "loss": 2.3447, "step": 29290 }, { "epoch": 0.25, "learning_rate": 8.542783523419171e-05, "loss": 2.2652, "step": 29295 }, { "epoch": 0.25, "learning_rate": 8.542310147791197e-05, "loss": 2.3481, "step": 29300 }, { "epoch": 0.25, "learning_rate": 8.541836708407906e-05, "loss": 2.3315, "step": 29305 }, { "epoch": 0.25, "learning_rate": 8.541363205277823e-05, "loss": 2.2826, "step": 29310 }, { "epoch": 0.25, "learning_rate": 8.540889638409466e-05, "loss": 2.3336, "step": 29315 }, { "epoch": 0.25, "learning_rate": 8.54041600781136e-05, "loss": 2.3301, "step": 29320 }, { "epoch": 0.25, "learning_rate": 8.53994231349203e-05, "loss": 2.3184, "step": 29325 }, { "epoch": 0.25, "learning_rate": 8.539468555460004e-05, "loss": 2.4378, "step": 29330 }, { "epoch": 0.25, "learning_rate": 8.538994733723804e-05, "loss": 2.3129, "step": 29335 }, { "epoch": 0.25, "learning_rate": 8.538520848291962e-05, "loss": 2.3537, "step": 29340 }, { "epoch": 0.25, "learning_rate": 8.538046899173004e-05, "loss": 2.3552, "step": 29345 }, { "epoch": 0.25, "learning_rate": 8.537572886375462e-05, "loss": 2.3276, "step": 29350 }, { "epoch": 0.25, "learning_rate": 8.537098809907868e-05, "loss": 2.3358, "step": 29355 }, { "epoch": 0.25, "learning_rate": 8.536624669778752e-05, "loss": 2.3019, "step": 29360 }, { "epoch": 0.25, "learning_rate": 8.536150465996651e-05, "loss": 2.3551, "step": 29365 }, { "epoch": 0.25, "learning_rate": 8.535676198570096e-05, "loss": 2.3429, "step": 29370 }, { "epoch": 0.25, "learning_rate": 8.535201867507627e-05, "loss": 2.3284, "step": 29375 }, { "epoch": 0.25, "learning_rate": 8.534727472817778e-05, "loss": 2.3613, "step": 29380 }, { "epoch": 0.25, "learning_rate": 8.534253014509088e-05, "loss": 2.3748, "step": 29385 }, { "epoch": 0.25, "learning_rate": 8.533778492590098e-05, "loss": 2.2775, "step": 29390 }, { "epoch": 0.25, "learning_rate": 8.533303907069348e-05, "loss": 2.3404, "step": 29395 }, { "epoch": 0.25, "learning_rate": 8.532829257955379e-05, "loss": 2.349, "step": 29400 }, { "epoch": 0.25, "learning_rate": 8.532354545256732e-05, "loss": 2.3368, "step": 29405 }, { "epoch": 0.25, "learning_rate": 8.531879768981954e-05, "loss": 2.4193, "step": 29410 }, { "epoch": 0.25, "learning_rate": 8.53140492913959e-05, "loss": 2.2613, "step": 29415 }, { "epoch": 0.25, "learning_rate": 8.530930025738184e-05, "loss": 2.3601, "step": 29420 }, { "epoch": 0.25, "learning_rate": 8.530455058786287e-05, "loss": 2.3314, "step": 29425 }, { "epoch": 0.25, "learning_rate": 8.529980028292443e-05, "loss": 2.401, "step": 29430 }, { "epoch": 0.25, "learning_rate": 8.529504934265205e-05, "loss": 2.3696, "step": 29435 }, { "epoch": 0.25, "learning_rate": 8.529029776713122e-05, "loss": 2.3427, "step": 29440 }, { "epoch": 0.25, "learning_rate": 8.528554555644748e-05, "loss": 2.2582, "step": 29445 }, { "epoch": 0.25, "learning_rate": 8.528079271068634e-05, "loss": 2.3946, "step": 29450 }, { "epoch": 0.25, "learning_rate": 8.527603922993336e-05, "loss": 2.2975, "step": 29455 }, { "epoch": 0.25, "learning_rate": 8.527128511427409e-05, "loss": 2.3647, "step": 29460 }, { "epoch": 0.25, "learning_rate": 8.526653036379408e-05, "loss": 2.272, "step": 29465 }, { "epoch": 0.25, "learning_rate": 8.526177497857895e-05, "loss": 2.356, "step": 29470 }, { "epoch": 0.25, "learning_rate": 8.525701895871422e-05, "loss": 2.3428, "step": 29475 }, { "epoch": 0.25, "learning_rate": 8.525226230428555e-05, "loss": 2.3232, "step": 29480 }, { "epoch": 0.25, "learning_rate": 8.524750501537855e-05, "loss": 2.2778, "step": 29485 }, { "epoch": 0.25, "learning_rate": 8.524274709207879e-05, "loss": 2.3628, "step": 29490 }, { "epoch": 0.25, "learning_rate": 8.523798853447194e-05, "loss": 2.3719, "step": 29495 }, { "epoch": 0.25, "learning_rate": 8.523322934264366e-05, "loss": 2.3646, "step": 29500 }, { "epoch": 0.25, "learning_rate": 8.522846951667958e-05, "loss": 2.3812, "step": 29505 }, { "epoch": 0.25, "learning_rate": 8.522370905666539e-05, "loss": 2.2827, "step": 29510 }, { "epoch": 0.25, "learning_rate": 8.521894796268675e-05, "loss": 2.2775, "step": 29515 }, { "epoch": 0.25, "learning_rate": 8.521418623482936e-05, "loss": 2.2931, "step": 29520 }, { "epoch": 0.25, "learning_rate": 8.520942387317891e-05, "loss": 2.3774, "step": 29525 }, { "epoch": 0.25, "learning_rate": 8.520466087782113e-05, "loss": 2.3921, "step": 29530 }, { "epoch": 0.25, "learning_rate": 8.519989724884175e-05, "loss": 2.3065, "step": 29535 }, { "epoch": 0.25, "learning_rate": 8.51951329863265e-05, "loss": 2.3623, "step": 29540 }, { "epoch": 0.25, "learning_rate": 8.519036809036112e-05, "loss": 2.3313, "step": 29545 }, { "epoch": 0.25, "learning_rate": 8.518560256103136e-05, "loss": 2.3017, "step": 29550 }, { "epoch": 0.25, "learning_rate": 8.518083639842304e-05, "loss": 2.2808, "step": 29555 }, { "epoch": 0.25, "learning_rate": 8.517606960262188e-05, "loss": 2.3733, "step": 29560 }, { "epoch": 0.25, "learning_rate": 8.517130217371375e-05, "loss": 2.318, "step": 29565 }, { "epoch": 0.25, "learning_rate": 8.516653411178437e-05, "loss": 2.3286, "step": 29570 }, { "epoch": 0.25, "learning_rate": 8.516176541691959e-05, "loss": 2.3481, "step": 29575 }, { "epoch": 0.25, "learning_rate": 8.515699608920527e-05, "loss": 2.3758, "step": 29580 }, { "epoch": 0.25, "learning_rate": 8.515222612872721e-05, "loss": 2.3646, "step": 29585 }, { "epoch": 0.25, "learning_rate": 8.514745553557128e-05, "loss": 2.398, "step": 29590 }, { "epoch": 0.25, "learning_rate": 8.514268430982333e-05, "loss": 2.3678, "step": 29595 }, { "epoch": 0.25, "learning_rate": 8.513791245156924e-05, "loss": 2.4104, "step": 29600 }, { "epoch": 0.25, "learning_rate": 8.51331399608949e-05, "loss": 2.3642, "step": 29605 }, { "epoch": 0.25, "learning_rate": 8.512836683788619e-05, "loss": 2.3942, "step": 29610 }, { "epoch": 0.25, "learning_rate": 8.512359308262905e-05, "loss": 2.267, "step": 29615 }, { "epoch": 0.25, "learning_rate": 8.511881869520937e-05, "loss": 2.337, "step": 29620 }, { "epoch": 0.25, "learning_rate": 8.511404367571307e-05, "loss": 2.2333, "step": 29625 }, { "epoch": 0.25, "learning_rate": 8.510926802422615e-05, "loss": 2.2503, "step": 29630 }, { "epoch": 0.25, "learning_rate": 8.51044917408345e-05, "loss": 2.344, "step": 29635 }, { "epoch": 0.25, "learning_rate": 8.50997148256241e-05, "loss": 2.2804, "step": 29640 }, { "epoch": 0.25, "learning_rate": 8.509493727868095e-05, "loss": 2.2841, "step": 29645 }, { "epoch": 0.25, "learning_rate": 8.5090159100091e-05, "loss": 2.4416, "step": 29650 }, { "epoch": 0.25, "learning_rate": 8.50853802899403e-05, "loss": 2.3685, "step": 29655 }, { "epoch": 0.25, "learning_rate": 8.508060084831482e-05, "loss": 2.338, "step": 29660 }, { "epoch": 0.25, "learning_rate": 8.507582077530058e-05, "loss": 2.3165, "step": 29665 }, { "epoch": 0.25, "learning_rate": 8.507104007098365e-05, "loss": 2.2629, "step": 29670 }, { "epoch": 0.25, "learning_rate": 8.506625873545003e-05, "loss": 2.3297, "step": 29675 }, { "epoch": 0.25, "learning_rate": 8.50614767687858e-05, "loss": 2.3172, "step": 29680 }, { "epoch": 0.25, "learning_rate": 8.505669417107703e-05, "loss": 2.3665, "step": 29685 }, { "epoch": 0.25, "learning_rate": 8.505191094240978e-05, "loss": 2.3441, "step": 29690 }, { "epoch": 0.25, "learning_rate": 8.504712708287016e-05, "loss": 2.246, "step": 29695 }, { "epoch": 0.25, "learning_rate": 8.504234259254425e-05, "loss": 2.2917, "step": 29700 }, { "epoch": 0.25, "learning_rate": 8.503755747151819e-05, "loss": 2.3507, "step": 29705 }, { "epoch": 0.25, "learning_rate": 8.503277171987807e-05, "loss": 2.2831, "step": 29710 }, { "epoch": 0.25, "learning_rate": 8.502798533771006e-05, "loss": 2.3585, "step": 29715 }, { "epoch": 0.25, "learning_rate": 8.502319832510027e-05, "loss": 2.2757, "step": 29720 }, { "epoch": 0.25, "learning_rate": 8.501841068213488e-05, "loss": 2.2871, "step": 29725 }, { "epoch": 0.25, "learning_rate": 8.501362240890006e-05, "loss": 2.3292, "step": 29730 }, { "epoch": 0.25, "learning_rate": 8.500883350548198e-05, "loss": 2.4178, "step": 29735 }, { "epoch": 0.25, "learning_rate": 8.500404397196686e-05, "loss": 2.3635, "step": 29740 }, { "epoch": 0.25, "learning_rate": 8.499925380844086e-05, "loss": 2.2627, "step": 29745 }, { "epoch": 0.25, "learning_rate": 8.49944630149902e-05, "loss": 2.2069, "step": 29750 }, { "epoch": 0.25, "learning_rate": 8.498967159170116e-05, "loss": 2.3743, "step": 29755 }, { "epoch": 0.25, "learning_rate": 8.498487953865992e-05, "loss": 2.3665, "step": 29760 }, { "epoch": 0.25, "learning_rate": 8.498008685595274e-05, "loss": 2.352, "step": 29765 }, { "epoch": 0.25, "learning_rate": 8.497529354366589e-05, "loss": 2.3678, "step": 29770 }, { "epoch": 0.25, "learning_rate": 8.497049960188565e-05, "loss": 2.2869, "step": 29775 }, { "epoch": 0.25, "learning_rate": 8.496570503069829e-05, "loss": 2.4418, "step": 29780 }, { "epoch": 0.25, "learning_rate": 8.496090983019008e-05, "loss": 2.37, "step": 29785 }, { "epoch": 0.25, "learning_rate": 8.495611400044738e-05, "loss": 2.4083, "step": 29790 }, { "epoch": 0.25, "learning_rate": 8.495131754155645e-05, "loss": 2.3086, "step": 29795 }, { "epoch": 0.25, "learning_rate": 8.494652045360364e-05, "loss": 2.3563, "step": 29800 }, { "epoch": 0.25, "learning_rate": 8.494172273667532e-05, "loss": 2.2828, "step": 29805 }, { "epoch": 0.25, "learning_rate": 8.493692439085779e-05, "loss": 2.4181, "step": 29810 }, { "epoch": 0.25, "learning_rate": 8.493212541623745e-05, "loss": 2.3296, "step": 29815 }, { "epoch": 0.25, "learning_rate": 8.492732581290065e-05, "loss": 2.3019, "step": 29820 }, { "epoch": 0.25, "learning_rate": 8.49225255809338e-05, "loss": 2.3295, "step": 29825 }, { "epoch": 0.25, "learning_rate": 8.491772472042325e-05, "loss": 2.4127, "step": 29830 }, { "epoch": 0.25, "learning_rate": 8.491292323145543e-05, "loss": 2.3079, "step": 29835 }, { "epoch": 0.25, "learning_rate": 8.490812111411679e-05, "loss": 2.3897, "step": 29840 }, { "epoch": 0.25, "learning_rate": 8.490331836849373e-05, "loss": 2.3719, "step": 29845 }, { "epoch": 0.25, "learning_rate": 8.489851499467268e-05, "loss": 2.431, "step": 29850 }, { "epoch": 0.25, "learning_rate": 8.489371099274011e-05, "loss": 2.3238, "step": 29855 }, { "epoch": 0.25, "learning_rate": 8.488890636278247e-05, "loss": 2.2705, "step": 29860 }, { "epoch": 0.25, "learning_rate": 8.488410110488625e-05, "loss": 2.3742, "step": 29865 }, { "epoch": 0.25, "learning_rate": 8.487929521913794e-05, "loss": 2.4445, "step": 29870 }, { "epoch": 0.25, "learning_rate": 8.487448870562402e-05, "loss": 2.333, "step": 29875 }, { "epoch": 0.25, "learning_rate": 8.486968156443101e-05, "loss": 2.2726, "step": 29880 }, { "epoch": 0.26, "learning_rate": 8.486487379564542e-05, "loss": 2.3562, "step": 29885 }, { "epoch": 0.26, "learning_rate": 8.48600653993538e-05, "loss": 2.3748, "step": 29890 }, { "epoch": 0.26, "learning_rate": 8.485525637564267e-05, "loss": 2.3495, "step": 29895 }, { "epoch": 0.26, "learning_rate": 8.485044672459861e-05, "loss": 2.3632, "step": 29900 }, { "epoch": 0.26, "learning_rate": 8.484563644630814e-05, "loss": 2.3364, "step": 29905 }, { "epoch": 0.26, "learning_rate": 8.484082554085788e-05, "loss": 2.2983, "step": 29910 }, { "epoch": 0.26, "learning_rate": 8.483601400833441e-05, "loss": 2.2869, "step": 29915 }, { "epoch": 0.26, "learning_rate": 8.483120184882433e-05, "loss": 2.3589, "step": 29920 }, { "epoch": 0.26, "learning_rate": 8.482638906241422e-05, "loss": 2.4015, "step": 29925 }, { "epoch": 0.26, "learning_rate": 8.482157564919076e-05, "loss": 2.2833, "step": 29930 }, { "epoch": 0.26, "learning_rate": 8.481676160924051e-05, "loss": 2.3458, "step": 29935 }, { "epoch": 0.26, "learning_rate": 8.481194694265017e-05, "loss": 2.3808, "step": 29940 }, { "epoch": 0.26, "learning_rate": 8.480713164950638e-05, "loss": 2.3131, "step": 29945 }, { "epoch": 0.26, "learning_rate": 8.48023157298958e-05, "loss": 2.3017, "step": 29950 }, { "epoch": 0.26, "learning_rate": 8.47974991839051e-05, "loss": 2.4075, "step": 29955 }, { "epoch": 0.26, "learning_rate": 8.4792682011621e-05, "loss": 2.3644, "step": 29960 }, { "epoch": 0.26, "learning_rate": 8.478786421313019e-05, "loss": 2.3356, "step": 29965 }, { "epoch": 0.26, "learning_rate": 8.478304578851934e-05, "loss": 2.325, "step": 29970 }, { "epoch": 0.26, "learning_rate": 8.477822673787523e-05, "loss": 2.3763, "step": 29975 }, { "epoch": 0.26, "learning_rate": 8.477340706128458e-05, "loss": 2.3505, "step": 29980 }, { "epoch": 0.26, "learning_rate": 8.476858675883412e-05, "loss": 2.321, "step": 29985 }, { "epoch": 0.26, "learning_rate": 8.476376583061061e-05, "loss": 2.2972, "step": 29990 }, { "epoch": 0.26, "learning_rate": 8.475894427670082e-05, "loss": 2.4223, "step": 29995 }, { "epoch": 0.26, "learning_rate": 8.475412209719154e-05, "loss": 2.3354, "step": 30000 }, { "epoch": 0.26, "learning_rate": 8.474929929216954e-05, "loss": 2.3533, "step": 30005 }, { "epoch": 0.26, "learning_rate": 8.474447586172164e-05, "loss": 2.4419, "step": 30010 }, { "epoch": 0.26, "learning_rate": 8.473965180593465e-05, "loss": 2.3262, "step": 30015 }, { "epoch": 0.26, "learning_rate": 8.47348271248954e-05, "loss": 2.3811, "step": 30020 }, { "epoch": 0.26, "learning_rate": 8.47300018186907e-05, "loss": 2.3975, "step": 30025 }, { "epoch": 0.26, "learning_rate": 8.472517588740742e-05, "loss": 2.3372, "step": 30030 }, { "epoch": 0.26, "learning_rate": 8.472034933113242e-05, "loss": 2.3058, "step": 30035 }, { "epoch": 0.26, "learning_rate": 8.471552214995257e-05, "loss": 2.3226, "step": 30040 }, { "epoch": 0.26, "learning_rate": 8.471069434395474e-05, "loss": 2.386, "step": 30045 }, { "epoch": 0.26, "learning_rate": 8.47058659132258e-05, "loss": 2.2658, "step": 30050 }, { "epoch": 0.26, "learning_rate": 8.47010368578527e-05, "loss": 2.3588, "step": 30055 }, { "epoch": 0.26, "learning_rate": 8.469620717792232e-05, "loss": 2.2974, "step": 30060 }, { "epoch": 0.26, "learning_rate": 8.469137687352163e-05, "loss": 2.3953, "step": 30065 }, { "epoch": 0.26, "learning_rate": 8.46865459447375e-05, "loss": 2.3866, "step": 30070 }, { "epoch": 0.26, "learning_rate": 8.468171439165693e-05, "loss": 2.3807, "step": 30075 }, { "epoch": 0.26, "learning_rate": 8.467688221436685e-05, "loss": 2.3177, "step": 30080 }, { "epoch": 0.26, "learning_rate": 8.467204941295427e-05, "loss": 2.3486, "step": 30085 }, { "epoch": 0.26, "learning_rate": 8.466721598750613e-05, "loss": 2.2811, "step": 30090 }, { "epoch": 0.26, "learning_rate": 8.466238193810943e-05, "loss": 2.355, "step": 30095 }, { "epoch": 0.26, "learning_rate": 8.46575472648512e-05, "loss": 2.326, "step": 30100 }, { "epoch": 0.26, "learning_rate": 8.465271196781843e-05, "loss": 2.3619, "step": 30105 }, { "epoch": 0.26, "learning_rate": 8.464787604709815e-05, "loss": 2.353, "step": 30110 }, { "epoch": 0.26, "learning_rate": 8.464303950277741e-05, "loss": 2.4327, "step": 30115 }, { "epoch": 0.26, "learning_rate": 8.463820233494325e-05, "loss": 2.2902, "step": 30120 }, { "epoch": 0.26, "learning_rate": 8.463336454368273e-05, "loss": 2.3385, "step": 30125 }, { "epoch": 0.26, "learning_rate": 8.462852612908294e-05, "loss": 2.3488, "step": 30130 }, { "epoch": 0.26, "learning_rate": 8.462368709123094e-05, "loss": 2.3963, "step": 30135 }, { "epoch": 0.26, "learning_rate": 8.461884743021382e-05, "loss": 2.2857, "step": 30140 }, { "epoch": 0.26, "learning_rate": 8.461400714611871e-05, "loss": 2.3761, "step": 30145 }, { "epoch": 0.26, "learning_rate": 8.460916623903271e-05, "loss": 2.3382, "step": 30150 }, { "epoch": 0.26, "learning_rate": 8.460432470904294e-05, "loss": 2.3216, "step": 30155 }, { "epoch": 0.26, "learning_rate": 8.459948255623657e-05, "loss": 2.3797, "step": 30160 }, { "epoch": 0.26, "learning_rate": 8.459463978070072e-05, "loss": 2.3399, "step": 30165 }, { "epoch": 0.26, "learning_rate": 8.458979638252256e-05, "loss": 2.2626, "step": 30170 }, { "epoch": 0.26, "learning_rate": 8.458495236178927e-05, "loss": 2.3892, "step": 30175 }, { "epoch": 0.26, "learning_rate": 8.458010771858803e-05, "loss": 2.3362, "step": 30180 }, { "epoch": 0.26, "learning_rate": 8.457526245300602e-05, "loss": 2.3614, "step": 30185 }, { "epoch": 0.26, "learning_rate": 8.457041656513048e-05, "loss": 2.29, "step": 30190 }, { "epoch": 0.26, "learning_rate": 8.456557005504859e-05, "loss": 2.3778, "step": 30195 }, { "epoch": 0.26, "learning_rate": 8.456072292284762e-05, "loss": 2.3527, "step": 30200 }, { "epoch": 0.26, "learning_rate": 8.455587516861476e-05, "loss": 2.3963, "step": 30205 }, { "epoch": 0.26, "learning_rate": 8.45510267924373e-05, "loss": 2.372, "step": 30210 }, { "epoch": 0.26, "learning_rate": 8.454617779440248e-05, "loss": 2.3331, "step": 30215 }, { "epoch": 0.26, "learning_rate": 8.454132817459758e-05, "loss": 2.318, "step": 30220 }, { "epoch": 0.26, "learning_rate": 8.45364779331099e-05, "loss": 2.3739, "step": 30225 }, { "epoch": 0.26, "learning_rate": 8.45316270700267e-05, "loss": 2.3332, "step": 30230 }, { "epoch": 0.26, "learning_rate": 8.452677558543534e-05, "loss": 2.3284, "step": 30235 }, { "epoch": 0.26, "learning_rate": 8.452192347942309e-05, "loss": 2.249, "step": 30240 }, { "epoch": 0.26, "learning_rate": 8.451707075207728e-05, "loss": 2.3463, "step": 30245 }, { "epoch": 0.26, "learning_rate": 8.451221740348529e-05, "loss": 2.3171, "step": 30250 }, { "epoch": 0.26, "learning_rate": 8.450736343373444e-05, "loss": 2.3835, "step": 30255 }, { "epoch": 0.26, "learning_rate": 8.450250884291211e-05, "loss": 2.3923, "step": 30260 }, { "epoch": 0.26, "learning_rate": 8.449765363110566e-05, "loss": 2.3332, "step": 30265 }, { "epoch": 0.26, "learning_rate": 8.449279779840249e-05, "loss": 2.3604, "step": 30270 }, { "epoch": 0.26, "learning_rate": 8.448794134488997e-05, "loss": 2.3634, "step": 30275 }, { "epoch": 0.26, "learning_rate": 8.448308427065554e-05, "loss": 2.3638, "step": 30280 }, { "epoch": 0.26, "learning_rate": 8.44782265757866e-05, "loss": 2.3351, "step": 30285 }, { "epoch": 0.26, "learning_rate": 8.447336826037058e-05, "loss": 2.3846, "step": 30290 }, { "epoch": 0.26, "learning_rate": 8.446850932449494e-05, "loss": 2.3634, "step": 30295 }, { "epoch": 0.26, "learning_rate": 8.44636497682471e-05, "loss": 2.3754, "step": 30300 }, { "epoch": 0.26, "learning_rate": 8.445878959171453e-05, "loss": 2.3825, "step": 30305 }, { "epoch": 0.26, "learning_rate": 8.445392879498474e-05, "loss": 2.4185, "step": 30310 }, { "epoch": 0.26, "learning_rate": 8.444906737814517e-05, "loss": 2.2643, "step": 30315 }, { "epoch": 0.26, "learning_rate": 8.444420534128337e-05, "loss": 2.281, "step": 30320 }, { "epoch": 0.26, "learning_rate": 8.44393426844868e-05, "loss": 2.3522, "step": 30325 }, { "epoch": 0.26, "learning_rate": 8.443447940784297e-05, "loss": 2.2873, "step": 30330 }, { "epoch": 0.26, "learning_rate": 8.442961551143947e-05, "loss": 2.4049, "step": 30335 }, { "epoch": 0.26, "learning_rate": 8.442475099536377e-05, "loss": 2.3607, "step": 30340 }, { "epoch": 0.26, "learning_rate": 8.44198858597035e-05, "loss": 2.2402, "step": 30345 }, { "epoch": 0.26, "learning_rate": 8.441502010454616e-05, "loss": 2.3389, "step": 30350 }, { "epoch": 0.26, "learning_rate": 8.441015372997936e-05, "loss": 2.3117, "step": 30355 }, { "epoch": 0.26, "learning_rate": 8.440528673609066e-05, "loss": 2.2556, "step": 30360 }, { "epoch": 0.26, "learning_rate": 8.440041912296767e-05, "loss": 2.2671, "step": 30365 }, { "epoch": 0.26, "learning_rate": 8.439555089069802e-05, "loss": 2.3054, "step": 30370 }, { "epoch": 0.26, "learning_rate": 8.43906820393693e-05, "loss": 2.4275, "step": 30375 }, { "epoch": 0.26, "learning_rate": 8.438581256906915e-05, "loss": 2.3797, "step": 30380 }, { "epoch": 0.26, "learning_rate": 8.438094247988521e-05, "loss": 2.3288, "step": 30385 }, { "epoch": 0.26, "learning_rate": 8.437607177190514e-05, "loss": 2.3099, "step": 30390 }, { "epoch": 0.26, "learning_rate": 8.437120044521659e-05, "loss": 2.3124, "step": 30395 }, { "epoch": 0.26, "learning_rate": 8.436632849990726e-05, "loss": 2.3058, "step": 30400 }, { "epoch": 0.26, "learning_rate": 8.436145593606481e-05, "loss": 2.3945, "step": 30405 }, { "epoch": 0.26, "learning_rate": 8.435658275377696e-05, "loss": 2.3418, "step": 30410 }, { "epoch": 0.26, "learning_rate": 8.435170895313138e-05, "loss": 2.3371, "step": 30415 }, { "epoch": 0.26, "learning_rate": 8.434683453421583e-05, "loss": 2.2903, "step": 30420 }, { "epoch": 0.26, "learning_rate": 8.434195949711805e-05, "loss": 2.3506, "step": 30425 }, { "epoch": 0.26, "learning_rate": 8.433708384192574e-05, "loss": 2.2975, "step": 30430 }, { "epoch": 0.26, "learning_rate": 8.433220756872668e-05, "loss": 2.2886, "step": 30435 }, { "epoch": 0.26, "learning_rate": 8.432733067760862e-05, "loss": 2.2222, "step": 30440 }, { "epoch": 0.26, "learning_rate": 8.432245316865935e-05, "loss": 2.2704, "step": 30445 }, { "epoch": 0.26, "learning_rate": 8.431757504196664e-05, "loss": 2.3283, "step": 30450 }, { "epoch": 0.26, "learning_rate": 8.43126962976183e-05, "loss": 2.2335, "step": 30455 }, { "epoch": 0.26, "learning_rate": 8.430781693570216e-05, "loss": 2.3343, "step": 30460 }, { "epoch": 0.26, "learning_rate": 8.430293695630598e-05, "loss": 2.4381, "step": 30465 }, { "epoch": 0.26, "learning_rate": 8.429805635951764e-05, "loss": 2.3405, "step": 30470 }, { "epoch": 0.26, "learning_rate": 8.429317514542498e-05, "loss": 2.3778, "step": 30475 }, { "epoch": 0.26, "learning_rate": 8.428829331411582e-05, "loss": 2.3907, "step": 30480 }, { "epoch": 0.26, "learning_rate": 8.428341086567807e-05, "loss": 2.2871, "step": 30485 }, { "epoch": 0.26, "learning_rate": 8.427852780019956e-05, "loss": 2.2739, "step": 30490 }, { "epoch": 0.26, "learning_rate": 8.427364411776822e-05, "loss": 2.3333, "step": 30495 }, { "epoch": 0.26, "learning_rate": 8.426875981847192e-05, "loss": 2.3944, "step": 30500 }, { "epoch": 0.26, "learning_rate": 8.426387490239858e-05, "loss": 2.2742, "step": 30505 }, { "epoch": 0.26, "learning_rate": 8.42589893696361e-05, "loss": 2.2588, "step": 30510 }, { "epoch": 0.26, "learning_rate": 8.425410322027243e-05, "loss": 2.4273, "step": 30515 }, { "epoch": 0.26, "learning_rate": 8.424921645439549e-05, "loss": 2.3309, "step": 30520 }, { "epoch": 0.26, "learning_rate": 8.424432907209328e-05, "loss": 2.2473, "step": 30525 }, { "epoch": 0.26, "learning_rate": 8.423944107345371e-05, "loss": 2.333, "step": 30530 }, { "epoch": 0.26, "learning_rate": 8.423455245856481e-05, "loss": 2.2837, "step": 30535 }, { "epoch": 0.26, "learning_rate": 8.422966322751452e-05, "loss": 2.3984, "step": 30540 }, { "epoch": 0.26, "learning_rate": 8.422477338039085e-05, "loss": 2.2691, "step": 30545 }, { "epoch": 0.26, "learning_rate": 8.421988291728182e-05, "loss": 2.3268, "step": 30550 }, { "epoch": 0.26, "learning_rate": 8.421499183827544e-05, "loss": 2.3307, "step": 30555 }, { "epoch": 0.26, "learning_rate": 8.421010014345975e-05, "loss": 2.3311, "step": 30560 }, { "epoch": 0.26, "learning_rate": 8.420520783292279e-05, "loss": 2.3481, "step": 30565 }, { "epoch": 0.26, "learning_rate": 8.420031490675257e-05, "loss": 2.2782, "step": 30570 }, { "epoch": 0.26, "learning_rate": 8.419542136503723e-05, "loss": 2.3294, "step": 30575 }, { "epoch": 0.26, "learning_rate": 8.41905272078648e-05, "loss": 2.3305, "step": 30580 }, { "epoch": 0.26, "learning_rate": 8.418563243532336e-05, "loss": 2.3259, "step": 30585 }, { "epoch": 0.26, "learning_rate": 8.418073704750103e-05, "loss": 2.3261, "step": 30590 }, { "epoch": 0.26, "learning_rate": 8.417584104448591e-05, "loss": 2.3479, "step": 30595 }, { "epoch": 0.26, "learning_rate": 8.417094442636612e-05, "loss": 2.3671, "step": 30600 }, { "epoch": 0.26, "learning_rate": 8.416604719322979e-05, "loss": 2.252, "step": 30605 }, { "epoch": 0.26, "learning_rate": 8.416114934516506e-05, "loss": 2.3511, "step": 30610 }, { "epoch": 0.26, "learning_rate": 8.415625088226007e-05, "loss": 2.3273, "step": 30615 }, { "epoch": 0.26, "learning_rate": 8.4151351804603e-05, "loss": 2.3098, "step": 30620 }, { "epoch": 0.26, "learning_rate": 8.414645211228202e-05, "loss": 2.3649, "step": 30625 }, { "epoch": 0.26, "learning_rate": 8.414155180538533e-05, "loss": 2.2938, "step": 30630 }, { "epoch": 0.26, "learning_rate": 8.413665088400111e-05, "loss": 2.3356, "step": 30635 }, { "epoch": 0.26, "learning_rate": 8.413174934821758e-05, "loss": 2.36, "step": 30640 }, { "epoch": 0.26, "learning_rate": 8.412684719812294e-05, "loss": 2.3172, "step": 30645 }, { "epoch": 0.26, "learning_rate": 8.412194443380542e-05, "loss": 2.3333, "step": 30650 }, { "epoch": 0.26, "learning_rate": 8.41170410553533e-05, "loss": 2.3901, "step": 30655 }, { "epoch": 0.26, "learning_rate": 8.411213706285477e-05, "loss": 2.3227, "step": 30660 }, { "epoch": 0.26, "learning_rate": 8.410723245639815e-05, "loss": 2.3001, "step": 30665 }, { "epoch": 0.26, "learning_rate": 8.410232723607168e-05, "loss": 2.2428, "step": 30670 }, { "epoch": 0.26, "learning_rate": 8.409742140196366e-05, "loss": 2.3801, "step": 30675 }, { "epoch": 0.26, "learning_rate": 8.40925149541624e-05, "loss": 2.3047, "step": 30680 }, { "epoch": 0.26, "learning_rate": 8.408760789275616e-05, "loss": 2.2903, "step": 30685 }, { "epoch": 0.26, "learning_rate": 8.408270021783331e-05, "loss": 2.3717, "step": 30690 }, { "epoch": 0.26, "learning_rate": 8.407779192948216e-05, "loss": 2.3394, "step": 30695 }, { "epoch": 0.26, "learning_rate": 8.407288302779104e-05, "loss": 2.3304, "step": 30700 }, { "epoch": 0.26, "learning_rate": 8.40679735128483e-05, "loss": 2.2656, "step": 30705 }, { "epoch": 0.26, "learning_rate": 8.406306338474234e-05, "loss": 2.342, "step": 30710 }, { "epoch": 0.26, "learning_rate": 8.405815264356149e-05, "loss": 2.2693, "step": 30715 }, { "epoch": 0.26, "learning_rate": 8.405324128939416e-05, "loss": 2.2604, "step": 30720 }, { "epoch": 0.26, "learning_rate": 8.404832932232872e-05, "loss": 2.3541, "step": 30725 }, { "epoch": 0.26, "learning_rate": 8.40434167424536e-05, "loss": 2.3083, "step": 30730 }, { "epoch": 0.26, "learning_rate": 8.403850354985723e-05, "loss": 2.3867, "step": 30735 }, { "epoch": 0.26, "learning_rate": 8.4033589744628e-05, "loss": 2.3177, "step": 30740 }, { "epoch": 0.26, "learning_rate": 8.402867532685436e-05, "loss": 2.3282, "step": 30745 }, { "epoch": 0.26, "learning_rate": 8.40237602966248e-05, "loss": 2.2568, "step": 30750 }, { "epoch": 0.26, "learning_rate": 8.401884465402775e-05, "loss": 2.3156, "step": 30755 }, { "epoch": 0.26, "learning_rate": 8.401392839915166e-05, "loss": 2.3923, "step": 30760 }, { "epoch": 0.26, "learning_rate": 8.400901153208508e-05, "loss": 2.341, "step": 30765 }, { "epoch": 0.26, "learning_rate": 8.400409405291643e-05, "loss": 2.4279, "step": 30770 }, { "epoch": 0.26, "learning_rate": 8.399917596173424e-05, "loss": 2.3333, "step": 30775 }, { "epoch": 0.26, "learning_rate": 8.399425725862706e-05, "loss": 2.3758, "step": 30780 }, { "epoch": 0.26, "learning_rate": 8.398933794368338e-05, "loss": 2.3097, "step": 30785 }, { "epoch": 0.26, "learning_rate": 8.398441801699178e-05, "loss": 2.2967, "step": 30790 }, { "epoch": 0.26, "learning_rate": 8.397949747864076e-05, "loss": 2.3136, "step": 30795 }, { "epoch": 0.26, "learning_rate": 8.397457632871893e-05, "loss": 2.2727, "step": 30800 }, { "epoch": 0.26, "learning_rate": 8.396965456731482e-05, "loss": 2.372, "step": 30805 }, { "epoch": 0.26, "learning_rate": 8.396473219451702e-05, "loss": 2.306, "step": 30810 }, { "epoch": 0.26, "learning_rate": 8.395980921041416e-05, "loss": 2.3469, "step": 30815 }, { "epoch": 0.26, "learning_rate": 8.39548856150948e-05, "loss": 2.2854, "step": 30820 }, { "epoch": 0.26, "learning_rate": 8.394996140864758e-05, "loss": 2.3137, "step": 30825 }, { "epoch": 0.26, "learning_rate": 8.394503659116111e-05, "loss": 2.3052, "step": 30830 }, { "epoch": 0.26, "learning_rate": 8.394011116272406e-05, "loss": 2.3345, "step": 30835 }, { "epoch": 0.26, "learning_rate": 8.393518512342504e-05, "loss": 2.3185, "step": 30840 }, { "epoch": 0.26, "learning_rate": 8.393025847335274e-05, "loss": 2.3438, "step": 30845 }, { "epoch": 0.26, "learning_rate": 8.392533121259582e-05, "loss": 2.3045, "step": 30850 }, { "epoch": 0.26, "learning_rate": 8.392040334124297e-05, "loss": 2.3594, "step": 30855 }, { "epoch": 0.26, "learning_rate": 8.391547485938287e-05, "loss": 2.3887, "step": 30860 }, { "epoch": 0.26, "learning_rate": 8.391054576710423e-05, "loss": 2.3269, "step": 30865 }, { "epoch": 0.26, "learning_rate": 8.390561606449577e-05, "loss": 2.3233, "step": 30870 }, { "epoch": 0.26, "learning_rate": 8.390068575164618e-05, "loss": 2.3794, "step": 30875 }, { "epoch": 0.26, "learning_rate": 8.389575482864425e-05, "loss": 2.2404, "step": 30880 }, { "epoch": 0.26, "learning_rate": 8.38908232955787e-05, "loss": 2.2402, "step": 30885 }, { "epoch": 0.26, "learning_rate": 8.388589115253829e-05, "loss": 2.3148, "step": 30890 }, { "epoch": 0.26, "learning_rate": 8.38809583996118e-05, "loss": 2.2468, "step": 30895 }, { "epoch": 0.26, "learning_rate": 8.3876025036888e-05, "loss": 2.3367, "step": 30900 }, { "epoch": 0.26, "learning_rate": 8.38710910644557e-05, "loss": 2.3482, "step": 30905 }, { "epoch": 0.26, "learning_rate": 8.386615648240367e-05, "loss": 2.3603, "step": 30910 }, { "epoch": 0.26, "learning_rate": 8.386122129082074e-05, "loss": 2.2694, "step": 30915 }, { "epoch": 0.26, "learning_rate": 8.385628548979576e-05, "loss": 2.3207, "step": 30920 }, { "epoch": 0.26, "learning_rate": 8.385134907941752e-05, "loss": 2.3795, "step": 30925 }, { "epoch": 0.26, "learning_rate": 8.38464120597749e-05, "loss": 2.4128, "step": 30930 }, { "epoch": 0.26, "learning_rate": 8.384147443095675e-05, "loss": 2.3957, "step": 30935 }, { "epoch": 0.26, "learning_rate": 8.383653619305192e-05, "loss": 2.4207, "step": 30940 }, { "epoch": 0.26, "learning_rate": 8.383159734614931e-05, "loss": 2.4177, "step": 30945 }, { "epoch": 0.26, "learning_rate": 8.382665789033784e-05, "loss": 2.3241, "step": 30950 }, { "epoch": 0.26, "learning_rate": 8.382171782570634e-05, "loss": 2.3963, "step": 30955 }, { "epoch": 0.26, "learning_rate": 8.381677715234378e-05, "loss": 2.3777, "step": 30960 }, { "epoch": 0.26, "learning_rate": 8.381183587033904e-05, "loss": 2.3103, "step": 30965 }, { "epoch": 0.26, "learning_rate": 8.38068939797811e-05, "loss": 2.3353, "step": 30970 }, { "epoch": 0.26, "learning_rate": 8.380195148075887e-05, "loss": 2.3226, "step": 30975 }, { "epoch": 0.26, "learning_rate": 8.37970083733613e-05, "loss": 2.3499, "step": 30980 }, { "epoch": 0.26, "learning_rate": 8.379206465767742e-05, "loss": 2.3486, "step": 30985 }, { "epoch": 0.26, "learning_rate": 8.378712033379613e-05, "loss": 2.3088, "step": 30990 }, { "epoch": 0.26, "learning_rate": 8.378217540180646e-05, "loss": 2.3105, "step": 30995 }, { "epoch": 0.26, "learning_rate": 8.377722986179741e-05, "loss": 2.2806, "step": 31000 }, { "epoch": 0.26, "learning_rate": 8.377228371385799e-05, "loss": 2.3794, "step": 31005 }, { "epoch": 0.26, "learning_rate": 8.376733695807722e-05, "loss": 2.3802, "step": 31010 }, { "epoch": 0.26, "learning_rate": 8.376238959454411e-05, "loss": 2.31, "step": 31015 }, { "epoch": 0.26, "learning_rate": 8.375744162334773e-05, "loss": 2.3189, "step": 31020 }, { "epoch": 0.26, "learning_rate": 8.375249304457712e-05, "loss": 2.3542, "step": 31025 }, { "epoch": 0.26, "learning_rate": 8.374754385832137e-05, "loss": 2.387, "step": 31030 }, { "epoch": 0.26, "learning_rate": 8.374259406466954e-05, "loss": 2.2924, "step": 31035 }, { "epoch": 0.26, "learning_rate": 8.37376436637107e-05, "loss": 2.3237, "step": 31040 }, { "epoch": 0.26, "learning_rate": 8.373269265553397e-05, "loss": 2.3306, "step": 31045 }, { "epoch": 0.26, "learning_rate": 8.372774104022847e-05, "loss": 2.382, "step": 31050 }, { "epoch": 0.27, "learning_rate": 8.37227888178833e-05, "loss": 2.2594, "step": 31055 }, { "epoch": 0.27, "learning_rate": 8.371783598858758e-05, "loss": 2.3336, "step": 31060 }, { "epoch": 0.27, "learning_rate": 8.371288255243048e-05, "loss": 2.3554, "step": 31065 }, { "epoch": 0.27, "learning_rate": 8.370792850950115e-05, "loss": 2.3063, "step": 31070 }, { "epoch": 0.27, "learning_rate": 8.370297385988875e-05, "loss": 2.2078, "step": 31075 }, { "epoch": 0.27, "learning_rate": 8.369801860368242e-05, "loss": 2.3754, "step": 31080 }, { "epoch": 0.27, "learning_rate": 8.36930627409714e-05, "loss": 2.3166, "step": 31085 }, { "epoch": 0.27, "learning_rate": 8.368810627184486e-05, "loss": 2.3142, "step": 31090 }, { "epoch": 0.27, "learning_rate": 8.368314919639202e-05, "loss": 2.3294, "step": 31095 }, { "epoch": 0.27, "learning_rate": 8.367819151470208e-05, "loss": 2.3243, "step": 31100 }, { "epoch": 0.27, "learning_rate": 8.367323322686426e-05, "loss": 2.349, "step": 31105 }, { "epoch": 0.27, "learning_rate": 8.366827433296787e-05, "loss": 2.3984, "step": 31110 }, { "epoch": 0.27, "learning_rate": 8.366331483310207e-05, "loss": 2.3647, "step": 31115 }, { "epoch": 0.27, "learning_rate": 8.365835472735616e-05, "loss": 2.3279, "step": 31120 }, { "epoch": 0.27, "learning_rate": 8.365339401581944e-05, "loss": 2.2666, "step": 31125 }, { "epoch": 0.27, "learning_rate": 8.364843269858117e-05, "loss": 2.2697, "step": 31130 }, { "epoch": 0.27, "learning_rate": 8.364347077573063e-05, "loss": 2.243, "step": 31135 }, { "epoch": 0.27, "learning_rate": 8.363850824735715e-05, "loss": 2.2888, "step": 31140 }, { "epoch": 0.27, "learning_rate": 8.363354511355003e-05, "loss": 2.3381, "step": 31145 }, { "epoch": 0.27, "learning_rate": 8.362858137439862e-05, "loss": 2.3129, "step": 31150 }, { "epoch": 0.27, "learning_rate": 8.362361702999224e-05, "loss": 2.3658, "step": 31155 }, { "epoch": 0.27, "learning_rate": 8.361865208042023e-05, "loss": 2.3442, "step": 31160 }, { "epoch": 0.27, "learning_rate": 8.361368652577198e-05, "loss": 2.3485, "step": 31165 }, { "epoch": 0.27, "learning_rate": 8.360872036613683e-05, "loss": 2.3333, "step": 31170 }, { "epoch": 0.27, "learning_rate": 8.36037536016042e-05, "loss": 2.2917, "step": 31175 }, { "epoch": 0.27, "learning_rate": 8.359878623226345e-05, "loss": 2.3823, "step": 31180 }, { "epoch": 0.27, "learning_rate": 8.359381825820398e-05, "loss": 2.3342, "step": 31185 }, { "epoch": 0.27, "learning_rate": 8.358884967951522e-05, "loss": 2.3095, "step": 31190 }, { "epoch": 0.27, "learning_rate": 8.35838804962866e-05, "loss": 2.2929, "step": 31195 }, { "epoch": 0.27, "learning_rate": 8.357891070860757e-05, "loss": 2.3518, "step": 31200 }, { "epoch": 0.27, "learning_rate": 8.357394031656754e-05, "loss": 2.4324, "step": 31205 }, { "epoch": 0.27, "learning_rate": 8.356896932025598e-05, "loss": 2.2873, "step": 31210 }, { "epoch": 0.27, "learning_rate": 8.356399771976237e-05, "loss": 2.3662, "step": 31215 }, { "epoch": 0.27, "learning_rate": 8.35590255151762e-05, "loss": 2.3214, "step": 31220 }, { "epoch": 0.27, "learning_rate": 8.355405270658695e-05, "loss": 2.2873, "step": 31225 }, { "epoch": 0.27, "learning_rate": 8.354907929408408e-05, "loss": 2.3513, "step": 31230 }, { "epoch": 0.27, "learning_rate": 8.354410527775716e-05, "loss": 2.2963, "step": 31235 }, { "epoch": 0.27, "learning_rate": 8.353913065769571e-05, "loss": 2.4014, "step": 31240 }, { "epoch": 0.27, "learning_rate": 8.353415543398924e-05, "loss": 2.3015, "step": 31245 }, { "epoch": 0.27, "learning_rate": 8.35291796067273e-05, "loss": 2.3503, "step": 31250 }, { "epoch": 0.27, "learning_rate": 8.352420317599944e-05, "loss": 2.3976, "step": 31255 }, { "epoch": 0.27, "learning_rate": 8.351922614189526e-05, "loss": 2.349, "step": 31260 }, { "epoch": 0.27, "learning_rate": 8.35142485045043e-05, "loss": 2.2742, "step": 31265 }, { "epoch": 0.27, "learning_rate": 8.350927026391618e-05, "loss": 2.4846, "step": 31270 }, { "epoch": 0.27, "learning_rate": 8.350429142022045e-05, "loss": 2.3783, "step": 31275 }, { "epoch": 0.27, "learning_rate": 8.349931197350678e-05, "loss": 2.3316, "step": 31280 }, { "epoch": 0.27, "learning_rate": 8.349433192386476e-05, "loss": 2.3687, "step": 31285 }, { "epoch": 0.27, "learning_rate": 8.348935127138402e-05, "loss": 2.2813, "step": 31290 }, { "epoch": 0.27, "learning_rate": 8.348437001615421e-05, "loss": 2.3456, "step": 31295 }, { "epoch": 0.27, "learning_rate": 8.347938815826499e-05, "loss": 2.4024, "step": 31300 }, { "epoch": 0.27, "learning_rate": 8.347440569780602e-05, "loss": 2.3036, "step": 31305 }, { "epoch": 0.27, "learning_rate": 8.346942263486697e-05, "loss": 2.376, "step": 31310 }, { "epoch": 0.27, "learning_rate": 8.346443896953753e-05, "loss": 2.3997, "step": 31315 }, { "epoch": 0.27, "learning_rate": 8.34594547019074e-05, "loss": 2.3251, "step": 31320 }, { "epoch": 0.27, "learning_rate": 8.345446983206627e-05, "loss": 2.3139, "step": 31325 }, { "epoch": 0.27, "learning_rate": 8.344948436010388e-05, "loss": 2.3957, "step": 31330 }, { "epoch": 0.27, "learning_rate": 8.344449828610996e-05, "loss": 2.3042, "step": 31335 }, { "epoch": 0.27, "learning_rate": 8.343951161017424e-05, "loss": 2.369, "step": 31340 }, { "epoch": 0.27, "learning_rate": 8.343452433238647e-05, "loss": 2.3503, "step": 31345 }, { "epoch": 0.27, "learning_rate": 8.342953645283643e-05, "loss": 2.3064, "step": 31350 }, { "epoch": 0.27, "learning_rate": 8.342454797161388e-05, "loss": 2.3072, "step": 31355 }, { "epoch": 0.27, "learning_rate": 8.34195588888086e-05, "loss": 2.3715, "step": 31360 }, { "epoch": 0.27, "learning_rate": 8.341456920451039e-05, "loss": 2.3817, "step": 31365 }, { "epoch": 0.27, "learning_rate": 8.340957891880905e-05, "loss": 2.3017, "step": 31370 }, { "epoch": 0.27, "learning_rate": 8.34045880317944e-05, "loss": 2.3322, "step": 31375 }, { "epoch": 0.27, "learning_rate": 8.339959654355628e-05, "loss": 2.3561, "step": 31380 }, { "epoch": 0.27, "learning_rate": 8.33946044541845e-05, "loss": 2.2589, "step": 31385 }, { "epoch": 0.27, "learning_rate": 8.338961176376894e-05, "loss": 2.3054, "step": 31390 }, { "epoch": 0.27, "learning_rate": 8.338461847239942e-05, "loss": 2.2822, "step": 31395 }, { "epoch": 0.27, "learning_rate": 8.337962458016586e-05, "loss": 2.2962, "step": 31400 }, { "epoch": 0.27, "learning_rate": 8.337463008715811e-05, "loss": 2.3743, "step": 31405 }, { "epoch": 0.27, "learning_rate": 8.336963499346606e-05, "loss": 2.3716, "step": 31410 }, { "epoch": 0.27, "learning_rate": 8.336463929917963e-05, "loss": 2.29, "step": 31415 }, { "epoch": 0.27, "learning_rate": 8.335964300438872e-05, "loss": 2.4136, "step": 31420 }, { "epoch": 0.27, "learning_rate": 8.335464610918326e-05, "loss": 2.3241, "step": 31425 }, { "epoch": 0.27, "learning_rate": 8.334964861365317e-05, "loss": 2.3123, "step": 31430 }, { "epoch": 0.27, "learning_rate": 8.334465051788844e-05, "loss": 2.3552, "step": 31435 }, { "epoch": 0.27, "learning_rate": 8.333965182197898e-05, "loss": 2.2925, "step": 31440 }, { "epoch": 0.27, "learning_rate": 8.333465252601476e-05, "loss": 2.349, "step": 31445 }, { "epoch": 0.27, "learning_rate": 8.332965263008578e-05, "loss": 2.3662, "step": 31450 }, { "epoch": 0.27, "learning_rate": 8.332465213428204e-05, "loss": 2.3922, "step": 31455 }, { "epoch": 0.27, "learning_rate": 8.331965103869353e-05, "loss": 2.3853, "step": 31460 }, { "epoch": 0.27, "learning_rate": 8.331464934341023e-05, "loss": 2.3165, "step": 31465 }, { "epoch": 0.27, "learning_rate": 8.33096470485222e-05, "loss": 2.344, "step": 31470 }, { "epoch": 0.27, "learning_rate": 8.330464415411945e-05, "loss": 2.3355, "step": 31475 }, { "epoch": 0.27, "learning_rate": 8.329964066029202e-05, "loss": 2.3378, "step": 31480 }, { "epoch": 0.27, "learning_rate": 8.329463656712999e-05, "loss": 2.2729, "step": 31485 }, { "epoch": 0.27, "learning_rate": 8.328963187472341e-05, "loss": 2.3223, "step": 31490 }, { "epoch": 0.27, "learning_rate": 8.328462658316233e-05, "loss": 2.363, "step": 31495 }, { "epoch": 0.27, "learning_rate": 8.327962069253689e-05, "loss": 2.3273, "step": 31500 }, { "epoch": 0.27, "learning_rate": 8.327461420293716e-05, "loss": 2.363, "step": 31505 }, { "epoch": 0.27, "learning_rate": 8.326960711445324e-05, "loss": 2.3444, "step": 31510 }, { "epoch": 0.27, "learning_rate": 8.326459942717526e-05, "loss": 2.321, "step": 31515 }, { "epoch": 0.27, "learning_rate": 8.325959114119332e-05, "loss": 2.2008, "step": 31520 }, { "epoch": 0.27, "learning_rate": 8.325458225659762e-05, "loss": 2.3365, "step": 31525 }, { "epoch": 0.27, "learning_rate": 8.324957277347827e-05, "loss": 2.3597, "step": 31530 }, { "epoch": 0.27, "learning_rate": 8.324456269192542e-05, "loss": 2.3125, "step": 31535 }, { "epoch": 0.27, "learning_rate": 8.323955201202927e-05, "loss": 2.282, "step": 31540 }, { "epoch": 0.27, "learning_rate": 8.323454073387999e-05, "loss": 2.3508, "step": 31545 }, { "epoch": 0.27, "learning_rate": 8.322952885756779e-05, "loss": 2.3851, "step": 31550 }, { "epoch": 0.27, "learning_rate": 8.322451638318285e-05, "loss": 2.3956, "step": 31555 }, { "epoch": 0.27, "learning_rate": 8.32195033108154e-05, "loss": 2.3162, "step": 31560 }, { "epoch": 0.27, "learning_rate": 8.321448964055569e-05, "loss": 2.3179, "step": 31565 }, { "epoch": 0.27, "learning_rate": 8.32094753724939e-05, "loss": 2.3193, "step": 31570 }, { "epoch": 0.27, "learning_rate": 8.320446050672033e-05, "loss": 2.297, "step": 31575 }, { "epoch": 0.27, "learning_rate": 8.319944504332522e-05, "loss": 2.3707, "step": 31580 }, { "epoch": 0.27, "learning_rate": 8.319442898239881e-05, "loss": 2.3365, "step": 31585 }, { "epoch": 0.27, "learning_rate": 8.318941232403145e-05, "loss": 2.3535, "step": 31590 }, { "epoch": 0.27, "learning_rate": 8.318439506831337e-05, "loss": 2.314, "step": 31595 }, { "epoch": 0.27, "learning_rate": 8.317937721533488e-05, "loss": 2.266, "step": 31600 }, { "epoch": 0.27, "learning_rate": 8.317435876518633e-05, "loss": 2.3985, "step": 31605 }, { "epoch": 0.27, "learning_rate": 8.316933971795799e-05, "loss": 2.335, "step": 31610 }, { "epoch": 0.27, "learning_rate": 8.316432007374024e-05, "loss": 2.3697, "step": 31615 }, { "epoch": 0.27, "learning_rate": 8.31592998326234e-05, "loss": 2.308, "step": 31620 }, { "epoch": 0.27, "learning_rate": 8.315427899469784e-05, "loss": 2.2738, "step": 31625 }, { "epoch": 0.27, "learning_rate": 8.314925756005392e-05, "loss": 2.3866, "step": 31630 }, { "epoch": 0.27, "learning_rate": 8.314423552878201e-05, "loss": 2.2987, "step": 31635 }, { "epoch": 0.27, "learning_rate": 8.313921290097249e-05, "loss": 2.3324, "step": 31640 }, { "epoch": 0.27, "learning_rate": 8.313418967671577e-05, "loss": 2.3822, "step": 31645 }, { "epoch": 0.27, "learning_rate": 8.312916585610227e-05, "loss": 2.316, "step": 31650 }, { "epoch": 0.27, "learning_rate": 8.312414143922241e-05, "loss": 2.3096, "step": 31655 }, { "epoch": 0.27, "learning_rate": 8.311911642616659e-05, "loss": 2.3322, "step": 31660 }, { "epoch": 0.27, "learning_rate": 8.311409081702528e-05, "loss": 2.2854, "step": 31665 }, { "epoch": 0.27, "learning_rate": 8.310906461188893e-05, "loss": 2.361, "step": 31670 }, { "epoch": 0.27, "learning_rate": 8.3104037810848e-05, "loss": 2.3337, "step": 31675 }, { "epoch": 0.27, "learning_rate": 8.309901041399295e-05, "loss": 2.3508, "step": 31680 }, { "epoch": 0.27, "learning_rate": 8.309398242141428e-05, "loss": 2.3691, "step": 31685 }, { "epoch": 0.27, "learning_rate": 8.308895383320247e-05, "loss": 2.3101, "step": 31690 }, { "epoch": 0.27, "learning_rate": 8.308392464944804e-05, "loss": 2.4028, "step": 31695 }, { "epoch": 0.27, "learning_rate": 8.30788948702415e-05, "loss": 2.2364, "step": 31700 }, { "epoch": 0.27, "learning_rate": 8.307386449567338e-05, "loss": 2.2977, "step": 31705 }, { "epoch": 0.27, "learning_rate": 8.306883352583421e-05, "loss": 2.3015, "step": 31710 }, { "epoch": 0.27, "learning_rate": 8.306380196081456e-05, "loss": 2.3018, "step": 31715 }, { "epoch": 0.27, "learning_rate": 8.305876980070497e-05, "loss": 2.2947, "step": 31720 }, { "epoch": 0.27, "learning_rate": 8.3053737045596e-05, "loss": 2.3456, "step": 31725 }, { "epoch": 0.27, "learning_rate": 8.304870369557827e-05, "loss": 2.3026, "step": 31730 }, { "epoch": 0.27, "learning_rate": 8.304366975074233e-05, "loss": 2.3574, "step": 31735 }, { "epoch": 0.27, "learning_rate": 8.30386352111788e-05, "loss": 2.3954, "step": 31740 }, { "epoch": 0.27, "learning_rate": 8.303360007697829e-05, "loss": 2.2419, "step": 31745 }, { "epoch": 0.27, "learning_rate": 8.302856434823141e-05, "loss": 2.3028, "step": 31750 }, { "epoch": 0.27, "learning_rate": 8.302352802502883e-05, "loss": 2.3425, "step": 31755 }, { "epoch": 0.27, "learning_rate": 8.301849110746117e-05, "loss": 2.343, "step": 31760 }, { "epoch": 0.27, "learning_rate": 8.30134535956191e-05, "loss": 2.3959, "step": 31765 }, { "epoch": 0.27, "learning_rate": 8.300841548959327e-05, "loss": 2.3538, "step": 31770 }, { "epoch": 0.27, "learning_rate": 8.300337678947434e-05, "loss": 2.3147, "step": 31775 }, { "epoch": 0.27, "learning_rate": 8.299833749535304e-05, "loss": 2.3719, "step": 31780 }, { "epoch": 0.27, "learning_rate": 8.299329760732004e-05, "loss": 2.2839, "step": 31785 }, { "epoch": 0.27, "learning_rate": 8.298825712546607e-05, "loss": 2.3289, "step": 31790 }, { "epoch": 0.27, "learning_rate": 8.298321604988184e-05, "loss": 2.3021, "step": 31795 }, { "epoch": 0.27, "learning_rate": 8.297817438065806e-05, "loss": 2.3604, "step": 31800 }, { "epoch": 0.27, "learning_rate": 8.297313211788549e-05, "loss": 2.2541, "step": 31805 }, { "epoch": 0.27, "learning_rate": 8.29680892616549e-05, "loss": 2.3359, "step": 31810 }, { "epoch": 0.27, "learning_rate": 8.296304581205703e-05, "loss": 2.3098, "step": 31815 }, { "epoch": 0.27, "learning_rate": 8.295800176918265e-05, "loss": 2.3591, "step": 31820 }, { "epoch": 0.27, "learning_rate": 8.295295713312254e-05, "loss": 2.3232, "step": 31825 }, { "epoch": 0.27, "learning_rate": 8.294791190396752e-05, "loss": 2.3474, "step": 31830 }, { "epoch": 0.27, "learning_rate": 8.294286608180837e-05, "loss": 2.3386, "step": 31835 }, { "epoch": 0.27, "learning_rate": 8.293781966673593e-05, "loss": 2.394, "step": 31840 }, { "epoch": 0.27, "learning_rate": 8.293277265884101e-05, "loss": 2.2778, "step": 31845 }, { "epoch": 0.27, "learning_rate": 8.292772505821445e-05, "loss": 2.3753, "step": 31850 }, { "epoch": 0.27, "learning_rate": 8.292267686494708e-05, "loss": 2.3431, "step": 31855 }, { "epoch": 0.27, "learning_rate": 8.291762807912978e-05, "loss": 2.3435, "step": 31860 }, { "epoch": 0.27, "learning_rate": 8.291257870085343e-05, "loss": 2.311, "step": 31865 }, { "epoch": 0.27, "learning_rate": 8.290752873020888e-05, "loss": 2.3658, "step": 31870 }, { "epoch": 0.27, "learning_rate": 8.290247816728704e-05, "loss": 2.2834, "step": 31875 }, { "epoch": 0.27, "learning_rate": 8.289742701217882e-05, "loss": 2.2769, "step": 31880 }, { "epoch": 0.27, "learning_rate": 8.289237526497512e-05, "loss": 2.3371, "step": 31885 }, { "epoch": 0.27, "learning_rate": 8.288732292576685e-05, "loss": 2.3832, "step": 31890 }, { "epoch": 0.27, "learning_rate": 8.288226999464495e-05, "loss": 2.2395, "step": 31895 }, { "epoch": 0.27, "learning_rate": 8.287721647170039e-05, "loss": 2.1795, "step": 31900 }, { "epoch": 0.27, "learning_rate": 8.287216235702408e-05, "loss": 2.3925, "step": 31905 }, { "epoch": 0.27, "learning_rate": 8.286710765070702e-05, "loss": 2.3751, "step": 31910 }, { "epoch": 0.27, "learning_rate": 8.286205235284017e-05, "loss": 2.3865, "step": 31915 }, { "epoch": 0.27, "learning_rate": 8.285699646351452e-05, "loss": 2.3991, "step": 31920 }, { "epoch": 0.27, "learning_rate": 8.285193998282107e-05, "loss": 2.33, "step": 31925 }, { "epoch": 0.27, "learning_rate": 8.284688291085082e-05, "loss": 2.433, "step": 31930 }, { "epoch": 0.27, "learning_rate": 8.284182524769481e-05, "loss": 2.2575, "step": 31935 }, { "epoch": 0.27, "learning_rate": 8.283676699344402e-05, "loss": 2.3185, "step": 31940 }, { "epoch": 0.27, "learning_rate": 8.283170814818955e-05, "loss": 2.2889, "step": 31945 }, { "epoch": 0.27, "learning_rate": 8.282664871202241e-05, "loss": 2.3999, "step": 31950 }, { "epoch": 0.27, "learning_rate": 8.282158868503367e-05, "loss": 2.2795, "step": 31955 }, { "epoch": 0.27, "learning_rate": 8.281652806731442e-05, "loss": 2.3582, "step": 31960 }, { "epoch": 0.27, "learning_rate": 8.281146685895571e-05, "loss": 2.3314, "step": 31965 }, { "epoch": 0.27, "learning_rate": 8.280640506004866e-05, "loss": 2.3953, "step": 31970 }, { "epoch": 0.27, "learning_rate": 8.280134267068437e-05, "loss": 2.2969, "step": 31975 }, { "epoch": 0.27, "learning_rate": 8.279627969095393e-05, "loss": 2.3464, "step": 31980 }, { "epoch": 0.27, "learning_rate": 8.279121612094849e-05, "loss": 2.3331, "step": 31985 }, { "epoch": 0.27, "learning_rate": 8.278615196075918e-05, "loss": 2.3643, "step": 31990 }, { "epoch": 0.27, "learning_rate": 8.278108721047715e-05, "loss": 2.3278, "step": 31995 }, { "epoch": 0.27, "learning_rate": 8.277602187019353e-05, "loss": 2.2975, "step": 32000 }, { "epoch": 0.27, "learning_rate": 8.277095593999953e-05, "loss": 2.2636, "step": 32005 }, { "epoch": 0.27, "learning_rate": 8.276588941998627e-05, "loss": 2.3793, "step": 32010 }, { "epoch": 0.27, "learning_rate": 8.2760822310245e-05, "loss": 2.4385, "step": 32015 }, { "epoch": 0.27, "learning_rate": 8.275575461086689e-05, "loss": 2.3258, "step": 32020 }, { "epoch": 0.27, "learning_rate": 8.275068632194314e-05, "loss": 2.3592, "step": 32025 }, { "epoch": 0.27, "learning_rate": 8.2745617443565e-05, "loss": 2.3384, "step": 32030 }, { "epoch": 0.27, "learning_rate": 8.274054797582366e-05, "loss": 2.3858, "step": 32035 }, { "epoch": 0.27, "learning_rate": 8.27354779188104e-05, "loss": 2.3521, "step": 32040 }, { "epoch": 0.27, "learning_rate": 8.273040727261645e-05, "loss": 2.3684, "step": 32045 }, { "epoch": 0.27, "learning_rate": 8.272533603733308e-05, "loss": 2.3141, "step": 32050 }, { "epoch": 0.27, "learning_rate": 8.272026421305156e-05, "loss": 2.3505, "step": 32055 }, { "epoch": 0.27, "learning_rate": 8.271519179986318e-05, "loss": 2.2883, "step": 32060 }, { "epoch": 0.27, "learning_rate": 8.271011879785923e-05, "loss": 2.2415, "step": 32065 }, { "epoch": 0.27, "learning_rate": 8.270504520713101e-05, "loss": 2.3251, "step": 32070 }, { "epoch": 0.27, "learning_rate": 8.269997102776984e-05, "loss": 2.3785, "step": 32075 }, { "epoch": 0.27, "learning_rate": 8.269489625986705e-05, "loss": 2.2934, "step": 32080 }, { "epoch": 0.27, "learning_rate": 8.268982090351398e-05, "loss": 2.2775, "step": 32085 }, { "epoch": 0.27, "learning_rate": 8.268474495880197e-05, "loss": 2.3319, "step": 32090 }, { "epoch": 0.27, "learning_rate": 8.267966842582238e-05, "loss": 2.273, "step": 32095 }, { "epoch": 0.27, "learning_rate": 8.267459130466657e-05, "loss": 2.3333, "step": 32100 }, { "epoch": 0.27, "learning_rate": 8.266951359542594e-05, "loss": 2.3246, "step": 32105 }, { "epoch": 0.27, "learning_rate": 8.266443529819185e-05, "loss": 2.271, "step": 32110 }, { "epoch": 0.27, "learning_rate": 8.265935641305574e-05, "loss": 2.3494, "step": 32115 }, { "epoch": 0.27, "learning_rate": 8.265427694010899e-05, "loss": 2.299, "step": 32120 }, { "epoch": 0.27, "learning_rate": 8.264919687944302e-05, "loss": 2.2466, "step": 32125 }, { "epoch": 0.27, "learning_rate": 8.264411623114927e-05, "loss": 2.2666, "step": 32130 }, { "epoch": 0.27, "learning_rate": 8.26390349953192e-05, "loss": 2.297, "step": 32135 }, { "epoch": 0.27, "learning_rate": 8.263395317204426e-05, "loss": 2.342, "step": 32140 }, { "epoch": 0.27, "learning_rate": 8.262887076141588e-05, "loss": 2.3237, "step": 32145 }, { "epoch": 0.27, "learning_rate": 8.262378776352555e-05, "loss": 2.3365, "step": 32150 }, { "epoch": 0.27, "learning_rate": 8.261870417846478e-05, "loss": 2.2986, "step": 32155 }, { "epoch": 0.27, "learning_rate": 8.261362000632502e-05, "loss": 2.3428, "step": 32160 }, { "epoch": 0.27, "learning_rate": 8.260853524719782e-05, "loss": 2.2977, "step": 32165 }, { "epoch": 0.27, "learning_rate": 8.260344990117469e-05, "loss": 2.372, "step": 32170 }, { "epoch": 0.27, "learning_rate": 8.259836396834714e-05, "loss": 2.3844, "step": 32175 }, { "epoch": 0.27, "learning_rate": 8.259327744880671e-05, "loss": 2.2788, "step": 32180 }, { "epoch": 0.27, "learning_rate": 8.258819034264496e-05, "loss": 2.2753, "step": 32185 }, { "epoch": 0.27, "learning_rate": 8.258310264995343e-05, "loss": 2.2606, "step": 32190 }, { "epoch": 0.27, "learning_rate": 8.257801437082371e-05, "loss": 2.3592, "step": 32195 }, { "epoch": 0.27, "learning_rate": 8.257292550534738e-05, "loss": 2.3304, "step": 32200 }, { "epoch": 0.27, "learning_rate": 8.256783605361601e-05, "loss": 2.2988, "step": 32205 }, { "epoch": 0.27, "learning_rate": 8.256274601572122e-05, "loss": 2.3175, "step": 32210 }, { "epoch": 0.27, "learning_rate": 8.25576553917546e-05, "loss": 2.3151, "step": 32215 }, { "epoch": 0.27, "learning_rate": 8.255256418180779e-05, "loss": 2.3493, "step": 32220 }, { "epoch": 0.27, "learning_rate": 8.254747238597243e-05, "loss": 2.4282, "step": 32225 }, { "epoch": 0.28, "learning_rate": 8.254238000434015e-05, "loss": 2.3328, "step": 32230 }, { "epoch": 0.28, "learning_rate": 8.25372870370026e-05, "loss": 2.2933, "step": 32235 }, { "epoch": 0.28, "learning_rate": 8.253219348405147e-05, "loss": 2.3247, "step": 32240 }, { "epoch": 0.28, "learning_rate": 8.252709934557841e-05, "loss": 2.3254, "step": 32245 }, { "epoch": 0.28, "learning_rate": 8.252200462167509e-05, "loss": 2.4149, "step": 32250 }, { "epoch": 0.28, "learning_rate": 8.251690931243326e-05, "loss": 2.2699, "step": 32255 }, { "epoch": 0.28, "learning_rate": 8.251181341794457e-05, "loss": 2.3843, "step": 32260 }, { "epoch": 0.28, "learning_rate": 8.250671693830077e-05, "loss": 2.3052, "step": 32265 }, { "epoch": 0.28, "learning_rate": 8.250161987359358e-05, "loss": 2.3631, "step": 32270 }, { "epoch": 0.28, "learning_rate": 8.249652222391472e-05, "loss": 2.3231, "step": 32275 }, { "epoch": 0.28, "learning_rate": 8.249142398935599e-05, "loss": 2.4161, "step": 32280 }, { "epoch": 0.28, "learning_rate": 8.248632517000909e-05, "loss": 2.4262, "step": 32285 }, { "epoch": 0.28, "learning_rate": 8.248122576596582e-05, "loss": 2.2747, "step": 32290 }, { "epoch": 0.28, "learning_rate": 8.247612577731796e-05, "loss": 2.2404, "step": 32295 }, { "epoch": 0.28, "learning_rate": 8.247102520415729e-05, "loss": 2.2983, "step": 32300 }, { "epoch": 0.28, "learning_rate": 8.246592404657562e-05, "loss": 2.3047, "step": 32305 }, { "epoch": 0.28, "learning_rate": 8.246082230466477e-05, "loss": 2.3016, "step": 32310 }, { "epoch": 0.28, "learning_rate": 8.245571997851653e-05, "loss": 2.331, "step": 32315 }, { "epoch": 0.28, "learning_rate": 8.245061706822276e-05, "loss": 2.3728, "step": 32320 }, { "epoch": 0.28, "learning_rate": 8.244551357387528e-05, "loss": 2.3115, "step": 32325 }, { "epoch": 0.28, "learning_rate": 8.2440409495566e-05, "loss": 2.331, "step": 32330 }, { "epoch": 0.28, "learning_rate": 8.243530483338673e-05, "loss": 2.2305, "step": 32335 }, { "epoch": 0.28, "learning_rate": 8.243019958742936e-05, "loss": 2.3319, "step": 32340 }, { "epoch": 0.28, "learning_rate": 8.242509375778578e-05, "loss": 2.3026, "step": 32345 }, { "epoch": 0.28, "learning_rate": 8.241998734454786e-05, "loss": 2.2829, "step": 32350 }, { "epoch": 0.28, "learning_rate": 8.241488034780755e-05, "loss": 2.3688, "step": 32355 }, { "epoch": 0.28, "learning_rate": 8.240977276765674e-05, "loss": 2.306, "step": 32360 }, { "epoch": 0.28, "learning_rate": 8.240466460418736e-05, "loss": 2.3404, "step": 32365 }, { "epoch": 0.28, "learning_rate": 8.239955585749135e-05, "loss": 2.3747, "step": 32370 }, { "epoch": 0.28, "learning_rate": 8.239444652766066e-05, "loss": 2.3097, "step": 32375 }, { "epoch": 0.28, "learning_rate": 8.238933661478725e-05, "loss": 2.291, "step": 32380 }, { "epoch": 0.28, "learning_rate": 8.238422611896309e-05, "loss": 2.3133, "step": 32385 }, { "epoch": 0.28, "learning_rate": 8.237911504028015e-05, "loss": 2.3464, "step": 32390 }, { "epoch": 0.28, "learning_rate": 8.237400337883044e-05, "loss": 2.3102, "step": 32395 }, { "epoch": 0.28, "learning_rate": 8.236889113470594e-05, "loss": 2.3318, "step": 32400 }, { "epoch": 0.28, "learning_rate": 8.236377830799867e-05, "loss": 2.3167, "step": 32405 }, { "epoch": 0.28, "learning_rate": 8.235866489880064e-05, "loss": 2.3652, "step": 32410 }, { "epoch": 0.28, "learning_rate": 8.235355090720392e-05, "loss": 2.3303, "step": 32415 }, { "epoch": 0.28, "learning_rate": 8.23484363333005e-05, "loss": 2.3323, "step": 32420 }, { "epoch": 0.28, "learning_rate": 8.234332117718246e-05, "loss": 2.3493, "step": 32425 }, { "epoch": 0.28, "learning_rate": 8.233820543894188e-05, "loss": 2.3528, "step": 32430 }, { "epoch": 0.28, "learning_rate": 8.233308911867082e-05, "loss": 2.2832, "step": 32435 }, { "epoch": 0.28, "learning_rate": 8.232797221646135e-05, "loss": 2.2644, "step": 32440 }, { "epoch": 0.28, "learning_rate": 8.232285473240557e-05, "loss": 2.2695, "step": 32445 }, { "epoch": 0.28, "learning_rate": 8.231773666659561e-05, "loss": 2.3019, "step": 32450 }, { "epoch": 0.28, "learning_rate": 8.231261801912358e-05, "loss": 2.3888, "step": 32455 }, { "epoch": 0.28, "learning_rate": 8.230749879008157e-05, "loss": 2.3426, "step": 32460 }, { "epoch": 0.28, "learning_rate": 8.230237897956176e-05, "loss": 2.3524, "step": 32465 }, { "epoch": 0.28, "learning_rate": 8.229725858765627e-05, "loss": 2.3116, "step": 32470 }, { "epoch": 0.28, "learning_rate": 8.229213761445727e-05, "loss": 2.3138, "step": 32475 }, { "epoch": 0.28, "learning_rate": 8.228701606005694e-05, "loss": 2.261, "step": 32480 }, { "epoch": 0.28, "learning_rate": 8.228189392454744e-05, "loss": 2.316, "step": 32485 }, { "epoch": 0.28, "learning_rate": 8.227677120802096e-05, "loss": 2.3649, "step": 32490 }, { "epoch": 0.28, "learning_rate": 8.22716479105697e-05, "loss": 2.301, "step": 32495 }, { "epoch": 0.28, "learning_rate": 8.226652403228588e-05, "loss": 2.3284, "step": 32500 }, { "epoch": 0.28, "learning_rate": 8.226139957326173e-05, "loss": 2.3939, "step": 32505 }, { "epoch": 0.28, "learning_rate": 8.225627453358946e-05, "loss": 2.2979, "step": 32510 }, { "epoch": 0.28, "learning_rate": 8.225114891336132e-05, "loss": 2.2684, "step": 32515 }, { "epoch": 0.28, "learning_rate": 8.224602271266955e-05, "loss": 2.3794, "step": 32520 }, { "epoch": 0.28, "learning_rate": 8.224089593160642e-05, "loss": 2.2391, "step": 32525 }, { "epoch": 0.28, "learning_rate": 8.223576857026422e-05, "loss": 2.333, "step": 32530 }, { "epoch": 0.28, "learning_rate": 8.223064062873522e-05, "loss": 2.2842, "step": 32535 }, { "epoch": 0.28, "learning_rate": 8.222551210711171e-05, "loss": 2.3191, "step": 32540 }, { "epoch": 0.28, "learning_rate": 8.222038300548602e-05, "loss": 2.4705, "step": 32545 }, { "epoch": 0.28, "learning_rate": 8.221525332395041e-05, "loss": 2.2927, "step": 32550 }, { "epoch": 0.28, "learning_rate": 8.221012306259725e-05, "loss": 2.3542, "step": 32555 }, { "epoch": 0.28, "learning_rate": 8.220499222151887e-05, "loss": 2.3391, "step": 32560 }, { "epoch": 0.28, "learning_rate": 8.219986080080762e-05, "loss": 2.3248, "step": 32565 }, { "epoch": 0.28, "learning_rate": 8.219472880055583e-05, "loss": 2.2817, "step": 32570 }, { "epoch": 0.28, "learning_rate": 8.218959622085588e-05, "loss": 2.3584, "step": 32575 }, { "epoch": 0.28, "learning_rate": 8.218446306180017e-05, "loss": 2.3645, "step": 32580 }, { "epoch": 0.28, "learning_rate": 8.217932932348104e-05, "loss": 2.332, "step": 32585 }, { "epoch": 0.28, "learning_rate": 8.217419500599095e-05, "loss": 2.2745, "step": 32590 }, { "epoch": 0.28, "learning_rate": 8.216906010942225e-05, "loss": 2.3508, "step": 32595 }, { "epoch": 0.28, "learning_rate": 8.216392463386739e-05, "loss": 2.35, "step": 32600 }, { "epoch": 0.28, "learning_rate": 8.215878857941881e-05, "loss": 2.3234, "step": 32605 }, { "epoch": 0.28, "learning_rate": 8.215365194616892e-05, "loss": 2.2898, "step": 32610 }, { "epoch": 0.28, "learning_rate": 8.21485147342102e-05, "loss": 2.3477, "step": 32615 }, { "epoch": 0.28, "learning_rate": 8.214337694363507e-05, "loss": 2.355, "step": 32620 }, { "epoch": 0.28, "learning_rate": 8.213823857453601e-05, "loss": 2.3697, "step": 32625 }, { "epoch": 0.28, "learning_rate": 8.213309962700556e-05, "loss": 2.333, "step": 32630 }, { "epoch": 0.28, "learning_rate": 8.212796010113615e-05, "loss": 2.3661, "step": 32635 }, { "epoch": 0.28, "learning_rate": 8.212281999702031e-05, "loss": 2.27, "step": 32640 }, { "epoch": 0.28, "learning_rate": 8.211767931475054e-05, "loss": 2.4112, "step": 32645 }, { "epoch": 0.28, "learning_rate": 8.211253805441937e-05, "loss": 2.2905, "step": 32650 }, { "epoch": 0.28, "learning_rate": 8.210739621611934e-05, "loss": 2.3067, "step": 32655 }, { "epoch": 0.28, "learning_rate": 8.210225379994296e-05, "loss": 2.2526, "step": 32660 }, { "epoch": 0.28, "learning_rate": 8.209711080598283e-05, "loss": 2.4097, "step": 32665 }, { "epoch": 0.28, "learning_rate": 8.20919672343315e-05, "loss": 2.2771, "step": 32670 }, { "epoch": 0.28, "learning_rate": 8.208682308508151e-05, "loss": 2.3069, "step": 32675 }, { "epoch": 0.28, "learning_rate": 8.208167835832551e-05, "loss": 2.2681, "step": 32680 }, { "epoch": 0.28, "learning_rate": 8.207653305415604e-05, "loss": 2.3402, "step": 32685 }, { "epoch": 0.28, "learning_rate": 8.207138717266573e-05, "loss": 2.2728, "step": 32690 }, { "epoch": 0.28, "learning_rate": 8.206624071394721e-05, "loss": 2.3288, "step": 32695 }, { "epoch": 0.28, "learning_rate": 8.206109367809309e-05, "loss": 2.3074, "step": 32700 }, { "epoch": 0.28, "learning_rate": 8.205594606519599e-05, "loss": 2.3205, "step": 32705 }, { "epoch": 0.28, "learning_rate": 8.20507978753486e-05, "loss": 2.3221, "step": 32710 }, { "epoch": 0.28, "learning_rate": 8.204564910864354e-05, "loss": 2.293, "step": 32715 }, { "epoch": 0.28, "learning_rate": 8.20404997651735e-05, "loss": 2.3366, "step": 32720 }, { "epoch": 0.28, "learning_rate": 8.203534984503114e-05, "loss": 2.3095, "step": 32725 }, { "epoch": 0.28, "learning_rate": 8.203019934830917e-05, "loss": 2.3605, "step": 32730 }, { "epoch": 0.28, "learning_rate": 8.20250482751003e-05, "loss": 2.4182, "step": 32735 }, { "epoch": 0.28, "learning_rate": 8.20198966254972e-05, "loss": 2.3116, "step": 32740 }, { "epoch": 0.28, "learning_rate": 8.201474439959262e-05, "loss": 2.3337, "step": 32745 }, { "epoch": 0.28, "learning_rate": 8.200959159747929e-05, "loss": 2.3482, "step": 32750 }, { "epoch": 0.28, "learning_rate": 8.200443821924993e-05, "loss": 2.3017, "step": 32755 }, { "epoch": 0.28, "learning_rate": 8.199928426499732e-05, "loss": 2.3404, "step": 32760 }, { "epoch": 0.28, "learning_rate": 8.199412973481422e-05, "loss": 2.3217, "step": 32765 }, { "epoch": 0.28, "learning_rate": 8.198897462879338e-05, "loss": 2.3114, "step": 32770 }, { "epoch": 0.28, "learning_rate": 8.198381894702757e-05, "loss": 2.234, "step": 32775 }, { "epoch": 0.28, "learning_rate": 8.197866268960966e-05, "loss": 2.3448, "step": 32780 }, { "epoch": 0.28, "learning_rate": 8.197350585663236e-05, "loss": 2.3343, "step": 32785 }, { "epoch": 0.28, "learning_rate": 8.196834844818854e-05, "loss": 2.2887, "step": 32790 }, { "epoch": 0.28, "learning_rate": 8.196319046437101e-05, "loss": 2.3045, "step": 32795 }, { "epoch": 0.28, "learning_rate": 8.19580319052726e-05, "loss": 2.3384, "step": 32800 }, { "epoch": 0.28, "learning_rate": 8.195287277098616e-05, "loss": 2.3772, "step": 32805 }, { "epoch": 0.28, "learning_rate": 8.194771306160455e-05, "loss": 2.3562, "step": 32810 }, { "epoch": 0.28, "learning_rate": 8.194255277722063e-05, "loss": 2.3591, "step": 32815 }, { "epoch": 0.28, "learning_rate": 8.193739191792727e-05, "loss": 2.3802, "step": 32820 }, { "epoch": 0.28, "learning_rate": 8.193223048381735e-05, "loss": 2.3931, "step": 32825 }, { "epoch": 0.28, "learning_rate": 8.19270684749838e-05, "loss": 2.3234, "step": 32830 }, { "epoch": 0.28, "learning_rate": 8.192190589151949e-05, "loss": 2.2312, "step": 32835 }, { "epoch": 0.28, "learning_rate": 8.191674273351736e-05, "loss": 2.312, "step": 32840 }, { "epoch": 0.28, "learning_rate": 8.191157900107034e-05, "loss": 2.3625, "step": 32845 }, { "epoch": 0.28, "learning_rate": 8.190641469427134e-05, "loss": 2.3292, "step": 32850 }, { "epoch": 0.28, "learning_rate": 8.190124981321334e-05, "loss": 2.3609, "step": 32855 }, { "epoch": 0.28, "learning_rate": 8.189608435798928e-05, "loss": 2.3323, "step": 32860 }, { "epoch": 0.28, "learning_rate": 8.189091832869213e-05, "loss": 2.2539, "step": 32865 }, { "epoch": 0.28, "learning_rate": 8.18857517254149e-05, "loss": 2.3816, "step": 32870 }, { "epoch": 0.28, "learning_rate": 8.188058454825054e-05, "loss": 2.4222, "step": 32875 }, { "epoch": 0.28, "learning_rate": 8.187541679729204e-05, "loss": 2.3165, "step": 32880 }, { "epoch": 0.28, "learning_rate": 8.187024847263246e-05, "loss": 2.3399, "step": 32885 }, { "epoch": 0.28, "learning_rate": 8.18650795743648e-05, "loss": 2.2722, "step": 32890 }, { "epoch": 0.28, "learning_rate": 8.185991010258207e-05, "loss": 2.4142, "step": 32895 }, { "epoch": 0.28, "learning_rate": 8.185474005737734e-05, "loss": 2.3206, "step": 32900 }, { "epoch": 0.28, "learning_rate": 8.184956943884365e-05, "loss": 2.3442, "step": 32905 }, { "epoch": 0.28, "learning_rate": 8.184439824707406e-05, "loss": 2.3744, "step": 32910 }, { "epoch": 0.28, "learning_rate": 8.183922648216162e-05, "loss": 2.3724, "step": 32915 }, { "epoch": 0.28, "learning_rate": 8.183405414419946e-05, "loss": 2.3214, "step": 32920 }, { "epoch": 0.28, "learning_rate": 8.182888123328065e-05, "loss": 2.3661, "step": 32925 }, { "epoch": 0.28, "learning_rate": 8.182370774949828e-05, "loss": 2.3382, "step": 32930 }, { "epoch": 0.28, "learning_rate": 8.181853369294549e-05, "loss": 2.3616, "step": 32935 }, { "epoch": 0.28, "learning_rate": 8.181335906371538e-05, "loss": 2.4009, "step": 32940 }, { "epoch": 0.28, "learning_rate": 8.18081838619011e-05, "loss": 2.2874, "step": 32945 }, { "epoch": 0.28, "learning_rate": 8.180300808759578e-05, "loss": 2.4009, "step": 32950 }, { "epoch": 0.28, "learning_rate": 8.17978317408926e-05, "loss": 2.2998, "step": 32955 }, { "epoch": 0.28, "learning_rate": 8.17926548218847e-05, "loss": 2.3331, "step": 32960 }, { "epoch": 0.28, "learning_rate": 8.178747733066525e-05, "loss": 2.3109, "step": 32965 }, { "epoch": 0.28, "learning_rate": 8.178229926732746e-05, "loss": 2.2479, "step": 32970 }, { "epoch": 0.28, "learning_rate": 8.177712063196453e-05, "loss": 2.3414, "step": 32975 }, { "epoch": 0.28, "learning_rate": 8.177194142466961e-05, "loss": 2.3224, "step": 32980 }, { "epoch": 0.28, "learning_rate": 8.176676164553599e-05, "loss": 2.2507, "step": 32985 }, { "epoch": 0.28, "learning_rate": 8.176158129465686e-05, "loss": 2.3431, "step": 32990 }, { "epoch": 0.28, "learning_rate": 8.175640037212546e-05, "loss": 2.2807, "step": 32995 }, { "epoch": 0.28, "learning_rate": 8.175121887803505e-05, "loss": 2.2764, "step": 33000 }, { "epoch": 0.28, "learning_rate": 8.174603681247887e-05, "loss": 2.3529, "step": 33005 }, { "epoch": 0.28, "learning_rate": 8.17408541755502e-05, "loss": 2.2943, "step": 33010 }, { "epoch": 0.28, "learning_rate": 8.173567096734232e-05, "loss": 2.3735, "step": 33015 }, { "epoch": 0.28, "learning_rate": 8.173048718794849e-05, "loss": 2.3057, "step": 33020 }, { "epoch": 0.28, "learning_rate": 8.172530283746205e-05, "loss": 2.3282, "step": 33025 }, { "epoch": 0.28, "learning_rate": 8.172011791597628e-05, "loss": 2.423, "step": 33030 }, { "epoch": 0.28, "learning_rate": 8.17149324235845e-05, "loss": 2.2632, "step": 33035 }, { "epoch": 0.28, "learning_rate": 8.170974636038007e-05, "loss": 2.4061, "step": 33040 }, { "epoch": 0.28, "learning_rate": 8.17045597264563e-05, "loss": 2.3554, "step": 33045 }, { "epoch": 0.28, "learning_rate": 8.169937252190654e-05, "loss": 2.3341, "step": 33050 }, { "epoch": 0.28, "learning_rate": 8.169418474682417e-05, "loss": 2.3112, "step": 33055 }, { "epoch": 0.28, "learning_rate": 8.168899640130257e-05, "loss": 2.332, "step": 33060 }, { "epoch": 0.28, "learning_rate": 8.168380748543507e-05, "loss": 2.3063, "step": 33065 }, { "epoch": 0.28, "learning_rate": 8.16786179993151e-05, "loss": 2.2873, "step": 33070 }, { "epoch": 0.28, "learning_rate": 8.167342794303607e-05, "loss": 2.334, "step": 33075 }, { "epoch": 0.28, "learning_rate": 8.166823731669138e-05, "loss": 2.3131, "step": 33080 }, { "epoch": 0.28, "learning_rate": 8.166304612037443e-05, "loss": 2.3889, "step": 33085 }, { "epoch": 0.28, "learning_rate": 8.165785435417868e-05, "loss": 2.3312, "step": 33090 }, { "epoch": 0.28, "learning_rate": 8.165266201819756e-05, "loss": 2.3135, "step": 33095 }, { "epoch": 0.28, "learning_rate": 8.164746911252453e-05, "loss": 2.3262, "step": 33100 }, { "epoch": 0.28, "learning_rate": 8.164227563725304e-05, "loss": 2.2915, "step": 33105 }, { "epoch": 0.28, "learning_rate": 8.163708159247658e-05, "loss": 2.2641, "step": 33110 }, { "epoch": 0.28, "learning_rate": 8.163188697828863e-05, "loss": 2.3337, "step": 33115 }, { "epoch": 0.28, "learning_rate": 8.162669179478268e-05, "loss": 2.3631, "step": 33120 }, { "epoch": 0.28, "learning_rate": 8.162149604205222e-05, "loss": 2.4443, "step": 33125 }, { "epoch": 0.28, "learning_rate": 8.16162997201908e-05, "loss": 2.3765, "step": 33130 }, { "epoch": 0.28, "learning_rate": 8.161110282929192e-05, "loss": 2.3913, "step": 33135 }, { "epoch": 0.28, "learning_rate": 8.16059053694491e-05, "loss": 2.3114, "step": 33140 }, { "epoch": 0.28, "learning_rate": 8.160070734075593e-05, "loss": 2.3616, "step": 33145 }, { "epoch": 0.28, "learning_rate": 8.159550874330593e-05, "loss": 2.3966, "step": 33150 }, { "epoch": 0.28, "learning_rate": 8.159030957719265e-05, "loss": 2.3314, "step": 33155 }, { "epoch": 0.28, "learning_rate": 8.158510984250972e-05, "loss": 2.3115, "step": 33160 }, { "epoch": 0.28, "learning_rate": 8.157990953935068e-05, "loss": 2.3167, "step": 33165 }, { "epoch": 0.28, "learning_rate": 8.157470866780916e-05, "loss": 2.2465, "step": 33170 }, { "epoch": 0.28, "learning_rate": 8.156950722797874e-05, "loss": 2.4335, "step": 33175 }, { "epoch": 0.28, "learning_rate": 8.156430521995304e-05, "loss": 2.3478, "step": 33180 }, { "epoch": 0.28, "learning_rate": 8.155910264382569e-05, "loss": 2.2794, "step": 33185 }, { "epoch": 0.28, "learning_rate": 8.155389949969033e-05, "loss": 2.292, "step": 33190 }, { "epoch": 0.28, "learning_rate": 8.154869578764061e-05, "loss": 2.3873, "step": 33195 }, { "epoch": 0.28, "learning_rate": 8.154349150777018e-05, "loss": 2.3394, "step": 33200 }, { "epoch": 0.28, "learning_rate": 8.153828666017274e-05, "loss": 2.3402, "step": 33205 }, { "epoch": 0.28, "learning_rate": 8.15330812449419e-05, "loss": 2.3869, "step": 33210 }, { "epoch": 0.28, "learning_rate": 8.152787526217142e-05, "loss": 2.2415, "step": 33215 }, { "epoch": 0.28, "learning_rate": 8.152266871195495e-05, "loss": 2.3166, "step": 33220 }, { "epoch": 0.28, "learning_rate": 8.151746159438622e-05, "loss": 2.3059, "step": 33225 }, { "epoch": 0.28, "learning_rate": 8.151225390955896e-05, "loss": 2.3804, "step": 33230 }, { "epoch": 0.28, "learning_rate": 8.150704565756687e-05, "loss": 2.3656, "step": 33235 }, { "epoch": 0.28, "learning_rate": 8.15018368385037e-05, "loss": 2.2569, "step": 33240 }, { "epoch": 0.28, "learning_rate": 8.14966274524632e-05, "loss": 2.3486, "step": 33245 }, { "epoch": 0.28, "learning_rate": 8.149141749953914e-05, "loss": 2.2896, "step": 33250 }, { "epoch": 0.28, "learning_rate": 8.14862069798253e-05, "loss": 2.3492, "step": 33255 }, { "epoch": 0.28, "learning_rate": 8.148099589341542e-05, "loss": 2.3101, "step": 33260 }, { "epoch": 0.28, "learning_rate": 8.147578424040332e-05, "loss": 2.3804, "step": 33265 }, { "epoch": 0.28, "learning_rate": 8.14705720208828e-05, "loss": 2.3379, "step": 33270 }, { "epoch": 0.28, "learning_rate": 8.146535923494765e-05, "loss": 2.3606, "step": 33275 }, { "epoch": 0.28, "learning_rate": 8.14601458826917e-05, "loss": 2.3338, "step": 33280 }, { "epoch": 0.28, "learning_rate": 8.145493196420882e-05, "loss": 2.2752, "step": 33285 }, { "epoch": 0.28, "learning_rate": 8.144971747959279e-05, "loss": 2.3515, "step": 33290 }, { "epoch": 0.28, "learning_rate": 8.144450242893749e-05, "loss": 2.3254, "step": 33295 }, { "epoch": 0.28, "learning_rate": 8.143928681233678e-05, "loss": 2.2801, "step": 33300 }, { "epoch": 0.28, "learning_rate": 8.143407062988454e-05, "loss": 2.3802, "step": 33305 }, { "epoch": 0.28, "learning_rate": 8.142885388167464e-05, "loss": 2.3059, "step": 33310 }, { "epoch": 0.28, "learning_rate": 8.142363656780099e-05, "loss": 2.2989, "step": 33315 }, { "epoch": 0.28, "learning_rate": 8.141841868835746e-05, "loss": 2.2888, "step": 33320 }, { "epoch": 0.28, "learning_rate": 8.141320024343799e-05, "loss": 2.3953, "step": 33325 }, { "epoch": 0.28, "learning_rate": 8.140798123313649e-05, "loss": 2.312, "step": 33330 }, { "epoch": 0.28, "learning_rate": 8.140276165754692e-05, "loss": 2.2673, "step": 33335 }, { "epoch": 0.28, "learning_rate": 8.139754151676317e-05, "loss": 2.3841, "step": 33340 }, { "epoch": 0.28, "learning_rate": 8.139232081087924e-05, "loss": 2.4118, "step": 33345 }, { "epoch": 0.28, "learning_rate": 8.138709953998907e-05, "loss": 2.3569, "step": 33350 }, { "epoch": 0.28, "learning_rate": 8.138187770418666e-05, "loss": 2.3161, "step": 33355 }, { "epoch": 0.28, "learning_rate": 8.137665530356596e-05, "loss": 2.3885, "step": 33360 }, { "epoch": 0.28, "learning_rate": 8.137143233822097e-05, "loss": 2.3635, "step": 33365 }, { "epoch": 0.28, "learning_rate": 8.136620880824573e-05, "loss": 2.3138, "step": 33370 }, { "epoch": 0.28, "learning_rate": 8.136098471373421e-05, "loss": 2.2867, "step": 33375 }, { "epoch": 0.28, "learning_rate": 8.135576005478045e-05, "loss": 2.317, "step": 33380 }, { "epoch": 0.28, "learning_rate": 8.13505348314785e-05, "loss": 2.3576, "step": 33385 }, { "epoch": 0.28, "learning_rate": 8.134530904392239e-05, "loss": 2.4095, "step": 33390 }, { "epoch": 0.28, "learning_rate": 8.134008269220614e-05, "loss": 2.3375, "step": 33395 }, { "epoch": 0.29, "learning_rate": 8.133485577642389e-05, "loss": 2.3437, "step": 33400 }, { "epoch": 0.29, "learning_rate": 8.132962829666966e-05, "loss": 2.2973, "step": 33405 }, { "epoch": 0.29, "learning_rate": 8.132440025303756e-05, "loss": 2.3177, "step": 33410 }, { "epoch": 0.29, "learning_rate": 8.131917164562168e-05, "loss": 2.362, "step": 33415 }, { "epoch": 0.29, "learning_rate": 8.131394247451611e-05, "loss": 2.2867, "step": 33420 }, { "epoch": 0.29, "learning_rate": 8.130871273981499e-05, "loss": 2.3693, "step": 33425 }, { "epoch": 0.29, "learning_rate": 8.130348244161245e-05, "loss": 2.3316, "step": 33430 }, { "epoch": 0.29, "learning_rate": 8.129825158000259e-05, "loss": 2.3526, "step": 33435 }, { "epoch": 0.29, "learning_rate": 8.129302015507959e-05, "loss": 2.3181, "step": 33440 }, { "epoch": 0.29, "learning_rate": 8.128778816693757e-05, "loss": 2.3308, "step": 33445 }, { "epoch": 0.29, "learning_rate": 8.128255561567073e-05, "loss": 2.2919, "step": 33450 }, { "epoch": 0.29, "learning_rate": 8.127732250137325e-05, "loss": 2.322, "step": 33455 }, { "epoch": 0.29, "learning_rate": 8.127208882413929e-05, "loss": 2.3829, "step": 33460 }, { "epoch": 0.29, "learning_rate": 8.126685458406306e-05, "loss": 2.2278, "step": 33465 }, { "epoch": 0.29, "learning_rate": 8.126161978123879e-05, "loss": 2.3182, "step": 33470 }, { "epoch": 0.29, "learning_rate": 8.125638441576065e-05, "loss": 2.369, "step": 33475 }, { "epoch": 0.29, "learning_rate": 8.12511484877229e-05, "loss": 2.3793, "step": 33480 }, { "epoch": 0.29, "learning_rate": 8.124591199721978e-05, "loss": 2.3044, "step": 33485 }, { "epoch": 0.29, "learning_rate": 8.124067494434552e-05, "loss": 2.3039, "step": 33490 }, { "epoch": 0.29, "learning_rate": 8.123543732919437e-05, "loss": 2.4095, "step": 33495 }, { "epoch": 0.29, "learning_rate": 8.123019915186063e-05, "loss": 2.3756, "step": 33500 }, { "epoch": 0.29, "learning_rate": 8.122496041243856e-05, "loss": 2.3067, "step": 33505 }, { "epoch": 0.29, "learning_rate": 8.121972111102245e-05, "loss": 2.2696, "step": 33510 }, { "epoch": 0.29, "learning_rate": 8.121448124770659e-05, "loss": 2.3409, "step": 33515 }, { "epoch": 0.29, "learning_rate": 8.12092408225853e-05, "loss": 2.3666, "step": 33520 }, { "epoch": 0.29, "learning_rate": 8.120399983575289e-05, "loss": 2.3798, "step": 33525 }, { "epoch": 0.29, "learning_rate": 8.11987582873037e-05, "loss": 2.3361, "step": 33530 }, { "epoch": 0.29, "learning_rate": 8.119351617733204e-05, "loss": 2.3036, "step": 33535 }, { "epoch": 0.29, "learning_rate": 8.11882735059323e-05, "loss": 2.3153, "step": 33540 }, { "epoch": 0.29, "learning_rate": 8.11830302731988e-05, "loss": 2.3499, "step": 33545 }, { "epoch": 0.29, "learning_rate": 8.117778647922594e-05, "loss": 2.3579, "step": 33550 }, { "epoch": 0.29, "learning_rate": 8.117254212410807e-05, "loss": 2.2663, "step": 33555 }, { "epoch": 0.29, "learning_rate": 8.116729720793963e-05, "loss": 2.3571, "step": 33560 }, { "epoch": 0.29, "learning_rate": 8.116205173081495e-05, "loss": 2.3197, "step": 33565 }, { "epoch": 0.29, "learning_rate": 8.115680569282849e-05, "loss": 2.3197, "step": 33570 }, { "epoch": 0.29, "learning_rate": 8.115155909407466e-05, "loss": 2.2418, "step": 33575 }, { "epoch": 0.29, "learning_rate": 8.114631193464787e-05, "loss": 2.2747, "step": 33580 }, { "epoch": 0.29, "learning_rate": 8.114106421464257e-05, "loss": 2.3622, "step": 33585 }, { "epoch": 0.29, "learning_rate": 8.113581593415322e-05, "loss": 2.3059, "step": 33590 }, { "epoch": 0.29, "learning_rate": 8.113056709327427e-05, "loss": 2.3226, "step": 33595 }, { "epoch": 0.29, "learning_rate": 8.112531769210017e-05, "loss": 2.3737, "step": 33600 }, { "epoch": 0.29, "learning_rate": 8.112006773072544e-05, "loss": 2.2288, "step": 33605 }, { "epoch": 0.29, "learning_rate": 8.111481720924457e-05, "loss": 2.3537, "step": 33610 }, { "epoch": 0.29, "learning_rate": 8.110956612775203e-05, "loss": 2.3811, "step": 33615 }, { "epoch": 0.29, "learning_rate": 8.110431448634232e-05, "loss": 2.2728, "step": 33620 }, { "epoch": 0.29, "learning_rate": 8.109906228510999e-05, "loss": 2.3787, "step": 33625 }, { "epoch": 0.29, "learning_rate": 8.109380952414958e-05, "loss": 2.3389, "step": 33630 }, { "epoch": 0.29, "learning_rate": 8.10885562035556e-05, "loss": 2.3121, "step": 33635 }, { "epoch": 0.29, "learning_rate": 8.108330232342261e-05, "loss": 2.4081, "step": 33640 }, { "epoch": 0.29, "learning_rate": 8.107804788384519e-05, "loss": 2.3247, "step": 33645 }, { "epoch": 0.29, "learning_rate": 8.107279288491786e-05, "loss": 2.3487, "step": 33650 }, { "epoch": 0.29, "learning_rate": 8.106753732673527e-05, "loss": 2.3851, "step": 33655 }, { "epoch": 0.29, "learning_rate": 8.106228120939197e-05, "loss": 2.3709, "step": 33660 }, { "epoch": 0.29, "learning_rate": 8.105702453298256e-05, "loss": 2.3257, "step": 33665 }, { "epoch": 0.29, "learning_rate": 8.105176729760166e-05, "loss": 2.3175, "step": 33670 }, { "epoch": 0.29, "learning_rate": 8.104650950334388e-05, "loss": 2.2795, "step": 33675 }, { "epoch": 0.29, "learning_rate": 8.104125115030387e-05, "loss": 2.2517, "step": 33680 }, { "epoch": 0.29, "learning_rate": 8.103599223857625e-05, "loss": 2.2589, "step": 33685 }, { "epoch": 0.29, "learning_rate": 8.103073276825569e-05, "loss": 2.3308, "step": 33690 }, { "epoch": 0.29, "learning_rate": 8.102547273943683e-05, "loss": 2.3157, "step": 33695 }, { "epoch": 0.29, "learning_rate": 8.102021215221436e-05, "loss": 2.3692, "step": 33700 }, { "epoch": 0.29, "learning_rate": 8.101495100668297e-05, "loss": 2.3225, "step": 33705 }, { "epoch": 0.29, "learning_rate": 8.100968930293732e-05, "loss": 2.3723, "step": 33710 }, { "epoch": 0.29, "learning_rate": 8.100442704107214e-05, "loss": 2.3616, "step": 33715 }, { "epoch": 0.29, "learning_rate": 8.099916422118212e-05, "loss": 2.3973, "step": 33720 }, { "epoch": 0.29, "learning_rate": 8.099390084336198e-05, "loss": 2.3095, "step": 33725 }, { "epoch": 0.29, "learning_rate": 8.098863690770648e-05, "loss": 2.3135, "step": 33730 }, { "epoch": 0.29, "learning_rate": 8.098337241431035e-05, "loss": 2.3098, "step": 33735 }, { "epoch": 0.29, "learning_rate": 8.097810736326832e-05, "loss": 2.3408, "step": 33740 }, { "epoch": 0.29, "learning_rate": 8.097284175467517e-05, "loss": 2.3128, "step": 33745 }, { "epoch": 0.29, "learning_rate": 8.096757558862567e-05, "loss": 2.3546, "step": 33750 }, { "epoch": 0.29, "learning_rate": 8.096230886521459e-05, "loss": 2.3555, "step": 33755 }, { "epoch": 0.29, "learning_rate": 8.095704158453674e-05, "loss": 2.3158, "step": 33760 }, { "epoch": 0.29, "learning_rate": 8.095177374668693e-05, "loss": 2.3326, "step": 33765 }, { "epoch": 0.29, "learning_rate": 8.094650535175992e-05, "loss": 2.2026, "step": 33770 }, { "epoch": 0.29, "learning_rate": 8.094123639985059e-05, "loss": 2.2948, "step": 33775 }, { "epoch": 0.29, "learning_rate": 8.093596689105375e-05, "loss": 2.3581, "step": 33780 }, { "epoch": 0.29, "learning_rate": 8.093069682546423e-05, "loss": 2.3758, "step": 33785 }, { "epoch": 0.29, "learning_rate": 8.092542620317692e-05, "loss": 2.3535, "step": 33790 }, { "epoch": 0.29, "learning_rate": 8.092015502428661e-05, "loss": 2.3595, "step": 33795 }, { "epoch": 0.29, "learning_rate": 8.091488328888824e-05, "loss": 2.3143, "step": 33800 }, { "epoch": 0.29, "learning_rate": 8.090961099707667e-05, "loss": 2.2938, "step": 33805 }, { "epoch": 0.29, "learning_rate": 8.090433814894677e-05, "loss": 2.3365, "step": 33810 }, { "epoch": 0.29, "learning_rate": 8.08990647445935e-05, "loss": 2.2864, "step": 33815 }, { "epoch": 0.29, "learning_rate": 8.089379078411171e-05, "loss": 2.3211, "step": 33820 }, { "epoch": 0.29, "learning_rate": 8.088851626759634e-05, "loss": 2.3151, "step": 33825 }, { "epoch": 0.29, "learning_rate": 8.088324119514235e-05, "loss": 2.3046, "step": 33830 }, { "epoch": 0.29, "learning_rate": 8.087796556684466e-05, "loss": 2.2651, "step": 33835 }, { "epoch": 0.29, "learning_rate": 8.08726893827982e-05, "loss": 2.3851, "step": 33840 }, { "epoch": 0.29, "learning_rate": 8.086741264309798e-05, "loss": 2.2878, "step": 33845 }, { "epoch": 0.29, "learning_rate": 8.086213534783892e-05, "loss": 2.3177, "step": 33850 }, { "epoch": 0.29, "learning_rate": 8.085685749711604e-05, "loss": 2.3241, "step": 33855 }, { "epoch": 0.29, "learning_rate": 8.085157909102431e-05, "loss": 2.3693, "step": 33860 }, { "epoch": 0.29, "learning_rate": 8.084630012965875e-05, "loss": 2.344, "step": 33865 }, { "epoch": 0.29, "learning_rate": 8.084102061311436e-05, "loss": 2.3375, "step": 33870 }, { "epoch": 0.29, "learning_rate": 8.083574054148617e-05, "loss": 2.3449, "step": 33875 }, { "epoch": 0.29, "learning_rate": 8.083045991486922e-05, "loss": 2.3783, "step": 33880 }, { "epoch": 0.29, "learning_rate": 8.082517873335852e-05, "loss": 2.3064, "step": 33885 }, { "epoch": 0.29, "learning_rate": 8.081989699704915e-05, "loss": 2.331, "step": 33890 }, { "epoch": 0.29, "learning_rate": 8.081461470603616e-05, "loss": 2.3353, "step": 33895 }, { "epoch": 0.29, "learning_rate": 8.080933186041464e-05, "loss": 2.2989, "step": 33900 }, { "epoch": 0.29, "learning_rate": 8.080404846027962e-05, "loss": 2.3153, "step": 33905 }, { "epoch": 0.29, "learning_rate": 8.079876450572627e-05, "loss": 2.3107, "step": 33910 }, { "epoch": 0.29, "learning_rate": 8.079347999684962e-05, "loss": 2.3784, "step": 33915 }, { "epoch": 0.29, "learning_rate": 8.078819493374483e-05, "loss": 2.3916, "step": 33920 }, { "epoch": 0.29, "learning_rate": 8.0782909316507e-05, "loss": 2.2643, "step": 33925 }, { "epoch": 0.29, "learning_rate": 8.077762314523127e-05, "loss": 2.3924, "step": 33930 }, { "epoch": 0.29, "learning_rate": 8.077233642001278e-05, "loss": 2.2662, "step": 33935 }, { "epoch": 0.29, "learning_rate": 8.076704914094668e-05, "loss": 2.3375, "step": 33940 }, { "epoch": 0.29, "learning_rate": 8.076176130812812e-05, "loss": 2.3565, "step": 33945 }, { "epoch": 0.29, "learning_rate": 8.075647292165229e-05, "loss": 2.3228, "step": 33950 }, { "epoch": 0.29, "learning_rate": 8.075118398161438e-05, "loss": 2.3591, "step": 33955 }, { "epoch": 0.29, "learning_rate": 8.074589448810955e-05, "loss": 2.3605, "step": 33960 }, { "epoch": 0.29, "learning_rate": 8.074060444123302e-05, "loss": 2.399, "step": 33965 }, { "epoch": 0.29, "learning_rate": 8.073531384107999e-05, "loss": 2.3345, "step": 33970 }, { "epoch": 0.29, "learning_rate": 8.073002268774569e-05, "loss": 2.2642, "step": 33975 }, { "epoch": 0.29, "learning_rate": 8.072473098132536e-05, "loss": 2.3052, "step": 33980 }, { "epoch": 0.29, "learning_rate": 8.071943872191424e-05, "loss": 2.2783, "step": 33985 }, { "epoch": 0.29, "learning_rate": 8.071414590960757e-05, "loss": 2.3836, "step": 33990 }, { "epoch": 0.29, "learning_rate": 8.070885254450063e-05, "loss": 2.2788, "step": 33995 }, { "epoch": 0.29, "learning_rate": 8.070355862668865e-05, "loss": 2.3466, "step": 34000 }, { "epoch": 0.29, "learning_rate": 8.069826415626696e-05, "loss": 2.2916, "step": 34005 }, { "epoch": 0.29, "learning_rate": 8.06929691333308e-05, "loss": 2.3395, "step": 34010 }, { "epoch": 0.29, "learning_rate": 8.068767355797553e-05, "loss": 2.2205, "step": 34015 }, { "epoch": 0.29, "learning_rate": 8.068237743029642e-05, "loss": 2.2781, "step": 34020 }, { "epoch": 0.29, "learning_rate": 8.06770807503888e-05, "loss": 2.3318, "step": 34025 }, { "epoch": 0.29, "learning_rate": 8.067178351834801e-05, "loss": 2.3796, "step": 34030 }, { "epoch": 0.29, "learning_rate": 8.066648573426938e-05, "loss": 2.2952, "step": 34035 }, { "epoch": 0.29, "learning_rate": 8.066118739824827e-05, "loss": 2.2828, "step": 34040 }, { "epoch": 0.29, "learning_rate": 8.065588851038002e-05, "loss": 2.3761, "step": 34045 }, { "epoch": 0.29, "learning_rate": 8.065058907076003e-05, "loss": 2.305, "step": 34050 }, { "epoch": 0.29, "learning_rate": 8.064528907948368e-05, "loss": 2.3135, "step": 34055 }, { "epoch": 0.29, "learning_rate": 8.063998853664631e-05, "loss": 2.3763, "step": 34060 }, { "epoch": 0.29, "learning_rate": 8.06346874423434e-05, "loss": 2.3012, "step": 34065 }, { "epoch": 0.29, "learning_rate": 8.062938579667028e-05, "loss": 2.3308, "step": 34070 }, { "epoch": 0.29, "learning_rate": 8.062408359972242e-05, "loss": 2.2927, "step": 34075 }, { "epoch": 0.29, "learning_rate": 8.061878085159525e-05, "loss": 2.3019, "step": 34080 }, { "epoch": 0.29, "learning_rate": 8.06134775523842e-05, "loss": 2.3004, "step": 34085 }, { "epoch": 0.29, "learning_rate": 8.06081737021847e-05, "loss": 2.3453, "step": 34090 }, { "epoch": 0.29, "learning_rate": 8.060286930109225e-05, "loss": 2.3076, "step": 34095 }, { "epoch": 0.29, "learning_rate": 8.059756434920227e-05, "loss": 2.3215, "step": 34100 }, { "epoch": 0.29, "learning_rate": 8.059225884661029e-05, "loss": 2.3004, "step": 34105 }, { "epoch": 0.29, "learning_rate": 8.058695279341176e-05, "loss": 2.3337, "step": 34110 }, { "epoch": 0.29, "learning_rate": 8.05816461897022e-05, "loss": 2.3481, "step": 34115 }, { "epoch": 0.29, "learning_rate": 8.057633903557713e-05, "loss": 2.4835, "step": 34120 }, { "epoch": 0.29, "learning_rate": 8.057103133113206e-05, "loss": 2.2763, "step": 34125 }, { "epoch": 0.29, "learning_rate": 8.05657230764625e-05, "loss": 2.4296, "step": 34130 }, { "epoch": 0.29, "learning_rate": 8.056041427166401e-05, "loss": 2.3312, "step": 34135 }, { "epoch": 0.29, "learning_rate": 8.055510491683213e-05, "loss": 2.3597, "step": 34140 }, { "epoch": 0.29, "learning_rate": 8.054979501206244e-05, "loss": 2.3511, "step": 34145 }, { "epoch": 0.29, "learning_rate": 8.054448455745047e-05, "loss": 2.3482, "step": 34150 }, { "epoch": 0.29, "learning_rate": 8.053917355309183e-05, "loss": 2.3723, "step": 34155 }, { "epoch": 0.29, "learning_rate": 8.053386199908208e-05, "loss": 2.2945, "step": 34160 }, { "epoch": 0.29, "learning_rate": 8.052854989551686e-05, "loss": 2.3039, "step": 34165 }, { "epoch": 0.29, "learning_rate": 8.052323724249174e-05, "loss": 2.3342, "step": 34170 }, { "epoch": 0.29, "learning_rate": 8.051792404010237e-05, "loss": 2.3091, "step": 34175 }, { "epoch": 0.29, "learning_rate": 8.051261028844435e-05, "loss": 2.3479, "step": 34180 }, { "epoch": 0.29, "learning_rate": 8.050729598761335e-05, "loss": 2.3957, "step": 34185 }, { "epoch": 0.29, "learning_rate": 8.050198113770497e-05, "loss": 2.3398, "step": 34190 }, { "epoch": 0.29, "learning_rate": 8.049666573881492e-05, "loss": 2.3753, "step": 34195 }, { "epoch": 0.29, "learning_rate": 8.049134979103882e-05, "loss": 2.2815, "step": 34200 }, { "epoch": 0.29, "learning_rate": 8.04860332944724e-05, "loss": 2.4361, "step": 34205 }, { "epoch": 0.29, "learning_rate": 8.048071624921132e-05, "loss": 2.3698, "step": 34210 }, { "epoch": 0.29, "learning_rate": 8.047539865535125e-05, "loss": 2.2853, "step": 34215 }, { "epoch": 0.29, "learning_rate": 8.047008051298794e-05, "loss": 2.3407, "step": 34220 }, { "epoch": 0.29, "learning_rate": 8.04647618222171e-05, "loss": 2.2371, "step": 34225 }, { "epoch": 0.29, "learning_rate": 8.045944258313443e-05, "loss": 2.3231, "step": 34230 }, { "epoch": 0.29, "learning_rate": 8.045412279583569e-05, "loss": 2.2884, "step": 34235 }, { "epoch": 0.29, "learning_rate": 8.044880246041661e-05, "loss": 2.2987, "step": 34240 }, { "epoch": 0.29, "learning_rate": 8.044348157697299e-05, "loss": 2.3645, "step": 34245 }, { "epoch": 0.29, "learning_rate": 8.043816014560053e-05, "loss": 2.3641, "step": 34250 }, { "epoch": 0.29, "learning_rate": 8.043283816639507e-05, "loss": 2.3172, "step": 34255 }, { "epoch": 0.29, "learning_rate": 8.042751563945237e-05, "loss": 2.3886, "step": 34260 }, { "epoch": 0.29, "learning_rate": 8.04221925648682e-05, "loss": 2.3683, "step": 34265 }, { "epoch": 0.29, "learning_rate": 8.041686894273839e-05, "loss": 2.3542, "step": 34270 }, { "epoch": 0.29, "learning_rate": 8.041154477315878e-05, "loss": 2.3248, "step": 34275 }, { "epoch": 0.29, "learning_rate": 8.040622005622514e-05, "loss": 2.3445, "step": 34280 }, { "epoch": 0.29, "learning_rate": 8.040089479203337e-05, "loss": 2.3255, "step": 34285 }, { "epoch": 0.29, "learning_rate": 8.039556898067925e-05, "loss": 2.2455, "step": 34290 }, { "epoch": 0.29, "learning_rate": 8.039024262225869e-05, "loss": 2.2876, "step": 34295 }, { "epoch": 0.29, "learning_rate": 8.038491571686752e-05, "loss": 2.2987, "step": 34300 }, { "epoch": 0.29, "learning_rate": 8.037958826460163e-05, "loss": 2.3667, "step": 34305 }, { "epoch": 0.29, "learning_rate": 8.03742602655569e-05, "loss": 2.3642, "step": 34310 }, { "epoch": 0.29, "learning_rate": 8.036893171982925e-05, "loss": 2.3477, "step": 34315 }, { "epoch": 0.29, "learning_rate": 8.036360262751452e-05, "loss": 2.3954, "step": 34320 }, { "epoch": 0.29, "learning_rate": 8.035827298870868e-05, "loss": 2.2681, "step": 34325 }, { "epoch": 0.29, "learning_rate": 8.035294280350765e-05, "loss": 2.3264, "step": 34330 }, { "epoch": 0.29, "learning_rate": 8.034761207200734e-05, "loss": 2.2695, "step": 34335 }, { "epoch": 0.29, "learning_rate": 8.034228079430371e-05, "loss": 2.4047, "step": 34340 }, { "epoch": 0.29, "learning_rate": 8.03369489704927e-05, "loss": 2.3439, "step": 34345 }, { "epoch": 0.29, "learning_rate": 8.033161660067032e-05, "loss": 2.3696, "step": 34350 }, { "epoch": 0.29, "learning_rate": 8.032628368493248e-05, "loss": 2.3029, "step": 34355 }, { "epoch": 0.29, "learning_rate": 8.03209502233752e-05, "loss": 2.3314, "step": 34360 }, { "epoch": 0.29, "learning_rate": 8.031561621609445e-05, "loss": 2.3384, "step": 34365 }, { "epoch": 0.29, "learning_rate": 8.031028166318623e-05, "loss": 2.365, "step": 34370 }, { "epoch": 0.29, "learning_rate": 8.03049465647466e-05, "loss": 2.276, "step": 34375 }, { "epoch": 0.29, "learning_rate": 8.029961092087153e-05, "loss": 2.2604, "step": 34380 }, { "epoch": 0.29, "learning_rate": 8.029427473165709e-05, "loss": 2.3711, "step": 34385 }, { "epoch": 0.29, "learning_rate": 8.02889379971993e-05, "loss": 2.2999, "step": 34390 }, { "epoch": 0.29, "learning_rate": 8.02836007175942e-05, "loss": 2.3173, "step": 34395 }, { "epoch": 0.29, "learning_rate": 8.027826289293788e-05, "loss": 2.2678, "step": 34400 }, { "epoch": 0.29, "learning_rate": 8.027292452332639e-05, "loss": 2.2627, "step": 34405 }, { "epoch": 0.29, "learning_rate": 8.026758560885584e-05, "loss": 2.2943, "step": 34410 }, { "epoch": 0.29, "learning_rate": 8.026224614962229e-05, "loss": 2.3876, "step": 34415 }, { "epoch": 0.29, "learning_rate": 8.025690614572184e-05, "loss": 2.3422, "step": 34420 }, { "epoch": 0.29, "learning_rate": 8.025156559725062e-05, "loss": 2.2131, "step": 34425 }, { "epoch": 0.29, "learning_rate": 8.024622450430476e-05, "loss": 2.3978, "step": 34430 }, { "epoch": 0.29, "learning_rate": 8.024088286698035e-05, "loss": 2.3617, "step": 34435 }, { "epoch": 0.29, "learning_rate": 8.023554068537358e-05, "loss": 2.284, "step": 34440 }, { "epoch": 0.29, "learning_rate": 8.023019795958055e-05, "loss": 2.3974, "step": 34445 }, { "epoch": 0.29, "learning_rate": 8.022485468969744e-05, "loss": 2.3346, "step": 34450 }, { "epoch": 0.29, "learning_rate": 8.021951087582045e-05, "loss": 2.3492, "step": 34455 }, { "epoch": 0.29, "learning_rate": 8.021416651804569e-05, "loss": 2.3087, "step": 34460 }, { "epoch": 0.29, "learning_rate": 8.020882161646943e-05, "loss": 2.3724, "step": 34465 }, { "epoch": 0.29, "learning_rate": 8.020347617118781e-05, "loss": 2.3772, "step": 34470 }, { "epoch": 0.29, "learning_rate": 8.019813018229705e-05, "loss": 2.3462, "step": 34475 }, { "epoch": 0.29, "learning_rate": 8.01927836498934e-05, "loss": 2.3585, "step": 34480 }, { "epoch": 0.29, "learning_rate": 8.018743657407303e-05, "loss": 2.3578, "step": 34485 }, { "epoch": 0.29, "learning_rate": 8.018208895493225e-05, "loss": 2.3626, "step": 34490 }, { "epoch": 0.29, "learning_rate": 8.017674079256725e-05, "loss": 2.2984, "step": 34495 }, { "epoch": 0.29, "learning_rate": 8.017139208707432e-05, "loss": 2.2797, "step": 34500 }, { "epoch": 0.29, "learning_rate": 8.016604283854969e-05, "loss": 2.3278, "step": 34505 }, { "epoch": 0.29, "learning_rate": 8.016069304708968e-05, "loss": 2.2503, "step": 34510 }, { "epoch": 0.29, "learning_rate": 8.015534271279055e-05, "loss": 2.3482, "step": 34515 }, { "epoch": 0.29, "learning_rate": 8.014999183574862e-05, "loss": 2.3709, "step": 34520 }, { "epoch": 0.29, "learning_rate": 8.014464041606016e-05, "loss": 2.3202, "step": 34525 }, { "epoch": 0.29, "learning_rate": 8.013928845382151e-05, "loss": 2.2964, "step": 34530 }, { "epoch": 0.29, "learning_rate": 8.013393594912902e-05, "loss": 2.4467, "step": 34535 }, { "epoch": 0.29, "learning_rate": 8.012858290207897e-05, "loss": 2.3619, "step": 34540 }, { "epoch": 0.29, "learning_rate": 8.012322931276774e-05, "loss": 2.3421, "step": 34545 }, { "epoch": 0.29, "learning_rate": 8.011787518129167e-05, "loss": 2.2125, "step": 34550 }, { "epoch": 0.29, "learning_rate": 8.011252050774715e-05, "loss": 2.3695, "step": 34555 }, { "epoch": 0.29, "learning_rate": 8.010716529223054e-05, "loss": 2.4198, "step": 34560 }, { "epoch": 0.29, "learning_rate": 8.010180953483824e-05, "loss": 2.3328, "step": 34565 }, { "epoch": 0.3, "learning_rate": 8.00964532356666e-05, "loss": 2.2698, "step": 34570 }, { "epoch": 0.3, "learning_rate": 8.009109639481204e-05, "loss": 2.3478, "step": 34575 }, { "epoch": 0.3, "learning_rate": 8.0085739012371e-05, "loss": 2.3535, "step": 34580 }, { "epoch": 0.3, "learning_rate": 8.008038108843989e-05, "loss": 2.3492, "step": 34585 }, { "epoch": 0.3, "learning_rate": 8.007502262311515e-05, "loss": 2.3411, "step": 34590 }, { "epoch": 0.3, "learning_rate": 8.00696636164932e-05, "loss": 2.3245, "step": 34595 }, { "epoch": 0.3, "learning_rate": 8.006430406867051e-05, "loss": 2.3147, "step": 34600 }, { "epoch": 0.3, "learning_rate": 8.005894397974355e-05, "loss": 2.2953, "step": 34605 }, { "epoch": 0.3, "learning_rate": 8.005358334980877e-05, "loss": 2.3062, "step": 34610 }, { "epoch": 0.3, "learning_rate": 8.004822217896268e-05, "loss": 2.2562, "step": 34615 }, { "epoch": 0.3, "learning_rate": 8.004286046730174e-05, "loss": 2.3446, "step": 34620 }, { "epoch": 0.3, "learning_rate": 8.003749821492246e-05, "loss": 2.2701, "step": 34625 }, { "epoch": 0.3, "learning_rate": 8.003213542192137e-05, "loss": 2.2463, "step": 34630 }, { "epoch": 0.3, "learning_rate": 8.002677208839496e-05, "loss": 2.3278, "step": 34635 }, { "epoch": 0.3, "learning_rate": 8.00214082144398e-05, "loss": 2.2889, "step": 34640 }, { "epoch": 0.3, "learning_rate": 8.001604380015239e-05, "loss": 2.2138, "step": 34645 }, { "epoch": 0.3, "learning_rate": 8.001067884562931e-05, "loss": 2.2499, "step": 34650 }, { "epoch": 0.3, "learning_rate": 8.000531335096711e-05, "loss": 2.3464, "step": 34655 }, { "epoch": 0.3, "learning_rate": 7.999994731626236e-05, "loss": 2.3088, "step": 34660 }, { "epoch": 0.3, "learning_rate": 7.999458074161164e-05, "loss": 2.3426, "step": 34665 }, { "epoch": 0.3, "learning_rate": 7.998921362711152e-05, "loss": 2.3335, "step": 34670 }, { "epoch": 0.3, "learning_rate": 7.998384597285862e-05, "loss": 2.3512, "step": 34675 }, { "epoch": 0.3, "learning_rate": 7.997847777894954e-05, "loss": 2.3365, "step": 34680 }, { "epoch": 0.3, "learning_rate": 7.997310904548091e-05, "loss": 2.3643, "step": 34685 }, { "epoch": 0.3, "learning_rate": 7.996773977254935e-05, "loss": 2.2933, "step": 34690 }, { "epoch": 0.3, "learning_rate": 7.996236996025148e-05, "loss": 2.3449, "step": 34695 }, { "epoch": 0.3, "learning_rate": 7.995699960868399e-05, "loss": 2.3714, "step": 34700 }, { "epoch": 0.3, "learning_rate": 7.995162871794348e-05, "loss": 2.3406, "step": 34705 }, { "epoch": 0.3, "learning_rate": 7.994625728812666e-05, "loss": 2.2151, "step": 34710 }, { "epoch": 0.3, "learning_rate": 7.99408853193302e-05, "loss": 2.2671, "step": 34715 }, { "epoch": 0.3, "learning_rate": 7.993551281165077e-05, "loss": 2.276, "step": 34720 }, { "epoch": 0.3, "learning_rate": 7.993013976518508e-05, "loss": 2.3383, "step": 34725 }, { "epoch": 0.3, "learning_rate": 7.992476618002982e-05, "loss": 2.3256, "step": 34730 }, { "epoch": 0.3, "learning_rate": 7.991939205628172e-05, "loss": 2.325, "step": 34735 }, { "epoch": 0.3, "learning_rate": 7.991401739403748e-05, "loss": 2.3707, "step": 34740 }, { "epoch": 0.3, "learning_rate": 7.990864219339388e-05, "loss": 2.3274, "step": 34745 }, { "epoch": 0.3, "learning_rate": 7.990326645444763e-05, "loss": 2.3191, "step": 34750 }, { "epoch": 0.3, "learning_rate": 7.989789017729548e-05, "loss": 2.3405, "step": 34755 }, { "epoch": 0.3, "learning_rate": 7.989251336203422e-05, "loss": 2.3276, "step": 34760 }, { "epoch": 0.3, "learning_rate": 7.988713600876061e-05, "loss": 2.2991, "step": 34765 }, { "epoch": 0.3, "learning_rate": 7.988175811757141e-05, "loss": 2.3071, "step": 34770 }, { "epoch": 0.3, "learning_rate": 7.987637968856346e-05, "loss": 2.3556, "step": 34775 }, { "epoch": 0.3, "learning_rate": 7.987100072183352e-05, "loss": 2.3397, "step": 34780 }, { "epoch": 0.3, "learning_rate": 7.986562121747843e-05, "loss": 2.3904, "step": 34785 }, { "epoch": 0.3, "learning_rate": 7.986024117559498e-05, "loss": 2.33, "step": 34790 }, { "epoch": 0.3, "learning_rate": 7.985486059628003e-05, "loss": 2.3053, "step": 34795 }, { "epoch": 0.3, "learning_rate": 7.984947947963041e-05, "loss": 2.3222, "step": 34800 }, { "epoch": 0.3, "learning_rate": 7.984409782574298e-05, "loss": 2.2684, "step": 34805 }, { "epoch": 0.3, "learning_rate": 7.983871563471459e-05, "loss": 2.3764, "step": 34810 }, { "epoch": 0.3, "learning_rate": 7.98333329066421e-05, "loss": 2.3531, "step": 34815 }, { "epoch": 0.3, "learning_rate": 7.982794964162241e-05, "loss": 2.4249, "step": 34820 }, { "epoch": 0.3, "learning_rate": 7.982256583975241e-05, "loss": 2.2677, "step": 34825 }, { "epoch": 0.3, "learning_rate": 7.981718150112896e-05, "loss": 2.3292, "step": 34830 }, { "epoch": 0.3, "learning_rate": 7.981179662584903e-05, "loss": 2.3452, "step": 34835 }, { "epoch": 0.3, "learning_rate": 7.980641121400949e-05, "loss": 2.2825, "step": 34840 }, { "epoch": 0.3, "learning_rate": 7.980102526570728e-05, "loss": 2.2626, "step": 34845 }, { "epoch": 0.3, "learning_rate": 7.979563878103935e-05, "loss": 2.3238, "step": 34850 }, { "epoch": 0.3, "learning_rate": 7.979025176010265e-05, "loss": 2.3012, "step": 34855 }, { "epoch": 0.3, "learning_rate": 7.978486420299411e-05, "loss": 2.342, "step": 34860 }, { "epoch": 0.3, "learning_rate": 7.977947610981073e-05, "loss": 2.3323, "step": 34865 }, { "epoch": 0.3, "learning_rate": 7.977408748064945e-05, "loss": 2.3146, "step": 34870 }, { "epoch": 0.3, "learning_rate": 7.976869831560728e-05, "loss": 2.3597, "step": 34875 }, { "epoch": 0.3, "learning_rate": 7.97633086147812e-05, "loss": 2.3924, "step": 34880 }, { "epoch": 0.3, "learning_rate": 7.975791837826825e-05, "loss": 2.4025, "step": 34885 }, { "epoch": 0.3, "learning_rate": 7.97525276061654e-05, "loss": 2.3788, "step": 34890 }, { "epoch": 0.3, "learning_rate": 7.97471362985697e-05, "loss": 2.2987, "step": 34895 }, { "epoch": 0.3, "learning_rate": 7.974174445557818e-05, "loss": 2.2636, "step": 34900 }, { "epoch": 0.3, "learning_rate": 7.973635207728788e-05, "loss": 2.361, "step": 34905 }, { "epoch": 0.3, "learning_rate": 7.973095916379586e-05, "loss": 2.3252, "step": 34910 }, { "epoch": 0.3, "learning_rate": 7.972556571519917e-05, "loss": 2.3759, "step": 34915 }, { "epoch": 0.3, "learning_rate": 7.972017173159489e-05, "loss": 2.3816, "step": 34920 }, { "epoch": 0.3, "learning_rate": 7.971477721308011e-05, "loss": 2.3453, "step": 34925 }, { "epoch": 0.3, "learning_rate": 7.970938215975192e-05, "loss": 2.3018, "step": 34930 }, { "epoch": 0.3, "learning_rate": 7.970398657170739e-05, "loss": 2.3749, "step": 34935 }, { "epoch": 0.3, "learning_rate": 7.969859044904367e-05, "loss": 2.2949, "step": 34940 }, { "epoch": 0.3, "learning_rate": 7.969319379185787e-05, "loss": 2.3082, "step": 34945 }, { "epoch": 0.3, "learning_rate": 7.968779660024712e-05, "loss": 2.3452, "step": 34950 }, { "epoch": 0.3, "learning_rate": 7.968239887430856e-05, "loss": 2.3989, "step": 34955 }, { "epoch": 0.3, "learning_rate": 7.967700061413933e-05, "loss": 2.3116, "step": 34960 }, { "epoch": 0.3, "learning_rate": 7.967160181983659e-05, "loss": 2.2972, "step": 34965 }, { "epoch": 0.3, "learning_rate": 7.966620249149753e-05, "loss": 2.3053, "step": 34970 }, { "epoch": 0.3, "learning_rate": 7.96608026292193e-05, "loss": 2.4291, "step": 34975 }, { "epoch": 0.3, "learning_rate": 7.965540223309912e-05, "loss": 2.3064, "step": 34980 }, { "epoch": 0.3, "learning_rate": 7.965000130323414e-05, "loss": 2.3019, "step": 34985 }, { "epoch": 0.3, "learning_rate": 7.964459983972162e-05, "loss": 2.3426, "step": 34990 }, { "epoch": 0.3, "learning_rate": 7.963919784265875e-05, "loss": 2.3178, "step": 34995 }, { "epoch": 0.3, "learning_rate": 7.963379531214275e-05, "loss": 2.2799, "step": 35000 }, { "epoch": 0.3, "learning_rate": 7.962839224827088e-05, "loss": 2.3568, "step": 35005 }, { "epoch": 0.3, "learning_rate": 7.962298865114036e-05, "loss": 2.3738, "step": 35010 }, { "epoch": 0.3, "learning_rate": 7.961758452084846e-05, "loss": 2.3912, "step": 35015 }, { "epoch": 0.3, "learning_rate": 7.961217985749243e-05, "loss": 2.2895, "step": 35020 }, { "epoch": 0.3, "learning_rate": 7.960677466116957e-05, "loss": 2.401, "step": 35025 }, { "epoch": 0.3, "learning_rate": 7.960136893197714e-05, "loss": 2.3956, "step": 35030 }, { "epoch": 0.3, "learning_rate": 7.959596267001243e-05, "loss": 2.3261, "step": 35035 }, { "epoch": 0.3, "learning_rate": 7.959055587537278e-05, "loss": 2.2959, "step": 35040 }, { "epoch": 0.3, "learning_rate": 7.958514854815547e-05, "loss": 2.3557, "step": 35045 }, { "epoch": 0.3, "learning_rate": 7.957974068845784e-05, "loss": 2.3024, "step": 35050 }, { "epoch": 0.3, "learning_rate": 7.957433229637719e-05, "loss": 2.2945, "step": 35055 }, { "epoch": 0.3, "learning_rate": 7.95689233720109e-05, "loss": 2.3979, "step": 35060 }, { "epoch": 0.3, "learning_rate": 7.956351391545632e-05, "loss": 2.2907, "step": 35065 }, { "epoch": 0.3, "learning_rate": 7.955810392681077e-05, "loss": 2.241, "step": 35070 }, { "epoch": 0.3, "learning_rate": 7.955269340617165e-05, "loss": 2.3211, "step": 35075 }, { "epoch": 0.3, "learning_rate": 7.954728235363634e-05, "loss": 2.3662, "step": 35080 }, { "epoch": 0.3, "learning_rate": 7.954187076930223e-05, "loss": 2.3185, "step": 35085 }, { "epoch": 0.3, "learning_rate": 7.953645865326671e-05, "loss": 2.2834, "step": 35090 }, { "epoch": 0.3, "learning_rate": 7.95310460056272e-05, "loss": 2.1969, "step": 35095 }, { "epoch": 0.3, "learning_rate": 7.95256328264811e-05, "loss": 2.281, "step": 35100 }, { "epoch": 0.3, "learning_rate": 7.952021911592587e-05, "loss": 2.3391, "step": 35105 }, { "epoch": 0.3, "learning_rate": 7.951480487405889e-05, "loss": 2.3646, "step": 35110 }, { "epoch": 0.3, "learning_rate": 7.950939010097767e-05, "loss": 2.3546, "step": 35115 }, { "epoch": 0.3, "learning_rate": 7.950397479677963e-05, "loss": 2.2806, "step": 35120 }, { "epoch": 0.3, "learning_rate": 7.949855896156225e-05, "loss": 2.26, "step": 35125 }, { "epoch": 0.3, "learning_rate": 7.9493142595423e-05, "loss": 2.2864, "step": 35130 }, { "epoch": 0.3, "learning_rate": 7.948772569845935e-05, "loss": 2.3176, "step": 35135 }, { "epoch": 0.3, "learning_rate": 7.948230827076881e-05, "loss": 2.2404, "step": 35140 }, { "epoch": 0.3, "learning_rate": 7.947689031244891e-05, "loss": 2.3519, "step": 35145 }, { "epoch": 0.3, "learning_rate": 7.947147182359712e-05, "loss": 2.2785, "step": 35150 }, { "epoch": 0.3, "learning_rate": 7.946605280431099e-05, "loss": 2.2865, "step": 35155 }, { "epoch": 0.3, "learning_rate": 7.946063325468803e-05, "loss": 2.2151, "step": 35160 }, { "epoch": 0.3, "learning_rate": 7.94552131748258e-05, "loss": 2.4294, "step": 35165 }, { "epoch": 0.3, "learning_rate": 7.944979256482185e-05, "loss": 2.2865, "step": 35170 }, { "epoch": 0.3, "learning_rate": 7.944437142477374e-05, "loss": 2.2944, "step": 35175 }, { "epoch": 0.3, "learning_rate": 7.943894975477906e-05, "loss": 2.3081, "step": 35180 }, { "epoch": 0.3, "learning_rate": 7.943352755493533e-05, "loss": 2.4051, "step": 35185 }, { "epoch": 0.3, "learning_rate": 7.94281048253402e-05, "loss": 2.3487, "step": 35190 }, { "epoch": 0.3, "learning_rate": 7.942268156609124e-05, "loss": 2.361, "step": 35195 }, { "epoch": 0.3, "learning_rate": 7.94172577772861e-05, "loss": 2.3496, "step": 35200 }, { "epoch": 0.3, "learning_rate": 7.941183345902234e-05, "loss": 2.2564, "step": 35205 }, { "epoch": 0.3, "learning_rate": 7.940640861139763e-05, "loss": 2.2035, "step": 35210 }, { "epoch": 0.3, "learning_rate": 7.940098323450959e-05, "loss": 2.3214, "step": 35215 }, { "epoch": 0.3, "learning_rate": 7.939555732845587e-05, "loss": 2.2964, "step": 35220 }, { "epoch": 0.3, "learning_rate": 7.939013089333412e-05, "loss": 2.4137, "step": 35225 }, { "epoch": 0.3, "learning_rate": 7.938470392924203e-05, "loss": 2.3407, "step": 35230 }, { "epoch": 0.3, "learning_rate": 7.937927643627724e-05, "loss": 2.3333, "step": 35235 }, { "epoch": 0.3, "learning_rate": 7.937384841453746e-05, "loss": 2.3171, "step": 35240 }, { "epoch": 0.3, "learning_rate": 7.936841986412039e-05, "loss": 2.3568, "step": 35245 }, { "epoch": 0.3, "learning_rate": 7.936299078512372e-05, "loss": 2.3817, "step": 35250 }, { "epoch": 0.3, "learning_rate": 7.935756117764517e-05, "loss": 2.2674, "step": 35255 }, { "epoch": 0.3, "learning_rate": 7.935213104178246e-05, "loss": 2.3362, "step": 35260 }, { "epoch": 0.3, "learning_rate": 7.934670037763331e-05, "loss": 2.2872, "step": 35265 }, { "epoch": 0.3, "learning_rate": 7.934126918529548e-05, "loss": 2.3101, "step": 35270 }, { "epoch": 0.3, "learning_rate": 7.933583746486673e-05, "loss": 2.316, "step": 35275 }, { "epoch": 0.3, "learning_rate": 7.93304052164448e-05, "loss": 2.3486, "step": 35280 }, { "epoch": 0.3, "learning_rate": 7.932497244012747e-05, "loss": 2.4009, "step": 35285 }, { "epoch": 0.3, "learning_rate": 7.931953913601253e-05, "loss": 2.3277, "step": 35290 }, { "epoch": 0.3, "learning_rate": 7.931410530419775e-05, "loss": 2.2942, "step": 35295 }, { "epoch": 0.3, "learning_rate": 7.930867094478094e-05, "loss": 2.3582, "step": 35300 }, { "epoch": 0.3, "learning_rate": 7.930323605785991e-05, "loss": 2.3152, "step": 35305 }, { "epoch": 0.3, "learning_rate": 7.92978006435325e-05, "loss": 2.2804, "step": 35310 }, { "epoch": 0.3, "learning_rate": 7.929236470189648e-05, "loss": 2.3158, "step": 35315 }, { "epoch": 0.3, "learning_rate": 7.928692823304974e-05, "loss": 2.317, "step": 35320 }, { "epoch": 0.3, "learning_rate": 7.92814912370901e-05, "loss": 2.3758, "step": 35325 }, { "epoch": 0.3, "learning_rate": 7.927605371411544e-05, "loss": 2.3713, "step": 35330 }, { "epoch": 0.3, "learning_rate": 7.92706156642236e-05, "loss": 2.3454, "step": 35335 }, { "epoch": 0.3, "learning_rate": 7.926517708751247e-05, "loss": 2.3688, "step": 35340 }, { "epoch": 0.3, "learning_rate": 7.925973798407991e-05, "loss": 2.319, "step": 35345 }, { "epoch": 0.3, "learning_rate": 7.925429835402387e-05, "loss": 2.3241, "step": 35350 }, { "epoch": 0.3, "learning_rate": 7.92488581974422e-05, "loss": 2.3151, "step": 35355 }, { "epoch": 0.3, "learning_rate": 7.924341751443284e-05, "loss": 2.3969, "step": 35360 }, { "epoch": 0.3, "learning_rate": 7.92379763050937e-05, "loss": 2.3112, "step": 35365 }, { "epoch": 0.3, "learning_rate": 7.923253456952271e-05, "loss": 2.2337, "step": 35370 }, { "epoch": 0.3, "learning_rate": 7.922709230781783e-05, "loss": 2.3728, "step": 35375 }, { "epoch": 0.3, "learning_rate": 7.9221649520077e-05, "loss": 2.2975, "step": 35380 }, { "epoch": 0.3, "learning_rate": 7.921620620639818e-05, "loss": 2.4118, "step": 35385 }, { "epoch": 0.3, "learning_rate": 7.921076236687934e-05, "loss": 2.2682, "step": 35390 }, { "epoch": 0.3, "learning_rate": 7.920531800161843e-05, "loss": 2.301, "step": 35395 }, { "epoch": 0.3, "learning_rate": 7.91998731107135e-05, "loss": 2.3736, "step": 35400 }, { "epoch": 0.3, "learning_rate": 7.919442769426252e-05, "loss": 2.3028, "step": 35405 }, { "epoch": 0.3, "learning_rate": 7.918898175236349e-05, "loss": 2.2898, "step": 35410 }, { "epoch": 0.3, "learning_rate": 7.918353528511443e-05, "loss": 2.3952, "step": 35415 }, { "epoch": 0.3, "learning_rate": 7.917808829261337e-05, "loss": 2.3568, "step": 35420 }, { "epoch": 0.3, "learning_rate": 7.917264077495834e-05, "loss": 2.2928, "step": 35425 }, { "epoch": 0.3, "learning_rate": 7.91671927322474e-05, "loss": 2.275, "step": 35430 }, { "epoch": 0.3, "learning_rate": 7.916174416457859e-05, "loss": 2.3156, "step": 35435 }, { "epoch": 0.3, "learning_rate": 7.915629507204998e-05, "loss": 2.2797, "step": 35440 }, { "epoch": 0.3, "learning_rate": 7.915084545475964e-05, "loss": 2.3338, "step": 35445 }, { "epoch": 0.3, "learning_rate": 7.914539531280567e-05, "loss": 2.3825, "step": 35450 }, { "epoch": 0.3, "learning_rate": 7.913994464628615e-05, "loss": 2.3792, "step": 35455 }, { "epoch": 0.3, "learning_rate": 7.913449345529917e-05, "loss": 2.3537, "step": 35460 }, { "epoch": 0.3, "learning_rate": 7.912904173994286e-05, "loss": 2.3442, "step": 35465 }, { "epoch": 0.3, "learning_rate": 7.912358950031535e-05, "loss": 2.3607, "step": 35470 }, { "epoch": 0.3, "learning_rate": 7.911813673651475e-05, "loss": 2.318, "step": 35475 }, { "epoch": 0.3, "learning_rate": 7.911268344863922e-05, "loss": 2.4121, "step": 35480 }, { "epoch": 0.3, "learning_rate": 7.910722963678687e-05, "loss": 2.3092, "step": 35485 }, { "epoch": 0.3, "learning_rate": 7.910177530105589e-05, "loss": 2.2544, "step": 35490 }, { "epoch": 0.3, "learning_rate": 7.909632044154446e-05, "loss": 2.345, "step": 35495 }, { "epoch": 0.3, "learning_rate": 7.909086505835073e-05, "loss": 2.3209, "step": 35500 }, { "epoch": 0.3, "learning_rate": 7.908540915157291e-05, "loss": 2.2381, "step": 35505 }, { "epoch": 0.3, "learning_rate": 7.907995272130917e-05, "loss": 2.3063, "step": 35510 }, { "epoch": 0.3, "learning_rate": 7.907449576765776e-05, "loss": 2.3783, "step": 35515 }, { "epoch": 0.3, "learning_rate": 7.906903829071684e-05, "loss": 2.4013, "step": 35520 }, { "epoch": 0.3, "learning_rate": 7.906358029058467e-05, "loss": 2.3093, "step": 35525 }, { "epoch": 0.3, "learning_rate": 7.905812176735948e-05, "loss": 2.2137, "step": 35530 }, { "epoch": 0.3, "learning_rate": 7.905266272113951e-05, "loss": 2.2566, "step": 35535 }, { "epoch": 0.3, "learning_rate": 7.904720315202301e-05, "loss": 2.2156, "step": 35540 }, { "epoch": 0.3, "learning_rate": 7.904174306010825e-05, "loss": 2.3606, "step": 35545 }, { "epoch": 0.3, "learning_rate": 7.903628244549349e-05, "loss": 2.2586, "step": 35550 }, { "epoch": 0.3, "learning_rate": 7.903082130827702e-05, "loss": 2.329, "step": 35555 }, { "epoch": 0.3, "learning_rate": 7.902535964855715e-05, "loss": 2.3424, "step": 35560 }, { "epoch": 0.3, "learning_rate": 7.901989746643214e-05, "loss": 2.3239, "step": 35565 }, { "epoch": 0.3, "learning_rate": 7.901443476200033e-05, "loss": 2.3482, "step": 35570 }, { "epoch": 0.3, "learning_rate": 7.900897153536003e-05, "loss": 2.3269, "step": 35575 }, { "epoch": 0.3, "learning_rate": 7.900350778660957e-05, "loss": 2.4106, "step": 35580 }, { "epoch": 0.3, "learning_rate": 7.899804351584728e-05, "loss": 2.1996, "step": 35585 }, { "epoch": 0.3, "learning_rate": 7.899257872317152e-05, "loss": 2.3037, "step": 35590 }, { "epoch": 0.3, "learning_rate": 7.898711340868062e-05, "loss": 2.327, "step": 35595 }, { "epoch": 0.3, "learning_rate": 7.898164757247298e-05, "loss": 2.2786, "step": 35600 }, { "epoch": 0.3, "learning_rate": 7.897618121464696e-05, "loss": 2.3332, "step": 35605 }, { "epoch": 0.3, "learning_rate": 7.897071433530094e-05, "loss": 2.2864, "step": 35610 }, { "epoch": 0.3, "learning_rate": 7.896524693453333e-05, "loss": 2.3267, "step": 35615 }, { "epoch": 0.3, "learning_rate": 7.895977901244251e-05, "loss": 2.2999, "step": 35620 }, { "epoch": 0.3, "learning_rate": 7.895431056912692e-05, "loss": 2.3173, "step": 35625 }, { "epoch": 0.3, "learning_rate": 7.894884160468497e-05, "loss": 2.3788, "step": 35630 }, { "epoch": 0.3, "learning_rate": 7.894337211921507e-05, "loss": 2.334, "step": 35635 }, { "epoch": 0.3, "learning_rate": 7.893790211281569e-05, "loss": 2.21, "step": 35640 }, { "epoch": 0.3, "learning_rate": 7.893243158558527e-05, "loss": 2.2476, "step": 35645 }, { "epoch": 0.3, "learning_rate": 7.892696053762227e-05, "loss": 2.3418, "step": 35650 }, { "epoch": 0.3, "learning_rate": 7.892148896902518e-05, "loss": 2.3747, "step": 35655 }, { "epoch": 0.3, "learning_rate": 7.891601687989244e-05, "loss": 2.3115, "step": 35660 }, { "epoch": 0.3, "learning_rate": 7.891054427032257e-05, "loss": 2.3397, "step": 35665 }, { "epoch": 0.3, "learning_rate": 7.890507114041404e-05, "loss": 2.2746, "step": 35670 }, { "epoch": 0.3, "learning_rate": 7.889959749026538e-05, "loss": 2.3721, "step": 35675 }, { "epoch": 0.3, "learning_rate": 7.88941233199751e-05, "loss": 2.311, "step": 35680 }, { "epoch": 0.3, "learning_rate": 7.888864862964172e-05, "loss": 2.4067, "step": 35685 }, { "epoch": 0.3, "learning_rate": 7.888317341936377e-05, "loss": 2.2308, "step": 35690 }, { "epoch": 0.3, "learning_rate": 7.887769768923981e-05, "loss": 2.3664, "step": 35695 }, { "epoch": 0.3, "learning_rate": 7.887222143936837e-05, "loss": 2.3437, "step": 35700 }, { "epoch": 0.3, "learning_rate": 7.886674466984804e-05, "loss": 2.329, "step": 35705 }, { "epoch": 0.3, "learning_rate": 7.886126738077737e-05, "loss": 2.3678, "step": 35710 }, { "epoch": 0.3, "learning_rate": 7.885578957225497e-05, "loss": 2.2823, "step": 35715 }, { "epoch": 0.3, "learning_rate": 7.885031124437941e-05, "loss": 2.34, "step": 35720 }, { "epoch": 0.3, "learning_rate": 7.884483239724927e-05, "loss": 2.2757, "step": 35725 }, { "epoch": 0.3, "learning_rate": 7.88393530309632e-05, "loss": 2.3055, "step": 35730 }, { "epoch": 0.3, "learning_rate": 7.88338731456198e-05, "loss": 2.309, "step": 35735 }, { "epoch": 0.3, "learning_rate": 7.88283927413177e-05, "loss": 2.258, "step": 35740 }, { "epoch": 0.31, "learning_rate": 7.882291181815552e-05, "loss": 2.3582, "step": 35745 }, { "epoch": 0.31, "learning_rate": 7.881743037623194e-05, "loss": 2.3554, "step": 35750 }, { "epoch": 0.31, "learning_rate": 7.881194841564558e-05, "loss": 2.3641, "step": 35755 }, { "epoch": 0.31, "learning_rate": 7.880646593649515e-05, "loss": 2.3986, "step": 35760 }, { "epoch": 0.31, "learning_rate": 7.880098293887929e-05, "loss": 2.3559, "step": 35765 }, { "epoch": 0.31, "learning_rate": 7.87954994228967e-05, "loss": 2.2945, "step": 35770 }, { "epoch": 0.31, "learning_rate": 7.879001538864606e-05, "loss": 2.3388, "step": 35775 }, { "epoch": 0.31, "learning_rate": 7.878453083622607e-05, "loss": 2.3201, "step": 35780 }, { "epoch": 0.31, "learning_rate": 7.877904576573547e-05, "loss": 2.3767, "step": 35785 }, { "epoch": 0.31, "learning_rate": 7.877356017727298e-05, "loss": 2.3492, "step": 35790 }, { "epoch": 0.31, "learning_rate": 7.876807407093729e-05, "loss": 2.3542, "step": 35795 }, { "epoch": 0.31, "learning_rate": 7.876258744682716e-05, "loss": 2.2961, "step": 35800 }, { "epoch": 0.31, "learning_rate": 7.875710030504135e-05, "loss": 2.301, "step": 35805 }, { "epoch": 0.31, "learning_rate": 7.875161264567863e-05, "loss": 2.403, "step": 35810 }, { "epoch": 0.31, "learning_rate": 7.874612446883775e-05, "loss": 2.3143, "step": 35815 }, { "epoch": 0.31, "learning_rate": 7.874063577461748e-05, "loss": 2.2636, "step": 35820 }, { "epoch": 0.31, "learning_rate": 7.873514656311662e-05, "loss": 2.3419, "step": 35825 }, { "epoch": 0.31, "learning_rate": 7.872965683443397e-05, "loss": 2.2771, "step": 35830 }, { "epoch": 0.31, "learning_rate": 7.872416658866833e-05, "loss": 2.33, "step": 35835 }, { "epoch": 0.31, "learning_rate": 7.87186758259185e-05, "loss": 2.3458, "step": 35840 }, { "epoch": 0.31, "learning_rate": 7.871318454628333e-05, "loss": 2.2679, "step": 35845 }, { "epoch": 0.31, "learning_rate": 7.870769274986163e-05, "loss": 2.3574, "step": 35850 }, { "epoch": 0.31, "learning_rate": 7.870220043675224e-05, "loss": 2.3427, "step": 35855 }, { "epoch": 0.31, "learning_rate": 7.869670760705404e-05, "loss": 2.326, "step": 35860 }, { "epoch": 0.31, "learning_rate": 7.869121426086588e-05, "loss": 2.2616, "step": 35865 }, { "epoch": 0.31, "learning_rate": 7.868572039828663e-05, "loss": 2.3821, "step": 35870 }, { "epoch": 0.31, "learning_rate": 7.868022601941516e-05, "loss": 2.3069, "step": 35875 }, { "epoch": 0.31, "learning_rate": 7.867473112435036e-05, "loss": 2.2798, "step": 35880 }, { "epoch": 0.31, "learning_rate": 7.866923571319114e-05, "loss": 2.2671, "step": 35885 }, { "epoch": 0.31, "learning_rate": 7.86637397860364e-05, "loss": 2.3618, "step": 35890 }, { "epoch": 0.31, "learning_rate": 7.865824334298506e-05, "loss": 2.3345, "step": 35895 }, { "epoch": 0.31, "learning_rate": 7.865274638413605e-05, "loss": 2.3084, "step": 35900 }, { "epoch": 0.31, "learning_rate": 7.864724890958827e-05, "loss": 2.2912, "step": 35905 }, { "epoch": 0.31, "learning_rate": 7.864175091944073e-05, "loss": 2.3048, "step": 35910 }, { "epoch": 0.31, "learning_rate": 7.863625241379234e-05, "loss": 2.3115, "step": 35915 }, { "epoch": 0.31, "learning_rate": 7.863075339274206e-05, "loss": 2.3696, "step": 35920 }, { "epoch": 0.31, "learning_rate": 7.862525385638889e-05, "loss": 2.3726, "step": 35925 }, { "epoch": 0.31, "learning_rate": 7.861975380483179e-05, "loss": 2.276, "step": 35930 }, { "epoch": 0.31, "learning_rate": 7.861425323816975e-05, "loss": 2.3883, "step": 35935 }, { "epoch": 0.31, "learning_rate": 7.86087521565018e-05, "loss": 2.3418, "step": 35940 }, { "epoch": 0.31, "learning_rate": 7.860325055992693e-05, "loss": 2.3338, "step": 35945 }, { "epoch": 0.31, "learning_rate": 7.859774844854413e-05, "loss": 2.3203, "step": 35950 }, { "epoch": 0.31, "learning_rate": 7.859224582245248e-05, "loss": 2.393, "step": 35955 }, { "epoch": 0.31, "learning_rate": 7.858674268175097e-05, "loss": 2.3015, "step": 35960 }, { "epoch": 0.31, "learning_rate": 7.858123902653869e-05, "loss": 2.3012, "step": 35965 }, { "epoch": 0.31, "learning_rate": 7.857573485691466e-05, "loss": 2.2851, "step": 35970 }, { "epoch": 0.31, "learning_rate": 7.857023017297798e-05, "loss": 2.2783, "step": 35975 }, { "epoch": 0.31, "learning_rate": 7.856472497482769e-05, "loss": 2.3205, "step": 35980 }, { "epoch": 0.31, "learning_rate": 7.85592192625629e-05, "loss": 2.3533, "step": 35985 }, { "epoch": 0.31, "learning_rate": 7.855371303628269e-05, "loss": 2.232, "step": 35990 }, { "epoch": 0.31, "learning_rate": 7.854820629608616e-05, "loss": 2.3408, "step": 35995 }, { "epoch": 0.31, "learning_rate": 7.854269904207243e-05, "loss": 2.3082, "step": 36000 }, { "epoch": 0.31, "learning_rate": 7.853719127434063e-05, "loss": 2.3347, "step": 36005 }, { "epoch": 0.31, "learning_rate": 7.853168299298985e-05, "loss": 2.3703, "step": 36010 }, { "epoch": 0.31, "learning_rate": 7.852617419811927e-05, "loss": 2.3822, "step": 36015 }, { "epoch": 0.31, "learning_rate": 7.852066488982804e-05, "loss": 2.3556, "step": 36020 }, { "epoch": 0.31, "learning_rate": 7.85151550682153e-05, "loss": 2.3336, "step": 36025 }, { "epoch": 0.31, "learning_rate": 7.85096447333802e-05, "loss": 2.2886, "step": 36030 }, { "epoch": 0.31, "learning_rate": 7.850413388542196e-05, "loss": 2.2827, "step": 36035 }, { "epoch": 0.31, "learning_rate": 7.849862252443973e-05, "loss": 2.3609, "step": 36040 }, { "epoch": 0.31, "learning_rate": 7.849311065053272e-05, "loss": 2.3134, "step": 36045 }, { "epoch": 0.31, "learning_rate": 7.848759826380014e-05, "loss": 2.3339, "step": 36050 }, { "epoch": 0.31, "learning_rate": 7.848208536434119e-05, "loss": 2.332, "step": 36055 }, { "epoch": 0.31, "learning_rate": 7.847657195225509e-05, "loss": 2.2666, "step": 36060 }, { "epoch": 0.31, "learning_rate": 7.847105802764107e-05, "loss": 2.3766, "step": 36065 }, { "epoch": 0.31, "learning_rate": 7.846554359059838e-05, "loss": 2.2746, "step": 36070 }, { "epoch": 0.31, "learning_rate": 7.846002864122628e-05, "loss": 2.271, "step": 36075 }, { "epoch": 0.31, "learning_rate": 7.845451317962402e-05, "loss": 2.3314, "step": 36080 }, { "epoch": 0.31, "learning_rate": 7.844899720589087e-05, "loss": 2.3322, "step": 36085 }, { "epoch": 0.31, "learning_rate": 7.844348072012608e-05, "loss": 2.2658, "step": 36090 }, { "epoch": 0.31, "learning_rate": 7.8437963722429e-05, "loss": 2.3326, "step": 36095 }, { "epoch": 0.31, "learning_rate": 7.843244621289886e-05, "loss": 2.3062, "step": 36100 }, { "epoch": 0.31, "learning_rate": 7.8426928191635e-05, "loss": 2.329, "step": 36105 }, { "epoch": 0.31, "learning_rate": 7.842140965873673e-05, "loss": 2.2122, "step": 36110 }, { "epoch": 0.31, "learning_rate": 7.841589061430336e-05, "loss": 2.2767, "step": 36115 }, { "epoch": 0.31, "learning_rate": 7.841037105843425e-05, "loss": 2.4462, "step": 36120 }, { "epoch": 0.31, "learning_rate": 7.840485099122873e-05, "loss": 2.3193, "step": 36125 }, { "epoch": 0.31, "learning_rate": 7.839933041278614e-05, "loss": 2.3155, "step": 36130 }, { "epoch": 0.31, "learning_rate": 7.839380932320586e-05, "loss": 2.2614, "step": 36135 }, { "epoch": 0.31, "learning_rate": 7.838828772258723e-05, "loss": 2.2913, "step": 36140 }, { "epoch": 0.31, "learning_rate": 7.838276561102966e-05, "loss": 2.359, "step": 36145 }, { "epoch": 0.31, "learning_rate": 7.837724298863254e-05, "loss": 2.2381, "step": 36150 }, { "epoch": 0.31, "learning_rate": 7.837171985549523e-05, "loss": 2.3721, "step": 36155 }, { "epoch": 0.31, "learning_rate": 7.836619621171716e-05, "loss": 2.3519, "step": 36160 }, { "epoch": 0.31, "learning_rate": 7.836067205739777e-05, "loss": 2.2831, "step": 36165 }, { "epoch": 0.31, "learning_rate": 7.835514739263646e-05, "loss": 2.2972, "step": 36170 }, { "epoch": 0.31, "learning_rate": 7.834962221753264e-05, "loss": 2.3335, "step": 36175 }, { "epoch": 0.31, "learning_rate": 7.834409653218579e-05, "loss": 2.3054, "step": 36180 }, { "epoch": 0.31, "learning_rate": 7.833857033669536e-05, "loss": 2.3589, "step": 36185 }, { "epoch": 0.31, "learning_rate": 7.833304363116079e-05, "loss": 2.3527, "step": 36190 }, { "epoch": 0.31, "learning_rate": 7.832751641568156e-05, "loss": 2.3286, "step": 36195 }, { "epoch": 0.31, "learning_rate": 7.832198869035719e-05, "loss": 2.3755, "step": 36200 }, { "epoch": 0.31, "learning_rate": 7.83164604552871e-05, "loss": 2.4046, "step": 36205 }, { "epoch": 0.31, "learning_rate": 7.831093171057082e-05, "loss": 2.349, "step": 36210 }, { "epoch": 0.31, "learning_rate": 7.830540245630787e-05, "loss": 2.3183, "step": 36215 }, { "epoch": 0.31, "learning_rate": 7.829987269259776e-05, "loss": 2.2552, "step": 36220 }, { "epoch": 0.31, "learning_rate": 7.829434241954001e-05, "loss": 2.3168, "step": 36225 }, { "epoch": 0.31, "learning_rate": 7.828881163723417e-05, "loss": 2.3914, "step": 36230 }, { "epoch": 0.31, "learning_rate": 7.828328034577974e-05, "loss": 2.2996, "step": 36235 }, { "epoch": 0.31, "learning_rate": 7.827774854527632e-05, "loss": 2.2599, "step": 36240 }, { "epoch": 0.31, "learning_rate": 7.827221623582348e-05, "loss": 2.2705, "step": 36245 }, { "epoch": 0.31, "learning_rate": 7.826668341752073e-05, "loss": 2.2802, "step": 36250 }, { "epoch": 0.31, "learning_rate": 7.826115009046773e-05, "loss": 2.3495, "step": 36255 }, { "epoch": 0.31, "learning_rate": 7.8255616254764e-05, "loss": 2.297, "step": 36260 }, { "epoch": 0.31, "learning_rate": 7.825008191050918e-05, "loss": 2.307, "step": 36265 }, { "epoch": 0.31, "learning_rate": 7.824454705780286e-05, "loss": 2.387, "step": 36270 }, { "epoch": 0.31, "learning_rate": 7.823901169674468e-05, "loss": 2.3788, "step": 36275 }, { "epoch": 0.31, "learning_rate": 7.823347582743425e-05, "loss": 2.3506, "step": 36280 }, { "epoch": 0.31, "learning_rate": 7.822793944997121e-05, "loss": 2.2144, "step": 36285 }, { "epoch": 0.31, "learning_rate": 7.82224025644552e-05, "loss": 2.323, "step": 36290 }, { "epoch": 0.31, "learning_rate": 7.821686517098588e-05, "loss": 2.3353, "step": 36295 }, { "epoch": 0.31, "learning_rate": 7.821132726966291e-05, "loss": 2.3841, "step": 36300 }, { "epoch": 0.31, "learning_rate": 7.820578886058596e-05, "loss": 2.3024, "step": 36305 }, { "epoch": 0.31, "learning_rate": 7.82002499438547e-05, "loss": 2.3312, "step": 36310 }, { "epoch": 0.31, "learning_rate": 7.819471051956887e-05, "loss": 2.3107, "step": 36315 }, { "epoch": 0.31, "learning_rate": 7.81891705878281e-05, "loss": 2.2526, "step": 36320 }, { "epoch": 0.31, "learning_rate": 7.818363014873215e-05, "loss": 2.2592, "step": 36325 }, { "epoch": 0.31, "learning_rate": 7.817808920238075e-05, "loss": 2.3569, "step": 36330 }, { "epoch": 0.31, "learning_rate": 7.817254774887356e-05, "loss": 2.3624, "step": 36335 }, { "epoch": 0.31, "learning_rate": 7.816700578831038e-05, "loss": 2.2771, "step": 36340 }, { "epoch": 0.31, "learning_rate": 7.816146332079091e-05, "loss": 2.3129, "step": 36345 }, { "epoch": 0.31, "learning_rate": 7.815592034641495e-05, "loss": 2.2245, "step": 36350 }, { "epoch": 0.31, "learning_rate": 7.815037686528222e-05, "loss": 2.3593, "step": 36355 }, { "epoch": 0.31, "learning_rate": 7.814483287749252e-05, "loss": 2.2817, "step": 36360 }, { "epoch": 0.31, "learning_rate": 7.813928838314563e-05, "loss": 2.4008, "step": 36365 }, { "epoch": 0.31, "learning_rate": 7.813374338234131e-05, "loss": 2.2876, "step": 36370 }, { "epoch": 0.31, "learning_rate": 7.812819787517943e-05, "loss": 2.3754, "step": 36375 }, { "epoch": 0.31, "learning_rate": 7.812265186175972e-05, "loss": 2.3793, "step": 36380 }, { "epoch": 0.31, "learning_rate": 7.811710534218204e-05, "loss": 2.368, "step": 36385 }, { "epoch": 0.31, "learning_rate": 7.811155831654622e-05, "loss": 2.3066, "step": 36390 }, { "epoch": 0.31, "learning_rate": 7.810601078495207e-05, "loss": 2.329, "step": 36395 }, { "epoch": 0.31, "learning_rate": 7.810046274749949e-05, "loss": 2.3033, "step": 36400 }, { "epoch": 0.31, "learning_rate": 7.809491420428827e-05, "loss": 2.3073, "step": 36405 }, { "epoch": 0.31, "learning_rate": 7.80893651554183e-05, "loss": 2.37, "step": 36410 }, { "epoch": 0.31, "learning_rate": 7.808381560098947e-05, "loss": 2.3686, "step": 36415 }, { "epoch": 0.31, "learning_rate": 7.807826554110163e-05, "loss": 2.3554, "step": 36420 }, { "epoch": 0.31, "learning_rate": 7.80727149758547e-05, "loss": 2.3592, "step": 36425 }, { "epoch": 0.31, "learning_rate": 7.806716390534859e-05, "loss": 2.2865, "step": 36430 }, { "epoch": 0.31, "learning_rate": 7.806161232968317e-05, "loss": 2.331, "step": 36435 }, { "epoch": 0.31, "learning_rate": 7.805606024895837e-05, "loss": 2.2212, "step": 36440 }, { "epoch": 0.31, "learning_rate": 7.805050766327413e-05, "loss": 2.3915, "step": 36445 }, { "epoch": 0.31, "learning_rate": 7.804495457273038e-05, "loss": 2.3597, "step": 36450 }, { "epoch": 0.31, "learning_rate": 7.803940097742707e-05, "loss": 2.3542, "step": 36455 }, { "epoch": 0.31, "learning_rate": 7.803384687746415e-05, "loss": 2.3873, "step": 36460 }, { "epoch": 0.31, "learning_rate": 7.80282922729416e-05, "loss": 2.2876, "step": 36465 }, { "epoch": 0.31, "learning_rate": 7.802273716395936e-05, "loss": 2.3261, "step": 36470 }, { "epoch": 0.31, "learning_rate": 7.801718155061743e-05, "loss": 2.3073, "step": 36475 }, { "epoch": 0.31, "learning_rate": 7.801162543301582e-05, "loss": 2.3332, "step": 36480 }, { "epoch": 0.31, "learning_rate": 7.80060688112545e-05, "loss": 2.2445, "step": 36485 }, { "epoch": 0.31, "learning_rate": 7.80005116854335e-05, "loss": 2.2675, "step": 36490 }, { "epoch": 0.31, "learning_rate": 7.799495405565284e-05, "loss": 2.2999, "step": 36495 }, { "epoch": 0.31, "learning_rate": 7.798939592201252e-05, "loss": 2.3055, "step": 36500 }, { "epoch": 0.31, "learning_rate": 7.79838372846126e-05, "loss": 2.3131, "step": 36505 }, { "epoch": 0.31, "learning_rate": 7.797827814355312e-05, "loss": 2.2029, "step": 36510 }, { "epoch": 0.31, "learning_rate": 7.797271849893416e-05, "loss": 2.2354, "step": 36515 }, { "epoch": 0.31, "learning_rate": 7.796715835085572e-05, "loss": 2.2875, "step": 36520 }, { "epoch": 0.31, "learning_rate": 7.796159769941792e-05, "loss": 2.2982, "step": 36525 }, { "epoch": 0.31, "learning_rate": 7.795603654472085e-05, "loss": 2.3599, "step": 36530 }, { "epoch": 0.31, "learning_rate": 7.795047488686457e-05, "loss": 2.2593, "step": 36535 }, { "epoch": 0.31, "learning_rate": 7.79449127259492e-05, "loss": 2.3285, "step": 36540 }, { "epoch": 0.31, "learning_rate": 7.793935006207484e-05, "loss": 2.4259, "step": 36545 }, { "epoch": 0.31, "learning_rate": 7.793378689534163e-05, "loss": 2.2346, "step": 36550 }, { "epoch": 0.31, "learning_rate": 7.792822322584965e-05, "loss": 2.3133, "step": 36555 }, { "epoch": 0.31, "learning_rate": 7.792265905369908e-05, "loss": 2.3729, "step": 36560 }, { "epoch": 0.31, "learning_rate": 7.791709437899006e-05, "loss": 2.2561, "step": 36565 }, { "epoch": 0.31, "learning_rate": 7.791152920182272e-05, "loss": 2.2703, "step": 36570 }, { "epoch": 0.31, "learning_rate": 7.790596352229725e-05, "loss": 2.2546, "step": 36575 }, { "epoch": 0.31, "learning_rate": 7.79003973405138e-05, "loss": 2.3769, "step": 36580 }, { "epoch": 0.31, "learning_rate": 7.789483065657258e-05, "loss": 2.3103, "step": 36585 }, { "epoch": 0.31, "learning_rate": 7.788926347057374e-05, "loss": 2.268, "step": 36590 }, { "epoch": 0.31, "learning_rate": 7.78836957826175e-05, "loss": 2.3503, "step": 36595 }, { "epoch": 0.31, "learning_rate": 7.787812759280408e-05, "loss": 2.3004, "step": 36600 }, { "epoch": 0.31, "learning_rate": 7.78725589012337e-05, "loss": 2.3538, "step": 36605 }, { "epoch": 0.31, "learning_rate": 7.786698970800655e-05, "loss": 2.3157, "step": 36610 }, { "epoch": 0.31, "learning_rate": 7.786142001322292e-05, "loss": 2.4203, "step": 36615 }, { "epoch": 0.31, "learning_rate": 7.7855849816983e-05, "loss": 2.3294, "step": 36620 }, { "epoch": 0.31, "learning_rate": 7.785027911938708e-05, "loss": 2.4385, "step": 36625 }, { "epoch": 0.31, "learning_rate": 7.784470792053539e-05, "loss": 2.2378, "step": 36630 }, { "epoch": 0.31, "learning_rate": 7.783913622052825e-05, "loss": 2.2768, "step": 36635 }, { "epoch": 0.31, "learning_rate": 7.783356401946591e-05, "loss": 2.2817, "step": 36640 }, { "epoch": 0.31, "learning_rate": 7.782799131744865e-05, "loss": 2.3597, "step": 36645 }, { "epoch": 0.31, "learning_rate": 7.782241811457679e-05, "loss": 2.3454, "step": 36650 }, { "epoch": 0.31, "learning_rate": 7.781684441095063e-05, "loss": 2.3672, "step": 36655 }, { "epoch": 0.31, "learning_rate": 7.781127020667049e-05, "loss": 2.2787, "step": 36660 }, { "epoch": 0.31, "learning_rate": 7.780569550183668e-05, "loss": 2.278, "step": 36665 }, { "epoch": 0.31, "learning_rate": 7.780012029654956e-05, "loss": 2.3858, "step": 36670 }, { "epoch": 0.31, "learning_rate": 7.779454459090946e-05, "loss": 2.3555, "step": 36675 }, { "epoch": 0.31, "learning_rate": 7.778896838501673e-05, "loss": 2.2964, "step": 36680 }, { "epoch": 0.31, "learning_rate": 7.778339167897172e-05, "loss": 2.4006, "step": 36685 }, { "epoch": 0.31, "learning_rate": 7.777781447287484e-05, "loss": 2.3173, "step": 36690 }, { "epoch": 0.31, "learning_rate": 7.777223676682645e-05, "loss": 2.3164, "step": 36695 }, { "epoch": 0.31, "learning_rate": 7.776665856092693e-05, "loss": 2.3817, "step": 36700 }, { "epoch": 0.31, "learning_rate": 7.776107985527668e-05, "loss": 2.3743, "step": 36705 }, { "epoch": 0.31, "learning_rate": 7.77555006499761e-05, "loss": 2.3213, "step": 36710 }, { "epoch": 0.31, "learning_rate": 7.774992094512564e-05, "loss": 2.3832, "step": 36715 }, { "epoch": 0.31, "learning_rate": 7.774434074082568e-05, "loss": 2.325, "step": 36720 }, { "epoch": 0.31, "learning_rate": 7.773876003717669e-05, "loss": 2.3143, "step": 36725 }, { "epoch": 0.31, "learning_rate": 7.773317883427906e-05, "loss": 2.3602, "step": 36730 }, { "epoch": 0.31, "learning_rate": 7.772759713223332e-05, "loss": 2.3323, "step": 36735 }, { "epoch": 0.31, "learning_rate": 7.772201493113986e-05, "loss": 2.3212, "step": 36740 }, { "epoch": 0.31, "learning_rate": 7.771643223109922e-05, "loss": 2.324, "step": 36745 }, { "epoch": 0.31, "learning_rate": 7.77108490322118e-05, "loss": 2.3727, "step": 36750 }, { "epoch": 0.31, "learning_rate": 7.770526533457815e-05, "loss": 2.3496, "step": 36755 }, { "epoch": 0.31, "learning_rate": 7.769968113829873e-05, "loss": 2.2859, "step": 36760 }, { "epoch": 0.31, "learning_rate": 7.769409644347406e-05, "loss": 2.3574, "step": 36765 }, { "epoch": 0.31, "learning_rate": 7.768851125020465e-05, "loss": 2.2514, "step": 36770 }, { "epoch": 0.31, "learning_rate": 7.768292555859105e-05, "loss": 2.3055, "step": 36775 }, { "epoch": 0.31, "learning_rate": 7.767733936873374e-05, "loss": 2.294, "step": 36780 }, { "epoch": 0.31, "learning_rate": 7.76717526807333e-05, "loss": 2.2816, "step": 36785 }, { "epoch": 0.31, "learning_rate": 7.766616549469027e-05, "loss": 2.3366, "step": 36790 }, { "epoch": 0.31, "learning_rate": 7.766057781070522e-05, "loss": 2.3788, "step": 36795 }, { "epoch": 0.31, "learning_rate": 7.76549896288787e-05, "loss": 2.2738, "step": 36800 }, { "epoch": 0.31, "learning_rate": 7.76494009493113e-05, "loss": 2.2658, "step": 36805 }, { "epoch": 0.31, "learning_rate": 7.764381177210359e-05, "loss": 2.2666, "step": 36810 }, { "epoch": 0.31, "learning_rate": 7.763822209735619e-05, "loss": 2.3494, "step": 36815 }, { "epoch": 0.31, "learning_rate": 7.76326319251697e-05, "loss": 2.3768, "step": 36820 }, { "epoch": 0.31, "learning_rate": 7.762704125564471e-05, "loss": 2.403, "step": 36825 }, { "epoch": 0.31, "learning_rate": 7.762145008888188e-05, "loss": 2.3042, "step": 36830 }, { "epoch": 0.31, "learning_rate": 7.761585842498178e-05, "loss": 2.3556, "step": 36835 }, { "epoch": 0.31, "learning_rate": 7.761026626404512e-05, "loss": 2.3252, "step": 36840 }, { "epoch": 0.31, "learning_rate": 7.760467360617252e-05, "loss": 2.3741, "step": 36845 }, { "epoch": 0.31, "learning_rate": 7.759908045146462e-05, "loss": 2.3054, "step": 36850 }, { "epoch": 0.31, "learning_rate": 7.759348680002211e-05, "loss": 2.3752, "step": 36855 }, { "epoch": 0.31, "learning_rate": 7.758789265194566e-05, "loss": 2.3529, "step": 36860 }, { "epoch": 0.31, "learning_rate": 7.758229800733595e-05, "loss": 2.3307, "step": 36865 }, { "epoch": 0.31, "learning_rate": 7.757670286629368e-05, "loss": 2.3104, "step": 36870 }, { "epoch": 0.31, "learning_rate": 7.757110722891954e-05, "loss": 2.2895, "step": 36875 }, { "epoch": 0.31, "learning_rate": 7.756551109531427e-05, "loss": 2.3613, "step": 36880 }, { "epoch": 0.31, "learning_rate": 7.755991446557856e-05, "loss": 2.4055, "step": 36885 }, { "epoch": 0.31, "learning_rate": 7.755431733981316e-05, "loss": 2.2083, "step": 36890 }, { "epoch": 0.31, "learning_rate": 7.754871971811879e-05, "loss": 2.1654, "step": 36895 }, { "epoch": 0.31, "learning_rate": 7.75431216005962e-05, "loss": 2.3365, "step": 36900 }, { "epoch": 0.31, "learning_rate": 7.753752298734615e-05, "loss": 2.4006, "step": 36905 }, { "epoch": 0.31, "learning_rate": 7.753192387846944e-05, "loss": 2.3421, "step": 36910 }, { "epoch": 0.32, "learning_rate": 7.752632427406679e-05, "loss": 2.3518, "step": 36915 }, { "epoch": 0.32, "learning_rate": 7.7520724174239e-05, "loss": 2.3237, "step": 36920 }, { "epoch": 0.32, "learning_rate": 7.751512357908688e-05, "loss": 2.2942, "step": 36925 }, { "epoch": 0.32, "learning_rate": 7.750952248871121e-05, "loss": 2.3466, "step": 36930 }, { "epoch": 0.32, "learning_rate": 7.75039209032128e-05, "loss": 2.2926, "step": 36935 }, { "epoch": 0.32, "learning_rate": 7.749831882269249e-05, "loss": 2.3056, "step": 36940 }, { "epoch": 0.32, "learning_rate": 7.74927162472511e-05, "loss": 2.3196, "step": 36945 }, { "epoch": 0.32, "learning_rate": 7.748711317698944e-05, "loss": 2.2989, "step": 36950 }, { "epoch": 0.32, "learning_rate": 7.748150961200838e-05, "loss": 2.3425, "step": 36955 }, { "epoch": 0.32, "learning_rate": 7.747590555240877e-05, "loss": 2.2767, "step": 36960 }, { "epoch": 0.32, "learning_rate": 7.747030099829149e-05, "loss": 2.3578, "step": 36965 }, { "epoch": 0.32, "learning_rate": 7.746469594975738e-05, "loss": 2.3055, "step": 36970 }, { "epoch": 0.32, "learning_rate": 7.745909040690735e-05, "loss": 2.3083, "step": 36975 }, { "epoch": 0.32, "learning_rate": 7.745348436984225e-05, "loss": 2.3225, "step": 36980 }, { "epoch": 0.32, "learning_rate": 7.744787783866303e-05, "loss": 2.3583, "step": 36985 }, { "epoch": 0.32, "learning_rate": 7.744227081347055e-05, "loss": 2.2988, "step": 36990 }, { "epoch": 0.32, "learning_rate": 7.743666329436576e-05, "loss": 2.3503, "step": 36995 }, { "epoch": 0.32, "learning_rate": 7.743105528144958e-05, "loss": 2.2924, "step": 37000 }, { "epoch": 0.32, "learning_rate": 7.742544677482293e-05, "loss": 2.2894, "step": 37005 }, { "epoch": 0.32, "learning_rate": 7.741983777458676e-05, "loss": 2.3569, "step": 37010 }, { "epoch": 0.32, "learning_rate": 7.741422828084204e-05, "loss": 2.3421, "step": 37015 }, { "epoch": 0.32, "learning_rate": 7.74086182936897e-05, "loss": 2.272, "step": 37020 }, { "epoch": 0.32, "learning_rate": 7.740300781323074e-05, "loss": 2.406, "step": 37025 }, { "epoch": 0.32, "learning_rate": 7.739739683956611e-05, "loss": 2.3031, "step": 37030 }, { "epoch": 0.32, "learning_rate": 7.73917853727968e-05, "loss": 2.31, "step": 37035 }, { "epoch": 0.32, "learning_rate": 7.738617341302383e-05, "loss": 2.3344, "step": 37040 }, { "epoch": 0.32, "learning_rate": 7.738056096034821e-05, "loss": 2.3134, "step": 37045 }, { "epoch": 0.32, "learning_rate": 7.73749480148709e-05, "loss": 2.255, "step": 37050 }, { "epoch": 0.32, "learning_rate": 7.736933457669298e-05, "loss": 2.3831, "step": 37055 }, { "epoch": 0.32, "learning_rate": 7.736372064591547e-05, "loss": 2.3588, "step": 37060 }, { "epoch": 0.32, "learning_rate": 7.73581062226394e-05, "loss": 2.3333, "step": 37065 }, { "epoch": 0.32, "learning_rate": 7.735249130696581e-05, "loss": 2.3201, "step": 37070 }, { "epoch": 0.32, "learning_rate": 7.734687589899579e-05, "loss": 2.2822, "step": 37075 }, { "epoch": 0.32, "learning_rate": 7.734125999883037e-05, "loss": 2.2982, "step": 37080 }, { "epoch": 0.32, "learning_rate": 7.733564360657066e-05, "loss": 2.2533, "step": 37085 }, { "epoch": 0.32, "learning_rate": 7.733002672231771e-05, "loss": 2.2702, "step": 37090 }, { "epoch": 0.32, "learning_rate": 7.732440934617265e-05, "loss": 2.3542, "step": 37095 }, { "epoch": 0.32, "learning_rate": 7.731879147823655e-05, "loss": 2.2784, "step": 37100 }, { "epoch": 0.32, "learning_rate": 7.731317311861055e-05, "loss": 2.2893, "step": 37105 }, { "epoch": 0.32, "learning_rate": 7.730755426739577e-05, "loss": 2.2958, "step": 37110 }, { "epoch": 0.32, "learning_rate": 7.730193492469331e-05, "loss": 2.3308, "step": 37115 }, { "epoch": 0.32, "learning_rate": 7.729631509060434e-05, "loss": 2.3773, "step": 37120 }, { "epoch": 0.32, "learning_rate": 7.729069476523e-05, "loss": 2.388, "step": 37125 }, { "epoch": 0.32, "learning_rate": 7.728507394867142e-05, "loss": 2.29, "step": 37130 }, { "epoch": 0.32, "learning_rate": 7.727945264102978e-05, "loss": 2.3313, "step": 37135 }, { "epoch": 0.32, "learning_rate": 7.727383084240626e-05, "loss": 2.3382, "step": 37140 }, { "epoch": 0.32, "learning_rate": 7.726820855290206e-05, "loss": 2.2985, "step": 37145 }, { "epoch": 0.32, "learning_rate": 7.726258577261834e-05, "loss": 2.3478, "step": 37150 }, { "epoch": 0.32, "learning_rate": 7.72569625016563e-05, "loss": 2.3304, "step": 37155 }, { "epoch": 0.32, "learning_rate": 7.725133874011718e-05, "loss": 2.3195, "step": 37160 }, { "epoch": 0.32, "learning_rate": 7.724571448810217e-05, "loss": 2.3365, "step": 37165 }, { "epoch": 0.32, "learning_rate": 7.72400897457125e-05, "loss": 2.4246, "step": 37170 }, { "epoch": 0.32, "learning_rate": 7.723446451304943e-05, "loss": 2.3091, "step": 37175 }, { "epoch": 0.32, "learning_rate": 7.722883879021417e-05, "loss": 2.4116, "step": 37180 }, { "epoch": 0.32, "learning_rate": 7.722321257730799e-05, "loss": 2.3392, "step": 37185 }, { "epoch": 0.32, "learning_rate": 7.721758587443213e-05, "loss": 2.2977, "step": 37190 }, { "epoch": 0.32, "learning_rate": 7.721195868168788e-05, "loss": 2.2685, "step": 37195 }, { "epoch": 0.32, "learning_rate": 7.720633099917656e-05, "loss": 2.3031, "step": 37200 }, { "epoch": 0.32, "learning_rate": 7.720070282699939e-05, "loss": 2.3664, "step": 37205 }, { "epoch": 0.32, "learning_rate": 7.719507416525771e-05, "loss": 2.3846, "step": 37210 }, { "epoch": 0.32, "learning_rate": 7.71894450140528e-05, "loss": 2.3494, "step": 37215 }, { "epoch": 0.32, "learning_rate": 7.718381537348598e-05, "loss": 2.2375, "step": 37220 }, { "epoch": 0.32, "learning_rate": 7.717818524365859e-05, "loss": 2.28, "step": 37225 }, { "epoch": 0.32, "learning_rate": 7.717255462467194e-05, "loss": 2.3012, "step": 37230 }, { "epoch": 0.32, "learning_rate": 7.71669235166274e-05, "loss": 2.333, "step": 37235 }, { "epoch": 0.32, "learning_rate": 7.716129191962629e-05, "loss": 2.4072, "step": 37240 }, { "epoch": 0.32, "learning_rate": 7.715565983377e-05, "loss": 2.3874, "step": 37245 }, { "epoch": 0.32, "learning_rate": 7.715002725915985e-05, "loss": 2.3175, "step": 37250 }, { "epoch": 0.32, "learning_rate": 7.714439419589727e-05, "loss": 2.3164, "step": 37255 }, { "epoch": 0.32, "learning_rate": 7.713876064408361e-05, "loss": 2.3483, "step": 37260 }, { "epoch": 0.32, "learning_rate": 7.713312660382028e-05, "loss": 2.2898, "step": 37265 }, { "epoch": 0.32, "learning_rate": 7.712749207520866e-05, "loss": 2.334, "step": 37270 }, { "epoch": 0.32, "learning_rate": 7.71218570583502e-05, "loss": 2.3379, "step": 37275 }, { "epoch": 0.32, "learning_rate": 7.71162215533463e-05, "loss": 2.2851, "step": 37280 }, { "epoch": 0.32, "learning_rate": 7.711058556029838e-05, "loss": 2.2247, "step": 37285 }, { "epoch": 0.32, "learning_rate": 7.710494907930789e-05, "loss": 2.3164, "step": 37290 }, { "epoch": 0.32, "learning_rate": 7.709931211047626e-05, "loss": 2.3124, "step": 37295 }, { "epoch": 0.32, "learning_rate": 7.709367465390498e-05, "loss": 2.2861, "step": 37300 }, { "epoch": 0.32, "learning_rate": 7.708803670969548e-05, "loss": 2.309, "step": 37305 }, { "epoch": 0.32, "learning_rate": 7.708239827794925e-05, "loss": 2.2579, "step": 37310 }, { "epoch": 0.32, "learning_rate": 7.707675935876777e-05, "loss": 2.3382, "step": 37315 }, { "epoch": 0.32, "learning_rate": 7.707111995225251e-05, "loss": 2.2698, "step": 37320 }, { "epoch": 0.32, "learning_rate": 7.706548005850501e-05, "loss": 2.2573, "step": 37325 }, { "epoch": 0.32, "learning_rate": 7.705983967762675e-05, "loss": 2.2659, "step": 37330 }, { "epoch": 0.32, "learning_rate": 7.705419880971924e-05, "loss": 2.3455, "step": 37335 }, { "epoch": 0.32, "learning_rate": 7.704855745488404e-05, "loss": 2.3515, "step": 37340 }, { "epoch": 0.32, "learning_rate": 7.704291561322265e-05, "loss": 2.2509, "step": 37345 }, { "epoch": 0.32, "learning_rate": 7.703727328483662e-05, "loss": 2.3169, "step": 37350 }, { "epoch": 0.32, "learning_rate": 7.703163046982751e-05, "loss": 2.2651, "step": 37355 }, { "epoch": 0.32, "learning_rate": 7.70259871682969e-05, "loss": 2.3321, "step": 37360 }, { "epoch": 0.32, "learning_rate": 7.702034338034631e-05, "loss": 2.2949, "step": 37365 }, { "epoch": 0.32, "learning_rate": 7.701469910607735e-05, "loss": 2.2866, "step": 37370 }, { "epoch": 0.32, "learning_rate": 7.700905434559162e-05, "loss": 2.3324, "step": 37375 }, { "epoch": 0.32, "learning_rate": 7.70034090989907e-05, "loss": 2.3167, "step": 37380 }, { "epoch": 0.32, "learning_rate": 7.699776336637617e-05, "loss": 2.2554, "step": 37385 }, { "epoch": 0.32, "learning_rate": 7.699211714784969e-05, "loss": 2.2884, "step": 37390 }, { "epoch": 0.32, "learning_rate": 7.698647044351284e-05, "loss": 2.2935, "step": 37395 }, { "epoch": 0.32, "learning_rate": 7.698082325346727e-05, "loss": 2.2728, "step": 37400 }, { "epoch": 0.32, "learning_rate": 7.697517557781462e-05, "loss": 2.2834, "step": 37405 }, { "epoch": 0.32, "learning_rate": 7.696952741665655e-05, "loss": 2.4147, "step": 37410 }, { "epoch": 0.32, "learning_rate": 7.696387877009468e-05, "loss": 2.3547, "step": 37415 }, { "epoch": 0.32, "learning_rate": 7.695822963823072e-05, "loss": 2.2992, "step": 37420 }, { "epoch": 0.32, "learning_rate": 7.695258002116631e-05, "loss": 2.3966, "step": 37425 }, { "epoch": 0.32, "learning_rate": 7.694692991900316e-05, "loss": 2.3031, "step": 37430 }, { "epoch": 0.32, "learning_rate": 7.694127933184294e-05, "loss": 2.3423, "step": 37435 }, { "epoch": 0.32, "learning_rate": 7.693562825978737e-05, "loss": 2.3451, "step": 37440 }, { "epoch": 0.32, "learning_rate": 7.692997670293814e-05, "loss": 2.3198, "step": 37445 }, { "epoch": 0.32, "learning_rate": 7.692432466139697e-05, "loss": 2.3939, "step": 37450 }, { "epoch": 0.32, "learning_rate": 7.69186721352656e-05, "loss": 2.3564, "step": 37455 }, { "epoch": 0.32, "learning_rate": 7.691301912464577e-05, "loss": 2.3311, "step": 37460 }, { "epoch": 0.32, "learning_rate": 7.690736562963918e-05, "loss": 2.2445, "step": 37465 }, { "epoch": 0.32, "learning_rate": 7.690171165034765e-05, "loss": 2.2893, "step": 37470 }, { "epoch": 0.32, "learning_rate": 7.689605718687289e-05, "loss": 2.3176, "step": 37475 }, { "epoch": 0.32, "learning_rate": 7.689040223931669e-05, "loss": 2.3028, "step": 37480 }, { "epoch": 0.32, "learning_rate": 7.688474680778082e-05, "loss": 2.2862, "step": 37485 }, { "epoch": 0.32, "learning_rate": 7.687909089236709e-05, "loss": 2.2647, "step": 37490 }, { "epoch": 0.32, "learning_rate": 7.687343449317727e-05, "loss": 2.3257, "step": 37495 }, { "epoch": 0.32, "learning_rate": 7.686777761031317e-05, "loss": 2.3245, "step": 37500 }, { "epoch": 0.32, "learning_rate": 7.686212024387662e-05, "loss": 2.2451, "step": 37505 }, { "epoch": 0.32, "learning_rate": 7.685646239396944e-05, "loss": 2.2281, "step": 37510 }, { "epoch": 0.32, "learning_rate": 7.685080406069344e-05, "loss": 2.3164, "step": 37515 }, { "epoch": 0.32, "learning_rate": 7.684514524415049e-05, "loss": 2.3159, "step": 37520 }, { "epoch": 0.32, "learning_rate": 7.683948594444241e-05, "loss": 2.3835, "step": 37525 }, { "epoch": 0.32, "learning_rate": 7.683382616167107e-05, "loss": 2.3253, "step": 37530 }, { "epoch": 0.32, "learning_rate": 7.682816589593835e-05, "loss": 2.2917, "step": 37535 }, { "epoch": 0.32, "learning_rate": 7.682250514734609e-05, "loss": 2.3737, "step": 37540 }, { "epoch": 0.32, "learning_rate": 7.68168439159962e-05, "loss": 2.3409, "step": 37545 }, { "epoch": 0.32, "learning_rate": 7.681118220199056e-05, "loss": 2.3013, "step": 37550 }, { "epoch": 0.32, "learning_rate": 7.680552000543108e-05, "loss": 2.2191, "step": 37555 }, { "epoch": 0.32, "learning_rate": 7.679985732641968e-05, "loss": 2.3638, "step": 37560 }, { "epoch": 0.32, "learning_rate": 7.679419416505827e-05, "loss": 2.3299, "step": 37565 }, { "epoch": 0.32, "learning_rate": 7.678853052144875e-05, "loss": 2.3113, "step": 37570 }, { "epoch": 0.32, "learning_rate": 7.678286639569309e-05, "loss": 2.3111, "step": 37575 }, { "epoch": 0.32, "learning_rate": 7.677720178789323e-05, "loss": 2.3449, "step": 37580 }, { "epoch": 0.32, "learning_rate": 7.677153669815109e-05, "loss": 2.3049, "step": 37585 }, { "epoch": 0.32, "learning_rate": 7.676587112656868e-05, "loss": 2.3488, "step": 37590 }, { "epoch": 0.32, "learning_rate": 7.676020507324792e-05, "loss": 2.3168, "step": 37595 }, { "epoch": 0.32, "learning_rate": 7.675453853829084e-05, "loss": 2.266, "step": 37600 }, { "epoch": 0.32, "learning_rate": 7.67488715217994e-05, "loss": 2.3928, "step": 37605 }, { "epoch": 0.32, "learning_rate": 7.674320402387559e-05, "loss": 2.417, "step": 37610 }, { "epoch": 0.32, "learning_rate": 7.673753604462142e-05, "loss": 2.3023, "step": 37615 }, { "epoch": 0.32, "learning_rate": 7.673186758413892e-05, "loss": 2.338, "step": 37620 }, { "epoch": 0.32, "learning_rate": 7.672619864253009e-05, "loss": 2.4472, "step": 37625 }, { "epoch": 0.32, "learning_rate": 7.672052921989699e-05, "loss": 2.3457, "step": 37630 }, { "epoch": 0.32, "learning_rate": 7.671485931634162e-05, "loss": 2.2435, "step": 37635 }, { "epoch": 0.32, "learning_rate": 7.670918893196605e-05, "loss": 2.3373, "step": 37640 }, { "epoch": 0.32, "learning_rate": 7.670351806687235e-05, "loss": 2.323, "step": 37645 }, { "epoch": 0.32, "learning_rate": 7.669784672116256e-05, "loss": 2.3236, "step": 37650 }, { "epoch": 0.32, "learning_rate": 7.669217489493876e-05, "loss": 2.3001, "step": 37655 }, { "epoch": 0.32, "learning_rate": 7.668650258830304e-05, "loss": 2.2795, "step": 37660 }, { "epoch": 0.32, "learning_rate": 7.66808298013575e-05, "loss": 2.2435, "step": 37665 }, { "epoch": 0.32, "learning_rate": 7.667515653420423e-05, "loss": 2.3175, "step": 37670 }, { "epoch": 0.32, "learning_rate": 7.666948278694533e-05, "loss": 2.3478, "step": 37675 }, { "epoch": 0.32, "learning_rate": 7.666380855968293e-05, "loss": 2.3027, "step": 37680 }, { "epoch": 0.32, "learning_rate": 7.665813385251915e-05, "loss": 2.2696, "step": 37685 }, { "epoch": 0.32, "learning_rate": 7.665245866555612e-05, "loss": 2.3081, "step": 37690 }, { "epoch": 0.32, "learning_rate": 7.664678299889601e-05, "loss": 2.31, "step": 37695 }, { "epoch": 0.32, "learning_rate": 7.664110685264094e-05, "loss": 2.3098, "step": 37700 }, { "epoch": 0.32, "learning_rate": 7.663543022689308e-05, "loss": 2.2908, "step": 37705 }, { "epoch": 0.32, "learning_rate": 7.66297531217546e-05, "loss": 2.3754, "step": 37710 }, { "epoch": 0.32, "learning_rate": 7.662407553732768e-05, "loss": 2.3998, "step": 37715 }, { "epoch": 0.32, "learning_rate": 7.661839747371451e-05, "loss": 2.2752, "step": 37720 }, { "epoch": 0.32, "learning_rate": 7.661271893101729e-05, "loss": 2.3928, "step": 37725 }, { "epoch": 0.32, "learning_rate": 7.660703990933821e-05, "loss": 2.3581, "step": 37730 }, { "epoch": 0.32, "learning_rate": 7.660136040877947e-05, "loss": 2.3029, "step": 37735 }, { "epoch": 0.32, "learning_rate": 7.659568042944333e-05, "loss": 2.312, "step": 37740 }, { "epoch": 0.32, "learning_rate": 7.658999997143199e-05, "loss": 2.3806, "step": 37745 }, { "epoch": 0.32, "learning_rate": 7.658431903484769e-05, "loss": 2.3328, "step": 37750 }, { "epoch": 0.32, "learning_rate": 7.65786376197927e-05, "loss": 2.3691, "step": 37755 }, { "epoch": 0.32, "learning_rate": 7.657295572636925e-05, "loss": 2.3439, "step": 37760 }, { "epoch": 0.32, "learning_rate": 7.65672733546796e-05, "loss": 2.2961, "step": 37765 }, { "epoch": 0.32, "learning_rate": 7.656159050482604e-05, "loss": 2.2658, "step": 37770 }, { "epoch": 0.32, "learning_rate": 7.655590717691086e-05, "loss": 2.3532, "step": 37775 }, { "epoch": 0.32, "learning_rate": 7.655022337103633e-05, "loss": 2.2539, "step": 37780 }, { "epoch": 0.32, "learning_rate": 7.654453908730475e-05, "loss": 2.2913, "step": 37785 }, { "epoch": 0.32, "learning_rate": 7.653885432581843e-05, "loss": 2.3145, "step": 37790 }, { "epoch": 0.32, "learning_rate": 7.65331690866797e-05, "loss": 2.3123, "step": 37795 }, { "epoch": 0.32, "learning_rate": 7.652748336999085e-05, "loss": 2.2545, "step": 37800 }, { "epoch": 0.32, "learning_rate": 7.652179717585424e-05, "loss": 2.2888, "step": 37805 }, { "epoch": 0.32, "learning_rate": 7.651611050437221e-05, "loss": 2.2924, "step": 37810 }, { "epoch": 0.32, "learning_rate": 7.65104233556471e-05, "loss": 2.356, "step": 37815 }, { "epoch": 0.32, "learning_rate": 7.650473572978128e-05, "loss": 2.234, "step": 37820 }, { "epoch": 0.32, "learning_rate": 7.649904762687712e-05, "loss": 2.3071, "step": 37825 }, { "epoch": 0.32, "learning_rate": 7.649335904703698e-05, "loss": 2.2509, "step": 37830 }, { "epoch": 0.32, "learning_rate": 7.648766999036325e-05, "loss": 2.3505, "step": 37835 }, { "epoch": 0.32, "learning_rate": 7.648198045695834e-05, "loss": 2.2931, "step": 37840 }, { "epoch": 0.32, "learning_rate": 7.64762904469246e-05, "loss": 2.3741, "step": 37845 }, { "epoch": 0.32, "learning_rate": 7.64705999603645e-05, "loss": 2.3774, "step": 37850 }, { "epoch": 0.32, "learning_rate": 7.646490899738044e-05, "loss": 2.2751, "step": 37855 }, { "epoch": 0.32, "learning_rate": 7.645921755807483e-05, "loss": 2.3424, "step": 37860 }, { "epoch": 0.32, "learning_rate": 7.645352564255012e-05, "loss": 2.3123, "step": 37865 }, { "epoch": 0.32, "learning_rate": 7.644783325090876e-05, "loss": 2.3335, "step": 37870 }, { "epoch": 0.32, "learning_rate": 7.64421403832532e-05, "loss": 2.3228, "step": 37875 }, { "epoch": 0.32, "learning_rate": 7.643644703968588e-05, "loss": 2.3092, "step": 37880 }, { "epoch": 0.32, "learning_rate": 7.64307532203093e-05, "loss": 2.283, "step": 37885 }, { "epoch": 0.32, "learning_rate": 7.642505892522592e-05, "loss": 2.396, "step": 37890 }, { "epoch": 0.32, "learning_rate": 7.641936415453823e-05, "loss": 2.3067, "step": 37895 }, { "epoch": 0.32, "learning_rate": 7.641366890834873e-05, "loss": 2.3473, "step": 37900 }, { "epoch": 0.32, "learning_rate": 7.640797318675994e-05, "loss": 2.3941, "step": 37905 }, { "epoch": 0.32, "learning_rate": 7.640227698987433e-05, "loss": 2.3576, "step": 37910 }, { "epoch": 0.32, "learning_rate": 7.639658031779446e-05, "loss": 2.2713, "step": 37915 }, { "epoch": 0.32, "learning_rate": 7.639088317062285e-05, "loss": 2.4128, "step": 37920 }, { "epoch": 0.32, "learning_rate": 7.638518554846203e-05, "loss": 2.3228, "step": 37925 }, { "epoch": 0.32, "learning_rate": 7.637948745141455e-05, "loss": 2.3243, "step": 37930 }, { "epoch": 0.32, "learning_rate": 7.637378887958299e-05, "loss": 2.3258, "step": 37935 }, { "epoch": 0.32, "learning_rate": 7.636808983306988e-05, "loss": 2.2828, "step": 37940 }, { "epoch": 0.32, "learning_rate": 7.63623903119778e-05, "loss": 2.3228, "step": 37945 }, { "epoch": 0.32, "learning_rate": 7.635669031640935e-05, "loss": 2.2748, "step": 37950 }, { "epoch": 0.32, "learning_rate": 7.635098984646709e-05, "loss": 2.1883, "step": 37955 }, { "epoch": 0.32, "learning_rate": 7.634528890225363e-05, "loss": 2.4058, "step": 37960 }, { "epoch": 0.32, "learning_rate": 7.63395874838716e-05, "loss": 2.28, "step": 37965 }, { "epoch": 0.32, "learning_rate": 7.63338855914236e-05, "loss": 2.3533, "step": 37970 }, { "epoch": 0.32, "learning_rate": 7.632818322501225e-05, "loss": 2.362, "step": 37975 }, { "epoch": 0.32, "learning_rate": 7.632248038474018e-05, "loss": 2.2969, "step": 37980 }, { "epoch": 0.32, "learning_rate": 7.631677707071003e-05, "loss": 2.4145, "step": 37985 }, { "epoch": 0.32, "learning_rate": 7.631107328302447e-05, "loss": 2.2893, "step": 37990 }, { "epoch": 0.32, "learning_rate": 7.630536902178613e-05, "loss": 2.2899, "step": 37995 }, { "epoch": 0.32, "learning_rate": 7.62996642870977e-05, "loss": 2.3279, "step": 38000 }, { "epoch": 0.32, "learning_rate": 7.629395907906182e-05, "loss": 2.3491, "step": 38005 }, { "epoch": 0.32, "learning_rate": 7.628825339778123e-05, "loss": 2.3916, "step": 38010 }, { "epoch": 0.32, "learning_rate": 7.628254724335856e-05, "loss": 2.3284, "step": 38015 }, { "epoch": 0.32, "learning_rate": 7.627684061589657e-05, "loss": 2.2882, "step": 38020 }, { "epoch": 0.32, "learning_rate": 7.627113351549792e-05, "loss": 2.2911, "step": 38025 }, { "epoch": 0.32, "learning_rate": 7.626542594226536e-05, "loss": 2.3226, "step": 38030 }, { "epoch": 0.32, "learning_rate": 7.625971789630161e-05, "loss": 2.2423, "step": 38035 }, { "epoch": 0.32, "learning_rate": 7.625400937770938e-05, "loss": 2.3569, "step": 38040 }, { "epoch": 0.32, "learning_rate": 7.624830038659145e-05, "loss": 2.3227, "step": 38045 }, { "epoch": 0.32, "learning_rate": 7.624259092305056e-05, "loss": 2.2999, "step": 38050 }, { "epoch": 0.32, "learning_rate": 7.623688098718943e-05, "loss": 2.3275, "step": 38055 }, { "epoch": 0.32, "learning_rate": 7.623117057911089e-05, "loss": 2.3796, "step": 38060 }, { "epoch": 0.32, "learning_rate": 7.622545969891768e-05, "loss": 2.3573, "step": 38065 }, { "epoch": 0.32, "learning_rate": 7.62197483467126e-05, "loss": 2.3539, "step": 38070 }, { "epoch": 0.32, "learning_rate": 7.621403652259842e-05, "loss": 2.3575, "step": 38075 }, { "epoch": 0.32, "learning_rate": 7.620832422667799e-05, "loss": 2.3435, "step": 38080 }, { "epoch": 0.32, "learning_rate": 7.62026114590541e-05, "loss": 2.3327, "step": 38085 }, { "epoch": 0.33, "learning_rate": 7.619689821982954e-05, "loss": 2.2311, "step": 38090 }, { "epoch": 0.33, "learning_rate": 7.619118450910717e-05, "loss": 2.3508, "step": 38095 }, { "epoch": 0.33, "learning_rate": 7.618547032698981e-05, "loss": 2.3132, "step": 38100 }, { "epoch": 0.33, "learning_rate": 7.617975567358033e-05, "loss": 2.2912, "step": 38105 }, { "epoch": 0.33, "learning_rate": 7.617404054898156e-05, "loss": 2.3195, "step": 38110 }, { "epoch": 0.33, "learning_rate": 7.616832495329637e-05, "loss": 2.3049, "step": 38115 }, { "epoch": 0.33, "learning_rate": 7.616260888662763e-05, "loss": 2.3124, "step": 38120 }, { "epoch": 0.33, "learning_rate": 7.615689234907822e-05, "loss": 2.3116, "step": 38125 }, { "epoch": 0.33, "learning_rate": 7.615117534075103e-05, "loss": 2.3144, "step": 38130 }, { "epoch": 0.33, "learning_rate": 7.614545786174896e-05, "loss": 2.374, "step": 38135 }, { "epoch": 0.33, "learning_rate": 7.613973991217489e-05, "loss": 2.2761, "step": 38140 }, { "epoch": 0.33, "learning_rate": 7.613402149213176e-05, "loss": 2.2794, "step": 38145 }, { "epoch": 0.33, "learning_rate": 7.612830260172247e-05, "loss": 2.3533, "step": 38150 }, { "epoch": 0.33, "learning_rate": 7.612258324105e-05, "loss": 2.3488, "step": 38155 }, { "epoch": 0.33, "learning_rate": 7.611686341021722e-05, "loss": 2.2667, "step": 38160 }, { "epoch": 0.33, "learning_rate": 7.61111431093271e-05, "loss": 2.2696, "step": 38165 }, { "epoch": 0.33, "learning_rate": 7.610542233848262e-05, "loss": 2.2607, "step": 38170 }, { "epoch": 0.33, "learning_rate": 7.60997010977867e-05, "loss": 2.3604, "step": 38175 }, { "epoch": 0.33, "learning_rate": 7.609397938734238e-05, "loss": 2.3602, "step": 38180 }, { "epoch": 0.33, "learning_rate": 7.608825720725256e-05, "loss": 2.3457, "step": 38185 }, { "epoch": 0.33, "learning_rate": 7.608253455762029e-05, "loss": 2.3808, "step": 38190 }, { "epoch": 0.33, "learning_rate": 7.607681143854854e-05, "loss": 2.3621, "step": 38195 }, { "epoch": 0.33, "learning_rate": 7.607108785014031e-05, "loss": 2.3705, "step": 38200 }, { "epoch": 0.33, "learning_rate": 7.606536379249865e-05, "loss": 2.3128, "step": 38205 }, { "epoch": 0.33, "learning_rate": 7.605963926572655e-05, "loss": 2.2852, "step": 38210 }, { "epoch": 0.33, "learning_rate": 7.605391426992703e-05, "loss": 2.3194, "step": 38215 }, { "epoch": 0.33, "learning_rate": 7.604818880520316e-05, "loss": 2.3701, "step": 38220 }, { "epoch": 0.33, "learning_rate": 7.6042462871658e-05, "loss": 2.2899, "step": 38225 }, { "epoch": 0.33, "learning_rate": 7.603673646939457e-05, "loss": 2.3305, "step": 38230 }, { "epoch": 0.33, "learning_rate": 7.603100959851594e-05, "loss": 2.3105, "step": 38235 }, { "epoch": 0.33, "learning_rate": 7.60252822591252e-05, "loss": 2.2788, "step": 38240 }, { "epoch": 0.33, "learning_rate": 7.601955445132543e-05, "loss": 2.4431, "step": 38245 }, { "epoch": 0.33, "learning_rate": 7.601382617521971e-05, "loss": 2.351, "step": 38250 }, { "epoch": 0.33, "learning_rate": 7.600809743091117e-05, "loss": 2.4059, "step": 38255 }, { "epoch": 0.33, "learning_rate": 7.600236821850286e-05, "loss": 2.3079, "step": 38260 }, { "epoch": 0.33, "learning_rate": 7.599663853809795e-05, "loss": 2.3175, "step": 38265 }, { "epoch": 0.33, "learning_rate": 7.599090838979952e-05, "loss": 2.3712, "step": 38270 }, { "epoch": 0.33, "learning_rate": 7.598517777371074e-05, "loss": 2.3296, "step": 38275 }, { "epoch": 0.33, "learning_rate": 7.597944668993473e-05, "loss": 2.2915, "step": 38280 }, { "epoch": 0.33, "learning_rate": 7.597371513857465e-05, "loss": 2.3278, "step": 38285 }, { "epoch": 0.33, "learning_rate": 7.596798311973365e-05, "loss": 2.3519, "step": 38290 }, { "epoch": 0.33, "learning_rate": 7.59622506335149e-05, "loss": 2.2866, "step": 38295 }, { "epoch": 0.33, "learning_rate": 7.595651768002156e-05, "loss": 2.2896, "step": 38300 }, { "epoch": 0.33, "learning_rate": 7.595078425935684e-05, "loss": 2.346, "step": 38305 }, { "epoch": 0.33, "learning_rate": 7.594505037162391e-05, "loss": 2.2699, "step": 38310 }, { "epoch": 0.33, "learning_rate": 7.5939316016926e-05, "loss": 2.2956, "step": 38315 }, { "epoch": 0.33, "learning_rate": 7.593358119536627e-05, "loss": 2.3424, "step": 38320 }, { "epoch": 0.33, "learning_rate": 7.592784590704797e-05, "loss": 2.3555, "step": 38325 }, { "epoch": 0.33, "learning_rate": 7.592211015207432e-05, "loss": 2.3627, "step": 38330 }, { "epoch": 0.33, "learning_rate": 7.591637393054856e-05, "loss": 2.3528, "step": 38335 }, { "epoch": 0.33, "learning_rate": 7.591063724257392e-05, "loss": 2.3115, "step": 38340 }, { "epoch": 0.33, "learning_rate": 7.590490008825364e-05, "loss": 2.3183, "step": 38345 }, { "epoch": 0.33, "learning_rate": 7.589916246769099e-05, "loss": 2.4059, "step": 38350 }, { "epoch": 0.33, "learning_rate": 7.589342438098927e-05, "loss": 2.3386, "step": 38355 }, { "epoch": 0.33, "learning_rate": 7.58876858282517e-05, "loss": 2.2196, "step": 38360 }, { "epoch": 0.33, "learning_rate": 7.588194680958158e-05, "loss": 2.3345, "step": 38365 }, { "epoch": 0.33, "learning_rate": 7.587620732508222e-05, "loss": 2.2913, "step": 38370 }, { "epoch": 0.33, "learning_rate": 7.587046737485692e-05, "loss": 2.3514, "step": 38375 }, { "epoch": 0.33, "learning_rate": 7.586472695900896e-05, "loss": 2.3767, "step": 38380 }, { "epoch": 0.33, "learning_rate": 7.585898607764168e-05, "loss": 2.3705, "step": 38385 }, { "epoch": 0.33, "learning_rate": 7.585324473085842e-05, "loss": 2.3558, "step": 38390 }, { "epoch": 0.33, "learning_rate": 7.584750291876248e-05, "loss": 2.263, "step": 38395 }, { "epoch": 0.33, "learning_rate": 7.584176064145723e-05, "loss": 2.3067, "step": 38400 }, { "epoch": 0.33, "learning_rate": 7.583601789904603e-05, "loss": 2.3725, "step": 38405 }, { "epoch": 0.33, "learning_rate": 7.583027469163218e-05, "loss": 2.3308, "step": 38410 }, { "epoch": 0.33, "learning_rate": 7.58245310193191e-05, "loss": 2.2977, "step": 38415 }, { "epoch": 0.33, "learning_rate": 7.581878688221016e-05, "loss": 2.3098, "step": 38420 }, { "epoch": 0.33, "learning_rate": 7.581304228040871e-05, "loss": 2.3037, "step": 38425 }, { "epoch": 0.33, "learning_rate": 7.580729721401821e-05, "loss": 2.2636, "step": 38430 }, { "epoch": 0.33, "learning_rate": 7.5801551683142e-05, "loss": 2.3653, "step": 38435 }, { "epoch": 0.33, "learning_rate": 7.579580568788352e-05, "loss": 2.3613, "step": 38440 }, { "epoch": 0.33, "learning_rate": 7.579005922834616e-05, "loss": 2.3014, "step": 38445 }, { "epoch": 0.33, "learning_rate": 7.578431230463339e-05, "loss": 2.283, "step": 38450 }, { "epoch": 0.33, "learning_rate": 7.577856491684859e-05, "loss": 2.3808, "step": 38455 }, { "epoch": 0.33, "learning_rate": 7.577281706509525e-05, "loss": 2.3371, "step": 38460 }, { "epoch": 0.33, "learning_rate": 7.57670687494768e-05, "loss": 2.4061, "step": 38465 }, { "epoch": 0.33, "learning_rate": 7.57613199700967e-05, "loss": 2.2813, "step": 38470 }, { "epoch": 0.33, "learning_rate": 7.575557072705841e-05, "loss": 2.3289, "step": 38475 }, { "epoch": 0.33, "learning_rate": 7.574982102046542e-05, "loss": 2.3791, "step": 38480 }, { "epoch": 0.33, "learning_rate": 7.574407085042123e-05, "loss": 2.312, "step": 38485 }, { "epoch": 0.33, "learning_rate": 7.57383202170293e-05, "loss": 2.3482, "step": 38490 }, { "epoch": 0.33, "learning_rate": 7.573256912039315e-05, "loss": 2.3355, "step": 38495 }, { "epoch": 0.33, "learning_rate": 7.572681756061628e-05, "loss": 2.2466, "step": 38500 }, { "epoch": 0.33, "learning_rate": 7.572106553780221e-05, "loss": 2.4176, "step": 38505 }, { "epoch": 0.33, "learning_rate": 7.571531305205446e-05, "loss": 2.2566, "step": 38510 }, { "epoch": 0.33, "learning_rate": 7.570956010347658e-05, "loss": 2.3458, "step": 38515 }, { "epoch": 0.33, "learning_rate": 7.570380669217212e-05, "loss": 2.287, "step": 38520 }, { "epoch": 0.33, "learning_rate": 7.569805281824459e-05, "loss": 2.3076, "step": 38525 }, { "epoch": 0.33, "learning_rate": 7.56922984817976e-05, "loss": 2.2274, "step": 38530 }, { "epoch": 0.33, "learning_rate": 7.568654368293468e-05, "loss": 2.3232, "step": 38535 }, { "epoch": 0.33, "learning_rate": 7.568078842175943e-05, "loss": 2.2449, "step": 38540 }, { "epoch": 0.33, "learning_rate": 7.567503269837543e-05, "loss": 2.3382, "step": 38545 }, { "epoch": 0.33, "learning_rate": 7.566927651288625e-05, "loss": 2.3618, "step": 38550 }, { "epoch": 0.33, "learning_rate": 7.566351986539552e-05, "loss": 2.3145, "step": 38555 }, { "epoch": 0.33, "learning_rate": 7.565776275600684e-05, "loss": 2.3386, "step": 38560 }, { "epoch": 0.33, "learning_rate": 7.565200518482383e-05, "loss": 2.3516, "step": 38565 }, { "epoch": 0.33, "learning_rate": 7.56462471519501e-05, "loss": 2.2712, "step": 38570 }, { "epoch": 0.33, "learning_rate": 7.564048865748931e-05, "loss": 2.2696, "step": 38575 }, { "epoch": 0.33, "learning_rate": 7.563472970154508e-05, "loss": 2.3075, "step": 38580 }, { "epoch": 0.33, "learning_rate": 7.562897028422107e-05, "loss": 2.2436, "step": 38585 }, { "epoch": 0.33, "learning_rate": 7.562321040562095e-05, "loss": 2.3573, "step": 38590 }, { "epoch": 0.33, "learning_rate": 7.561745006584838e-05, "loss": 2.3107, "step": 38595 }, { "epoch": 0.33, "learning_rate": 7.561168926500701e-05, "loss": 2.2309, "step": 38600 }, { "epoch": 0.33, "learning_rate": 7.560592800320058e-05, "loss": 2.3284, "step": 38605 }, { "epoch": 0.33, "learning_rate": 7.560016628053274e-05, "loss": 2.293, "step": 38610 }, { "epoch": 0.33, "learning_rate": 7.559440409710718e-05, "loss": 2.3687, "step": 38615 }, { "epoch": 0.33, "learning_rate": 7.558864145302767e-05, "loss": 2.3277, "step": 38620 }, { "epoch": 0.33, "learning_rate": 7.558287834839786e-05, "loss": 2.3166, "step": 38625 }, { "epoch": 0.33, "learning_rate": 7.55771147833215e-05, "loss": 2.2552, "step": 38630 }, { "epoch": 0.33, "learning_rate": 7.557135075790232e-05, "loss": 2.3282, "step": 38635 }, { "epoch": 0.33, "learning_rate": 7.556558627224409e-05, "loss": 2.3704, "step": 38640 }, { "epoch": 0.33, "learning_rate": 7.555982132645054e-05, "loss": 2.2531, "step": 38645 }, { "epoch": 0.33, "learning_rate": 7.55540559206254e-05, "loss": 2.3392, "step": 38650 }, { "epoch": 0.33, "learning_rate": 7.554829005487251e-05, "loss": 2.3283, "step": 38655 }, { "epoch": 0.33, "learning_rate": 7.554252372929558e-05, "loss": 2.3224, "step": 38660 }, { "epoch": 0.33, "learning_rate": 7.553675694399842e-05, "loss": 2.2667, "step": 38665 }, { "epoch": 0.33, "learning_rate": 7.553098969908481e-05, "loss": 2.3591, "step": 38670 }, { "epoch": 0.33, "learning_rate": 7.552522199465857e-05, "loss": 2.2637, "step": 38675 }, { "epoch": 0.33, "learning_rate": 7.551945383082346e-05, "loss": 2.3291, "step": 38680 }, { "epoch": 0.33, "learning_rate": 7.551368520768337e-05, "loss": 2.3267, "step": 38685 }, { "epoch": 0.33, "learning_rate": 7.550791612534207e-05, "loss": 2.3825, "step": 38690 }, { "epoch": 0.33, "learning_rate": 7.550214658390342e-05, "loss": 2.2666, "step": 38695 }, { "epoch": 0.33, "learning_rate": 7.549637658347124e-05, "loss": 2.3892, "step": 38700 }, { "epoch": 0.33, "learning_rate": 7.54906061241494e-05, "loss": 2.3528, "step": 38705 }, { "epoch": 0.33, "learning_rate": 7.548483520604175e-05, "loss": 2.3023, "step": 38710 }, { "epoch": 0.33, "learning_rate": 7.547906382925216e-05, "loss": 2.3144, "step": 38715 }, { "epoch": 0.33, "learning_rate": 7.547329199388452e-05, "loss": 2.3288, "step": 38720 }, { "epoch": 0.33, "learning_rate": 7.546751970004266e-05, "loss": 2.2757, "step": 38725 }, { "epoch": 0.33, "learning_rate": 7.546174694783051e-05, "loss": 2.3041, "step": 38730 }, { "epoch": 0.33, "learning_rate": 7.545597373735197e-05, "loss": 2.3584, "step": 38735 }, { "epoch": 0.33, "learning_rate": 7.545020006871095e-05, "loss": 2.2665, "step": 38740 }, { "epoch": 0.33, "learning_rate": 7.544442594201134e-05, "loss": 2.2936, "step": 38745 }, { "epoch": 0.33, "learning_rate": 7.54386513573571e-05, "loss": 2.2809, "step": 38750 }, { "epoch": 0.33, "learning_rate": 7.543287631485214e-05, "loss": 2.3026, "step": 38755 }, { "epoch": 0.33, "learning_rate": 7.542710081460038e-05, "loss": 2.3505, "step": 38760 }, { "epoch": 0.33, "learning_rate": 7.542132485670583e-05, "loss": 2.3111, "step": 38765 }, { "epoch": 0.33, "learning_rate": 7.541554844127239e-05, "loss": 2.2914, "step": 38770 }, { "epoch": 0.33, "learning_rate": 7.540977156840405e-05, "loss": 2.3519, "step": 38775 }, { "epoch": 0.33, "learning_rate": 7.540399423820478e-05, "loss": 2.3546, "step": 38780 }, { "epoch": 0.33, "learning_rate": 7.539821645077856e-05, "loss": 2.3232, "step": 38785 }, { "epoch": 0.33, "learning_rate": 7.539243820622939e-05, "loss": 2.2939, "step": 38790 }, { "epoch": 0.33, "learning_rate": 7.538665950466124e-05, "loss": 2.2627, "step": 38795 }, { "epoch": 0.33, "learning_rate": 7.538088034617814e-05, "loss": 2.286, "step": 38800 }, { "epoch": 0.33, "learning_rate": 7.537510073088411e-05, "loss": 2.329, "step": 38805 }, { "epoch": 0.33, "learning_rate": 7.536932065888316e-05, "loss": 2.3531, "step": 38810 }, { "epoch": 0.33, "learning_rate": 7.536354013027932e-05, "loss": 2.3895, "step": 38815 }, { "epoch": 0.33, "learning_rate": 7.535775914517664e-05, "loss": 2.3705, "step": 38820 }, { "epoch": 0.33, "learning_rate": 7.535197770367914e-05, "loss": 2.3282, "step": 38825 }, { "epoch": 0.33, "learning_rate": 7.534619580589093e-05, "loss": 2.3339, "step": 38830 }, { "epoch": 0.33, "learning_rate": 7.534041345191601e-05, "loss": 2.3911, "step": 38835 }, { "epoch": 0.33, "learning_rate": 7.533463064185848e-05, "loss": 2.3132, "step": 38840 }, { "epoch": 0.33, "learning_rate": 7.532884737582245e-05, "loss": 2.3767, "step": 38845 }, { "epoch": 0.33, "learning_rate": 7.532306365391197e-05, "loss": 2.3327, "step": 38850 }, { "epoch": 0.33, "learning_rate": 7.531727947623115e-05, "loss": 2.2577, "step": 38855 }, { "epoch": 0.33, "learning_rate": 7.531149484288409e-05, "loss": 2.2963, "step": 38860 }, { "epoch": 0.33, "learning_rate": 7.530570975397491e-05, "loss": 2.2889, "step": 38865 }, { "epoch": 0.33, "learning_rate": 7.529992420960771e-05, "loss": 2.3173, "step": 38870 }, { "epoch": 0.33, "learning_rate": 7.529413820988667e-05, "loss": 2.3684, "step": 38875 }, { "epoch": 0.33, "learning_rate": 7.528835175491586e-05, "loss": 2.2475, "step": 38880 }, { "epoch": 0.33, "learning_rate": 7.528256484479948e-05, "loss": 2.3482, "step": 38885 }, { "epoch": 0.33, "learning_rate": 7.527677747964166e-05, "loss": 2.3307, "step": 38890 }, { "epoch": 0.33, "learning_rate": 7.527098965954658e-05, "loss": 2.3364, "step": 38895 }, { "epoch": 0.33, "learning_rate": 7.526520138461839e-05, "loss": 2.3702, "step": 38900 }, { "epoch": 0.33, "learning_rate": 7.525941265496126e-05, "loss": 2.3484, "step": 38905 }, { "epoch": 0.33, "learning_rate": 7.525362347067941e-05, "loss": 2.3594, "step": 38910 }, { "epoch": 0.33, "learning_rate": 7.524783383187702e-05, "loss": 2.3149, "step": 38915 }, { "epoch": 0.33, "learning_rate": 7.524204373865828e-05, "loss": 2.362, "step": 38920 }, { "epoch": 0.33, "learning_rate": 7.523625319112744e-05, "loss": 2.3088, "step": 38925 }, { "epoch": 0.33, "learning_rate": 7.523046218938867e-05, "loss": 2.3559, "step": 38930 }, { "epoch": 0.33, "learning_rate": 7.522467073354622e-05, "loss": 2.3376, "step": 38935 }, { "epoch": 0.33, "learning_rate": 7.521887882370433e-05, "loss": 2.2644, "step": 38940 }, { "epoch": 0.33, "learning_rate": 7.521308645996724e-05, "loss": 2.3229, "step": 38945 }, { "epoch": 0.33, "learning_rate": 7.520729364243921e-05, "loss": 2.2936, "step": 38950 }, { "epoch": 0.33, "learning_rate": 7.520150037122449e-05, "loss": 2.3542, "step": 38955 }, { "epoch": 0.33, "learning_rate": 7.519570664642734e-05, "loss": 2.3278, "step": 38960 }, { "epoch": 0.33, "learning_rate": 7.518991246815206e-05, "loss": 2.2877, "step": 38965 }, { "epoch": 0.33, "learning_rate": 7.518411783650292e-05, "loss": 2.2537, "step": 38970 }, { "epoch": 0.33, "learning_rate": 7.517832275158422e-05, "loss": 2.323, "step": 38975 }, { "epoch": 0.33, "learning_rate": 7.517252721350028e-05, "loss": 2.3289, "step": 38980 }, { "epoch": 0.33, "learning_rate": 7.516673122235536e-05, "loss": 2.3468, "step": 38985 }, { "epoch": 0.33, "learning_rate": 7.51609347782538e-05, "loss": 2.2727, "step": 38990 }, { "epoch": 0.33, "learning_rate": 7.515513788129996e-05, "loss": 2.284, "step": 38995 }, { "epoch": 0.33, "learning_rate": 7.514934053159813e-05, "loss": 2.3311, "step": 39000 }, { "epoch": 0.33, "learning_rate": 7.514354272925266e-05, "loss": 2.365, "step": 39005 }, { "epoch": 0.33, "learning_rate": 7.51377444743679e-05, "loss": 2.3309, "step": 39010 }, { "epoch": 0.33, "learning_rate": 7.513194576704822e-05, "loss": 2.3439, "step": 39015 }, { "epoch": 0.33, "learning_rate": 7.5126146607398e-05, "loss": 2.2854, "step": 39020 }, { "epoch": 0.33, "learning_rate": 7.512034699552159e-05, "loss": 2.3283, "step": 39025 }, { "epoch": 0.33, "learning_rate": 7.511454693152337e-05, "loss": 2.3723, "step": 39030 }, { "epoch": 0.33, "learning_rate": 7.510874641550776e-05, "loss": 2.2993, "step": 39035 }, { "epoch": 0.33, "learning_rate": 7.510294544757913e-05, "loss": 2.3657, "step": 39040 }, { "epoch": 0.33, "learning_rate": 7.509714402784187e-05, "loss": 2.3662, "step": 39045 }, { "epoch": 0.33, "learning_rate": 7.509134215640045e-05, "loss": 2.2766, "step": 39050 }, { "epoch": 0.33, "learning_rate": 7.508553983335927e-05, "loss": 2.3223, "step": 39055 }, { "epoch": 0.33, "learning_rate": 7.507973705882274e-05, "loss": 2.3202, "step": 39060 }, { "epoch": 0.33, "learning_rate": 7.507393383289532e-05, "loss": 2.3122, "step": 39065 }, { "epoch": 0.33, "learning_rate": 7.506813015568146e-05, "loss": 2.3646, "step": 39070 }, { "epoch": 0.33, "learning_rate": 7.506232602728561e-05, "loss": 2.3794, "step": 39075 }, { "epoch": 0.33, "learning_rate": 7.505652144781221e-05, "loss": 2.3492, "step": 39080 }, { "epoch": 0.33, "learning_rate": 7.505071641736579e-05, "loss": 2.3064, "step": 39085 }, { "epoch": 0.33, "learning_rate": 7.504491093605077e-05, "loss": 2.2709, "step": 39090 }, { "epoch": 0.33, "learning_rate": 7.503910500397169e-05, "loss": 2.2505, "step": 39095 }, { "epoch": 0.33, "learning_rate": 7.5033298621233e-05, "loss": 2.4101, "step": 39100 }, { "epoch": 0.33, "learning_rate": 7.502749178793924e-05, "loss": 2.2932, "step": 39105 }, { "epoch": 0.33, "learning_rate": 7.502168450419492e-05, "loss": 2.2855, "step": 39110 }, { "epoch": 0.33, "learning_rate": 7.501587677010452e-05, "loss": 2.3206, "step": 39115 }, { "epoch": 0.33, "learning_rate": 7.501006858577262e-05, "loss": 2.3091, "step": 39120 }, { "epoch": 0.33, "learning_rate": 7.500425995130373e-05, "loss": 2.3591, "step": 39125 }, { "epoch": 0.33, "learning_rate": 7.499845086680238e-05, "loss": 2.2975, "step": 39130 }, { "epoch": 0.33, "learning_rate": 7.499264133237317e-05, "loss": 2.3989, "step": 39135 }, { "epoch": 0.33, "learning_rate": 7.498683134812064e-05, "loss": 2.3244, "step": 39140 }, { "epoch": 0.33, "learning_rate": 7.498102091414931e-05, "loss": 2.3454, "step": 39145 }, { "epoch": 0.33, "learning_rate": 7.497521003056384e-05, "loss": 2.2584, "step": 39150 }, { "epoch": 0.33, "learning_rate": 7.496939869746879e-05, "loss": 2.3064, "step": 39155 }, { "epoch": 0.33, "learning_rate": 7.496358691496871e-05, "loss": 2.3116, "step": 39160 }, { "epoch": 0.33, "learning_rate": 7.495777468316826e-05, "loss": 2.2937, "step": 39165 }, { "epoch": 0.33, "learning_rate": 7.495196200217201e-05, "loss": 2.2647, "step": 39170 }, { "epoch": 0.33, "learning_rate": 7.494614887208459e-05, "loss": 2.3031, "step": 39175 }, { "epoch": 0.33, "learning_rate": 7.494033529301064e-05, "loss": 2.3515, "step": 39180 }, { "epoch": 0.33, "learning_rate": 7.493452126505477e-05, "loss": 2.3229, "step": 39185 }, { "epoch": 0.33, "learning_rate": 7.492870678832162e-05, "loss": 2.3358, "step": 39190 }, { "epoch": 0.33, "learning_rate": 7.492289186291586e-05, "loss": 2.3819, "step": 39195 }, { "epoch": 0.33, "learning_rate": 7.491707648894216e-05, "loss": 2.3263, "step": 39200 }, { "epoch": 0.33, "learning_rate": 7.491126066650517e-05, "loss": 2.4043, "step": 39205 }, { "epoch": 0.33, "learning_rate": 7.490544439570955e-05, "loss": 2.2367, "step": 39210 }, { "epoch": 0.33, "learning_rate": 7.489962767666e-05, "loss": 2.2655, "step": 39215 }, { "epoch": 0.33, "learning_rate": 7.48938105094612e-05, "loss": 2.2735, "step": 39220 }, { "epoch": 0.33, "learning_rate": 7.488799289421786e-05, "loss": 2.3982, "step": 39225 }, { "epoch": 0.33, "learning_rate": 7.488217483103469e-05, "loss": 2.2757, "step": 39230 }, { "epoch": 0.33, "learning_rate": 7.48763563200164e-05, "loss": 2.3229, "step": 39235 }, { "epoch": 0.33, "learning_rate": 7.487053736126769e-05, "loss": 2.3319, "step": 39240 }, { "epoch": 0.33, "learning_rate": 7.486471795489331e-05, "loss": 2.2886, "step": 39245 }, { "epoch": 0.33, "learning_rate": 7.485889810099802e-05, "loss": 2.3172, "step": 39250 }, { "epoch": 0.33, "learning_rate": 7.485307779968653e-05, "loss": 2.2467, "step": 39255 }, { "epoch": 0.34, "learning_rate": 7.484725705106362e-05, "loss": 2.3159, "step": 39260 }, { "epoch": 0.34, "learning_rate": 7.484143585523405e-05, "loss": 2.2861, "step": 39265 }, { "epoch": 0.34, "learning_rate": 7.483561421230257e-05, "loss": 2.3591, "step": 39270 }, { "epoch": 0.34, "learning_rate": 7.4829792122374e-05, "loss": 2.3043, "step": 39275 }, { "epoch": 0.34, "learning_rate": 7.482396958555309e-05, "loss": 2.2905, "step": 39280 }, { "epoch": 0.34, "learning_rate": 7.481814660194464e-05, "loss": 2.2975, "step": 39285 }, { "epoch": 0.34, "learning_rate": 7.481232317165347e-05, "loss": 2.2725, "step": 39290 }, { "epoch": 0.34, "learning_rate": 7.480649929478438e-05, "loss": 2.3685, "step": 39295 }, { "epoch": 0.34, "learning_rate": 7.48006749714422e-05, "loss": 2.3487, "step": 39300 }, { "epoch": 0.34, "learning_rate": 7.479485020173173e-05, "loss": 2.327, "step": 39305 }, { "epoch": 0.34, "learning_rate": 7.478902498575787e-05, "loss": 2.3142, "step": 39310 }, { "epoch": 0.34, "learning_rate": 7.478319932362539e-05, "loss": 2.2743, "step": 39315 }, { "epoch": 0.34, "learning_rate": 7.477737321543916e-05, "loss": 2.2944, "step": 39320 }, { "epoch": 0.34, "learning_rate": 7.477154666130405e-05, "loss": 2.3554, "step": 39325 }, { "epoch": 0.34, "learning_rate": 7.476571966132495e-05, "loss": 2.2908, "step": 39330 }, { "epoch": 0.34, "learning_rate": 7.475989221560671e-05, "loss": 2.3711, "step": 39335 }, { "epoch": 0.34, "learning_rate": 7.475406432425421e-05, "loss": 2.2223, "step": 39340 }, { "epoch": 0.34, "learning_rate": 7.474823598737235e-05, "loss": 2.298, "step": 39345 }, { "epoch": 0.34, "learning_rate": 7.474240720506602e-05, "loss": 2.3469, "step": 39350 }, { "epoch": 0.34, "learning_rate": 7.473657797744014e-05, "loss": 2.261, "step": 39355 }, { "epoch": 0.34, "learning_rate": 7.473074830459964e-05, "loss": 2.305, "step": 39360 }, { "epoch": 0.34, "learning_rate": 7.472491818664943e-05, "loss": 2.2827, "step": 39365 }, { "epoch": 0.34, "learning_rate": 7.471908762369442e-05, "loss": 2.3482, "step": 39370 }, { "epoch": 0.34, "learning_rate": 7.471325661583957e-05, "loss": 2.2977, "step": 39375 }, { "epoch": 0.34, "learning_rate": 7.470742516318983e-05, "loss": 2.2596, "step": 39380 }, { "epoch": 0.34, "learning_rate": 7.470159326585014e-05, "loss": 2.4306, "step": 39385 }, { "epoch": 0.34, "learning_rate": 7.46957609239255e-05, "loss": 2.3544, "step": 39390 }, { "epoch": 0.34, "learning_rate": 7.468992813752085e-05, "loss": 2.3574, "step": 39395 }, { "epoch": 0.34, "learning_rate": 7.468409490674115e-05, "loss": 2.2585, "step": 39400 }, { "epoch": 0.34, "learning_rate": 7.467826123169144e-05, "loss": 2.2561, "step": 39405 }, { "epoch": 0.34, "learning_rate": 7.467242711247669e-05, "loss": 2.3708, "step": 39410 }, { "epoch": 0.34, "learning_rate": 7.466659254920189e-05, "loss": 2.306, "step": 39415 }, { "epoch": 0.34, "learning_rate": 7.466075754197208e-05, "loss": 2.3817, "step": 39420 }, { "epoch": 0.34, "learning_rate": 7.465492209089228e-05, "loss": 2.3062, "step": 39425 }, { "epoch": 0.34, "learning_rate": 7.464908619606748e-05, "loss": 2.2783, "step": 39430 }, { "epoch": 0.34, "learning_rate": 7.464324985760274e-05, "loss": 2.2693, "step": 39435 }, { "epoch": 0.34, "learning_rate": 7.463741307560313e-05, "loss": 2.2425, "step": 39440 }, { "epoch": 0.34, "learning_rate": 7.463157585017364e-05, "loss": 2.3812, "step": 39445 }, { "epoch": 0.34, "learning_rate": 7.462573818141938e-05, "loss": 2.2307, "step": 39450 }, { "epoch": 0.34, "learning_rate": 7.461990006944542e-05, "loss": 2.3509, "step": 39455 }, { "epoch": 0.34, "learning_rate": 7.46140615143568e-05, "loss": 2.298, "step": 39460 }, { "epoch": 0.34, "learning_rate": 7.460822251625862e-05, "loss": 2.361, "step": 39465 }, { "epoch": 0.34, "learning_rate": 7.460238307525598e-05, "loss": 2.2511, "step": 39470 }, { "epoch": 0.34, "learning_rate": 7.459654319145398e-05, "loss": 2.3172, "step": 39475 }, { "epoch": 0.34, "learning_rate": 7.459070286495771e-05, "loss": 2.3101, "step": 39480 }, { "epoch": 0.34, "learning_rate": 7.45848620958723e-05, "loss": 2.3692, "step": 39485 }, { "epoch": 0.34, "learning_rate": 7.457902088430289e-05, "loss": 2.3311, "step": 39490 }, { "epoch": 0.34, "learning_rate": 7.457317923035456e-05, "loss": 2.2723, "step": 39495 }, { "epoch": 0.34, "learning_rate": 7.45673371341325e-05, "loss": 2.4034, "step": 39500 }, { "epoch": 0.34, "learning_rate": 7.456149459574182e-05, "loss": 2.2344, "step": 39505 }, { "epoch": 0.34, "learning_rate": 7.455565161528771e-05, "loss": 2.228, "step": 39510 }, { "epoch": 0.34, "learning_rate": 7.454980819287532e-05, "loss": 2.3505, "step": 39515 }, { "epoch": 0.34, "learning_rate": 7.454396432860981e-05, "loss": 2.3374, "step": 39520 }, { "epoch": 0.34, "learning_rate": 7.453812002259636e-05, "loss": 2.3433, "step": 39525 }, { "epoch": 0.34, "learning_rate": 7.453227527494018e-05, "loss": 2.2795, "step": 39530 }, { "epoch": 0.34, "learning_rate": 7.452643008574645e-05, "loss": 2.3582, "step": 39535 }, { "epoch": 0.34, "learning_rate": 7.452058445512035e-05, "loss": 2.3756, "step": 39540 }, { "epoch": 0.34, "learning_rate": 7.451473838316713e-05, "loss": 2.2958, "step": 39545 }, { "epoch": 0.34, "learning_rate": 7.4508891869992e-05, "loss": 2.2824, "step": 39550 }, { "epoch": 0.34, "learning_rate": 7.450304491570018e-05, "loss": 2.4007, "step": 39555 }, { "epoch": 0.34, "learning_rate": 7.449719752039688e-05, "loss": 2.3769, "step": 39560 }, { "epoch": 0.34, "learning_rate": 7.44913496841874e-05, "loss": 2.2566, "step": 39565 }, { "epoch": 0.34, "learning_rate": 7.448550140717694e-05, "loss": 2.2306, "step": 39570 }, { "epoch": 0.34, "learning_rate": 7.447965268947076e-05, "loss": 2.3632, "step": 39575 }, { "epoch": 0.34, "learning_rate": 7.447380353117418e-05, "loss": 2.336, "step": 39580 }, { "epoch": 0.34, "learning_rate": 7.446795393239242e-05, "loss": 2.2689, "step": 39585 }, { "epoch": 0.34, "learning_rate": 7.446210389323079e-05, "loss": 2.2816, "step": 39590 }, { "epoch": 0.34, "learning_rate": 7.445625341379455e-05, "loss": 2.3027, "step": 39595 }, { "epoch": 0.34, "learning_rate": 7.445040249418904e-05, "loss": 2.3293, "step": 39600 }, { "epoch": 0.34, "learning_rate": 7.444455113451953e-05, "loss": 2.3596, "step": 39605 }, { "epoch": 0.34, "learning_rate": 7.443869933489136e-05, "loss": 2.3432, "step": 39610 }, { "epoch": 0.34, "learning_rate": 7.443284709540983e-05, "loss": 2.3889, "step": 39615 }, { "epoch": 0.34, "learning_rate": 7.442699441618028e-05, "loss": 2.2584, "step": 39620 }, { "epoch": 0.34, "learning_rate": 7.442114129730807e-05, "loss": 2.3257, "step": 39625 }, { "epoch": 0.34, "learning_rate": 7.44152877388985e-05, "loss": 2.3003, "step": 39630 }, { "epoch": 0.34, "learning_rate": 7.440943374105697e-05, "loss": 2.3491, "step": 39635 }, { "epoch": 0.34, "learning_rate": 7.44035793038888e-05, "loss": 2.292, "step": 39640 }, { "epoch": 0.34, "learning_rate": 7.439772442749939e-05, "loss": 2.3541, "step": 39645 }, { "epoch": 0.34, "learning_rate": 7.439186911199411e-05, "loss": 2.4239, "step": 39650 }, { "epoch": 0.34, "learning_rate": 7.438601335747833e-05, "loss": 2.3806, "step": 39655 }, { "epoch": 0.34, "learning_rate": 7.438015716405746e-05, "loss": 2.2674, "step": 39660 }, { "epoch": 0.34, "learning_rate": 7.43743005318369e-05, "loss": 2.2817, "step": 39665 }, { "epoch": 0.34, "learning_rate": 7.436844346092207e-05, "loss": 2.2794, "step": 39670 }, { "epoch": 0.34, "learning_rate": 7.436258595141834e-05, "loss": 2.3079, "step": 39675 }, { "epoch": 0.34, "learning_rate": 7.43567280034312e-05, "loss": 2.2919, "step": 39680 }, { "epoch": 0.34, "learning_rate": 7.435086961706604e-05, "loss": 2.3177, "step": 39685 }, { "epoch": 0.34, "learning_rate": 7.434501079242829e-05, "loss": 2.3356, "step": 39690 }, { "epoch": 0.34, "learning_rate": 7.433915152962345e-05, "loss": 2.3282, "step": 39695 }, { "epoch": 0.34, "learning_rate": 7.433329182875693e-05, "loss": 2.2818, "step": 39700 }, { "epoch": 0.34, "learning_rate": 7.432743168993421e-05, "loss": 2.3462, "step": 39705 }, { "epoch": 0.34, "learning_rate": 7.432157111326076e-05, "loss": 2.3267, "step": 39710 }, { "epoch": 0.34, "learning_rate": 7.431571009884207e-05, "loss": 2.2944, "step": 39715 }, { "epoch": 0.34, "learning_rate": 7.430984864678361e-05, "loss": 2.3185, "step": 39720 }, { "epoch": 0.34, "learning_rate": 7.430398675719089e-05, "loss": 2.3623, "step": 39725 }, { "epoch": 0.34, "learning_rate": 7.429812443016941e-05, "loss": 2.3302, "step": 39730 }, { "epoch": 0.34, "learning_rate": 7.429226166582468e-05, "loss": 2.3526, "step": 39735 }, { "epoch": 0.34, "learning_rate": 7.428639846426222e-05, "loss": 2.2903, "step": 39740 }, { "epoch": 0.34, "learning_rate": 7.428053482558757e-05, "loss": 2.3045, "step": 39745 }, { "epoch": 0.34, "learning_rate": 7.427467074990623e-05, "loss": 2.3879, "step": 39750 }, { "epoch": 0.34, "learning_rate": 7.426880623732378e-05, "loss": 2.3114, "step": 39755 }, { "epoch": 0.34, "learning_rate": 7.426294128794576e-05, "loss": 2.3613, "step": 39760 }, { "epoch": 0.34, "learning_rate": 7.425707590187771e-05, "loss": 2.2646, "step": 39765 }, { "epoch": 0.34, "learning_rate": 7.425121007922522e-05, "loss": 2.3631, "step": 39770 }, { "epoch": 0.34, "learning_rate": 7.424534382009385e-05, "loss": 2.3186, "step": 39775 }, { "epoch": 0.34, "learning_rate": 7.42394771245892e-05, "loss": 2.3691, "step": 39780 }, { "epoch": 0.34, "learning_rate": 7.423360999281683e-05, "loss": 2.3156, "step": 39785 }, { "epoch": 0.34, "learning_rate": 7.422774242488239e-05, "loss": 2.35, "step": 39790 }, { "epoch": 0.34, "learning_rate": 7.422187442089143e-05, "loss": 2.3485, "step": 39795 }, { "epoch": 0.34, "learning_rate": 7.421600598094958e-05, "loss": 2.3527, "step": 39800 }, { "epoch": 0.34, "learning_rate": 7.421013710516248e-05, "loss": 2.3932, "step": 39805 }, { "epoch": 0.34, "learning_rate": 7.420426779363575e-05, "loss": 2.397, "step": 39810 }, { "epoch": 0.34, "learning_rate": 7.419839804647501e-05, "loss": 2.2996, "step": 39815 }, { "epoch": 0.34, "learning_rate": 7.419252786378591e-05, "loss": 2.2987, "step": 39820 }, { "epoch": 0.34, "learning_rate": 7.418665724567413e-05, "loss": 2.2725, "step": 39825 }, { "epoch": 0.34, "learning_rate": 7.418078619224532e-05, "loss": 2.3916, "step": 39830 }, { "epoch": 0.34, "learning_rate": 7.417491470360512e-05, "loss": 2.3246, "step": 39835 }, { "epoch": 0.34, "learning_rate": 7.416904277985925e-05, "loss": 2.3737, "step": 39840 }, { "epoch": 0.34, "learning_rate": 7.416317042111335e-05, "loss": 2.237, "step": 39845 }, { "epoch": 0.34, "learning_rate": 7.415729762747315e-05, "loss": 2.396, "step": 39850 }, { "epoch": 0.34, "learning_rate": 7.415142439904434e-05, "loss": 2.3048, "step": 39855 }, { "epoch": 0.34, "learning_rate": 7.41455507359326e-05, "loss": 2.3068, "step": 39860 }, { "epoch": 0.34, "learning_rate": 7.413967663824367e-05, "loss": 2.3242, "step": 39865 }, { "epoch": 0.34, "learning_rate": 7.41338021060833e-05, "loss": 2.3367, "step": 39870 }, { "epoch": 0.34, "learning_rate": 7.412792713955716e-05, "loss": 2.3116, "step": 39875 }, { "epoch": 0.34, "learning_rate": 7.412205173877103e-05, "loss": 2.325, "step": 39880 }, { "epoch": 0.34, "learning_rate": 7.411617590383065e-05, "loss": 2.3894, "step": 39885 }, { "epoch": 0.34, "learning_rate": 7.411029963484178e-05, "loss": 2.3085, "step": 39890 }, { "epoch": 0.34, "learning_rate": 7.410442293191015e-05, "loss": 2.3172, "step": 39895 }, { "epoch": 0.34, "learning_rate": 7.409854579514158e-05, "loss": 2.3016, "step": 39900 }, { "epoch": 0.34, "learning_rate": 7.409266822464182e-05, "loss": 2.3896, "step": 39905 }, { "epoch": 0.34, "learning_rate": 7.408679022051666e-05, "loss": 2.3697, "step": 39910 }, { "epoch": 0.34, "learning_rate": 7.408091178287187e-05, "loss": 2.2952, "step": 39915 }, { "epoch": 0.34, "learning_rate": 7.40750329118133e-05, "loss": 2.2512, "step": 39920 }, { "epoch": 0.34, "learning_rate": 7.406915360744673e-05, "loss": 2.2972, "step": 39925 }, { "epoch": 0.34, "learning_rate": 7.406327386987797e-05, "loss": 2.3958, "step": 39930 }, { "epoch": 0.34, "learning_rate": 7.405739369921286e-05, "loss": 2.3161, "step": 39935 }, { "epoch": 0.34, "learning_rate": 7.405151309555724e-05, "loss": 2.3366, "step": 39940 }, { "epoch": 0.34, "learning_rate": 7.404563205901691e-05, "loss": 2.2833, "step": 39945 }, { "epoch": 0.34, "learning_rate": 7.403975058969776e-05, "loss": 2.4115, "step": 39950 }, { "epoch": 0.34, "learning_rate": 7.403386868770566e-05, "loss": 2.3552, "step": 39955 }, { "epoch": 0.34, "learning_rate": 7.40279863531464e-05, "loss": 2.3513, "step": 39960 }, { "epoch": 0.34, "learning_rate": 7.402210358612591e-05, "loss": 2.2887, "step": 39965 }, { "epoch": 0.34, "learning_rate": 7.401622038675007e-05, "loss": 2.3747, "step": 39970 }, { "epoch": 0.34, "learning_rate": 7.401033675512477e-05, "loss": 2.3123, "step": 39975 }, { "epoch": 0.34, "learning_rate": 7.400445269135587e-05, "loss": 2.351, "step": 39980 }, { "epoch": 0.34, "learning_rate": 7.399856819554929e-05, "loss": 2.3913, "step": 39985 }, { "epoch": 0.34, "learning_rate": 7.399268326781096e-05, "loss": 2.3532, "step": 39990 }, { "epoch": 0.34, "learning_rate": 7.398679790824676e-05, "loss": 2.2863, "step": 39995 }, { "epoch": 0.34, "learning_rate": 7.398091211696265e-05, "loss": 2.3508, "step": 40000 }, { "epoch": 0.34, "learning_rate": 7.397502589406456e-05, "loss": 2.3226, "step": 40005 }, { "epoch": 0.34, "learning_rate": 7.39691392396584e-05, "loss": 2.3568, "step": 40010 }, { "epoch": 0.34, "learning_rate": 7.396325215385014e-05, "loss": 2.4091, "step": 40015 }, { "epoch": 0.34, "learning_rate": 7.395736463674576e-05, "loss": 2.2863, "step": 40020 }, { "epoch": 0.34, "learning_rate": 7.395147668845119e-05, "loss": 2.3782, "step": 40025 }, { "epoch": 0.34, "learning_rate": 7.394558830907242e-05, "loss": 2.2855, "step": 40030 }, { "epoch": 0.34, "learning_rate": 7.393969949871545e-05, "loss": 2.3141, "step": 40035 }, { "epoch": 0.34, "learning_rate": 7.393381025748621e-05, "loss": 2.2821, "step": 40040 }, { "epoch": 0.34, "learning_rate": 7.392792058549074e-05, "loss": 2.3109, "step": 40045 }, { "epoch": 0.34, "learning_rate": 7.392203048283506e-05, "loss": 2.3433, "step": 40050 }, { "epoch": 0.34, "learning_rate": 7.391613994962513e-05, "loss": 2.3609, "step": 40055 }, { "epoch": 0.34, "learning_rate": 7.391024898596702e-05, "loss": 2.3449, "step": 40060 }, { "epoch": 0.34, "learning_rate": 7.39043575919667e-05, "loss": 2.3082, "step": 40065 }, { "epoch": 0.34, "learning_rate": 7.389846576773025e-05, "loss": 2.3601, "step": 40070 }, { "epoch": 0.34, "learning_rate": 7.389257351336369e-05, "loss": 2.3883, "step": 40075 }, { "epoch": 0.34, "learning_rate": 7.38866808289731e-05, "loss": 2.3515, "step": 40080 }, { "epoch": 0.34, "learning_rate": 7.388078771466452e-05, "loss": 2.3482, "step": 40085 }, { "epoch": 0.34, "learning_rate": 7.3874894170544e-05, "loss": 2.2601, "step": 40090 }, { "epoch": 0.34, "learning_rate": 7.386900019671764e-05, "loss": 2.3013, "step": 40095 }, { "epoch": 0.34, "learning_rate": 7.386310579329149e-05, "loss": 2.3631, "step": 40100 }, { "epoch": 0.34, "learning_rate": 7.385721096037166e-05, "loss": 2.2916, "step": 40105 }, { "epoch": 0.34, "learning_rate": 7.385131569806424e-05, "loss": 2.2643, "step": 40110 }, { "epoch": 0.34, "learning_rate": 7.384542000647537e-05, "loss": 2.3182, "step": 40115 }, { "epoch": 0.34, "learning_rate": 7.383952388571108e-05, "loss": 2.2621, "step": 40120 }, { "epoch": 0.34, "learning_rate": 7.383362733587758e-05, "loss": 2.3264, "step": 40125 }, { "epoch": 0.34, "learning_rate": 7.382773035708092e-05, "loss": 2.2643, "step": 40130 }, { "epoch": 0.34, "learning_rate": 7.382183294942731e-05, "loss": 2.2377, "step": 40135 }, { "epoch": 0.34, "learning_rate": 7.381593511302283e-05, "loss": 2.3315, "step": 40140 }, { "epoch": 0.34, "learning_rate": 7.381003684797366e-05, "loss": 2.3886, "step": 40145 }, { "epoch": 0.34, "learning_rate": 7.380413815438596e-05, "loss": 2.2851, "step": 40150 }, { "epoch": 0.34, "learning_rate": 7.37982390323659e-05, "loss": 2.3179, "step": 40155 }, { "epoch": 0.34, "learning_rate": 7.379233948201962e-05, "loss": 2.3626, "step": 40160 }, { "epoch": 0.34, "learning_rate": 7.378643950345331e-05, "loss": 2.3563, "step": 40165 }, { "epoch": 0.34, "learning_rate": 7.37805390967732e-05, "loss": 2.38, "step": 40170 }, { "epoch": 0.34, "learning_rate": 7.377463826208547e-05, "loss": 2.2446, "step": 40175 }, { "epoch": 0.34, "learning_rate": 7.376873699949632e-05, "loss": 2.342, "step": 40180 }, { "epoch": 0.34, "learning_rate": 7.376283530911192e-05, "loss": 2.2015, "step": 40185 }, { "epoch": 0.34, "learning_rate": 7.375693319103855e-05, "loss": 2.3045, "step": 40190 }, { "epoch": 0.34, "learning_rate": 7.375103064538242e-05, "loss": 2.3531, "step": 40195 }, { "epoch": 0.34, "learning_rate": 7.374512767224976e-05, "loss": 2.3361, "step": 40200 }, { "epoch": 0.34, "learning_rate": 7.373922427174681e-05, "loss": 2.2564, "step": 40205 }, { "epoch": 0.34, "learning_rate": 7.373332044397983e-05, "loss": 2.3139, "step": 40210 }, { "epoch": 0.34, "learning_rate": 7.372741618905507e-05, "loss": 2.3728, "step": 40215 }, { "epoch": 0.34, "learning_rate": 7.37215115070788e-05, "loss": 2.2683, "step": 40220 }, { "epoch": 0.34, "learning_rate": 7.371560639815728e-05, "loss": 2.3529, "step": 40225 }, { "epoch": 0.34, "learning_rate": 7.370970086239683e-05, "loss": 2.3013, "step": 40230 }, { "epoch": 0.34, "learning_rate": 7.37037948999037e-05, "loss": 2.2872, "step": 40235 }, { "epoch": 0.34, "learning_rate": 7.369788851078419e-05, "loss": 2.2717, "step": 40240 }, { "epoch": 0.34, "learning_rate": 7.369198169514463e-05, "loss": 2.3328, "step": 40245 }, { "epoch": 0.34, "learning_rate": 7.36860744530913e-05, "loss": 2.3181, "step": 40250 }, { "epoch": 0.34, "learning_rate": 7.368016678473057e-05, "loss": 2.2415, "step": 40255 }, { "epoch": 0.34, "learning_rate": 7.36742586901687e-05, "loss": 2.3029, "step": 40260 }, { "epoch": 0.34, "learning_rate": 7.366835016951208e-05, "loss": 2.2832, "step": 40265 }, { "epoch": 0.34, "learning_rate": 7.366244122286703e-05, "loss": 2.3196, "step": 40270 }, { "epoch": 0.34, "learning_rate": 7.36565318503399e-05, "loss": 2.3777, "step": 40275 }, { "epoch": 0.34, "learning_rate": 7.365062205203705e-05, "loss": 2.3446, "step": 40280 }, { "epoch": 0.34, "learning_rate": 7.364471182806486e-05, "loss": 2.2648, "step": 40285 }, { "epoch": 0.34, "learning_rate": 7.363880117852968e-05, "loss": 2.3793, "step": 40290 }, { "epoch": 0.34, "learning_rate": 7.363289010353792e-05, "loss": 2.2702, "step": 40295 }, { "epoch": 0.34, "learning_rate": 7.362697860319593e-05, "loss": 2.3076, "step": 40300 }, { "epoch": 0.34, "learning_rate": 7.362106667761013e-05, "loss": 2.347, "step": 40305 }, { "epoch": 0.34, "learning_rate": 7.361515432688694e-05, "loss": 2.3113, "step": 40310 }, { "epoch": 0.34, "learning_rate": 7.360924155113274e-05, "loss": 2.2955, "step": 40315 }, { "epoch": 0.34, "learning_rate": 7.360332835045397e-05, "loss": 2.3129, "step": 40320 }, { "epoch": 0.34, "learning_rate": 7.359741472495705e-05, "loss": 2.3475, "step": 40325 }, { "epoch": 0.34, "learning_rate": 7.35915006747484e-05, "loss": 2.4418, "step": 40330 }, { "epoch": 0.34, "learning_rate": 7.35855861999345e-05, "loss": 2.3338, "step": 40335 }, { "epoch": 0.34, "learning_rate": 7.357967130062177e-05, "loss": 2.3387, "step": 40340 }, { "epoch": 0.34, "learning_rate": 7.357375597691667e-05, "loss": 2.4333, "step": 40345 }, { "epoch": 0.34, "learning_rate": 7.356784022892568e-05, "loss": 2.3015, "step": 40350 }, { "epoch": 0.34, "learning_rate": 7.356192405675528e-05, "loss": 2.3601, "step": 40355 }, { "epoch": 0.34, "learning_rate": 7.35560074605119e-05, "loss": 2.2993, "step": 40360 }, { "epoch": 0.34, "learning_rate": 7.355009044030208e-05, "loss": 2.3772, "step": 40365 }, { "epoch": 0.34, "learning_rate": 7.35441729962323e-05, "loss": 2.299, "step": 40370 }, { "epoch": 0.34, "learning_rate": 7.353825512840907e-05, "loss": 2.3285, "step": 40375 }, { "epoch": 0.34, "learning_rate": 7.353233683693888e-05, "loss": 2.3118, "step": 40380 }, { "epoch": 0.34, "learning_rate": 7.352641812192826e-05, "loss": 2.3932, "step": 40385 }, { "epoch": 0.34, "learning_rate": 7.352049898348376e-05, "loss": 2.3666, "step": 40390 }, { "epoch": 0.34, "learning_rate": 7.351457942171186e-05, "loss": 2.3441, "step": 40395 }, { "epoch": 0.34, "learning_rate": 7.350865943671918e-05, "loss": 2.329, "step": 40400 }, { "epoch": 0.34, "learning_rate": 7.35027390286122e-05, "loss": 2.3055, "step": 40405 }, { "epoch": 0.34, "learning_rate": 7.349681819749748e-05, "loss": 2.2412, "step": 40410 }, { "epoch": 0.34, "learning_rate": 7.349089694348163e-05, "loss": 2.4238, "step": 40415 }, { "epoch": 0.34, "learning_rate": 7.348497526667119e-05, "loss": 2.2486, "step": 40420 }, { "epoch": 0.34, "learning_rate": 7.347905316717274e-05, "loss": 2.3259, "step": 40425 }, { "epoch": 0.35, "learning_rate": 7.34731306450929e-05, "loss": 2.4032, "step": 40430 }, { "epoch": 0.35, "learning_rate": 7.346720770053823e-05, "loss": 2.3559, "step": 40435 }, { "epoch": 0.35, "learning_rate": 7.346128433361532e-05, "loss": 2.3623, "step": 40440 }, { "epoch": 0.35, "learning_rate": 7.345536054443081e-05, "loss": 2.3697, "step": 40445 }, { "epoch": 0.35, "learning_rate": 7.344943633309133e-05, "loss": 2.3436, "step": 40450 }, { "epoch": 0.35, "learning_rate": 7.344351169970346e-05, "loss": 2.3587, "step": 40455 }, { "epoch": 0.35, "learning_rate": 7.343758664437386e-05, "loss": 2.3711, "step": 40460 }, { "epoch": 0.35, "learning_rate": 7.343166116720919e-05, "loss": 2.2827, "step": 40465 }, { "epoch": 0.35, "learning_rate": 7.342573526831606e-05, "loss": 2.3074, "step": 40470 }, { "epoch": 0.35, "learning_rate": 7.341980894780114e-05, "loss": 2.3383, "step": 40475 }, { "epoch": 0.35, "learning_rate": 7.34138822057711e-05, "loss": 2.2203, "step": 40480 }, { "epoch": 0.35, "learning_rate": 7.340795504233261e-05, "loss": 2.2537, "step": 40485 }, { "epoch": 0.35, "learning_rate": 7.340202745759234e-05, "loss": 2.3092, "step": 40490 }, { "epoch": 0.35, "learning_rate": 7.339609945165698e-05, "loss": 2.3417, "step": 40495 }, { "epoch": 0.35, "learning_rate": 7.339017102463323e-05, "loss": 2.295, "step": 40500 }, { "epoch": 0.35, "learning_rate": 7.338424217662778e-05, "loss": 2.2574, "step": 40505 }, { "epoch": 0.35, "learning_rate": 7.337831290774735e-05, "loss": 2.3225, "step": 40510 }, { "epoch": 0.35, "learning_rate": 7.337238321809865e-05, "loss": 2.3121, "step": 40515 }, { "epoch": 0.35, "learning_rate": 7.33664531077884e-05, "loss": 2.2843, "step": 40520 }, { "epoch": 0.35, "learning_rate": 7.336052257692335e-05, "loss": 2.3736, "step": 40525 }, { "epoch": 0.35, "learning_rate": 7.33545916256102e-05, "loss": 2.3907, "step": 40530 }, { "epoch": 0.35, "learning_rate": 7.334866025395575e-05, "loss": 2.27, "step": 40535 }, { "epoch": 0.35, "learning_rate": 7.33427284620667e-05, "loss": 2.2661, "step": 40540 }, { "epoch": 0.35, "learning_rate": 7.333679625004985e-05, "loss": 2.3556, "step": 40545 }, { "epoch": 0.35, "learning_rate": 7.333086361801196e-05, "loss": 2.2139, "step": 40550 }, { "epoch": 0.35, "learning_rate": 7.33249305660598e-05, "loss": 2.369, "step": 40555 }, { "epoch": 0.35, "learning_rate": 7.331899709430016e-05, "loss": 2.3392, "step": 40560 }, { "epoch": 0.35, "learning_rate": 7.331306320283983e-05, "loss": 2.3532, "step": 40565 }, { "epoch": 0.35, "learning_rate": 7.33071288917856e-05, "loss": 2.3979, "step": 40570 }, { "epoch": 0.35, "learning_rate": 7.33011941612443e-05, "loss": 2.3299, "step": 40575 }, { "epoch": 0.35, "learning_rate": 7.329525901132272e-05, "loss": 2.3386, "step": 40580 }, { "epoch": 0.35, "learning_rate": 7.32893234421277e-05, "loss": 2.3456, "step": 40585 }, { "epoch": 0.35, "learning_rate": 7.328338745376607e-05, "loss": 2.2713, "step": 40590 }, { "epoch": 0.35, "learning_rate": 7.327745104634467e-05, "loss": 2.3366, "step": 40595 }, { "epoch": 0.35, "learning_rate": 7.327151421997031e-05, "loss": 2.2671, "step": 40600 }, { "epoch": 0.35, "learning_rate": 7.326557697474989e-05, "loss": 2.3622, "step": 40605 }, { "epoch": 0.35, "learning_rate": 7.325963931079024e-05, "loss": 2.3164, "step": 40610 }, { "epoch": 0.35, "learning_rate": 7.325370122819824e-05, "loss": 2.2919, "step": 40615 }, { "epoch": 0.35, "learning_rate": 7.324776272708075e-05, "loss": 2.3012, "step": 40620 }, { "epoch": 0.35, "learning_rate": 7.324182380754467e-05, "loss": 2.3889, "step": 40625 }, { "epoch": 0.35, "learning_rate": 7.323588446969686e-05, "loss": 2.3513, "step": 40630 }, { "epoch": 0.35, "learning_rate": 7.322994471364427e-05, "loss": 2.241, "step": 40635 }, { "epoch": 0.35, "learning_rate": 7.322400453949377e-05, "loss": 2.2978, "step": 40640 }, { "epoch": 0.35, "learning_rate": 7.321806394735227e-05, "loss": 2.2848, "step": 40645 }, { "epoch": 0.35, "learning_rate": 7.32121229373267e-05, "loss": 2.367, "step": 40650 }, { "epoch": 0.35, "learning_rate": 7.320618150952401e-05, "loss": 2.3449, "step": 40655 }, { "epoch": 0.35, "learning_rate": 7.32002396640511e-05, "loss": 2.2855, "step": 40660 }, { "epoch": 0.35, "learning_rate": 7.31942974010149e-05, "loss": 2.3197, "step": 40665 }, { "epoch": 0.35, "learning_rate": 7.31883547205224e-05, "loss": 2.3296, "step": 40670 }, { "epoch": 0.35, "learning_rate": 7.318241162268055e-05, "loss": 2.3505, "step": 40675 }, { "epoch": 0.35, "learning_rate": 7.31764681075963e-05, "loss": 2.357, "step": 40680 }, { "epoch": 0.35, "learning_rate": 7.317052417537663e-05, "loss": 2.2554, "step": 40685 }, { "epoch": 0.35, "learning_rate": 7.316457982612851e-05, "loss": 2.3094, "step": 40690 }, { "epoch": 0.35, "learning_rate": 7.315863505995895e-05, "loss": 2.3397, "step": 40695 }, { "epoch": 0.35, "learning_rate": 7.315268987697492e-05, "loss": 2.319, "step": 40700 }, { "epoch": 0.35, "learning_rate": 7.314674427728346e-05, "loss": 2.3024, "step": 40705 }, { "epoch": 0.35, "learning_rate": 7.314079826099155e-05, "loss": 2.3299, "step": 40710 }, { "epoch": 0.35, "learning_rate": 7.313485182820619e-05, "loss": 2.2997, "step": 40715 }, { "epoch": 0.35, "learning_rate": 7.312890497903447e-05, "loss": 2.327, "step": 40720 }, { "epoch": 0.35, "learning_rate": 7.312295771358335e-05, "loss": 2.3693, "step": 40725 }, { "epoch": 0.35, "learning_rate": 7.311701003195991e-05, "loss": 2.2136, "step": 40730 }, { "epoch": 0.35, "learning_rate": 7.311106193427119e-05, "loss": 2.3195, "step": 40735 }, { "epoch": 0.35, "learning_rate": 7.310511342062425e-05, "loss": 2.291, "step": 40740 }, { "epoch": 0.35, "learning_rate": 7.309916449112614e-05, "loss": 2.3678, "step": 40745 }, { "epoch": 0.35, "learning_rate": 7.309321514588394e-05, "loss": 2.2547, "step": 40750 }, { "epoch": 0.35, "learning_rate": 7.308726538500474e-05, "loss": 2.3252, "step": 40755 }, { "epoch": 0.35, "learning_rate": 7.30813152085956e-05, "loss": 2.3731, "step": 40760 }, { "epoch": 0.35, "learning_rate": 7.307536461676362e-05, "loss": 2.3015, "step": 40765 }, { "epoch": 0.35, "learning_rate": 7.306941360961592e-05, "loss": 2.3054, "step": 40770 }, { "epoch": 0.35, "learning_rate": 7.306346218725956e-05, "loss": 2.3341, "step": 40775 }, { "epoch": 0.35, "learning_rate": 7.305751034980173e-05, "loss": 2.316, "step": 40780 }, { "epoch": 0.35, "learning_rate": 7.305155809734946e-05, "loss": 2.3382, "step": 40785 }, { "epoch": 0.35, "learning_rate": 7.304560543000997e-05, "loss": 2.3818, "step": 40790 }, { "epoch": 0.35, "learning_rate": 7.303965234789034e-05, "loss": 2.203, "step": 40795 }, { "epoch": 0.35, "learning_rate": 7.303369885109774e-05, "loss": 2.3419, "step": 40800 }, { "epoch": 0.35, "learning_rate": 7.30277449397393e-05, "loss": 2.3097, "step": 40805 }, { "epoch": 0.35, "learning_rate": 7.302179061392221e-05, "loss": 2.2941, "step": 40810 }, { "epoch": 0.35, "learning_rate": 7.301583587375361e-05, "loss": 2.4096, "step": 40815 }, { "epoch": 0.35, "learning_rate": 7.30098807193407e-05, "loss": 2.3243, "step": 40820 }, { "epoch": 0.35, "learning_rate": 7.300392515079063e-05, "loss": 2.3419, "step": 40825 }, { "epoch": 0.35, "learning_rate": 7.299796916821062e-05, "loss": 2.3514, "step": 40830 }, { "epoch": 0.35, "learning_rate": 7.299201277170784e-05, "loss": 2.2575, "step": 40835 }, { "epoch": 0.35, "learning_rate": 7.298605596138952e-05, "loss": 2.3288, "step": 40840 }, { "epoch": 0.35, "learning_rate": 7.298009873736287e-05, "loss": 2.3148, "step": 40845 }, { "epoch": 0.35, "learning_rate": 7.297414109973508e-05, "loss": 2.3323, "step": 40850 }, { "epoch": 0.35, "learning_rate": 7.296818304861341e-05, "loss": 2.3208, "step": 40855 }, { "epoch": 0.35, "learning_rate": 7.29622245841051e-05, "loss": 2.3355, "step": 40860 }, { "epoch": 0.35, "learning_rate": 7.295626570631735e-05, "loss": 2.3656, "step": 40865 }, { "epoch": 0.35, "learning_rate": 7.295030641535744e-05, "loss": 2.2288, "step": 40870 }, { "epoch": 0.35, "learning_rate": 7.294434671133263e-05, "loss": 2.2421, "step": 40875 }, { "epoch": 0.35, "learning_rate": 7.293838659435017e-05, "loss": 2.3561, "step": 40880 }, { "epoch": 0.35, "learning_rate": 7.293242606451732e-05, "loss": 2.3218, "step": 40885 }, { "epoch": 0.35, "learning_rate": 7.29264651219414e-05, "loss": 2.3087, "step": 40890 }, { "epoch": 0.35, "learning_rate": 7.292050376672965e-05, "loss": 2.2942, "step": 40895 }, { "epoch": 0.35, "learning_rate": 7.291454199898939e-05, "loss": 2.348, "step": 40900 }, { "epoch": 0.35, "learning_rate": 7.290857981882792e-05, "loss": 2.3322, "step": 40905 }, { "epoch": 0.35, "learning_rate": 7.290261722635255e-05, "loss": 2.3616, "step": 40910 }, { "epoch": 0.35, "learning_rate": 7.28966542216706e-05, "loss": 2.3402, "step": 40915 }, { "epoch": 0.35, "learning_rate": 7.289069080488937e-05, "loss": 2.2827, "step": 40920 }, { "epoch": 0.35, "learning_rate": 7.288472697611622e-05, "loss": 2.3167, "step": 40925 }, { "epoch": 0.35, "learning_rate": 7.287876273545847e-05, "loss": 2.4165, "step": 40930 }, { "epoch": 0.35, "learning_rate": 7.287279808302344e-05, "loss": 2.2491, "step": 40935 }, { "epoch": 0.35, "learning_rate": 7.286683301891854e-05, "loss": 2.3372, "step": 40940 }, { "epoch": 0.35, "learning_rate": 7.28608675432511e-05, "loss": 2.4063, "step": 40945 }, { "epoch": 0.35, "learning_rate": 7.28549016561285e-05, "loss": 2.2615, "step": 40950 }, { "epoch": 0.35, "learning_rate": 7.284893535765809e-05, "loss": 2.3349, "step": 40955 }, { "epoch": 0.35, "learning_rate": 7.284296864794727e-05, "loss": 2.3399, "step": 40960 }, { "epoch": 0.35, "learning_rate": 7.283700152710344e-05, "loss": 2.3428, "step": 40965 }, { "epoch": 0.35, "learning_rate": 7.283103399523399e-05, "loss": 2.2827, "step": 40970 }, { "epoch": 0.35, "learning_rate": 7.282506605244632e-05, "loss": 2.3134, "step": 40975 }, { "epoch": 0.35, "learning_rate": 7.281909769884785e-05, "loss": 2.3593, "step": 40980 }, { "epoch": 0.35, "learning_rate": 7.281312893454599e-05, "loss": 2.2514, "step": 40985 }, { "epoch": 0.35, "learning_rate": 7.280715975964817e-05, "loss": 2.2999, "step": 40990 }, { "epoch": 0.35, "learning_rate": 7.280119017426183e-05, "loss": 2.3178, "step": 40995 }, { "epoch": 0.35, "learning_rate": 7.279522017849441e-05, "loss": 2.3195, "step": 41000 }, { "epoch": 0.35, "learning_rate": 7.278924977245335e-05, "loss": 2.3769, "step": 41005 }, { "epoch": 0.35, "learning_rate": 7.278327895624612e-05, "loss": 2.32, "step": 41010 }, { "epoch": 0.35, "learning_rate": 7.277730772998018e-05, "loss": 2.3625, "step": 41015 }, { "epoch": 0.35, "learning_rate": 7.277133609376301e-05, "loss": 2.3156, "step": 41020 }, { "epoch": 0.35, "learning_rate": 7.276536404770207e-05, "loss": 2.2503, "step": 41025 }, { "epoch": 0.35, "learning_rate": 7.275939159190486e-05, "loss": 2.3064, "step": 41030 }, { "epoch": 0.35, "learning_rate": 7.275341872647886e-05, "loss": 2.3136, "step": 41035 }, { "epoch": 0.35, "learning_rate": 7.274744545153159e-05, "loss": 2.3119, "step": 41040 }, { "epoch": 0.35, "learning_rate": 7.274147176717055e-05, "loss": 2.3778, "step": 41045 }, { "epoch": 0.35, "learning_rate": 7.273549767350323e-05, "loss": 2.3306, "step": 41050 }, { "epoch": 0.35, "learning_rate": 7.27295231706372e-05, "loss": 2.2899, "step": 41055 }, { "epoch": 0.35, "learning_rate": 7.272354825867998e-05, "loss": 2.3279, "step": 41060 }, { "epoch": 0.35, "learning_rate": 7.271757293773907e-05, "loss": 2.2792, "step": 41065 }, { "epoch": 0.35, "learning_rate": 7.271159720792206e-05, "loss": 2.3531, "step": 41070 }, { "epoch": 0.35, "learning_rate": 7.270562106933647e-05, "loss": 2.3357, "step": 41075 }, { "epoch": 0.35, "learning_rate": 7.269964452208988e-05, "loss": 2.379, "step": 41080 }, { "epoch": 0.35, "learning_rate": 7.269366756628986e-05, "loss": 2.3058, "step": 41085 }, { "epoch": 0.35, "learning_rate": 7.268769020204397e-05, "loss": 2.3445, "step": 41090 }, { "epoch": 0.35, "learning_rate": 7.268171242945978e-05, "loss": 2.3206, "step": 41095 }, { "epoch": 0.35, "learning_rate": 7.267573424864491e-05, "loss": 2.3325, "step": 41100 }, { "epoch": 0.35, "learning_rate": 7.266975565970695e-05, "loss": 2.3822, "step": 41105 }, { "epoch": 0.35, "learning_rate": 7.26637766627535e-05, "loss": 2.3472, "step": 41110 }, { "epoch": 0.35, "learning_rate": 7.265779725789214e-05, "loss": 2.3724, "step": 41115 }, { "epoch": 0.35, "learning_rate": 7.265181744523056e-05, "loss": 2.293, "step": 41120 }, { "epoch": 0.35, "learning_rate": 7.26458372248763e-05, "loss": 2.2634, "step": 41125 }, { "epoch": 0.35, "learning_rate": 7.263985659693707e-05, "loss": 2.3117, "step": 41130 }, { "epoch": 0.35, "learning_rate": 7.263387556152047e-05, "loss": 2.2824, "step": 41135 }, { "epoch": 0.35, "learning_rate": 7.262789411873415e-05, "loss": 2.3033, "step": 41140 }, { "epoch": 0.35, "learning_rate": 7.262191226868576e-05, "loss": 2.3212, "step": 41145 }, { "epoch": 0.35, "learning_rate": 7.2615930011483e-05, "loss": 2.285, "step": 41150 }, { "epoch": 0.35, "learning_rate": 7.260994734723349e-05, "loss": 2.323, "step": 41155 }, { "epoch": 0.35, "learning_rate": 7.260396427604494e-05, "loss": 2.3035, "step": 41160 }, { "epoch": 0.35, "learning_rate": 7.259798079802504e-05, "loss": 2.3022, "step": 41165 }, { "epoch": 0.35, "learning_rate": 7.259199691328146e-05, "loss": 2.3693, "step": 41170 }, { "epoch": 0.35, "learning_rate": 7.25860126219219e-05, "loss": 2.2572, "step": 41175 }, { "epoch": 0.35, "learning_rate": 7.258002792405409e-05, "loss": 2.2867, "step": 41180 }, { "epoch": 0.35, "learning_rate": 7.257404281978571e-05, "loss": 2.3044, "step": 41185 }, { "epoch": 0.35, "learning_rate": 7.25680573092245e-05, "loss": 2.2926, "step": 41190 }, { "epoch": 0.35, "learning_rate": 7.256207139247819e-05, "loss": 2.4007, "step": 41195 }, { "epoch": 0.35, "learning_rate": 7.255608506965453e-05, "loss": 2.2798, "step": 41200 }, { "epoch": 0.35, "learning_rate": 7.255009834086124e-05, "loss": 2.2808, "step": 41205 }, { "epoch": 0.35, "learning_rate": 7.254411120620606e-05, "loss": 2.2898, "step": 41210 }, { "epoch": 0.35, "learning_rate": 7.253812366579678e-05, "loss": 2.4164, "step": 41215 }, { "epoch": 0.35, "learning_rate": 7.253213571974115e-05, "loss": 2.3187, "step": 41220 }, { "epoch": 0.35, "learning_rate": 7.252614736814693e-05, "loss": 2.2827, "step": 41225 }, { "epoch": 0.35, "learning_rate": 7.252015861112193e-05, "loss": 2.3794, "step": 41230 }, { "epoch": 0.35, "learning_rate": 7.251416944877393e-05, "loss": 2.2968, "step": 41235 }, { "epoch": 0.35, "learning_rate": 7.25081798812107e-05, "loss": 2.3861, "step": 41240 }, { "epoch": 0.35, "learning_rate": 7.250218990854006e-05, "loss": 2.3487, "step": 41245 }, { "epoch": 0.35, "learning_rate": 7.249619953086979e-05, "loss": 2.276, "step": 41250 }, { "epoch": 0.35, "learning_rate": 7.249020874830775e-05, "loss": 2.3274, "step": 41255 }, { "epoch": 0.35, "learning_rate": 7.248421756096174e-05, "loss": 2.2047, "step": 41260 }, { "epoch": 0.35, "learning_rate": 7.247822596893961e-05, "loss": 2.3423, "step": 41265 }, { "epoch": 0.35, "learning_rate": 7.247223397234917e-05, "loss": 2.3126, "step": 41270 }, { "epoch": 0.35, "learning_rate": 7.246624157129828e-05, "loss": 2.3198, "step": 41275 }, { "epoch": 0.35, "learning_rate": 7.246024876589479e-05, "loss": 2.3399, "step": 41280 }, { "epoch": 0.35, "learning_rate": 7.245425555624657e-05, "loss": 2.3258, "step": 41285 }, { "epoch": 0.35, "learning_rate": 7.244826194246146e-05, "loss": 2.3879, "step": 41290 }, { "epoch": 0.35, "learning_rate": 7.244226792464736e-05, "loss": 2.3703, "step": 41295 }, { "epoch": 0.35, "learning_rate": 7.243627350291215e-05, "loss": 2.3536, "step": 41300 }, { "epoch": 0.35, "learning_rate": 7.24302786773637e-05, "loss": 2.3648, "step": 41305 }, { "epoch": 0.35, "learning_rate": 7.242428344810994e-05, "loss": 2.2762, "step": 41310 }, { "epoch": 0.35, "learning_rate": 7.241828781525875e-05, "loss": 2.4215, "step": 41315 }, { "epoch": 0.35, "learning_rate": 7.241229177891803e-05, "loss": 2.3346, "step": 41320 }, { "epoch": 0.35, "learning_rate": 7.240629533919572e-05, "loss": 2.3144, "step": 41325 }, { "epoch": 0.35, "learning_rate": 7.240029849619973e-05, "loss": 2.3535, "step": 41330 }, { "epoch": 0.35, "learning_rate": 7.239430125003802e-05, "loss": 2.4043, "step": 41335 }, { "epoch": 0.35, "learning_rate": 7.238830360081849e-05, "loss": 2.2215, "step": 41340 }, { "epoch": 0.35, "learning_rate": 7.238230554864911e-05, "loss": 2.3452, "step": 41345 }, { "epoch": 0.35, "learning_rate": 7.237630709363783e-05, "loss": 2.339, "step": 41350 }, { "epoch": 0.35, "learning_rate": 7.237030823589262e-05, "loss": 2.2885, "step": 41355 }, { "epoch": 0.35, "learning_rate": 7.236430897552144e-05, "loss": 2.3507, "step": 41360 }, { "epoch": 0.35, "learning_rate": 7.235830931263227e-05, "loss": 2.401, "step": 41365 }, { "epoch": 0.35, "learning_rate": 7.235230924733308e-05, "loss": 2.3034, "step": 41370 }, { "epoch": 0.35, "learning_rate": 7.234630877973187e-05, "loss": 2.2641, "step": 41375 }, { "epoch": 0.35, "learning_rate": 7.234030790993666e-05, "loss": 2.3095, "step": 41380 }, { "epoch": 0.35, "learning_rate": 7.23343066380554e-05, "loss": 2.1968, "step": 41385 }, { "epoch": 0.35, "learning_rate": 7.232830496419617e-05, "loss": 2.3099, "step": 41390 }, { "epoch": 0.35, "learning_rate": 7.232230288846694e-05, "loss": 2.3499, "step": 41395 }, { "epoch": 0.35, "learning_rate": 7.231630041097576e-05, "loss": 2.2522, "step": 41400 }, { "epoch": 0.35, "learning_rate": 7.231029753183064e-05, "loss": 2.1972, "step": 41405 }, { "epoch": 0.35, "learning_rate": 7.230429425113965e-05, "loss": 2.2733, "step": 41410 }, { "epoch": 0.35, "learning_rate": 7.229829056901083e-05, "loss": 2.2887, "step": 41415 }, { "epoch": 0.35, "learning_rate": 7.229228648555222e-05, "loss": 2.2833, "step": 41420 }, { "epoch": 0.35, "learning_rate": 7.22862820008719e-05, "loss": 2.2407, "step": 41425 }, { "epoch": 0.35, "learning_rate": 7.228027711507796e-05, "loss": 2.2966, "step": 41430 }, { "epoch": 0.35, "learning_rate": 7.227427182827841e-05, "loss": 2.3463, "step": 41435 }, { "epoch": 0.35, "learning_rate": 7.226826614058141e-05, "loss": 2.3616, "step": 41440 }, { "epoch": 0.35, "learning_rate": 7.2262260052095e-05, "loss": 2.3194, "step": 41445 }, { "epoch": 0.35, "learning_rate": 7.225625356292731e-05, "loss": 2.3978, "step": 41450 }, { "epoch": 0.35, "learning_rate": 7.225024667318642e-05, "loss": 2.3322, "step": 41455 }, { "epoch": 0.35, "learning_rate": 7.224423938298046e-05, "loss": 2.3583, "step": 41460 }, { "epoch": 0.35, "learning_rate": 7.223823169241755e-05, "loss": 2.3065, "step": 41465 }, { "epoch": 0.35, "learning_rate": 7.223222360160581e-05, "loss": 2.3656, "step": 41470 }, { "epoch": 0.35, "learning_rate": 7.222621511065341e-05, "loss": 2.3786, "step": 41475 }, { "epoch": 0.35, "learning_rate": 7.222020621966843e-05, "loss": 2.2479, "step": 41480 }, { "epoch": 0.35, "learning_rate": 7.221419692875906e-05, "loss": 2.291, "step": 41485 }, { "epoch": 0.35, "learning_rate": 7.220818723803345e-05, "loss": 2.2638, "step": 41490 }, { "epoch": 0.35, "learning_rate": 7.220217714759976e-05, "loss": 2.3571, "step": 41495 }, { "epoch": 0.35, "learning_rate": 7.219616665756618e-05, "loss": 2.2582, "step": 41500 }, { "epoch": 0.35, "learning_rate": 7.219015576804085e-05, "loss": 2.284, "step": 41505 }, { "epoch": 0.35, "learning_rate": 7.218414447913199e-05, "loss": 2.3131, "step": 41510 }, { "epoch": 0.35, "learning_rate": 7.217813279094777e-05, "loss": 2.3171, "step": 41515 }, { "epoch": 0.35, "learning_rate": 7.21721207035964e-05, "loss": 2.3594, "step": 41520 }, { "epoch": 0.35, "learning_rate": 7.216610821718611e-05, "loss": 2.248, "step": 41525 }, { "epoch": 0.35, "learning_rate": 7.216009533182506e-05, "loss": 2.3094, "step": 41530 }, { "epoch": 0.35, "learning_rate": 7.21540820476215e-05, "loss": 2.3514, "step": 41535 }, { "epoch": 0.35, "learning_rate": 7.214806836468368e-05, "loss": 2.3342, "step": 41540 }, { "epoch": 0.35, "learning_rate": 7.214205428311982e-05, "loss": 2.3306, "step": 41545 }, { "epoch": 0.35, "learning_rate": 7.213603980303815e-05, "loss": 2.3108, "step": 41550 }, { "epoch": 0.35, "learning_rate": 7.213002492454691e-05, "loss": 2.3355, "step": 41555 }, { "epoch": 0.35, "learning_rate": 7.212400964775439e-05, "loss": 2.362, "step": 41560 }, { "epoch": 0.35, "learning_rate": 7.211799397276885e-05, "loss": 2.2106, "step": 41565 }, { "epoch": 0.35, "learning_rate": 7.211197789969854e-05, "loss": 2.2199, "step": 41570 }, { "epoch": 0.35, "learning_rate": 7.210596142865175e-05, "loss": 2.3043, "step": 41575 }, { "epoch": 0.35, "learning_rate": 7.209994455973678e-05, "loss": 2.3436, "step": 41580 }, { "epoch": 0.35, "learning_rate": 7.20939272930619e-05, "loss": 2.4151, "step": 41585 }, { "epoch": 0.35, "learning_rate": 7.208790962873542e-05, "loss": 2.3194, "step": 41590 }, { "epoch": 0.35, "learning_rate": 7.208189156686564e-05, "loss": 2.2862, "step": 41595 }, { "epoch": 0.35, "learning_rate": 7.20758731075609e-05, "loss": 2.3993, "step": 41600 }, { "epoch": 0.36, "learning_rate": 7.206985425092949e-05, "loss": 2.3829, "step": 41605 }, { "epoch": 0.36, "learning_rate": 7.206383499707974e-05, "loss": 2.306, "step": 41610 }, { "epoch": 0.36, "learning_rate": 7.205781534612001e-05, "loss": 2.3008, "step": 41615 }, { "epoch": 0.36, "learning_rate": 7.205179529815865e-05, "loss": 2.3029, "step": 41620 }, { "epoch": 0.36, "learning_rate": 7.204577485330395e-05, "loss": 2.314, "step": 41625 }, { "epoch": 0.36, "learning_rate": 7.203975401166434e-05, "loss": 2.2788, "step": 41630 }, { "epoch": 0.36, "learning_rate": 7.203373277334814e-05, "loss": 2.2849, "step": 41635 }, { "epoch": 0.36, "learning_rate": 7.202771113846373e-05, "loss": 2.3204, "step": 41640 }, { "epoch": 0.36, "learning_rate": 7.20216891071195e-05, "loss": 2.3275, "step": 41645 }, { "epoch": 0.36, "learning_rate": 7.201566667942383e-05, "loss": 2.2605, "step": 41650 }, { "epoch": 0.36, "learning_rate": 7.20096438554851e-05, "loss": 2.3416, "step": 41655 }, { "epoch": 0.36, "learning_rate": 7.200362063541172e-05, "loss": 2.3756, "step": 41660 }, { "epoch": 0.36, "learning_rate": 7.199759701931213e-05, "loss": 2.296, "step": 41665 }, { "epoch": 0.36, "learning_rate": 7.199157300729468e-05, "loss": 2.3573, "step": 41670 }, { "epoch": 0.36, "learning_rate": 7.198554859946785e-05, "loss": 2.2877, "step": 41675 }, { "epoch": 0.36, "learning_rate": 7.197952379594004e-05, "loss": 2.3147, "step": 41680 }, { "epoch": 0.36, "learning_rate": 7.197349859681967e-05, "loss": 2.3608, "step": 41685 }, { "epoch": 0.36, "learning_rate": 7.196747300221522e-05, "loss": 2.3685, "step": 41690 }, { "epoch": 0.36, "learning_rate": 7.196144701223513e-05, "loss": 2.3432, "step": 41695 }, { "epoch": 0.36, "learning_rate": 7.195542062698783e-05, "loss": 2.3352, "step": 41700 }, { "epoch": 0.36, "learning_rate": 7.194939384658181e-05, "loss": 2.3134, "step": 41705 }, { "epoch": 0.36, "learning_rate": 7.194336667112554e-05, "loss": 2.3464, "step": 41710 }, { "epoch": 0.36, "learning_rate": 7.193733910072749e-05, "loss": 2.3886, "step": 41715 }, { "epoch": 0.36, "learning_rate": 7.193131113549616e-05, "loss": 2.2499, "step": 41720 }, { "epoch": 0.36, "learning_rate": 7.192528277554003e-05, "loss": 2.3268, "step": 41725 }, { "epoch": 0.36, "learning_rate": 7.191925402096759e-05, "loss": 2.2537, "step": 41730 }, { "epoch": 0.36, "learning_rate": 7.191322487188736e-05, "loss": 2.3875, "step": 41735 }, { "epoch": 0.36, "learning_rate": 7.190719532840787e-05, "loss": 2.212, "step": 41740 }, { "epoch": 0.36, "learning_rate": 7.190116539063763e-05, "loss": 2.2807, "step": 41745 }, { "epoch": 0.36, "learning_rate": 7.189513505868513e-05, "loss": 2.3482, "step": 41750 }, { "epoch": 0.36, "learning_rate": 7.188910433265897e-05, "loss": 2.2815, "step": 41755 }, { "epoch": 0.36, "learning_rate": 7.188307321266763e-05, "loss": 2.261, "step": 41760 }, { "epoch": 0.36, "learning_rate": 7.187704169881972e-05, "loss": 2.3403, "step": 41765 }, { "epoch": 0.36, "learning_rate": 7.187100979122374e-05, "loss": 2.3508, "step": 41770 }, { "epoch": 0.36, "learning_rate": 7.18649774899883e-05, "loss": 2.27, "step": 41775 }, { "epoch": 0.36, "learning_rate": 7.185894479522193e-05, "loss": 2.3411, "step": 41780 }, { "epoch": 0.36, "learning_rate": 7.185291170703325e-05, "loss": 2.3885, "step": 41785 }, { "epoch": 0.36, "learning_rate": 7.184687822553081e-05, "loss": 2.2978, "step": 41790 }, { "epoch": 0.36, "learning_rate": 7.184084435082322e-05, "loss": 2.2547, "step": 41795 }, { "epoch": 0.36, "learning_rate": 7.183481008301907e-05, "loss": 2.3483, "step": 41800 }, { "epoch": 0.36, "learning_rate": 7.182877542222698e-05, "loss": 2.3621, "step": 41805 }, { "epoch": 0.36, "learning_rate": 7.182274036855556e-05, "loss": 2.3607, "step": 41810 }, { "epoch": 0.36, "learning_rate": 7.18167049221134e-05, "loss": 2.3213, "step": 41815 }, { "epoch": 0.36, "learning_rate": 7.181066908300916e-05, "loss": 2.2976, "step": 41820 }, { "epoch": 0.36, "learning_rate": 7.180463285135147e-05, "loss": 2.3032, "step": 41825 }, { "epoch": 0.36, "learning_rate": 7.179859622724899e-05, "loss": 2.3259, "step": 41830 }, { "epoch": 0.36, "learning_rate": 7.17925592108103e-05, "loss": 2.3077, "step": 41835 }, { "epoch": 0.36, "learning_rate": 7.178652180214413e-05, "loss": 2.2756, "step": 41840 }, { "epoch": 0.36, "learning_rate": 7.178048400135911e-05, "loss": 2.2361, "step": 41845 }, { "epoch": 0.36, "learning_rate": 7.177444580856391e-05, "loss": 2.2359, "step": 41850 }, { "epoch": 0.36, "learning_rate": 7.176840722386722e-05, "loss": 2.4047, "step": 41855 }, { "epoch": 0.36, "learning_rate": 7.176236824737772e-05, "loss": 2.3207, "step": 41860 }, { "epoch": 0.36, "learning_rate": 7.175632887920407e-05, "loss": 2.2519, "step": 41865 }, { "epoch": 0.36, "learning_rate": 7.1750289119455e-05, "loss": 2.3672, "step": 41870 }, { "epoch": 0.36, "learning_rate": 7.174424896823924e-05, "loss": 2.2514, "step": 41875 }, { "epoch": 0.36, "learning_rate": 7.173820842566544e-05, "loss": 2.358, "step": 41880 }, { "epoch": 0.36, "learning_rate": 7.173216749184235e-05, "loss": 2.3083, "step": 41885 }, { "epoch": 0.36, "learning_rate": 7.172612616687871e-05, "loss": 2.3357, "step": 41890 }, { "epoch": 0.36, "learning_rate": 7.172008445088323e-05, "loss": 2.2896, "step": 41895 }, { "epoch": 0.36, "learning_rate": 7.171404234396466e-05, "loss": 2.3583, "step": 41900 }, { "epoch": 0.36, "learning_rate": 7.170799984623175e-05, "loss": 2.3047, "step": 41905 }, { "epoch": 0.36, "learning_rate": 7.170195695779325e-05, "loss": 2.3077, "step": 41910 }, { "epoch": 0.36, "learning_rate": 7.169591367875791e-05, "loss": 2.3238, "step": 41915 }, { "epoch": 0.36, "learning_rate": 7.168987000923453e-05, "loss": 2.3127, "step": 41920 }, { "epoch": 0.36, "learning_rate": 7.168382594933185e-05, "loss": 2.3237, "step": 41925 }, { "epoch": 0.36, "learning_rate": 7.167778149915867e-05, "loss": 2.2937, "step": 41930 }, { "epoch": 0.36, "learning_rate": 7.167173665882378e-05, "loss": 2.2708, "step": 41935 }, { "epoch": 0.36, "learning_rate": 7.166569142843598e-05, "loss": 2.2874, "step": 41940 }, { "epoch": 0.36, "learning_rate": 7.165964580810406e-05, "loss": 2.3387, "step": 41945 }, { "epoch": 0.36, "learning_rate": 7.165359979793685e-05, "loss": 2.3445, "step": 41950 }, { "epoch": 0.36, "learning_rate": 7.164755339804314e-05, "loss": 2.2852, "step": 41955 }, { "epoch": 0.36, "learning_rate": 7.164150660853178e-05, "loss": 2.2628, "step": 41960 }, { "epoch": 0.36, "learning_rate": 7.163545942951158e-05, "loss": 2.3015, "step": 41965 }, { "epoch": 0.36, "learning_rate": 7.162941186109139e-05, "loss": 2.391, "step": 41970 }, { "epoch": 0.36, "learning_rate": 7.162336390338007e-05, "loss": 2.3106, "step": 41975 }, { "epoch": 0.36, "learning_rate": 7.161731555648643e-05, "loss": 2.3593, "step": 41980 }, { "epoch": 0.36, "learning_rate": 7.161126682051939e-05, "loss": 2.2749, "step": 41985 }, { "epoch": 0.36, "learning_rate": 7.160521769558777e-05, "loss": 2.1789, "step": 41990 }, { "epoch": 0.36, "learning_rate": 7.159916818180045e-05, "loss": 2.3568, "step": 41995 }, { "epoch": 0.36, "learning_rate": 7.159311827926634e-05, "loss": 2.2828, "step": 42000 }, { "epoch": 0.36, "learning_rate": 7.158706798809428e-05, "loss": 2.339, "step": 42005 }, { "epoch": 0.36, "learning_rate": 7.15810173083932e-05, "loss": 2.3507, "step": 42010 }, { "epoch": 0.36, "learning_rate": 7.1574966240272e-05, "loss": 2.3151, "step": 42015 }, { "epoch": 0.36, "learning_rate": 7.156891478383956e-05, "loss": 2.3107, "step": 42020 }, { "epoch": 0.36, "learning_rate": 7.156286293920482e-05, "loss": 2.4188, "step": 42025 }, { "epoch": 0.36, "learning_rate": 7.155681070647671e-05, "loss": 2.3446, "step": 42030 }, { "epoch": 0.36, "learning_rate": 7.155075808576414e-05, "loss": 2.296, "step": 42035 }, { "epoch": 0.36, "learning_rate": 7.154470507717607e-05, "loss": 2.2894, "step": 42040 }, { "epoch": 0.36, "learning_rate": 7.153865168082141e-05, "loss": 2.4053, "step": 42045 }, { "epoch": 0.36, "learning_rate": 7.153259789680914e-05, "loss": 2.3351, "step": 42050 }, { "epoch": 0.36, "learning_rate": 7.15265437252482e-05, "loss": 2.3446, "step": 42055 }, { "epoch": 0.36, "learning_rate": 7.152048916624755e-05, "loss": 2.3367, "step": 42060 }, { "epoch": 0.36, "learning_rate": 7.151443421991619e-05, "loss": 2.3505, "step": 42065 }, { "epoch": 0.36, "learning_rate": 7.150837888636306e-05, "loss": 2.288, "step": 42070 }, { "epoch": 0.36, "learning_rate": 7.150232316569717e-05, "loss": 2.2847, "step": 42075 }, { "epoch": 0.36, "learning_rate": 7.149626705802751e-05, "loss": 2.2628, "step": 42080 }, { "epoch": 0.36, "learning_rate": 7.149021056346308e-05, "loss": 2.3232, "step": 42085 }, { "epoch": 0.36, "learning_rate": 7.148415368211288e-05, "loss": 2.2773, "step": 42090 }, { "epoch": 0.36, "learning_rate": 7.147809641408593e-05, "loss": 2.3523, "step": 42095 }, { "epoch": 0.36, "learning_rate": 7.147203875949125e-05, "loss": 2.3252, "step": 42100 }, { "epoch": 0.36, "learning_rate": 7.146598071843784e-05, "loss": 2.3468, "step": 42105 }, { "epoch": 0.36, "learning_rate": 7.145992229103476e-05, "loss": 2.3315, "step": 42110 }, { "epoch": 0.36, "learning_rate": 7.145386347739106e-05, "loss": 2.3669, "step": 42115 }, { "epoch": 0.36, "learning_rate": 7.144780427761578e-05, "loss": 2.3249, "step": 42120 }, { "epoch": 0.36, "learning_rate": 7.144174469181795e-05, "loss": 2.3321, "step": 42125 }, { "epoch": 0.36, "learning_rate": 7.143568472010666e-05, "loss": 2.3613, "step": 42130 }, { "epoch": 0.36, "learning_rate": 7.1429624362591e-05, "loss": 2.2607, "step": 42135 }, { "epoch": 0.36, "learning_rate": 7.142356361937998e-05, "loss": 2.3347, "step": 42140 }, { "epoch": 0.36, "learning_rate": 7.141750249058274e-05, "loss": 2.3074, "step": 42145 }, { "epoch": 0.36, "learning_rate": 7.141144097630834e-05, "loss": 2.306, "step": 42150 }, { "epoch": 0.36, "learning_rate": 7.140537907666588e-05, "loss": 2.2965, "step": 42155 }, { "epoch": 0.36, "learning_rate": 7.139931679176448e-05, "loss": 2.2926, "step": 42160 }, { "epoch": 0.36, "learning_rate": 7.139325412171324e-05, "loss": 2.2504, "step": 42165 }, { "epoch": 0.36, "learning_rate": 7.138719106662126e-05, "loss": 2.2441, "step": 42170 }, { "epoch": 0.36, "learning_rate": 7.13811276265977e-05, "loss": 2.348, "step": 42175 }, { "epoch": 0.36, "learning_rate": 7.137506380175166e-05, "loss": 2.3624, "step": 42180 }, { "epoch": 0.36, "learning_rate": 7.13689995921923e-05, "loss": 2.4073, "step": 42185 }, { "epoch": 0.36, "learning_rate": 7.136293499802875e-05, "loss": 2.3896, "step": 42190 }, { "epoch": 0.36, "learning_rate": 7.135687001937017e-05, "loss": 2.3517, "step": 42195 }, { "epoch": 0.36, "learning_rate": 7.135080465632571e-05, "loss": 2.3254, "step": 42200 }, { "epoch": 0.36, "learning_rate": 7.134473890900455e-05, "loss": 2.2904, "step": 42205 }, { "epoch": 0.36, "learning_rate": 7.133867277751584e-05, "loss": 2.3048, "step": 42210 }, { "epoch": 0.36, "learning_rate": 7.13326062619688e-05, "loss": 2.2996, "step": 42215 }, { "epoch": 0.36, "learning_rate": 7.132653936247257e-05, "loss": 2.3407, "step": 42220 }, { "epoch": 0.36, "learning_rate": 7.132047207913636e-05, "loss": 2.3362, "step": 42225 }, { "epoch": 0.36, "learning_rate": 7.13144044120694e-05, "loss": 2.3442, "step": 42230 }, { "epoch": 0.36, "learning_rate": 7.130833636138086e-05, "loss": 2.3517, "step": 42235 }, { "epoch": 0.36, "learning_rate": 7.130226792717996e-05, "loss": 2.2859, "step": 42240 }, { "epoch": 0.36, "learning_rate": 7.129619910957593e-05, "loss": 2.3373, "step": 42245 }, { "epoch": 0.36, "learning_rate": 7.129012990867799e-05, "loss": 2.2776, "step": 42250 }, { "epoch": 0.36, "learning_rate": 7.12840603245954e-05, "loss": 2.331, "step": 42255 }, { "epoch": 0.36, "learning_rate": 7.127799035743736e-05, "loss": 2.3012, "step": 42260 }, { "epoch": 0.36, "learning_rate": 7.127192000731316e-05, "loss": 2.2889, "step": 42265 }, { "epoch": 0.36, "learning_rate": 7.126584927433202e-05, "loss": 2.3894, "step": 42270 }, { "epoch": 0.36, "learning_rate": 7.125977815860322e-05, "loss": 2.3938, "step": 42275 }, { "epoch": 0.36, "learning_rate": 7.125370666023601e-05, "loss": 2.3909, "step": 42280 }, { "epoch": 0.36, "learning_rate": 7.124763477933972e-05, "loss": 2.3317, "step": 42285 }, { "epoch": 0.36, "learning_rate": 7.124156251602358e-05, "loss": 2.3753, "step": 42290 }, { "epoch": 0.36, "learning_rate": 7.12354898703969e-05, "loss": 2.2606, "step": 42295 }, { "epoch": 0.36, "learning_rate": 7.122941684256899e-05, "loss": 2.3522, "step": 42300 }, { "epoch": 0.36, "learning_rate": 7.122334343264912e-05, "loss": 2.34, "step": 42305 }, { "epoch": 0.36, "learning_rate": 7.121726964074661e-05, "loss": 2.3197, "step": 42310 }, { "epoch": 0.36, "learning_rate": 7.121119546697081e-05, "loss": 2.3316, "step": 42315 }, { "epoch": 0.36, "learning_rate": 7.120512091143101e-05, "loss": 2.3436, "step": 42320 }, { "epoch": 0.36, "learning_rate": 7.119904597423655e-05, "loss": 2.3169, "step": 42325 }, { "epoch": 0.36, "learning_rate": 7.119297065549675e-05, "loss": 2.3646, "step": 42330 }, { "epoch": 0.36, "learning_rate": 7.1186894955321e-05, "loss": 2.2811, "step": 42335 }, { "epoch": 0.36, "learning_rate": 7.118081887381863e-05, "loss": 2.2549, "step": 42340 }, { "epoch": 0.36, "learning_rate": 7.117474241109897e-05, "loss": 2.3778, "step": 42345 }, { "epoch": 0.36, "learning_rate": 7.116866556727143e-05, "loss": 2.2702, "step": 42350 }, { "epoch": 0.36, "learning_rate": 7.116258834244537e-05, "loss": 2.2315, "step": 42355 }, { "epoch": 0.36, "learning_rate": 7.115651073673014e-05, "loss": 2.227, "step": 42360 }, { "epoch": 0.36, "learning_rate": 7.115043275023516e-05, "loss": 2.3649, "step": 42365 }, { "epoch": 0.36, "learning_rate": 7.114435438306983e-05, "loss": 2.3322, "step": 42370 }, { "epoch": 0.36, "learning_rate": 7.11382756353435e-05, "loss": 2.3705, "step": 42375 }, { "epoch": 0.36, "learning_rate": 7.113219650716562e-05, "loss": 2.3249, "step": 42380 }, { "epoch": 0.36, "learning_rate": 7.11261169986456e-05, "loss": 2.2566, "step": 42385 }, { "epoch": 0.36, "learning_rate": 7.112003710989286e-05, "loss": 2.321, "step": 42390 }, { "epoch": 0.36, "learning_rate": 7.111395684101679e-05, "loss": 2.37, "step": 42395 }, { "epoch": 0.36, "learning_rate": 7.110787619212688e-05, "loss": 2.3029, "step": 42400 }, { "epoch": 0.36, "learning_rate": 7.110179516333253e-05, "loss": 2.2521, "step": 42405 }, { "epoch": 0.36, "learning_rate": 7.109571375474321e-05, "loss": 2.3568, "step": 42410 }, { "epoch": 0.36, "learning_rate": 7.108963196646836e-05, "loss": 2.3179, "step": 42415 }, { "epoch": 0.36, "learning_rate": 7.108354979861746e-05, "loss": 2.2701, "step": 42420 }, { "epoch": 0.36, "learning_rate": 7.107746725129996e-05, "loss": 2.258, "step": 42425 }, { "epoch": 0.36, "learning_rate": 7.107138432462533e-05, "loss": 2.2815, "step": 42430 }, { "epoch": 0.36, "learning_rate": 7.106530101870309e-05, "loss": 2.3405, "step": 42435 }, { "epoch": 0.36, "learning_rate": 7.105921733364267e-05, "loss": 2.3482, "step": 42440 }, { "epoch": 0.36, "learning_rate": 7.105313326955362e-05, "loss": 2.3287, "step": 42445 }, { "epoch": 0.36, "learning_rate": 7.104704882654541e-05, "loss": 2.4036, "step": 42450 }, { "epoch": 0.36, "learning_rate": 7.104096400472758e-05, "loss": 2.2561, "step": 42455 }, { "epoch": 0.36, "learning_rate": 7.10348788042096e-05, "loss": 2.3488, "step": 42460 }, { "epoch": 0.36, "learning_rate": 7.102879322510103e-05, "loss": 2.3772, "step": 42465 }, { "epoch": 0.36, "learning_rate": 7.102270726751139e-05, "loss": 2.2824, "step": 42470 }, { "epoch": 0.36, "learning_rate": 7.101662093155022e-05, "loss": 2.2465, "step": 42475 }, { "epoch": 0.36, "learning_rate": 7.101053421732703e-05, "loss": 2.3482, "step": 42480 }, { "epoch": 0.36, "learning_rate": 7.100444712495143e-05, "loss": 2.3364, "step": 42485 }, { "epoch": 0.36, "learning_rate": 7.099835965453292e-05, "loss": 2.3502, "step": 42490 }, { "epoch": 0.36, "learning_rate": 7.099227180618109e-05, "loss": 2.1931, "step": 42495 }, { "epoch": 0.36, "learning_rate": 7.098618358000554e-05, "loss": 2.2464, "step": 42500 }, { "epoch": 0.36, "learning_rate": 7.098009497611579e-05, "loss": 2.4108, "step": 42505 }, { "epoch": 0.36, "learning_rate": 7.097400599462145e-05, "loss": 2.3307, "step": 42510 }, { "epoch": 0.36, "learning_rate": 7.096791663563213e-05, "loss": 2.3163, "step": 42515 }, { "epoch": 0.36, "learning_rate": 7.096182689925739e-05, "loss": 2.3005, "step": 42520 }, { "epoch": 0.36, "learning_rate": 7.095573678560685e-05, "loss": 2.3177, "step": 42525 }, { "epoch": 0.36, "learning_rate": 7.094964629479013e-05, "loss": 2.3425, "step": 42530 }, { "epoch": 0.36, "learning_rate": 7.094355542691686e-05, "loss": 2.2923, "step": 42535 }, { "epoch": 0.36, "learning_rate": 7.093746418209662e-05, "loss": 2.3904, "step": 42540 }, { "epoch": 0.36, "learning_rate": 7.093137256043909e-05, "loss": 2.3203, "step": 42545 }, { "epoch": 0.36, "learning_rate": 7.092528056205388e-05, "loss": 2.2875, "step": 42550 }, { "epoch": 0.36, "learning_rate": 7.091918818705065e-05, "loss": 2.2847, "step": 42555 }, { "epoch": 0.36, "learning_rate": 7.091309543553903e-05, "loss": 2.2833, "step": 42560 }, { "epoch": 0.36, "learning_rate": 7.090700230762873e-05, "loss": 2.3207, "step": 42565 }, { "epoch": 0.36, "learning_rate": 7.090090880342934e-05, "loss": 2.3127, "step": 42570 }, { "epoch": 0.36, "learning_rate": 7.089481492305058e-05, "loss": 2.3936, "step": 42575 }, { "epoch": 0.36, "learning_rate": 7.088872066660212e-05, "loss": 2.2744, "step": 42580 }, { "epoch": 0.36, "learning_rate": 7.088262603419365e-05, "loss": 2.3423, "step": 42585 }, { "epoch": 0.36, "learning_rate": 7.087653102593486e-05, "loss": 2.3586, "step": 42590 }, { "epoch": 0.36, "learning_rate": 7.087043564193544e-05, "loss": 2.3522, "step": 42595 }, { "epoch": 0.36, "learning_rate": 7.086433988230511e-05, "loss": 2.2433, "step": 42600 }, { "epoch": 0.36, "learning_rate": 7.085824374715357e-05, "loss": 2.2988, "step": 42605 }, { "epoch": 0.36, "learning_rate": 7.085214723659057e-05, "loss": 2.3321, "step": 42610 }, { "epoch": 0.36, "learning_rate": 7.084605035072579e-05, "loss": 2.3545, "step": 42615 }, { "epoch": 0.36, "learning_rate": 7.0839953089669e-05, "loss": 2.3387, "step": 42620 }, { "epoch": 0.36, "learning_rate": 7.083385545352993e-05, "loss": 2.3134, "step": 42625 }, { "epoch": 0.36, "learning_rate": 7.082775744241831e-05, "loss": 2.291, "step": 42630 }, { "epoch": 0.36, "learning_rate": 7.08216590564439e-05, "loss": 2.3335, "step": 42635 }, { "epoch": 0.36, "learning_rate": 7.081556029571647e-05, "loss": 2.2392, "step": 42640 }, { "epoch": 0.36, "learning_rate": 7.08094611603458e-05, "loss": 2.2206, "step": 42645 }, { "epoch": 0.36, "learning_rate": 7.080336165044163e-05, "loss": 2.3128, "step": 42650 }, { "epoch": 0.36, "learning_rate": 7.079726176611377e-05, "loss": 2.2669, "step": 42655 }, { "epoch": 0.36, "learning_rate": 7.079116150747201e-05, "loss": 2.2136, "step": 42660 }, { "epoch": 0.36, "learning_rate": 7.07850608746261e-05, "loss": 2.2246, "step": 42665 }, { "epoch": 0.36, "learning_rate": 7.077895986768588e-05, "loss": 2.252, "step": 42670 }, { "epoch": 0.36, "learning_rate": 7.077285848676114e-05, "loss": 2.3215, "step": 42675 }, { "epoch": 0.36, "learning_rate": 7.07667567319617e-05, "loss": 2.3083, "step": 42680 }, { "epoch": 0.36, "learning_rate": 7.076065460339739e-05, "loss": 2.3229, "step": 42685 }, { "epoch": 0.36, "learning_rate": 7.075455210117803e-05, "loss": 2.3053, "step": 42690 }, { "epoch": 0.36, "learning_rate": 7.074844922541345e-05, "loss": 2.2056, "step": 42695 }, { "epoch": 0.36, "learning_rate": 7.074234597621348e-05, "loss": 2.2585, "step": 42700 }, { "epoch": 0.36, "learning_rate": 7.0736242353688e-05, "loss": 2.3145, "step": 42705 }, { "epoch": 0.36, "learning_rate": 7.073013835794684e-05, "loss": 2.3331, "step": 42710 }, { "epoch": 0.36, "learning_rate": 7.072403398909986e-05, "loss": 2.3156, "step": 42715 }, { "epoch": 0.36, "learning_rate": 7.071792924725695e-05, "loss": 2.3099, "step": 42720 }, { "epoch": 0.36, "learning_rate": 7.071182413252798e-05, "loss": 2.2966, "step": 42725 }, { "epoch": 0.36, "learning_rate": 7.070571864502278e-05, "loss": 2.362, "step": 42730 }, { "epoch": 0.36, "learning_rate": 7.06996127848513e-05, "loss": 2.3058, "step": 42735 }, { "epoch": 0.36, "learning_rate": 7.069350655212342e-05, "loss": 2.3118, "step": 42740 }, { "epoch": 0.36, "learning_rate": 7.068739994694902e-05, "loss": 2.223, "step": 42745 }, { "epoch": 0.36, "learning_rate": 7.068129296943804e-05, "loss": 2.3032, "step": 42750 }, { "epoch": 0.36, "learning_rate": 7.067518561970037e-05, "loss": 2.279, "step": 42755 }, { "epoch": 0.36, "learning_rate": 7.066907789784594e-05, "loss": 2.2535, "step": 42760 }, { "epoch": 0.36, "learning_rate": 7.066296980398469e-05, "loss": 2.3646, "step": 42765 }, { "epoch": 0.36, "learning_rate": 7.065686133822651e-05, "loss": 2.3454, "step": 42770 }, { "epoch": 0.37, "learning_rate": 7.06507525006814e-05, "loss": 2.3064, "step": 42775 }, { "epoch": 0.37, "learning_rate": 7.064464329145928e-05, "loss": 2.208, "step": 42780 }, { "epoch": 0.37, "learning_rate": 7.063853371067011e-05, "loss": 2.3078, "step": 42785 }, { "epoch": 0.37, "learning_rate": 7.063242375842384e-05, "loss": 2.4373, "step": 42790 }, { "epoch": 0.37, "learning_rate": 7.062631343483044e-05, "loss": 2.2966, "step": 42795 }, { "epoch": 0.37, "learning_rate": 7.06202027399999e-05, "loss": 2.3009, "step": 42800 }, { "epoch": 0.37, "learning_rate": 7.06140916740422e-05, "loss": 2.2831, "step": 42805 }, { "epoch": 0.37, "learning_rate": 7.060798023706732e-05, "loss": 2.351, "step": 42810 }, { "epoch": 0.37, "learning_rate": 7.060186842918526e-05, "loss": 2.2467, "step": 42815 }, { "epoch": 0.37, "learning_rate": 7.059575625050602e-05, "loss": 2.3326, "step": 42820 }, { "epoch": 0.37, "learning_rate": 7.058964370113959e-05, "loss": 2.3048, "step": 42825 }, { "epoch": 0.37, "learning_rate": 7.058353078119601e-05, "loss": 2.2665, "step": 42830 }, { "epoch": 0.37, "learning_rate": 7.057741749078531e-05, "loss": 2.3494, "step": 42835 }, { "epoch": 0.37, "learning_rate": 7.057130383001749e-05, "loss": 2.2026, "step": 42840 }, { "epoch": 0.37, "learning_rate": 7.056518979900259e-05, "loss": 2.312, "step": 42845 }, { "epoch": 0.37, "learning_rate": 7.055907539785067e-05, "loss": 2.3179, "step": 42850 }, { "epoch": 0.37, "learning_rate": 7.055296062667177e-05, "loss": 2.2285, "step": 42855 }, { "epoch": 0.37, "learning_rate": 7.054684548557593e-05, "loss": 2.3459, "step": 42860 }, { "epoch": 0.37, "learning_rate": 7.054072997467325e-05, "loss": 2.2615, "step": 42865 }, { "epoch": 0.37, "learning_rate": 7.053461409407374e-05, "loss": 2.3299, "step": 42870 }, { "epoch": 0.37, "learning_rate": 7.052849784388753e-05, "loss": 2.3148, "step": 42875 }, { "epoch": 0.37, "learning_rate": 7.052238122422467e-05, "loss": 2.2688, "step": 42880 }, { "epoch": 0.37, "learning_rate": 7.051626423519528e-05, "loss": 2.3241, "step": 42885 }, { "epoch": 0.37, "learning_rate": 7.05101468769094e-05, "loss": 2.2744, "step": 42890 }, { "epoch": 0.37, "learning_rate": 7.050402914947719e-05, "loss": 2.3351, "step": 42895 }, { "epoch": 0.37, "learning_rate": 7.049791105300871e-05, "loss": 2.387, "step": 42900 }, { "epoch": 0.37, "learning_rate": 7.049179258761411e-05, "loss": 2.3927, "step": 42905 }, { "epoch": 0.37, "learning_rate": 7.04856737534035e-05, "loss": 2.4157, "step": 42910 }, { "epoch": 0.37, "learning_rate": 7.047955455048702e-05, "loss": 2.4037, "step": 42915 }, { "epoch": 0.37, "learning_rate": 7.047343497897477e-05, "loss": 2.3442, "step": 42920 }, { "epoch": 0.37, "learning_rate": 7.046731503897694e-05, "loss": 2.3654, "step": 42925 }, { "epoch": 0.37, "learning_rate": 7.046119473060363e-05, "loss": 2.3315, "step": 42930 }, { "epoch": 0.37, "learning_rate": 7.045507405396502e-05, "loss": 2.3111, "step": 42935 }, { "epoch": 0.37, "learning_rate": 7.044895300917125e-05, "loss": 2.2665, "step": 42940 }, { "epoch": 0.37, "learning_rate": 7.044283159633254e-05, "loss": 2.2842, "step": 42945 }, { "epoch": 0.37, "learning_rate": 7.043670981555902e-05, "loss": 2.3328, "step": 42950 }, { "epoch": 0.37, "learning_rate": 7.043058766696089e-05, "loss": 2.3714, "step": 42955 }, { "epoch": 0.37, "learning_rate": 7.042446515064831e-05, "loss": 2.2075, "step": 42960 }, { "epoch": 0.37, "learning_rate": 7.04183422667315e-05, "loss": 2.3473, "step": 42965 }, { "epoch": 0.37, "learning_rate": 7.041221901532065e-05, "loss": 2.3926, "step": 42970 }, { "epoch": 0.37, "learning_rate": 7.0406095396526e-05, "loss": 2.3513, "step": 42975 }, { "epoch": 0.37, "learning_rate": 7.039997141045772e-05, "loss": 2.2736, "step": 42980 }, { "epoch": 0.37, "learning_rate": 7.039384705722604e-05, "loss": 2.3515, "step": 42985 }, { "epoch": 0.37, "learning_rate": 7.038772233694121e-05, "loss": 2.3317, "step": 42990 }, { "epoch": 0.37, "learning_rate": 7.038159724971343e-05, "loss": 2.2747, "step": 42995 }, { "epoch": 0.37, "learning_rate": 7.037547179565298e-05, "loss": 2.3242, "step": 43000 }, { "epoch": 0.37, "learning_rate": 7.036934597487007e-05, "loss": 2.2716, "step": 43005 }, { "epoch": 0.37, "learning_rate": 7.0363219787475e-05, "loss": 2.2639, "step": 43010 }, { "epoch": 0.37, "learning_rate": 7.035709323357798e-05, "loss": 2.2807, "step": 43015 }, { "epoch": 0.37, "learning_rate": 7.03509663132893e-05, "loss": 2.2606, "step": 43020 }, { "epoch": 0.37, "learning_rate": 7.034483902671924e-05, "loss": 2.3787, "step": 43025 }, { "epoch": 0.37, "learning_rate": 7.033871137397808e-05, "loss": 2.3304, "step": 43030 }, { "epoch": 0.37, "learning_rate": 7.033258335517607e-05, "loss": 2.3063, "step": 43035 }, { "epoch": 0.37, "learning_rate": 7.032645497042358e-05, "loss": 2.2689, "step": 43040 }, { "epoch": 0.37, "learning_rate": 7.032032621983083e-05, "loss": 2.3829, "step": 43045 }, { "epoch": 0.37, "learning_rate": 7.031419710350815e-05, "loss": 2.3365, "step": 43050 }, { "epoch": 0.37, "learning_rate": 7.03080676215659e-05, "loss": 2.3114, "step": 43055 }, { "epoch": 0.37, "learning_rate": 7.030193777411435e-05, "loss": 2.3787, "step": 43060 }, { "epoch": 0.37, "learning_rate": 7.029580756126382e-05, "loss": 2.2811, "step": 43065 }, { "epoch": 0.37, "learning_rate": 7.02896769831247e-05, "loss": 2.2749, "step": 43070 }, { "epoch": 0.37, "learning_rate": 7.028354603980727e-05, "loss": 2.2689, "step": 43075 }, { "epoch": 0.37, "learning_rate": 7.02774147314219e-05, "loss": 2.2801, "step": 43080 }, { "epoch": 0.37, "learning_rate": 7.027128305807893e-05, "loss": 2.2604, "step": 43085 }, { "epoch": 0.37, "learning_rate": 7.026515101988877e-05, "loss": 2.3246, "step": 43090 }, { "epoch": 0.37, "learning_rate": 7.025901861696171e-05, "loss": 2.3138, "step": 43095 }, { "epoch": 0.37, "learning_rate": 7.025288584940817e-05, "loss": 2.3585, "step": 43100 }, { "epoch": 0.37, "learning_rate": 7.024675271733851e-05, "loss": 2.2939, "step": 43105 }, { "epoch": 0.37, "learning_rate": 7.024061922086313e-05, "loss": 2.3414, "step": 43110 }, { "epoch": 0.37, "learning_rate": 7.023448536009241e-05, "loss": 2.295, "step": 43115 }, { "epoch": 0.37, "learning_rate": 7.022835113513677e-05, "loss": 2.2277, "step": 43120 }, { "epoch": 0.37, "learning_rate": 7.02222165461066e-05, "loss": 2.3546, "step": 43125 }, { "epoch": 0.37, "learning_rate": 7.02160815931123e-05, "loss": 2.3336, "step": 43130 }, { "epoch": 0.37, "learning_rate": 7.02099462762643e-05, "loss": 2.2595, "step": 43135 }, { "epoch": 0.37, "learning_rate": 7.020381059567304e-05, "loss": 2.3047, "step": 43140 }, { "epoch": 0.37, "learning_rate": 7.01976745514489e-05, "loss": 2.3494, "step": 43145 }, { "epoch": 0.37, "learning_rate": 7.019153814370239e-05, "loss": 2.3898, "step": 43150 }, { "epoch": 0.37, "learning_rate": 7.01854013725439e-05, "loss": 2.3503, "step": 43155 }, { "epoch": 0.37, "learning_rate": 7.01792642380839e-05, "loss": 2.3245, "step": 43160 }, { "epoch": 0.37, "learning_rate": 7.017312674043285e-05, "loss": 2.1623, "step": 43165 }, { "epoch": 0.37, "learning_rate": 7.016698887970121e-05, "loss": 2.3056, "step": 43170 }, { "epoch": 0.37, "learning_rate": 7.016085065599945e-05, "loss": 2.3889, "step": 43175 }, { "epoch": 0.37, "learning_rate": 7.015471206943806e-05, "loss": 2.3174, "step": 43180 }, { "epoch": 0.37, "learning_rate": 7.014857312012751e-05, "loss": 2.2636, "step": 43185 }, { "epoch": 0.37, "learning_rate": 7.014243380817827e-05, "loss": 2.2509, "step": 43190 }, { "epoch": 0.37, "learning_rate": 7.013629413370087e-05, "loss": 2.388, "step": 43195 }, { "epoch": 0.37, "learning_rate": 7.013015409680581e-05, "loss": 2.4244, "step": 43200 }, { "epoch": 0.37, "learning_rate": 7.012401369760359e-05, "loss": 2.2961, "step": 43205 }, { "epoch": 0.37, "learning_rate": 7.011787293620473e-05, "loss": 2.3359, "step": 43210 }, { "epoch": 0.37, "learning_rate": 7.011173181271975e-05, "loss": 2.356, "step": 43215 }, { "epoch": 0.37, "learning_rate": 7.010559032725918e-05, "loss": 2.2876, "step": 43220 }, { "epoch": 0.37, "learning_rate": 7.009944847993356e-05, "loss": 2.3955, "step": 43225 }, { "epoch": 0.37, "learning_rate": 7.009330627085343e-05, "loss": 2.3108, "step": 43230 }, { "epoch": 0.37, "learning_rate": 7.008716370012933e-05, "loss": 2.2587, "step": 43235 }, { "epoch": 0.37, "learning_rate": 7.008102076787183e-05, "loss": 2.3213, "step": 43240 }, { "epoch": 0.37, "learning_rate": 7.007487747419149e-05, "loss": 2.2514, "step": 43245 }, { "epoch": 0.37, "learning_rate": 7.006873381919887e-05, "loss": 2.3427, "step": 43250 }, { "epoch": 0.37, "learning_rate": 7.006258980300454e-05, "loss": 2.3497, "step": 43255 }, { "epoch": 0.37, "learning_rate": 7.00564454257191e-05, "loss": 2.3693, "step": 43260 }, { "epoch": 0.37, "learning_rate": 7.005030068745312e-05, "loss": 2.1948, "step": 43265 }, { "epoch": 0.37, "learning_rate": 7.004415558831721e-05, "loss": 2.3412, "step": 43270 }, { "epoch": 0.37, "learning_rate": 7.003801012842195e-05, "loss": 2.2416, "step": 43275 }, { "epoch": 0.37, "learning_rate": 7.003186430787797e-05, "loss": 2.3456, "step": 43280 }, { "epoch": 0.37, "learning_rate": 7.00257181267959e-05, "loss": 2.3615, "step": 43285 }, { "epoch": 0.37, "learning_rate": 7.001957158528629e-05, "loss": 2.3287, "step": 43290 }, { "epoch": 0.37, "learning_rate": 7.001342468345983e-05, "loss": 2.3302, "step": 43295 }, { "epoch": 0.37, "learning_rate": 7.000727742142715e-05, "loss": 2.3472, "step": 43300 }, { "epoch": 0.37, "learning_rate": 7.000112979929884e-05, "loss": 2.2546, "step": 43305 }, { "epoch": 0.37, "learning_rate": 6.999498181718563e-05, "loss": 2.3018, "step": 43310 }, { "epoch": 0.37, "learning_rate": 6.99888334751981e-05, "loss": 2.4166, "step": 43315 }, { "epoch": 0.37, "learning_rate": 6.998268477344693e-05, "loss": 2.2883, "step": 43320 }, { "epoch": 0.37, "learning_rate": 6.99765357120428e-05, "loss": 2.2849, "step": 43325 }, { "epoch": 0.37, "learning_rate": 6.997038629109636e-05, "loss": 2.3272, "step": 43330 }, { "epoch": 0.37, "learning_rate": 6.99642365107183e-05, "loss": 2.3646, "step": 43335 }, { "epoch": 0.37, "learning_rate": 6.99580863710193e-05, "loss": 2.337, "step": 43340 }, { "epoch": 0.37, "learning_rate": 6.995193587211008e-05, "loss": 2.274, "step": 43345 }, { "epoch": 0.37, "learning_rate": 6.99457850141013e-05, "loss": 2.2888, "step": 43350 }, { "epoch": 0.37, "learning_rate": 6.993963379710366e-05, "loss": 2.3301, "step": 43355 }, { "epoch": 0.37, "learning_rate": 6.993348222122792e-05, "loss": 2.2801, "step": 43360 }, { "epoch": 0.37, "learning_rate": 6.992733028658477e-05, "loss": 2.2347, "step": 43365 }, { "epoch": 0.37, "learning_rate": 6.992117799328492e-05, "loss": 2.2737, "step": 43370 }, { "epoch": 0.37, "learning_rate": 6.991502534143912e-05, "loss": 2.3031, "step": 43375 }, { "epoch": 0.37, "learning_rate": 6.99088723311581e-05, "loss": 2.3136, "step": 43380 }, { "epoch": 0.37, "learning_rate": 6.990271896255259e-05, "loss": 2.3688, "step": 43385 }, { "epoch": 0.37, "learning_rate": 6.989656523573336e-05, "loss": 2.2899, "step": 43390 }, { "epoch": 0.37, "learning_rate": 6.989041115081116e-05, "loss": 2.3234, "step": 43395 }, { "epoch": 0.37, "learning_rate": 6.988425670789674e-05, "loss": 2.3398, "step": 43400 }, { "epoch": 0.37, "learning_rate": 6.987810190710089e-05, "loss": 2.2971, "step": 43405 }, { "epoch": 0.37, "learning_rate": 6.987194674853438e-05, "loss": 2.3256, "step": 43410 }, { "epoch": 0.37, "learning_rate": 6.986579123230798e-05, "loss": 2.3687, "step": 43415 }, { "epoch": 0.37, "learning_rate": 6.985963535853248e-05, "loss": 2.3059, "step": 43420 }, { "epoch": 0.37, "learning_rate": 6.98534791273187e-05, "loss": 2.3242, "step": 43425 }, { "epoch": 0.37, "learning_rate": 6.984732253877742e-05, "loss": 2.3662, "step": 43430 }, { "epoch": 0.37, "learning_rate": 6.984116559301944e-05, "loss": 2.3616, "step": 43435 }, { "epoch": 0.37, "learning_rate": 6.983500829015559e-05, "loss": 2.2699, "step": 43440 }, { "epoch": 0.37, "learning_rate": 6.982885063029668e-05, "loss": 2.2583, "step": 43445 }, { "epoch": 0.37, "learning_rate": 6.982269261355354e-05, "loss": 2.3615, "step": 43450 }, { "epoch": 0.37, "learning_rate": 6.9816534240037e-05, "loss": 2.3501, "step": 43455 }, { "epoch": 0.37, "learning_rate": 6.981037550985792e-05, "loss": 2.3095, "step": 43460 }, { "epoch": 0.37, "learning_rate": 6.980421642312711e-05, "loss": 2.3254, "step": 43465 }, { "epoch": 0.37, "learning_rate": 6.979805697995547e-05, "loss": 2.3261, "step": 43470 }, { "epoch": 0.37, "learning_rate": 6.979189718045383e-05, "loss": 2.2475, "step": 43475 }, { "epoch": 0.37, "learning_rate": 6.978573702473303e-05, "loss": 2.294, "step": 43480 }, { "epoch": 0.37, "learning_rate": 6.9779576512904e-05, "loss": 2.3468, "step": 43485 }, { "epoch": 0.37, "learning_rate": 6.977341564507757e-05, "loss": 2.2777, "step": 43490 }, { "epoch": 0.37, "learning_rate": 6.976725442136466e-05, "loss": 2.2785, "step": 43495 }, { "epoch": 0.37, "learning_rate": 6.976109284187614e-05, "loss": 2.3392, "step": 43500 }, { "epoch": 0.37, "learning_rate": 6.97549309067229e-05, "loss": 2.3519, "step": 43505 }, { "epoch": 0.37, "learning_rate": 6.974876861601587e-05, "loss": 2.3423, "step": 43510 }, { "epoch": 0.37, "learning_rate": 6.974260596986593e-05, "loss": 2.2848, "step": 43515 }, { "epoch": 0.37, "learning_rate": 6.973644296838403e-05, "loss": 2.3059, "step": 43520 }, { "epoch": 0.37, "learning_rate": 6.973027961168108e-05, "loss": 2.2967, "step": 43525 }, { "epoch": 0.37, "learning_rate": 6.972411589986798e-05, "loss": 2.2811, "step": 43530 }, { "epoch": 0.37, "learning_rate": 6.971795183305572e-05, "loss": 2.4061, "step": 43535 }, { "epoch": 0.37, "learning_rate": 6.97117874113552e-05, "loss": 2.363, "step": 43540 }, { "epoch": 0.37, "learning_rate": 6.970562263487738e-05, "loss": 2.4045, "step": 43545 }, { "epoch": 0.37, "learning_rate": 6.969945750373322e-05, "loss": 2.2573, "step": 43550 }, { "epoch": 0.37, "learning_rate": 6.96932920180337e-05, "loss": 2.2761, "step": 43555 }, { "epoch": 0.37, "learning_rate": 6.968712617788972e-05, "loss": 2.3837, "step": 43560 }, { "epoch": 0.37, "learning_rate": 6.968095998341233e-05, "loss": 2.3567, "step": 43565 }, { "epoch": 0.37, "learning_rate": 6.967479343471249e-05, "loss": 2.3212, "step": 43570 }, { "epoch": 0.37, "learning_rate": 6.966862653190117e-05, "loss": 2.3471, "step": 43575 }, { "epoch": 0.37, "learning_rate": 6.966245927508937e-05, "loss": 2.355, "step": 43580 }, { "epoch": 0.37, "learning_rate": 6.965629166438809e-05, "loss": 2.1659, "step": 43585 }, { "epoch": 0.37, "learning_rate": 6.965012369990835e-05, "loss": 2.3609, "step": 43590 }, { "epoch": 0.37, "learning_rate": 6.964395538176113e-05, "loss": 2.2417, "step": 43595 }, { "epoch": 0.37, "learning_rate": 6.963778671005747e-05, "loss": 2.35, "step": 43600 }, { "epoch": 0.37, "learning_rate": 6.963161768490843e-05, "loss": 2.4102, "step": 43605 }, { "epoch": 0.37, "learning_rate": 6.962544830642494e-05, "loss": 2.2666, "step": 43610 }, { "epoch": 0.37, "learning_rate": 6.961927857471816e-05, "loss": 2.333, "step": 43615 }, { "epoch": 0.37, "learning_rate": 6.961310848989906e-05, "loss": 2.3242, "step": 43620 }, { "epoch": 0.37, "learning_rate": 6.96069380520787e-05, "loss": 2.2917, "step": 43625 }, { "epoch": 0.37, "learning_rate": 6.960076726136817e-05, "loss": 2.2369, "step": 43630 }, { "epoch": 0.37, "learning_rate": 6.959459611787849e-05, "loss": 2.3185, "step": 43635 }, { "epoch": 0.37, "learning_rate": 6.958842462172075e-05, "loss": 2.3267, "step": 43640 }, { "epoch": 0.37, "learning_rate": 6.958225277300603e-05, "loss": 2.3539, "step": 43645 }, { "epoch": 0.37, "learning_rate": 6.95760805718454e-05, "loss": 2.2788, "step": 43650 }, { "epoch": 0.37, "learning_rate": 6.956990801834996e-05, "loss": 2.3428, "step": 43655 }, { "epoch": 0.37, "learning_rate": 6.956373511263079e-05, "loss": 2.3902, "step": 43660 }, { "epoch": 0.37, "learning_rate": 6.955756185479901e-05, "loss": 2.3339, "step": 43665 }, { "epoch": 0.37, "learning_rate": 6.955138824496573e-05, "loss": 2.2709, "step": 43670 }, { "epoch": 0.37, "learning_rate": 6.954521428324203e-05, "loss": 2.2784, "step": 43675 }, { "epoch": 0.37, "learning_rate": 6.953903996973908e-05, "loss": 2.3112, "step": 43680 }, { "epoch": 0.37, "learning_rate": 6.953286530456797e-05, "loss": 2.3487, "step": 43685 }, { "epoch": 0.37, "learning_rate": 6.952669028783984e-05, "loss": 2.3372, "step": 43690 }, { "epoch": 0.37, "learning_rate": 6.952051491966585e-05, "loss": 2.2584, "step": 43695 }, { "epoch": 0.37, "learning_rate": 6.951433920015711e-05, "loss": 2.3397, "step": 43700 }, { "epoch": 0.37, "learning_rate": 6.95081631294248e-05, "loss": 2.2558, "step": 43705 }, { "epoch": 0.37, "learning_rate": 6.950198670758006e-05, "loss": 2.4365, "step": 43710 }, { "epoch": 0.37, "learning_rate": 6.949580993473407e-05, "loss": 2.3263, "step": 43715 }, { "epoch": 0.37, "learning_rate": 6.948963281099799e-05, "loss": 2.3519, "step": 43720 }, { "epoch": 0.37, "learning_rate": 6.948345533648301e-05, "loss": 2.3434, "step": 43725 }, { "epoch": 0.37, "learning_rate": 6.947727751130032e-05, "loss": 2.3817, "step": 43730 }, { "epoch": 0.37, "learning_rate": 6.947109933556106e-05, "loss": 2.3836, "step": 43735 }, { "epoch": 0.37, "learning_rate": 6.946492080937647e-05, "loss": 2.2296, "step": 43740 }, { "epoch": 0.37, "learning_rate": 6.945874193285777e-05, "loss": 2.3545, "step": 43745 }, { "epoch": 0.37, "learning_rate": 6.945256270611613e-05, "loss": 2.3832, "step": 43750 }, { "epoch": 0.37, "learning_rate": 6.944638312926277e-05, "loss": 2.3116, "step": 43755 }, { "epoch": 0.37, "learning_rate": 6.944020320240893e-05, "loss": 2.3391, "step": 43760 }, { "epoch": 0.37, "learning_rate": 6.943402292566583e-05, "loss": 2.3267, "step": 43765 }, { "epoch": 0.37, "learning_rate": 6.942784229914468e-05, "loss": 2.3502, "step": 43770 }, { "epoch": 0.37, "learning_rate": 6.942166132295678e-05, "loss": 2.2787, "step": 43775 }, { "epoch": 0.37, "learning_rate": 6.941547999721332e-05, "loss": 2.2874, "step": 43780 }, { "epoch": 0.37, "learning_rate": 6.940929832202556e-05, "loss": 2.3403, "step": 43785 }, { "epoch": 0.37, "learning_rate": 6.940311629750477e-05, "loss": 2.3768, "step": 43790 }, { "epoch": 0.37, "learning_rate": 6.939693392376224e-05, "loss": 2.2546, "step": 43795 }, { "epoch": 0.37, "learning_rate": 6.939075120090921e-05, "loss": 2.3553, "step": 43800 }, { "epoch": 0.37, "learning_rate": 6.938456812905695e-05, "loss": 2.3004, "step": 43805 }, { "epoch": 0.37, "learning_rate": 6.93783847083168e-05, "loss": 2.4162, "step": 43810 }, { "epoch": 0.37, "learning_rate": 6.937220093879997e-05, "loss": 2.3154, "step": 43815 }, { "epoch": 0.37, "learning_rate": 6.93660168206178e-05, "loss": 2.273, "step": 43820 }, { "epoch": 0.37, "learning_rate": 6.93598323538816e-05, "loss": 2.3508, "step": 43825 }, { "epoch": 0.37, "learning_rate": 6.935364753870268e-05, "loss": 2.3635, "step": 43830 }, { "epoch": 0.37, "learning_rate": 6.934746237519235e-05, "loss": 2.2246, "step": 43835 }, { "epoch": 0.37, "learning_rate": 6.934127686346191e-05, "loss": 2.3883, "step": 43840 }, { "epoch": 0.37, "learning_rate": 6.933509100362271e-05, "loss": 2.392, "step": 43845 }, { "epoch": 0.37, "learning_rate": 6.93289047957861e-05, "loss": 2.3301, "step": 43850 }, { "epoch": 0.37, "learning_rate": 6.932271824006338e-05, "loss": 2.3579, "step": 43855 }, { "epoch": 0.37, "learning_rate": 6.931653133656594e-05, "loss": 2.2974, "step": 43860 }, { "epoch": 0.37, "learning_rate": 6.931034408540509e-05, "loss": 2.2611, "step": 43865 }, { "epoch": 0.37, "learning_rate": 6.930415648669223e-05, "loss": 2.2887, "step": 43870 }, { "epoch": 0.37, "learning_rate": 6.929796854053869e-05, "loss": 2.3162, "step": 43875 }, { "epoch": 0.37, "learning_rate": 6.929178024705587e-05, "loss": 2.3739, "step": 43880 }, { "epoch": 0.37, "learning_rate": 6.928559160635514e-05, "loss": 2.2776, "step": 43885 }, { "epoch": 0.37, "learning_rate": 6.927940261854789e-05, "loss": 2.3288, "step": 43890 }, { "epoch": 0.37, "learning_rate": 6.92732132837455e-05, "loss": 2.2509, "step": 43895 }, { "epoch": 0.37, "learning_rate": 6.926702360205937e-05, "loss": 2.2714, "step": 43900 }, { "epoch": 0.37, "learning_rate": 6.92608335736009e-05, "loss": 2.2304, "step": 43905 }, { "epoch": 0.37, "learning_rate": 6.925464319848151e-05, "loss": 2.3564, "step": 43910 }, { "epoch": 0.37, "learning_rate": 6.92484524768126e-05, "loss": 2.3534, "step": 43915 }, { "epoch": 0.37, "learning_rate": 6.92422614087056e-05, "loss": 2.2597, "step": 43920 }, { "epoch": 0.37, "learning_rate": 6.923606999427196e-05, "loss": 2.3984, "step": 43925 }, { "epoch": 0.37, "learning_rate": 6.922987823362307e-05, "loss": 2.333, "step": 43930 }, { "epoch": 0.37, "learning_rate": 6.92236861268704e-05, "loss": 2.3529, "step": 43935 }, { "epoch": 0.37, "learning_rate": 6.921749367412541e-05, "loss": 2.2788, "step": 43940 }, { "epoch": 0.38, "learning_rate": 6.921130087549952e-05, "loss": 2.4015, "step": 43945 }, { "epoch": 0.38, "learning_rate": 6.920510773110421e-05, "loss": 2.2081, "step": 43950 }, { "epoch": 0.38, "learning_rate": 6.919891424105094e-05, "loss": 2.2484, "step": 43955 }, { "epoch": 0.38, "learning_rate": 6.919272040545118e-05, "loss": 2.2708, "step": 43960 }, { "epoch": 0.38, "learning_rate": 6.918652622441642e-05, "loss": 2.2812, "step": 43965 }, { "epoch": 0.38, "learning_rate": 6.918033169805811e-05, "loss": 2.361, "step": 43970 }, { "epoch": 0.38, "learning_rate": 6.917413682648779e-05, "loss": 2.3159, "step": 43975 }, { "epoch": 0.38, "learning_rate": 6.916794160981692e-05, "loss": 2.3815, "step": 43980 }, { "epoch": 0.38, "learning_rate": 6.916174604815702e-05, "loss": 2.3295, "step": 43985 }, { "epoch": 0.38, "learning_rate": 6.915555014161958e-05, "loss": 2.2889, "step": 43990 }, { "epoch": 0.38, "learning_rate": 6.914935389031614e-05, "loss": 2.1851, "step": 43995 }, { "epoch": 0.38, "learning_rate": 6.91431572943582e-05, "loss": 2.2409, "step": 44000 }, { "epoch": 0.38, "learning_rate": 6.913696035385733e-05, "loss": 2.2183, "step": 44005 }, { "epoch": 0.38, "learning_rate": 6.913076306892499e-05, "loss": 2.2736, "step": 44010 }, { "epoch": 0.38, "learning_rate": 6.912456543967281e-05, "loss": 2.3325, "step": 44015 }, { "epoch": 0.38, "learning_rate": 6.911836746621226e-05, "loss": 2.3526, "step": 44020 }, { "epoch": 0.38, "learning_rate": 6.91121691486549e-05, "loss": 2.2949, "step": 44025 }, { "epoch": 0.38, "learning_rate": 6.910597048711235e-05, "loss": 2.2912, "step": 44030 }, { "epoch": 0.38, "learning_rate": 6.909977148169612e-05, "loss": 2.3405, "step": 44035 }, { "epoch": 0.38, "learning_rate": 6.909357213251779e-05, "loss": 2.3484, "step": 44040 }, { "epoch": 0.38, "learning_rate": 6.908737243968896e-05, "loss": 2.337, "step": 44045 }, { "epoch": 0.38, "learning_rate": 6.908117240332119e-05, "loss": 2.259, "step": 44050 }, { "epoch": 0.38, "learning_rate": 6.907497202352606e-05, "loss": 2.3002, "step": 44055 }, { "epoch": 0.38, "learning_rate": 6.90687713004152e-05, "loss": 2.3109, "step": 44060 }, { "epoch": 0.38, "learning_rate": 6.906257023410021e-05, "loss": 2.3483, "step": 44065 }, { "epoch": 0.38, "learning_rate": 6.905636882469265e-05, "loss": 2.2394, "step": 44070 }, { "epoch": 0.38, "learning_rate": 6.905016707230418e-05, "loss": 2.366, "step": 44075 }, { "epoch": 0.38, "learning_rate": 6.904396497704641e-05, "loss": 2.2961, "step": 44080 }, { "epoch": 0.38, "learning_rate": 6.903776253903098e-05, "loss": 2.2677, "step": 44085 }, { "epoch": 0.38, "learning_rate": 6.903155975836948e-05, "loss": 2.361, "step": 44090 }, { "epoch": 0.38, "learning_rate": 6.902535663517359e-05, "loss": 2.2894, "step": 44095 }, { "epoch": 0.38, "learning_rate": 6.901915316955495e-05, "loss": 2.3392, "step": 44100 }, { "epoch": 0.38, "learning_rate": 6.901294936162518e-05, "loss": 2.3133, "step": 44105 }, { "epoch": 0.38, "learning_rate": 6.9006745211496e-05, "loss": 2.3838, "step": 44110 }, { "epoch": 0.38, "learning_rate": 6.900054071927901e-05, "loss": 2.2921, "step": 44115 }, { "epoch": 0.38, "learning_rate": 6.899433588508591e-05, "loss": 2.3151, "step": 44120 }, { "epoch": 0.38, "learning_rate": 6.898813070902836e-05, "loss": 2.2821, "step": 44125 }, { "epoch": 0.38, "learning_rate": 6.898192519121805e-05, "loss": 2.3131, "step": 44130 }, { "epoch": 0.38, "learning_rate": 6.897571933176669e-05, "loss": 2.3297, "step": 44135 }, { "epoch": 0.38, "learning_rate": 6.896951313078593e-05, "loss": 2.3013, "step": 44140 }, { "epoch": 0.38, "learning_rate": 6.896330658838753e-05, "loss": 2.3051, "step": 44145 }, { "epoch": 0.38, "learning_rate": 6.895709970468315e-05, "loss": 2.3947, "step": 44150 }, { "epoch": 0.38, "learning_rate": 6.89508924797845e-05, "loss": 2.3047, "step": 44155 }, { "epoch": 0.38, "learning_rate": 6.894468491380332e-05, "loss": 2.3769, "step": 44160 }, { "epoch": 0.38, "learning_rate": 6.893847700685136e-05, "loss": 2.3666, "step": 44165 }, { "epoch": 0.38, "learning_rate": 6.893226875904029e-05, "loss": 2.3753, "step": 44170 }, { "epoch": 0.38, "learning_rate": 6.892606017048188e-05, "loss": 2.2971, "step": 44175 }, { "epoch": 0.38, "learning_rate": 6.891985124128788e-05, "loss": 2.313, "step": 44180 }, { "epoch": 0.38, "learning_rate": 6.891364197157002e-05, "loss": 2.2858, "step": 44185 }, { "epoch": 0.38, "learning_rate": 6.890743236144009e-05, "loss": 2.3193, "step": 44190 }, { "epoch": 0.38, "learning_rate": 6.890122241100983e-05, "loss": 2.3337, "step": 44195 }, { "epoch": 0.38, "learning_rate": 6.889501212039099e-05, "loss": 2.3626, "step": 44200 }, { "epoch": 0.38, "learning_rate": 6.888880148969538e-05, "loss": 2.3133, "step": 44205 }, { "epoch": 0.38, "learning_rate": 6.888259051903475e-05, "loss": 2.3324, "step": 44210 }, { "epoch": 0.38, "learning_rate": 6.88763792085209e-05, "loss": 2.2834, "step": 44215 }, { "epoch": 0.38, "learning_rate": 6.887016755826563e-05, "loss": 2.3016, "step": 44220 }, { "epoch": 0.38, "learning_rate": 6.886395556838072e-05, "loss": 2.283, "step": 44225 }, { "epoch": 0.38, "learning_rate": 6.885774323897801e-05, "loss": 2.3259, "step": 44230 }, { "epoch": 0.38, "learning_rate": 6.885153057016926e-05, "loss": 2.3483, "step": 44235 }, { "epoch": 0.38, "learning_rate": 6.884531756206632e-05, "loss": 2.2994, "step": 44240 }, { "epoch": 0.38, "learning_rate": 6.883910421478102e-05, "loss": 2.4195, "step": 44245 }, { "epoch": 0.38, "learning_rate": 6.883289052842515e-05, "loss": 2.2871, "step": 44250 }, { "epoch": 0.38, "learning_rate": 6.88266765031106e-05, "loss": 2.2734, "step": 44255 }, { "epoch": 0.38, "learning_rate": 6.882046213894917e-05, "loss": 2.3055, "step": 44260 }, { "epoch": 0.38, "learning_rate": 6.881424743605271e-05, "loss": 2.3353, "step": 44265 }, { "epoch": 0.38, "learning_rate": 6.880803239453311e-05, "loss": 2.2782, "step": 44270 }, { "epoch": 0.38, "learning_rate": 6.880181701450218e-05, "loss": 2.3267, "step": 44275 }, { "epoch": 0.38, "learning_rate": 6.879560129607182e-05, "loss": 2.2299, "step": 44280 }, { "epoch": 0.38, "learning_rate": 6.87893852393539e-05, "loss": 2.3926, "step": 44285 }, { "epoch": 0.38, "learning_rate": 6.878316884446027e-05, "loss": 2.2689, "step": 44290 }, { "epoch": 0.38, "learning_rate": 6.877695211150285e-05, "loss": 2.3296, "step": 44295 }, { "epoch": 0.38, "learning_rate": 6.87707350405935e-05, "loss": 2.3415, "step": 44300 }, { "epoch": 0.38, "learning_rate": 6.876451763184413e-05, "loss": 2.4213, "step": 44305 }, { "epoch": 0.38, "learning_rate": 6.875829988536666e-05, "loss": 2.3707, "step": 44310 }, { "epoch": 0.38, "learning_rate": 6.875208180127297e-05, "loss": 2.3972, "step": 44315 }, { "epoch": 0.38, "learning_rate": 6.874586337967498e-05, "loss": 2.3004, "step": 44320 }, { "epoch": 0.38, "learning_rate": 6.873964462068462e-05, "loss": 2.3292, "step": 44325 }, { "epoch": 0.38, "learning_rate": 6.873342552441382e-05, "loss": 2.3166, "step": 44330 }, { "epoch": 0.38, "learning_rate": 6.87272060909745e-05, "loss": 2.385, "step": 44335 }, { "epoch": 0.38, "learning_rate": 6.872098632047861e-05, "loss": 2.352, "step": 44340 }, { "epoch": 0.38, "learning_rate": 6.871476621303808e-05, "loss": 2.2949, "step": 44345 }, { "epoch": 0.38, "learning_rate": 6.870854576876488e-05, "loss": 2.3228, "step": 44350 }, { "epoch": 0.38, "learning_rate": 6.870232498777095e-05, "loss": 2.3266, "step": 44355 }, { "epoch": 0.38, "learning_rate": 6.869610387016825e-05, "loss": 2.3467, "step": 44360 }, { "epoch": 0.38, "learning_rate": 6.868988241606877e-05, "loss": 2.3125, "step": 44365 }, { "epoch": 0.38, "learning_rate": 6.868366062558449e-05, "loss": 2.2763, "step": 44370 }, { "epoch": 0.38, "learning_rate": 6.867743849882736e-05, "loss": 2.4054, "step": 44375 }, { "epoch": 0.38, "learning_rate": 6.867121603590937e-05, "loss": 2.2653, "step": 44380 }, { "epoch": 0.38, "learning_rate": 6.866499323694254e-05, "loss": 2.2913, "step": 44385 }, { "epoch": 0.38, "learning_rate": 6.865877010203887e-05, "loss": 2.3216, "step": 44390 }, { "epoch": 0.38, "learning_rate": 6.865254663131032e-05, "loss": 2.4273, "step": 44395 }, { "epoch": 0.38, "learning_rate": 6.864632282486896e-05, "loss": 2.2789, "step": 44400 }, { "epoch": 0.38, "learning_rate": 6.864009868282677e-05, "loss": 2.3837, "step": 44405 }, { "epoch": 0.38, "learning_rate": 6.863387420529578e-05, "loss": 2.2934, "step": 44410 }, { "epoch": 0.38, "learning_rate": 6.862764939238803e-05, "loss": 2.2842, "step": 44415 }, { "epoch": 0.38, "learning_rate": 6.862142424421554e-05, "loss": 2.3318, "step": 44420 }, { "epoch": 0.38, "learning_rate": 6.861519876089036e-05, "loss": 2.3738, "step": 44425 }, { "epoch": 0.38, "learning_rate": 6.860897294252454e-05, "loss": 2.2729, "step": 44430 }, { "epoch": 0.38, "learning_rate": 6.860274678923014e-05, "loss": 2.2807, "step": 44435 }, { "epoch": 0.38, "learning_rate": 6.859652030111921e-05, "loss": 2.4004, "step": 44440 }, { "epoch": 0.38, "learning_rate": 6.85902934783038e-05, "loss": 2.3385, "step": 44445 }, { "epoch": 0.38, "learning_rate": 6.858406632089602e-05, "loss": 2.3063, "step": 44450 }, { "epoch": 0.38, "learning_rate": 6.857783882900793e-05, "loss": 2.2657, "step": 44455 }, { "epoch": 0.38, "learning_rate": 6.857161100275159e-05, "loss": 2.3639, "step": 44460 }, { "epoch": 0.38, "learning_rate": 6.856538284223912e-05, "loss": 2.2179, "step": 44465 }, { "epoch": 0.38, "learning_rate": 6.855915434758261e-05, "loss": 2.3565, "step": 44470 }, { "epoch": 0.38, "learning_rate": 6.855292551889415e-05, "loss": 2.2476, "step": 44475 }, { "epoch": 0.38, "learning_rate": 6.854669635628586e-05, "loss": 2.2895, "step": 44480 }, { "epoch": 0.38, "learning_rate": 6.854046685986986e-05, "loss": 2.3576, "step": 44485 }, { "epoch": 0.38, "learning_rate": 6.853423702975823e-05, "loss": 2.4017, "step": 44490 }, { "epoch": 0.38, "learning_rate": 6.852800686606316e-05, "loss": 2.2658, "step": 44495 }, { "epoch": 0.38, "learning_rate": 6.852177636889675e-05, "loss": 2.244, "step": 44500 }, { "epoch": 0.38, "learning_rate": 6.85155455383711e-05, "loss": 2.2957, "step": 44505 }, { "epoch": 0.38, "learning_rate": 6.850931437459842e-05, "loss": 2.3209, "step": 44510 }, { "epoch": 0.38, "learning_rate": 6.850308287769083e-05, "loss": 2.2192, "step": 44515 }, { "epoch": 0.38, "learning_rate": 6.849685104776047e-05, "loss": 2.2339, "step": 44520 }, { "epoch": 0.38, "learning_rate": 6.849061888491953e-05, "loss": 2.2724, "step": 44525 }, { "epoch": 0.38, "learning_rate": 6.848438638928015e-05, "loss": 2.3799, "step": 44530 }, { "epoch": 0.38, "learning_rate": 6.847815356095452e-05, "loss": 2.3534, "step": 44535 }, { "epoch": 0.38, "learning_rate": 6.847192040005483e-05, "loss": 2.3486, "step": 44540 }, { "epoch": 0.38, "learning_rate": 6.846568690669324e-05, "loss": 2.3784, "step": 44545 }, { "epoch": 0.38, "learning_rate": 6.845945308098198e-05, "loss": 2.3069, "step": 44550 }, { "epoch": 0.38, "learning_rate": 6.845321892303322e-05, "loss": 2.361, "step": 44555 }, { "epoch": 0.38, "learning_rate": 6.844698443295916e-05, "loss": 2.2849, "step": 44560 }, { "epoch": 0.38, "learning_rate": 6.844074961087202e-05, "loss": 2.3005, "step": 44565 }, { "epoch": 0.38, "learning_rate": 6.843451445688401e-05, "loss": 2.326, "step": 44570 }, { "epoch": 0.38, "learning_rate": 6.842827897110738e-05, "loss": 2.3374, "step": 44575 }, { "epoch": 0.38, "learning_rate": 6.84220431536543e-05, "loss": 2.3587, "step": 44580 }, { "epoch": 0.38, "learning_rate": 6.841580700463704e-05, "loss": 2.3358, "step": 44585 }, { "epoch": 0.38, "learning_rate": 6.840957052416785e-05, "loss": 2.3711, "step": 44590 }, { "epoch": 0.38, "learning_rate": 6.840333371235898e-05, "loss": 2.3891, "step": 44595 }, { "epoch": 0.38, "learning_rate": 6.839709656932262e-05, "loss": 2.3036, "step": 44600 }, { "epoch": 0.38, "learning_rate": 6.839085909517111e-05, "loss": 2.2813, "step": 44605 }, { "epoch": 0.38, "learning_rate": 6.838462129001667e-05, "loss": 2.3176, "step": 44610 }, { "epoch": 0.38, "learning_rate": 6.837838315397156e-05, "loss": 2.2767, "step": 44615 }, { "epoch": 0.38, "learning_rate": 6.837214468714807e-05, "loss": 2.3396, "step": 44620 }, { "epoch": 0.38, "learning_rate": 6.83659058896585e-05, "loss": 2.3378, "step": 44625 }, { "epoch": 0.38, "learning_rate": 6.835966676161509e-05, "loss": 2.2773, "step": 44630 }, { "epoch": 0.38, "learning_rate": 6.835342730313018e-05, "loss": 2.318, "step": 44635 }, { "epoch": 0.38, "learning_rate": 6.834718751431606e-05, "loss": 2.3525, "step": 44640 }, { "epoch": 0.38, "learning_rate": 6.834094739528501e-05, "loss": 2.2451, "step": 44645 }, { "epoch": 0.38, "learning_rate": 6.833470694614937e-05, "loss": 2.3314, "step": 44650 }, { "epoch": 0.38, "learning_rate": 6.832846616702143e-05, "loss": 2.27, "step": 44655 }, { "epoch": 0.38, "learning_rate": 6.832222505801354e-05, "loss": 2.3348, "step": 44660 }, { "epoch": 0.38, "learning_rate": 6.8315983619238e-05, "loss": 2.4192, "step": 44665 }, { "epoch": 0.38, "learning_rate": 6.830974185080718e-05, "loss": 2.2405, "step": 44670 }, { "epoch": 0.38, "learning_rate": 6.83034997528334e-05, "loss": 2.2537, "step": 44675 }, { "epoch": 0.38, "learning_rate": 6.8297257325429e-05, "loss": 2.3301, "step": 44680 }, { "epoch": 0.38, "learning_rate": 6.829101456870634e-05, "loss": 2.4187, "step": 44685 }, { "epoch": 0.38, "learning_rate": 6.82847714827778e-05, "loss": 2.271, "step": 44690 }, { "epoch": 0.38, "learning_rate": 6.82785280677557e-05, "loss": 2.3675, "step": 44695 }, { "epoch": 0.38, "learning_rate": 6.827228432375243e-05, "loss": 2.3434, "step": 44700 }, { "epoch": 0.38, "learning_rate": 6.826604025088039e-05, "loss": 2.2395, "step": 44705 }, { "epoch": 0.38, "learning_rate": 6.825979584925195e-05, "loss": 2.2482, "step": 44710 }, { "epoch": 0.38, "learning_rate": 6.825355111897947e-05, "loss": 2.3286, "step": 44715 }, { "epoch": 0.38, "learning_rate": 6.824730606017537e-05, "loss": 2.3908, "step": 44720 }, { "epoch": 0.38, "learning_rate": 6.824106067295207e-05, "loss": 2.3095, "step": 44725 }, { "epoch": 0.38, "learning_rate": 6.823481495742192e-05, "loss": 2.3759, "step": 44730 }, { "epoch": 0.38, "learning_rate": 6.822856891369739e-05, "loss": 2.2629, "step": 44735 }, { "epoch": 0.38, "learning_rate": 6.822232254189085e-05, "loss": 2.3363, "step": 44740 }, { "epoch": 0.38, "learning_rate": 6.821607584211475e-05, "loss": 2.2682, "step": 44745 }, { "epoch": 0.38, "learning_rate": 6.820982881448151e-05, "loss": 2.3757, "step": 44750 }, { "epoch": 0.38, "learning_rate": 6.820358145910359e-05, "loss": 2.281, "step": 44755 }, { "epoch": 0.38, "learning_rate": 6.819733377609339e-05, "loss": 2.2762, "step": 44760 }, { "epoch": 0.38, "learning_rate": 6.819108576556339e-05, "loss": 2.3153, "step": 44765 }, { "epoch": 0.38, "learning_rate": 6.818483742762602e-05, "loss": 2.2861, "step": 44770 }, { "epoch": 0.38, "learning_rate": 6.817858876239376e-05, "loss": 2.3498, "step": 44775 }, { "epoch": 0.38, "learning_rate": 6.817233976997908e-05, "loss": 2.3409, "step": 44780 }, { "epoch": 0.38, "learning_rate": 6.816609045049441e-05, "loss": 2.3984, "step": 44785 }, { "epoch": 0.38, "learning_rate": 6.815984080405226e-05, "loss": 2.3328, "step": 44790 }, { "epoch": 0.38, "learning_rate": 6.815359083076511e-05, "loss": 2.2444, "step": 44795 }, { "epoch": 0.38, "learning_rate": 6.814734053074546e-05, "loss": 2.3454, "step": 44800 }, { "epoch": 0.38, "learning_rate": 6.814108990410576e-05, "loss": 2.3372, "step": 44805 }, { "epoch": 0.38, "learning_rate": 6.813483895095854e-05, "loss": 2.375, "step": 44810 }, { "epoch": 0.38, "learning_rate": 6.812858767141633e-05, "loss": 2.3848, "step": 44815 }, { "epoch": 0.38, "learning_rate": 6.81223360655916e-05, "loss": 2.2725, "step": 44820 }, { "epoch": 0.38, "learning_rate": 6.811608413359688e-05, "loss": 2.2607, "step": 44825 }, { "epoch": 0.38, "learning_rate": 6.810983187554472e-05, "loss": 2.2838, "step": 44830 }, { "epoch": 0.38, "learning_rate": 6.81035792915476e-05, "loss": 2.3586, "step": 44835 }, { "epoch": 0.38, "learning_rate": 6.80973263817181e-05, "loss": 2.24, "step": 44840 }, { "epoch": 0.38, "learning_rate": 6.809107314616872e-05, "loss": 2.3102, "step": 44845 }, { "epoch": 0.38, "learning_rate": 6.808481958501207e-05, "loss": 2.284, "step": 44850 }, { "epoch": 0.38, "learning_rate": 6.807856569836065e-05, "loss": 2.2952, "step": 44855 }, { "epoch": 0.38, "learning_rate": 6.807231148632703e-05, "loss": 2.3424, "step": 44860 }, { "epoch": 0.38, "learning_rate": 6.806605694902377e-05, "loss": 2.2857, "step": 44865 }, { "epoch": 0.38, "learning_rate": 6.805980208656346e-05, "loss": 2.284, "step": 44870 }, { "epoch": 0.38, "learning_rate": 6.805354689905867e-05, "loss": 2.3124, "step": 44875 }, { "epoch": 0.38, "learning_rate": 6.804729138662197e-05, "loss": 2.2747, "step": 44880 }, { "epoch": 0.38, "learning_rate": 6.804103554936596e-05, "loss": 2.3463, "step": 44885 }, { "epoch": 0.38, "learning_rate": 6.803477938740323e-05, "loss": 2.3206, "step": 44890 }, { "epoch": 0.38, "learning_rate": 6.802852290084637e-05, "loss": 2.2869, "step": 44895 }, { "epoch": 0.38, "learning_rate": 6.8022266089808e-05, "loss": 2.3043, "step": 44900 }, { "epoch": 0.38, "learning_rate": 6.801600895440072e-05, "loss": 2.3186, "step": 44905 }, { "epoch": 0.38, "learning_rate": 6.800975149473717e-05, "loss": 2.3426, "step": 44910 }, { "epoch": 0.38, "learning_rate": 6.800349371092996e-05, "loss": 2.3072, "step": 44915 }, { "epoch": 0.38, "learning_rate": 6.79972356030917e-05, "loss": 2.2301, "step": 44920 }, { "epoch": 0.38, "learning_rate": 6.799097717133506e-05, "loss": 2.3743, "step": 44925 }, { "epoch": 0.38, "learning_rate": 6.798471841577265e-05, "loss": 2.3163, "step": 44930 }, { "epoch": 0.38, "learning_rate": 6.797845933651712e-05, "loss": 2.269, "step": 44935 }, { "epoch": 0.38, "learning_rate": 6.797219993368116e-05, "loss": 2.3032, "step": 44940 }, { "epoch": 0.38, "learning_rate": 6.796594020737737e-05, "loss": 2.2467, "step": 44945 }, { "epoch": 0.38, "learning_rate": 6.795968015771847e-05, "loss": 2.3058, "step": 44950 }, { "epoch": 0.38, "learning_rate": 6.795341978481707e-05, "loss": 2.3533, "step": 44955 }, { "epoch": 0.38, "learning_rate": 6.79471590887859e-05, "loss": 2.3045, "step": 44960 }, { "epoch": 0.38, "learning_rate": 6.794089806973763e-05, "loss": 2.2921, "step": 44965 }, { "epoch": 0.38, "learning_rate": 6.793463672778492e-05, "loss": 2.2356, "step": 44970 }, { "epoch": 0.38, "learning_rate": 6.792837506304048e-05, "loss": 2.3051, "step": 44975 }, { "epoch": 0.38, "learning_rate": 6.792211307561702e-05, "loss": 2.3027, "step": 44980 }, { "epoch": 0.38, "learning_rate": 6.791585076562722e-05, "loss": 2.2984, "step": 44985 }, { "epoch": 0.38, "learning_rate": 6.790958813318383e-05, "loss": 2.321, "step": 44990 }, { "epoch": 0.38, "learning_rate": 6.79033251783995e-05, "loss": 2.3479, "step": 44995 }, { "epoch": 0.38, "learning_rate": 6.789706190138703e-05, "loss": 2.2883, "step": 45000 }, { "epoch": 0.38, "learning_rate": 6.789079830225908e-05, "loss": 2.3224, "step": 45005 }, { "epoch": 0.38, "learning_rate": 6.788453438112845e-05, "loss": 2.37, "step": 45010 }, { "epoch": 0.38, "learning_rate": 6.787827013810782e-05, "loss": 2.3147, "step": 45015 }, { "epoch": 0.38, "learning_rate": 6.787200557330996e-05, "loss": 2.3819, "step": 45020 }, { "epoch": 0.38, "learning_rate": 6.786574068684763e-05, "loss": 2.3201, "step": 45025 }, { "epoch": 0.38, "learning_rate": 6.78594754788336e-05, "loss": 2.3006, "step": 45030 }, { "epoch": 0.38, "learning_rate": 6.785320994938056e-05, "loss": 2.318, "step": 45035 }, { "epoch": 0.38, "learning_rate": 6.784694409860137e-05, "loss": 2.349, "step": 45040 }, { "epoch": 0.38, "learning_rate": 6.784067792660873e-05, "loss": 2.3704, "step": 45045 }, { "epoch": 0.38, "learning_rate": 6.783441143351546e-05, "loss": 2.3487, "step": 45050 }, { "epoch": 0.38, "learning_rate": 6.782814461943435e-05, "loss": 2.302, "step": 45055 }, { "epoch": 0.38, "learning_rate": 6.782187748447819e-05, "loss": 2.292, "step": 45060 }, { "epoch": 0.38, "learning_rate": 6.781561002875974e-05, "loss": 2.3337, "step": 45065 }, { "epoch": 0.38, "learning_rate": 6.780934225239185e-05, "loss": 2.31, "step": 45070 }, { "epoch": 0.38, "learning_rate": 6.78030741554873e-05, "loss": 2.2505, "step": 45075 }, { "epoch": 0.38, "learning_rate": 6.779680573815892e-05, "loss": 2.2834, "step": 45080 }, { "epoch": 0.38, "learning_rate": 6.779053700051953e-05, "loss": 2.2594, "step": 45085 }, { "epoch": 0.38, "learning_rate": 6.778426794268194e-05, "loss": 2.3918, "step": 45090 }, { "epoch": 0.38, "learning_rate": 6.7777998564759e-05, "loss": 2.3522, "step": 45095 }, { "epoch": 0.38, "learning_rate": 6.777172886686351e-05, "loss": 2.3192, "step": 45100 }, { "epoch": 0.38, "learning_rate": 6.77654588491084e-05, "loss": 2.2673, "step": 45105 }, { "epoch": 0.38, "learning_rate": 6.775918851160642e-05, "loss": 2.3152, "step": 45110 }, { "epoch": 0.38, "learning_rate": 6.775291785447047e-05, "loss": 2.3311, "step": 45115 }, { "epoch": 0.39, "learning_rate": 6.774664687781343e-05, "loss": 2.2198, "step": 45120 }, { "epoch": 0.39, "learning_rate": 6.774037558174814e-05, "loss": 2.3366, "step": 45125 }, { "epoch": 0.39, "learning_rate": 6.773410396638746e-05, "loss": 2.2887, "step": 45130 }, { "epoch": 0.39, "learning_rate": 6.772783203184431e-05, "loss": 2.2728, "step": 45135 }, { "epoch": 0.39, "learning_rate": 6.772155977823154e-05, "loss": 2.3525, "step": 45140 }, { "epoch": 0.39, "learning_rate": 6.771528720566204e-05, "loss": 2.3216, "step": 45145 }, { "epoch": 0.39, "learning_rate": 6.77090143142487e-05, "loss": 2.2408, "step": 45150 }, { "epoch": 0.39, "learning_rate": 6.770274110410446e-05, "loss": 2.4194, "step": 45155 }, { "epoch": 0.39, "learning_rate": 6.76964675753422e-05, "loss": 2.3963, "step": 45160 }, { "epoch": 0.39, "learning_rate": 6.769019372807483e-05, "loss": 2.3247, "step": 45165 }, { "epoch": 0.39, "learning_rate": 6.768391956241528e-05, "loss": 2.3442, "step": 45170 }, { "epoch": 0.39, "learning_rate": 6.767764507847644e-05, "loss": 2.3086, "step": 45175 }, { "epoch": 0.39, "learning_rate": 6.767137027637129e-05, "loss": 2.345, "step": 45180 }, { "epoch": 0.39, "learning_rate": 6.766509515621273e-05, "loss": 2.3027, "step": 45185 }, { "epoch": 0.39, "learning_rate": 6.765881971811374e-05, "loss": 2.3093, "step": 45190 }, { "epoch": 0.39, "learning_rate": 6.765254396218719e-05, "loss": 2.2266, "step": 45195 }, { "epoch": 0.39, "learning_rate": 6.764626788854611e-05, "loss": 2.2935, "step": 45200 }, { "epoch": 0.39, "learning_rate": 6.763999149730343e-05, "loss": 2.3835, "step": 45205 }, { "epoch": 0.39, "learning_rate": 6.76337147885721e-05, "loss": 2.333, "step": 45210 }, { "epoch": 0.39, "learning_rate": 6.762743776246512e-05, "loss": 2.3749, "step": 45215 }, { "epoch": 0.39, "learning_rate": 6.762116041909543e-05, "loss": 2.3029, "step": 45220 }, { "epoch": 0.39, "learning_rate": 6.761488275857604e-05, "loss": 2.3365, "step": 45225 }, { "epoch": 0.39, "learning_rate": 6.760860478101992e-05, "loss": 2.2987, "step": 45230 }, { "epoch": 0.39, "learning_rate": 6.760232648654008e-05, "loss": 2.3119, "step": 45235 }, { "epoch": 0.39, "learning_rate": 6.759604787524951e-05, "loss": 2.3356, "step": 45240 }, { "epoch": 0.39, "learning_rate": 6.75897689472612e-05, "loss": 2.2272, "step": 45245 }, { "epoch": 0.39, "learning_rate": 6.758348970268817e-05, "loss": 2.3887, "step": 45250 }, { "epoch": 0.39, "learning_rate": 6.757721014164343e-05, "loss": 2.2801, "step": 45255 }, { "epoch": 0.39, "learning_rate": 6.757093026424002e-05, "loss": 2.2311, "step": 45260 }, { "epoch": 0.39, "learning_rate": 6.756465007059094e-05, "loss": 2.2651, "step": 45265 }, { "epoch": 0.39, "learning_rate": 6.755836956080925e-05, "loss": 2.3576, "step": 45270 }, { "epoch": 0.39, "learning_rate": 6.755208873500795e-05, "loss": 2.3414, "step": 45275 }, { "epoch": 0.39, "learning_rate": 6.754580759330014e-05, "loss": 2.3069, "step": 45280 }, { "epoch": 0.39, "learning_rate": 6.753952613579882e-05, "loss": 2.2941, "step": 45285 }, { "epoch": 0.39, "learning_rate": 6.753324436261706e-05, "loss": 2.2928, "step": 45290 }, { "epoch": 0.39, "learning_rate": 6.752696227386795e-05, "loss": 2.2705, "step": 45295 }, { "epoch": 0.39, "learning_rate": 6.75206798696645e-05, "loss": 2.2943, "step": 45300 }, { "epoch": 0.39, "learning_rate": 6.751439715011982e-05, "loss": 2.2906, "step": 45305 }, { "epoch": 0.39, "learning_rate": 6.750811411534696e-05, "loss": 2.2869, "step": 45310 }, { "epoch": 0.39, "learning_rate": 6.750183076545905e-05, "loss": 2.3438, "step": 45315 }, { "epoch": 0.39, "learning_rate": 6.749554710056914e-05, "loss": 2.2449, "step": 45320 }, { "epoch": 0.39, "learning_rate": 6.748926312079034e-05, "loss": 2.4072, "step": 45325 }, { "epoch": 0.39, "learning_rate": 6.748297882623574e-05, "loss": 2.3004, "step": 45330 }, { "epoch": 0.39, "learning_rate": 6.747669421701848e-05, "loss": 2.3092, "step": 45335 }, { "epoch": 0.39, "learning_rate": 6.747040929325161e-05, "loss": 2.2939, "step": 45340 }, { "epoch": 0.39, "learning_rate": 6.74641240550483e-05, "loss": 2.3583, "step": 45345 }, { "epoch": 0.39, "learning_rate": 6.745783850252166e-05, "loss": 2.2658, "step": 45350 }, { "epoch": 0.39, "learning_rate": 6.745155263578479e-05, "loss": 2.285, "step": 45355 }, { "epoch": 0.39, "learning_rate": 6.744526645495088e-05, "loss": 2.3709, "step": 45360 }, { "epoch": 0.39, "learning_rate": 6.743897996013303e-05, "loss": 2.2867, "step": 45365 }, { "epoch": 0.39, "learning_rate": 6.743269315144439e-05, "loss": 2.27, "step": 45370 }, { "epoch": 0.39, "learning_rate": 6.742640602899812e-05, "loss": 2.2683, "step": 45375 }, { "epoch": 0.39, "learning_rate": 6.742011859290739e-05, "loss": 2.304, "step": 45380 }, { "epoch": 0.39, "learning_rate": 6.741383084328532e-05, "loss": 2.2932, "step": 45385 }, { "epoch": 0.39, "learning_rate": 6.740754278024512e-05, "loss": 2.3333, "step": 45390 }, { "epoch": 0.39, "learning_rate": 6.740125440389995e-05, "loss": 2.3226, "step": 45395 }, { "epoch": 0.39, "learning_rate": 6.739496571436298e-05, "loss": 2.2727, "step": 45400 }, { "epoch": 0.39, "learning_rate": 6.73886767117474e-05, "loss": 2.2793, "step": 45405 }, { "epoch": 0.39, "learning_rate": 6.738238739616643e-05, "loss": 2.3434, "step": 45410 }, { "epoch": 0.39, "learning_rate": 6.737609776773321e-05, "loss": 2.2715, "step": 45415 }, { "epoch": 0.39, "learning_rate": 6.736980782656099e-05, "loss": 2.3419, "step": 45420 }, { "epoch": 0.39, "learning_rate": 6.736351757276295e-05, "loss": 2.314, "step": 45425 }, { "epoch": 0.39, "learning_rate": 6.735722700645234e-05, "loss": 2.4185, "step": 45430 }, { "epoch": 0.39, "learning_rate": 6.735093612774234e-05, "loss": 2.3412, "step": 45435 }, { "epoch": 0.39, "learning_rate": 6.734464493674619e-05, "loss": 2.4183, "step": 45440 }, { "epoch": 0.39, "learning_rate": 6.733835343357712e-05, "loss": 2.2854, "step": 45445 }, { "epoch": 0.39, "learning_rate": 6.733206161834835e-05, "loss": 2.3148, "step": 45450 }, { "epoch": 0.39, "learning_rate": 6.732576949117314e-05, "loss": 2.3527, "step": 45455 }, { "epoch": 0.39, "learning_rate": 6.731947705216475e-05, "loss": 2.3117, "step": 45460 }, { "epoch": 0.39, "learning_rate": 6.731318430143639e-05, "loss": 2.3557, "step": 45465 }, { "epoch": 0.39, "learning_rate": 6.730689123910137e-05, "loss": 2.2247, "step": 45470 }, { "epoch": 0.39, "learning_rate": 6.730059786527292e-05, "loss": 2.2555, "step": 45475 }, { "epoch": 0.39, "learning_rate": 6.729430418006431e-05, "loss": 2.3456, "step": 45480 }, { "epoch": 0.39, "learning_rate": 6.728801018358885e-05, "loss": 2.345, "step": 45485 }, { "epoch": 0.39, "learning_rate": 6.728171587595977e-05, "loss": 2.2897, "step": 45490 }, { "epoch": 0.39, "learning_rate": 6.727542125729038e-05, "loss": 2.2742, "step": 45495 }, { "epoch": 0.39, "learning_rate": 6.726912632769399e-05, "loss": 2.2781, "step": 45500 }, { "epoch": 0.39, "learning_rate": 6.726283108728388e-05, "loss": 2.2792, "step": 45505 }, { "epoch": 0.39, "learning_rate": 6.725653553617333e-05, "loss": 2.3725, "step": 45510 }, { "epoch": 0.39, "learning_rate": 6.725023967447568e-05, "loss": 2.276, "step": 45515 }, { "epoch": 0.39, "learning_rate": 6.724394350230425e-05, "loss": 2.3384, "step": 45520 }, { "epoch": 0.39, "learning_rate": 6.723764701977233e-05, "loss": 2.278, "step": 45525 }, { "epoch": 0.39, "learning_rate": 6.723135022699327e-05, "loss": 2.3143, "step": 45530 }, { "epoch": 0.39, "learning_rate": 6.72250531240804e-05, "loss": 2.3434, "step": 45535 }, { "epoch": 0.39, "learning_rate": 6.721875571114705e-05, "loss": 2.274, "step": 45540 }, { "epoch": 0.39, "learning_rate": 6.721245798830656e-05, "loss": 2.2839, "step": 45545 }, { "epoch": 0.39, "learning_rate": 6.720615995567226e-05, "loss": 2.3227, "step": 45550 }, { "epoch": 0.39, "learning_rate": 6.719986161335756e-05, "loss": 2.2987, "step": 45555 }, { "epoch": 0.39, "learning_rate": 6.719356296147574e-05, "loss": 2.3798, "step": 45560 }, { "epoch": 0.39, "learning_rate": 6.718726400014024e-05, "loss": 2.3565, "step": 45565 }, { "epoch": 0.39, "learning_rate": 6.718096472946438e-05, "loss": 2.3117, "step": 45570 }, { "epoch": 0.39, "learning_rate": 6.717466514956157e-05, "loss": 2.3132, "step": 45575 }, { "epoch": 0.39, "learning_rate": 6.716836526054515e-05, "loss": 2.2503, "step": 45580 }, { "epoch": 0.39, "learning_rate": 6.716206506252856e-05, "loss": 2.3474, "step": 45585 }, { "epoch": 0.39, "learning_rate": 6.715576455562514e-05, "loss": 2.3633, "step": 45590 }, { "epoch": 0.39, "learning_rate": 6.714946373994833e-05, "loss": 2.3372, "step": 45595 }, { "epoch": 0.39, "learning_rate": 6.71431626156115e-05, "loss": 2.2909, "step": 45600 }, { "epoch": 0.39, "learning_rate": 6.713686118272808e-05, "loss": 2.2981, "step": 45605 }, { "epoch": 0.39, "learning_rate": 6.713055944141147e-05, "loss": 2.3453, "step": 45610 }, { "epoch": 0.39, "learning_rate": 6.71242573917751e-05, "loss": 2.3107, "step": 45615 }, { "epoch": 0.39, "learning_rate": 6.711795503393242e-05, "loss": 2.3497, "step": 45620 }, { "epoch": 0.39, "learning_rate": 6.71116523679968e-05, "loss": 2.3638, "step": 45625 }, { "epoch": 0.39, "learning_rate": 6.710534939408174e-05, "loss": 2.3329, "step": 45630 }, { "epoch": 0.39, "learning_rate": 6.709904611230064e-05, "loss": 2.2474, "step": 45635 }, { "epoch": 0.39, "learning_rate": 6.709274252276697e-05, "loss": 2.2446, "step": 45640 }, { "epoch": 0.39, "learning_rate": 6.708643862559418e-05, "loss": 2.3153, "step": 45645 }, { "epoch": 0.39, "learning_rate": 6.708013442089573e-05, "loss": 2.313, "step": 45650 }, { "epoch": 0.39, "learning_rate": 6.707382990878507e-05, "loss": 2.3214, "step": 45655 }, { "epoch": 0.39, "learning_rate": 6.706752508937568e-05, "loss": 2.326, "step": 45660 }, { "epoch": 0.39, "learning_rate": 6.706121996278104e-05, "loss": 2.3087, "step": 45665 }, { "epoch": 0.39, "learning_rate": 6.705491452911463e-05, "loss": 2.3092, "step": 45670 }, { "epoch": 0.39, "learning_rate": 6.704860878848992e-05, "loss": 2.3167, "step": 45675 }, { "epoch": 0.39, "learning_rate": 6.704230274102043e-05, "loss": 2.3303, "step": 45680 }, { "epoch": 0.39, "learning_rate": 6.703599638681963e-05, "loss": 2.337, "step": 45685 }, { "epoch": 0.39, "learning_rate": 6.702968972600104e-05, "loss": 2.3199, "step": 45690 }, { "epoch": 0.39, "learning_rate": 6.702338275867819e-05, "loss": 2.3793, "step": 45695 }, { "epoch": 0.39, "learning_rate": 6.701707548496454e-05, "loss": 2.3361, "step": 45700 }, { "epoch": 0.39, "learning_rate": 6.701076790497364e-05, "loss": 2.3789, "step": 45705 }, { "epoch": 0.39, "learning_rate": 6.700446001881904e-05, "loss": 2.3479, "step": 45710 }, { "epoch": 0.39, "learning_rate": 6.699815182661421e-05, "loss": 2.3339, "step": 45715 }, { "epoch": 0.39, "learning_rate": 6.699184332847275e-05, "loss": 2.3079, "step": 45720 }, { "epoch": 0.39, "learning_rate": 6.698553452450816e-05, "loss": 2.3728, "step": 45725 }, { "epoch": 0.39, "learning_rate": 6.697922541483401e-05, "loss": 2.2962, "step": 45730 }, { "epoch": 0.39, "learning_rate": 6.697291599956386e-05, "loss": 2.3839, "step": 45735 }, { "epoch": 0.39, "learning_rate": 6.696660627881122e-05, "loss": 2.3823, "step": 45740 }, { "epoch": 0.39, "learning_rate": 6.69602962526897e-05, "loss": 2.2885, "step": 45745 }, { "epoch": 0.39, "learning_rate": 6.695398592131286e-05, "loss": 2.3405, "step": 45750 }, { "epoch": 0.39, "learning_rate": 6.694767528479425e-05, "loss": 2.3353, "step": 45755 }, { "epoch": 0.39, "learning_rate": 6.694136434324749e-05, "loss": 2.3065, "step": 45760 }, { "epoch": 0.39, "learning_rate": 6.693505309678613e-05, "loss": 2.3122, "step": 45765 }, { "epoch": 0.39, "learning_rate": 6.692874154552378e-05, "loss": 2.2821, "step": 45770 }, { "epoch": 0.39, "learning_rate": 6.692242968957405e-05, "loss": 2.2887, "step": 45775 }, { "epoch": 0.39, "learning_rate": 6.691611752905052e-05, "loss": 2.3069, "step": 45780 }, { "epoch": 0.39, "learning_rate": 6.690980506406678e-05, "loss": 2.3025, "step": 45785 }, { "epoch": 0.39, "learning_rate": 6.690349229473652e-05, "loss": 2.3526, "step": 45790 }, { "epoch": 0.39, "learning_rate": 6.689717922117327e-05, "loss": 2.3515, "step": 45795 }, { "epoch": 0.39, "learning_rate": 6.689086584349067e-05, "loss": 2.3905, "step": 45800 }, { "epoch": 0.39, "learning_rate": 6.688455216180241e-05, "loss": 2.3315, "step": 45805 }, { "epoch": 0.39, "learning_rate": 6.687823817622208e-05, "loss": 2.2945, "step": 45810 }, { "epoch": 0.39, "learning_rate": 6.68719238868633e-05, "loss": 2.2768, "step": 45815 }, { "epoch": 0.39, "learning_rate": 6.686560929383976e-05, "loss": 2.361, "step": 45820 }, { "epoch": 0.39, "learning_rate": 6.685929439726509e-05, "loss": 2.3439, "step": 45825 }, { "epoch": 0.39, "learning_rate": 6.685297919725295e-05, "loss": 2.2983, "step": 45830 }, { "epoch": 0.39, "learning_rate": 6.6846663693917e-05, "loss": 2.2678, "step": 45835 }, { "epoch": 0.39, "learning_rate": 6.68403478873709e-05, "loss": 2.3405, "step": 45840 }, { "epoch": 0.39, "learning_rate": 6.683403177772836e-05, "loss": 2.3475, "step": 45845 }, { "epoch": 0.39, "learning_rate": 6.6827715365103e-05, "loss": 2.3742, "step": 45850 }, { "epoch": 0.39, "learning_rate": 6.682139864960857e-05, "loss": 2.2259, "step": 45855 }, { "epoch": 0.39, "learning_rate": 6.681508163135871e-05, "loss": 2.2995, "step": 45860 }, { "epoch": 0.39, "learning_rate": 6.680876431046712e-05, "loss": 2.3453, "step": 45865 }, { "epoch": 0.39, "learning_rate": 6.680244668704751e-05, "loss": 2.3505, "step": 45870 }, { "epoch": 0.39, "learning_rate": 6.679612876121362e-05, "loss": 2.2481, "step": 45875 }, { "epoch": 0.39, "learning_rate": 6.678981053307912e-05, "loss": 2.3376, "step": 45880 }, { "epoch": 0.39, "learning_rate": 6.678349200275771e-05, "loss": 2.37, "step": 45885 }, { "epoch": 0.39, "learning_rate": 6.677717317036316e-05, "loss": 2.3624, "step": 45890 }, { "epoch": 0.39, "learning_rate": 6.677085403600918e-05, "loss": 2.3322, "step": 45895 }, { "epoch": 0.39, "learning_rate": 6.676453459980949e-05, "loss": 2.3803, "step": 45900 }, { "epoch": 0.39, "learning_rate": 6.675821486187784e-05, "loss": 2.3238, "step": 45905 }, { "epoch": 0.39, "learning_rate": 6.675189482232798e-05, "loss": 2.4036, "step": 45910 }, { "epoch": 0.39, "learning_rate": 6.674557448127364e-05, "loss": 2.3661, "step": 45915 }, { "epoch": 0.39, "learning_rate": 6.673925383882859e-05, "loss": 2.342, "step": 45920 }, { "epoch": 0.39, "learning_rate": 6.67329328951066e-05, "loss": 2.3225, "step": 45925 }, { "epoch": 0.39, "learning_rate": 6.672661165022141e-05, "loss": 2.3626, "step": 45930 }, { "epoch": 0.39, "learning_rate": 6.672029010428681e-05, "loss": 2.3112, "step": 45935 }, { "epoch": 0.39, "learning_rate": 6.671396825741657e-05, "loss": 2.2693, "step": 45940 }, { "epoch": 0.39, "learning_rate": 6.670764610972446e-05, "loss": 2.2927, "step": 45945 }, { "epoch": 0.39, "learning_rate": 6.670132366132432e-05, "loss": 2.4061, "step": 45950 }, { "epoch": 0.39, "learning_rate": 6.669500091232986e-05, "loss": 2.3186, "step": 45955 }, { "epoch": 0.39, "learning_rate": 6.668867786285494e-05, "loss": 2.3083, "step": 45960 }, { "epoch": 0.39, "learning_rate": 6.668235451301334e-05, "loss": 2.3287, "step": 45965 }, { "epoch": 0.39, "learning_rate": 6.667603086291888e-05, "loss": 2.2836, "step": 45970 }, { "epoch": 0.39, "learning_rate": 6.666970691268538e-05, "loss": 2.4037, "step": 45975 }, { "epoch": 0.39, "learning_rate": 6.666338266242663e-05, "loss": 2.3383, "step": 45980 }, { "epoch": 0.39, "learning_rate": 6.665705811225648e-05, "loss": 2.3413, "step": 45985 }, { "epoch": 0.39, "learning_rate": 6.665073326228877e-05, "loss": 2.2173, "step": 45990 }, { "epoch": 0.39, "learning_rate": 6.66444081126373e-05, "loss": 2.264, "step": 45995 }, { "epoch": 0.39, "learning_rate": 6.663808266341594e-05, "loss": 2.2874, "step": 46000 }, { "epoch": 0.39, "learning_rate": 6.663175691473855e-05, "loss": 2.2764, "step": 46005 }, { "epoch": 0.39, "learning_rate": 6.662543086671892e-05, "loss": 2.2997, "step": 46010 }, { "epoch": 0.39, "learning_rate": 6.661910451947099e-05, "loss": 2.3058, "step": 46015 }, { "epoch": 0.39, "learning_rate": 6.661277787310856e-05, "loss": 2.329, "step": 46020 }, { "epoch": 0.39, "learning_rate": 6.660645092774553e-05, "loss": 2.2804, "step": 46025 }, { "epoch": 0.39, "learning_rate": 6.660012368349576e-05, "loss": 2.3611, "step": 46030 }, { "epoch": 0.39, "learning_rate": 6.659379614047315e-05, "loss": 2.3425, "step": 46035 }, { "epoch": 0.39, "learning_rate": 6.658746829879154e-05, "loss": 2.3417, "step": 46040 }, { "epoch": 0.39, "learning_rate": 6.658114015856487e-05, "loss": 2.3235, "step": 46045 }, { "epoch": 0.39, "learning_rate": 6.6574811719907e-05, "loss": 2.3665, "step": 46050 }, { "epoch": 0.39, "learning_rate": 6.656848298293186e-05, "loss": 2.3366, "step": 46055 }, { "epoch": 0.39, "learning_rate": 6.656215394775334e-05, "loss": 2.3197, "step": 46060 }, { "epoch": 0.39, "learning_rate": 6.655582461448535e-05, "loss": 2.3232, "step": 46065 }, { "epoch": 0.39, "learning_rate": 6.654949498324182e-05, "loss": 2.2809, "step": 46070 }, { "epoch": 0.39, "learning_rate": 6.654316505413661e-05, "loss": 2.2607, "step": 46075 }, { "epoch": 0.39, "learning_rate": 6.653683482728375e-05, "loss": 2.3915, "step": 46080 }, { "epoch": 0.39, "learning_rate": 6.65305043027971e-05, "loss": 2.2801, "step": 46085 }, { "epoch": 0.39, "learning_rate": 6.652417348079063e-05, "loss": 2.2717, "step": 46090 }, { "epoch": 0.39, "learning_rate": 6.651784236137827e-05, "loss": 2.3739, "step": 46095 }, { "epoch": 0.39, "learning_rate": 6.651151094467398e-05, "loss": 2.2997, "step": 46100 }, { "epoch": 0.39, "learning_rate": 6.65051792307917e-05, "loss": 2.2824, "step": 46105 }, { "epoch": 0.39, "learning_rate": 6.649884721984539e-05, "loss": 2.291, "step": 46110 }, { "epoch": 0.39, "learning_rate": 6.649251491194903e-05, "loss": 2.3116, "step": 46115 }, { "epoch": 0.39, "learning_rate": 6.648618230721658e-05, "loss": 2.3419, "step": 46120 }, { "epoch": 0.39, "learning_rate": 6.647984940576199e-05, "loss": 2.2103, "step": 46125 }, { "epoch": 0.39, "learning_rate": 6.64735162076993e-05, "loss": 2.3379, "step": 46130 }, { "epoch": 0.39, "learning_rate": 6.646718271314247e-05, "loss": 2.3679, "step": 46135 }, { "epoch": 0.39, "learning_rate": 6.646084892220548e-05, "loss": 2.3118, "step": 46140 }, { "epoch": 0.39, "learning_rate": 6.645451483500232e-05, "loss": 2.342, "step": 46145 }, { "epoch": 0.39, "learning_rate": 6.644818045164702e-05, "loss": 2.3284, "step": 46150 }, { "epoch": 0.39, "learning_rate": 6.644184577225357e-05, "loss": 2.2823, "step": 46155 }, { "epoch": 0.39, "learning_rate": 6.643551079693598e-05, "loss": 2.3053, "step": 46160 }, { "epoch": 0.39, "learning_rate": 6.642917552580828e-05, "loss": 2.304, "step": 46165 }, { "epoch": 0.39, "learning_rate": 6.642283995898448e-05, "loss": 2.355, "step": 46170 }, { "epoch": 0.39, "learning_rate": 6.641650409657863e-05, "loss": 2.2874, "step": 46175 }, { "epoch": 0.39, "learning_rate": 6.641016793870475e-05, "loss": 2.2679, "step": 46180 }, { "epoch": 0.39, "learning_rate": 6.640383148547687e-05, "loss": 2.3083, "step": 46185 }, { "epoch": 0.39, "learning_rate": 6.639749473700907e-05, "loss": 2.3242, "step": 46190 }, { "epoch": 0.39, "learning_rate": 6.639115769341537e-05, "loss": 2.2501, "step": 46195 }, { "epoch": 0.39, "learning_rate": 6.63848203548098e-05, "loss": 2.2944, "step": 46200 }, { "epoch": 0.39, "learning_rate": 6.637848272130648e-05, "loss": 2.3357, "step": 46205 }, { "epoch": 0.39, "learning_rate": 6.637214479301946e-05, "loss": 2.326, "step": 46210 }, { "epoch": 0.39, "learning_rate": 6.636580657006278e-05, "loss": 2.3021, "step": 46215 }, { "epoch": 0.39, "learning_rate": 6.635946805255055e-05, "loss": 2.3047, "step": 46220 }, { "epoch": 0.39, "learning_rate": 6.635312924059683e-05, "loss": 2.3226, "step": 46225 }, { "epoch": 0.39, "learning_rate": 6.634679013431573e-05, "loss": 2.2777, "step": 46230 }, { "epoch": 0.39, "learning_rate": 6.634045073382131e-05, "loss": 2.2643, "step": 46235 }, { "epoch": 0.39, "learning_rate": 6.63341110392277e-05, "loss": 2.2869, "step": 46240 }, { "epoch": 0.39, "learning_rate": 6.6327771050649e-05, "loss": 2.3537, "step": 46245 }, { "epoch": 0.39, "learning_rate": 6.63214307681993e-05, "loss": 2.3308, "step": 46250 }, { "epoch": 0.39, "learning_rate": 6.631509019199273e-05, "loss": 2.3194, "step": 46255 }, { "epoch": 0.39, "learning_rate": 6.63087493221434e-05, "loss": 2.3627, "step": 46260 }, { "epoch": 0.39, "learning_rate": 6.630240815876543e-05, "loss": 2.2308, "step": 46265 }, { "epoch": 0.39, "learning_rate": 6.629606670197296e-05, "loss": 2.383, "step": 46270 }, { "epoch": 0.39, "learning_rate": 6.628972495188013e-05, "loss": 2.37, "step": 46275 }, { "epoch": 0.39, "learning_rate": 6.628338290860106e-05, "loss": 2.3114, "step": 46280 }, { "epoch": 0.39, "learning_rate": 6.627704057224991e-05, "loss": 2.3002, "step": 46285 }, { "epoch": 0.4, "learning_rate": 6.627069794294083e-05, "loss": 2.2307, "step": 46290 }, { "epoch": 0.4, "learning_rate": 6.626435502078798e-05, "loss": 2.3166, "step": 46295 }, { "epoch": 0.4, "learning_rate": 6.625801180590551e-05, "loss": 2.3512, "step": 46300 }, { "epoch": 0.4, "learning_rate": 6.62516682984076e-05, "loss": 2.3266, "step": 46305 }, { "epoch": 0.4, "learning_rate": 6.624532449840841e-05, "loss": 2.3529, "step": 46310 }, { "epoch": 0.4, "learning_rate": 6.623898040602211e-05, "loss": 2.3269, "step": 46315 }, { "epoch": 0.4, "learning_rate": 6.623263602136292e-05, "loss": 2.2978, "step": 46320 }, { "epoch": 0.4, "learning_rate": 6.622629134454499e-05, "loss": 2.3438, "step": 46325 }, { "epoch": 0.4, "learning_rate": 6.62199463756825e-05, "loss": 2.2754, "step": 46330 }, { "epoch": 0.4, "learning_rate": 6.62136011148897e-05, "loss": 2.232, "step": 46335 }, { "epoch": 0.4, "learning_rate": 6.620725556228077e-05, "loss": 2.2478, "step": 46340 }, { "epoch": 0.4, "learning_rate": 6.62009097179699e-05, "loss": 2.3349, "step": 46345 }, { "epoch": 0.4, "learning_rate": 6.619456358207132e-05, "loss": 2.2507, "step": 46350 }, { "epoch": 0.4, "learning_rate": 6.618821715469928e-05, "loss": 2.3315, "step": 46355 }, { "epoch": 0.4, "learning_rate": 6.618187043596793e-05, "loss": 2.2361, "step": 46360 }, { "epoch": 0.4, "learning_rate": 6.617552342599156e-05, "loss": 2.3248, "step": 46365 }, { "epoch": 0.4, "learning_rate": 6.61691761248844e-05, "loss": 2.3033, "step": 46370 }, { "epoch": 0.4, "learning_rate": 6.616282853276065e-05, "loss": 2.3611, "step": 46375 }, { "epoch": 0.4, "learning_rate": 6.61564806497346e-05, "loss": 2.2543, "step": 46380 }, { "epoch": 0.4, "learning_rate": 6.615013247592047e-05, "loss": 2.2469, "step": 46385 }, { "epoch": 0.4, "learning_rate": 6.614378401143256e-05, "loss": 2.3998, "step": 46390 }, { "epoch": 0.4, "learning_rate": 6.613743525638507e-05, "loss": 2.2798, "step": 46395 }, { "epoch": 0.4, "learning_rate": 6.613108621089233e-05, "loss": 2.3245, "step": 46400 }, { "epoch": 0.4, "learning_rate": 6.612473687506856e-05, "loss": 2.2767, "step": 46405 }, { "epoch": 0.4, "learning_rate": 6.611838724902804e-05, "loss": 2.3971, "step": 46410 }, { "epoch": 0.4, "learning_rate": 6.61120373328851e-05, "loss": 2.274, "step": 46415 }, { "epoch": 0.4, "learning_rate": 6.610568712675398e-05, "loss": 2.2778, "step": 46420 }, { "epoch": 0.4, "learning_rate": 6.609933663074897e-05, "loss": 2.1955, "step": 46425 }, { "epoch": 0.4, "learning_rate": 6.60929858449844e-05, "loss": 2.3044, "step": 46430 }, { "epoch": 0.4, "learning_rate": 6.608663476957457e-05, "loss": 2.3094, "step": 46435 }, { "epoch": 0.4, "learning_rate": 6.608028340463376e-05, "loss": 2.3642, "step": 46440 }, { "epoch": 0.4, "learning_rate": 6.60739317502763e-05, "loss": 2.268, "step": 46445 }, { "epoch": 0.4, "learning_rate": 6.606757980661651e-05, "loss": 2.3645, "step": 46450 }, { "epoch": 0.4, "learning_rate": 6.606122757376871e-05, "loss": 2.2649, "step": 46455 }, { "epoch": 0.4, "learning_rate": 6.605487505184724e-05, "loss": 2.3036, "step": 46460 }, { "epoch": 0.4, "learning_rate": 6.604852224096642e-05, "loss": 2.3387, "step": 46465 }, { "epoch": 0.4, "learning_rate": 6.60421691412406e-05, "loss": 2.3522, "step": 46470 }, { "epoch": 0.4, "learning_rate": 6.60358157527841e-05, "loss": 2.346, "step": 46475 }, { "epoch": 0.4, "learning_rate": 6.60294620757113e-05, "loss": 2.2945, "step": 46480 }, { "epoch": 0.4, "learning_rate": 6.602310811013654e-05, "loss": 2.3459, "step": 46485 }, { "epoch": 0.4, "learning_rate": 6.601675385617418e-05, "loss": 2.3042, "step": 46490 }, { "epoch": 0.4, "learning_rate": 6.60103993139386e-05, "loss": 2.2512, "step": 46495 }, { "epoch": 0.4, "learning_rate": 6.600404448354417e-05, "loss": 2.3772, "step": 46500 }, { "epoch": 0.4, "learning_rate": 6.599768936510523e-05, "loss": 2.3505, "step": 46505 }, { "epoch": 0.4, "learning_rate": 6.59913339587362e-05, "loss": 2.397, "step": 46510 }, { "epoch": 0.4, "learning_rate": 6.598497826455146e-05, "loss": 2.3155, "step": 46515 }, { "epoch": 0.4, "learning_rate": 6.597862228266538e-05, "loss": 2.2939, "step": 46520 }, { "epoch": 0.4, "learning_rate": 6.597226601319237e-05, "loss": 2.2651, "step": 46525 }, { "epoch": 0.4, "learning_rate": 6.596590945624684e-05, "loss": 2.334, "step": 46530 }, { "epoch": 0.4, "learning_rate": 6.595955261194318e-05, "loss": 2.3021, "step": 46535 }, { "epoch": 0.4, "learning_rate": 6.59531954803958e-05, "loss": 2.2275, "step": 46540 }, { "epoch": 0.4, "learning_rate": 6.594683806171914e-05, "loss": 2.3227, "step": 46545 }, { "epoch": 0.4, "learning_rate": 6.594048035602761e-05, "loss": 2.3015, "step": 46550 }, { "epoch": 0.4, "learning_rate": 6.593412236343564e-05, "loss": 2.2999, "step": 46555 }, { "epoch": 0.4, "learning_rate": 6.592776408405766e-05, "loss": 2.2329, "step": 46560 }, { "epoch": 0.4, "learning_rate": 6.59214055180081e-05, "loss": 2.3276, "step": 46565 }, { "epoch": 0.4, "learning_rate": 6.591504666540141e-05, "loss": 2.2606, "step": 46570 }, { "epoch": 0.4, "learning_rate": 6.590868752635205e-05, "loss": 2.2962, "step": 46575 }, { "epoch": 0.4, "learning_rate": 6.590232810097446e-05, "loss": 2.2822, "step": 46580 }, { "epoch": 0.4, "learning_rate": 6.589596838938308e-05, "loss": 2.3689, "step": 46585 }, { "epoch": 0.4, "learning_rate": 6.588960839169239e-05, "loss": 2.2453, "step": 46590 }, { "epoch": 0.4, "learning_rate": 6.58832481080169e-05, "loss": 2.3087, "step": 46595 }, { "epoch": 0.4, "learning_rate": 6.587688753847103e-05, "loss": 2.2799, "step": 46600 }, { "epoch": 0.4, "learning_rate": 6.587052668316925e-05, "loss": 2.3408, "step": 46605 }, { "epoch": 0.4, "learning_rate": 6.586416554222609e-05, "loss": 2.2668, "step": 46610 }, { "epoch": 0.4, "learning_rate": 6.585780411575603e-05, "loss": 2.3729, "step": 46615 }, { "epoch": 0.4, "learning_rate": 6.585144240387353e-05, "loss": 2.3224, "step": 46620 }, { "epoch": 0.4, "learning_rate": 6.584508040669312e-05, "loss": 2.2407, "step": 46625 }, { "epoch": 0.4, "learning_rate": 6.583871812432932e-05, "loss": 2.3295, "step": 46630 }, { "epoch": 0.4, "learning_rate": 6.583235555689659e-05, "loss": 2.2825, "step": 46635 }, { "epoch": 0.4, "learning_rate": 6.582599270450947e-05, "loss": 2.3099, "step": 46640 }, { "epoch": 0.4, "learning_rate": 6.581962956728249e-05, "loss": 2.3472, "step": 46645 }, { "epoch": 0.4, "learning_rate": 6.581326614533017e-05, "loss": 2.3674, "step": 46650 }, { "epoch": 0.4, "learning_rate": 6.580690243876704e-05, "loss": 2.2931, "step": 46655 }, { "epoch": 0.4, "learning_rate": 6.580053844770763e-05, "loss": 2.3703, "step": 46660 }, { "epoch": 0.4, "learning_rate": 6.579417417226648e-05, "loss": 2.3093, "step": 46665 }, { "epoch": 0.4, "learning_rate": 6.578780961255815e-05, "loss": 2.3611, "step": 46670 }, { "epoch": 0.4, "learning_rate": 6.578144476869719e-05, "loss": 2.3271, "step": 46675 }, { "epoch": 0.4, "learning_rate": 6.577507964079812e-05, "loss": 2.2142, "step": 46680 }, { "epoch": 0.4, "learning_rate": 6.576871422897553e-05, "loss": 2.2541, "step": 46685 }, { "epoch": 0.4, "learning_rate": 6.5762348533344e-05, "loss": 2.2519, "step": 46690 }, { "epoch": 0.4, "learning_rate": 6.575598255401807e-05, "loss": 2.294, "step": 46695 }, { "epoch": 0.4, "learning_rate": 6.574961629111234e-05, "loss": 2.3492, "step": 46700 }, { "epoch": 0.4, "learning_rate": 6.574324974474138e-05, "loss": 2.2859, "step": 46705 }, { "epoch": 0.4, "learning_rate": 6.573688291501978e-05, "loss": 2.3113, "step": 46710 }, { "epoch": 0.4, "learning_rate": 6.573051580206212e-05, "loss": 2.3667, "step": 46715 }, { "epoch": 0.4, "learning_rate": 6.572414840598301e-05, "loss": 2.3881, "step": 46720 }, { "epoch": 0.4, "learning_rate": 6.571778072689707e-05, "loss": 2.248, "step": 46725 }, { "epoch": 0.4, "learning_rate": 6.571141276491885e-05, "loss": 2.2291, "step": 46730 }, { "epoch": 0.4, "learning_rate": 6.570504452016304e-05, "loss": 2.3951, "step": 46735 }, { "epoch": 0.4, "learning_rate": 6.569867599274418e-05, "loss": 2.2692, "step": 46740 }, { "epoch": 0.4, "learning_rate": 6.569230718277694e-05, "loss": 2.3291, "step": 46745 }, { "epoch": 0.4, "learning_rate": 6.568593809037595e-05, "loss": 2.2532, "step": 46750 }, { "epoch": 0.4, "learning_rate": 6.567956871565582e-05, "loss": 2.3596, "step": 46755 }, { "epoch": 0.4, "learning_rate": 6.567319905873119e-05, "loss": 2.3079, "step": 46760 }, { "epoch": 0.4, "learning_rate": 6.56668291197167e-05, "loss": 2.4228, "step": 46765 }, { "epoch": 0.4, "learning_rate": 6.566045889872702e-05, "loss": 2.2851, "step": 46770 }, { "epoch": 0.4, "learning_rate": 6.565408839587678e-05, "loss": 2.2701, "step": 46775 }, { "epoch": 0.4, "learning_rate": 6.564771761128064e-05, "loss": 2.3974, "step": 46780 }, { "epoch": 0.4, "learning_rate": 6.564134654505328e-05, "loss": 2.4157, "step": 46785 }, { "epoch": 0.4, "learning_rate": 6.563497519730934e-05, "loss": 2.3577, "step": 46790 }, { "epoch": 0.4, "learning_rate": 6.562860356816351e-05, "loss": 2.3026, "step": 46795 }, { "epoch": 0.4, "learning_rate": 6.562223165773049e-05, "loss": 2.3343, "step": 46800 }, { "epoch": 0.4, "learning_rate": 6.561585946612493e-05, "loss": 2.2855, "step": 46805 }, { "epoch": 0.4, "learning_rate": 6.560948699346152e-05, "loss": 2.3446, "step": 46810 }, { "epoch": 0.4, "learning_rate": 6.560311423985496e-05, "loss": 2.3068, "step": 46815 }, { "epoch": 0.4, "learning_rate": 6.559674120541997e-05, "loss": 2.2955, "step": 46820 }, { "epoch": 0.4, "learning_rate": 6.559036789027123e-05, "loss": 2.3141, "step": 46825 }, { "epoch": 0.4, "learning_rate": 6.558399429452344e-05, "loss": 2.3355, "step": 46830 }, { "epoch": 0.4, "learning_rate": 6.557762041829133e-05, "loss": 2.2728, "step": 46835 }, { "epoch": 0.4, "learning_rate": 6.557124626168962e-05, "loss": 2.2744, "step": 46840 }, { "epoch": 0.4, "learning_rate": 6.556487182483301e-05, "loss": 2.3195, "step": 46845 }, { "epoch": 0.4, "learning_rate": 6.555849710783626e-05, "loss": 2.3311, "step": 46850 }, { "epoch": 0.4, "learning_rate": 6.555212211081408e-05, "loss": 2.3248, "step": 46855 }, { "epoch": 0.4, "learning_rate": 6.554574683388122e-05, "loss": 2.3215, "step": 46860 }, { "epoch": 0.4, "learning_rate": 6.553937127715244e-05, "loss": 2.311, "step": 46865 }, { "epoch": 0.4, "learning_rate": 6.553299544074244e-05, "loss": 2.2465, "step": 46870 }, { "epoch": 0.4, "learning_rate": 6.552661932476603e-05, "loss": 2.3291, "step": 46875 }, { "epoch": 0.4, "learning_rate": 6.552024292933794e-05, "loss": 2.4024, "step": 46880 }, { "epoch": 0.4, "learning_rate": 6.551386625457294e-05, "loss": 2.279, "step": 46885 }, { "epoch": 0.4, "learning_rate": 6.550748930058577e-05, "loss": 2.3247, "step": 46890 }, { "epoch": 0.4, "learning_rate": 6.550111206749125e-05, "loss": 2.3564, "step": 46895 }, { "epoch": 0.4, "learning_rate": 6.549473455540414e-05, "loss": 2.306, "step": 46900 }, { "epoch": 0.4, "learning_rate": 6.54883567644392e-05, "loss": 2.3159, "step": 46905 }, { "epoch": 0.4, "learning_rate": 6.548197869471127e-05, "loss": 2.2291, "step": 46910 }, { "epoch": 0.4, "learning_rate": 6.547560034633512e-05, "loss": 2.3571, "step": 46915 }, { "epoch": 0.4, "learning_rate": 6.546922171942553e-05, "loss": 2.272, "step": 46920 }, { "epoch": 0.4, "learning_rate": 6.546284281409731e-05, "loss": 2.3296, "step": 46925 }, { "epoch": 0.4, "learning_rate": 6.54564636304653e-05, "loss": 2.334, "step": 46930 }, { "epoch": 0.4, "learning_rate": 6.545008416864427e-05, "loss": 2.2677, "step": 46935 }, { "epoch": 0.4, "learning_rate": 6.544370442874907e-05, "loss": 2.2931, "step": 46940 }, { "epoch": 0.4, "learning_rate": 6.543732441089451e-05, "loss": 2.2641, "step": 46945 }, { "epoch": 0.4, "learning_rate": 6.543094411519543e-05, "loss": 2.276, "step": 46950 }, { "epoch": 0.4, "learning_rate": 6.542456354176665e-05, "loss": 2.3308, "step": 46955 }, { "epoch": 0.4, "learning_rate": 6.541818269072304e-05, "loss": 2.3442, "step": 46960 }, { "epoch": 0.4, "learning_rate": 6.54118015621794e-05, "loss": 2.3834, "step": 46965 }, { "epoch": 0.4, "learning_rate": 6.54054201562506e-05, "loss": 2.3513, "step": 46970 }, { "epoch": 0.4, "learning_rate": 6.53990384730515e-05, "loss": 2.2837, "step": 46975 }, { "epoch": 0.4, "learning_rate": 6.539265651269696e-05, "loss": 2.3778, "step": 46980 }, { "epoch": 0.4, "learning_rate": 6.538627427530181e-05, "loss": 2.3303, "step": 46985 }, { "epoch": 0.4, "learning_rate": 6.537989176098098e-05, "loss": 2.3522, "step": 46990 }, { "epoch": 0.4, "learning_rate": 6.537350896984928e-05, "loss": 2.2792, "step": 46995 }, { "epoch": 0.4, "learning_rate": 6.536712590202164e-05, "loss": 2.2241, "step": 47000 }, { "epoch": 0.4, "learning_rate": 6.53607425576129e-05, "loss": 2.3917, "step": 47005 }, { "epoch": 0.4, "learning_rate": 6.5354358936738e-05, "loss": 2.3361, "step": 47010 }, { "epoch": 0.4, "learning_rate": 6.534797503951179e-05, "loss": 2.3198, "step": 47015 }, { "epoch": 0.4, "learning_rate": 6.534159086604919e-05, "loss": 2.3193, "step": 47020 }, { "epoch": 0.4, "learning_rate": 6.53352064164651e-05, "loss": 2.2526, "step": 47025 }, { "epoch": 0.4, "learning_rate": 6.532882169087442e-05, "loss": 2.2743, "step": 47030 }, { "epoch": 0.4, "learning_rate": 6.532243668939207e-05, "loss": 2.3413, "step": 47035 }, { "epoch": 0.4, "learning_rate": 6.531605141213297e-05, "loss": 2.3843, "step": 47040 }, { "epoch": 0.4, "learning_rate": 6.530966585921204e-05, "loss": 2.3335, "step": 47045 }, { "epoch": 0.4, "learning_rate": 6.53032800307442e-05, "loss": 2.3093, "step": 47050 }, { "epoch": 0.4, "learning_rate": 6.529689392684442e-05, "loss": 2.2542, "step": 47055 }, { "epoch": 0.4, "learning_rate": 6.529050754762762e-05, "loss": 2.3312, "step": 47060 }, { "epoch": 0.4, "learning_rate": 6.528412089320871e-05, "loss": 2.2878, "step": 47065 }, { "epoch": 0.4, "learning_rate": 6.527773396370269e-05, "loss": 2.3398, "step": 47070 }, { "epoch": 0.4, "learning_rate": 6.527134675922448e-05, "loss": 2.374, "step": 47075 }, { "epoch": 0.4, "learning_rate": 6.526495927988903e-05, "loss": 2.4058, "step": 47080 }, { "epoch": 0.4, "learning_rate": 6.525857152581135e-05, "loss": 2.3856, "step": 47085 }, { "epoch": 0.4, "learning_rate": 6.525218349710636e-05, "loss": 2.2518, "step": 47090 }, { "epoch": 0.4, "learning_rate": 6.524579519388906e-05, "loss": 2.269, "step": 47095 }, { "epoch": 0.4, "learning_rate": 6.523940661627441e-05, "loss": 2.3993, "step": 47100 }, { "epoch": 0.4, "learning_rate": 6.523301776437743e-05, "loss": 2.2278, "step": 47105 }, { "epoch": 0.4, "learning_rate": 6.522662863831306e-05, "loss": 2.2949, "step": 47110 }, { "epoch": 0.4, "learning_rate": 6.522023923819633e-05, "loss": 2.2685, "step": 47115 }, { "epoch": 0.4, "learning_rate": 6.521384956414221e-05, "loss": 2.3115, "step": 47120 }, { "epoch": 0.4, "learning_rate": 6.520745961626572e-05, "loss": 2.2861, "step": 47125 }, { "epoch": 0.4, "learning_rate": 6.520106939468186e-05, "loss": 2.3031, "step": 47130 }, { "epoch": 0.4, "learning_rate": 6.519467889950566e-05, "loss": 2.262, "step": 47135 }, { "epoch": 0.4, "learning_rate": 6.518828813085212e-05, "loss": 2.2458, "step": 47140 }, { "epoch": 0.4, "learning_rate": 6.518189708883624e-05, "loss": 2.296, "step": 47145 }, { "epoch": 0.4, "learning_rate": 6.517550577357309e-05, "loss": 2.3131, "step": 47150 }, { "epoch": 0.4, "learning_rate": 6.51691141851777e-05, "loss": 2.2753, "step": 47155 }, { "epoch": 0.4, "learning_rate": 6.516272232376508e-05, "loss": 2.3716, "step": 47160 }, { "epoch": 0.4, "learning_rate": 6.515633018945028e-05, "loss": 2.3123, "step": 47165 }, { "epoch": 0.4, "learning_rate": 6.514993778234837e-05, "loss": 2.381, "step": 47170 }, { "epoch": 0.4, "learning_rate": 6.514354510257438e-05, "loss": 2.2494, "step": 47175 }, { "epoch": 0.4, "learning_rate": 6.513715215024336e-05, "loss": 2.3352, "step": 47180 }, { "epoch": 0.4, "learning_rate": 6.513075892547038e-05, "loss": 2.2792, "step": 47185 }, { "epoch": 0.4, "learning_rate": 6.512436542837053e-05, "loss": 2.3047, "step": 47190 }, { "epoch": 0.4, "learning_rate": 6.511797165905884e-05, "loss": 2.3281, "step": 47195 }, { "epoch": 0.4, "learning_rate": 6.511157761765043e-05, "loss": 2.369, "step": 47200 }, { "epoch": 0.4, "learning_rate": 6.510518330426034e-05, "loss": 2.3732, "step": 47205 }, { "epoch": 0.4, "learning_rate": 6.509878871900367e-05, "loss": 2.3636, "step": 47210 }, { "epoch": 0.4, "learning_rate": 6.509239386199556e-05, "loss": 2.325, "step": 47215 }, { "epoch": 0.4, "learning_rate": 6.508599873335103e-05, "loss": 2.3021, "step": 47220 }, { "epoch": 0.4, "learning_rate": 6.507960333318522e-05, "loss": 2.2316, "step": 47225 }, { "epoch": 0.4, "learning_rate": 6.507320766161323e-05, "loss": 2.2805, "step": 47230 }, { "epoch": 0.4, "learning_rate": 6.506681171875018e-05, "loss": 2.3193, "step": 47235 }, { "epoch": 0.4, "learning_rate": 6.506041550471115e-05, "loss": 2.2549, "step": 47240 }, { "epoch": 0.4, "learning_rate": 6.505401901961132e-05, "loss": 2.3892, "step": 47245 }, { "epoch": 0.4, "learning_rate": 6.504762226356576e-05, "loss": 2.3494, "step": 47250 }, { "epoch": 0.4, "learning_rate": 6.504122523668963e-05, "loss": 2.3621, "step": 47255 }, { "epoch": 0.4, "learning_rate": 6.503482793909806e-05, "loss": 2.3272, "step": 47260 }, { "epoch": 0.4, "learning_rate": 6.502843037090618e-05, "loss": 2.3599, "step": 47265 }, { "epoch": 0.4, "learning_rate": 6.502203253222916e-05, "loss": 2.3201, "step": 47270 }, { "epoch": 0.4, "learning_rate": 6.501563442318212e-05, "loss": 2.3141, "step": 47275 }, { "epoch": 0.4, "learning_rate": 6.500923604388023e-05, "loss": 2.344, "step": 47280 }, { "epoch": 0.4, "learning_rate": 6.500283739443865e-05, "loss": 2.2831, "step": 47285 }, { "epoch": 0.4, "learning_rate": 6.499643847497253e-05, "loss": 2.3954, "step": 47290 }, { "epoch": 0.4, "learning_rate": 6.499003928559706e-05, "loss": 2.378, "step": 47295 }, { "epoch": 0.4, "learning_rate": 6.49836398264274e-05, "loss": 2.3185, "step": 47300 }, { "epoch": 0.4, "learning_rate": 6.497724009757874e-05, "loss": 2.3738, "step": 47305 }, { "epoch": 0.4, "learning_rate": 6.497084009916625e-05, "loss": 2.355, "step": 47310 }, { "epoch": 0.4, "learning_rate": 6.496443983130514e-05, "loss": 2.3204, "step": 47315 }, { "epoch": 0.4, "learning_rate": 6.495803929411058e-05, "loss": 2.293, "step": 47320 }, { "epoch": 0.4, "learning_rate": 6.495163848769778e-05, "loss": 2.3416, "step": 47325 }, { "epoch": 0.4, "learning_rate": 6.494523741218194e-05, "loss": 2.3327, "step": 47330 }, { "epoch": 0.4, "learning_rate": 6.493883606767827e-05, "loss": 2.2898, "step": 47335 }, { "epoch": 0.4, "learning_rate": 6.493243445430197e-05, "loss": 2.3223, "step": 47340 }, { "epoch": 0.4, "learning_rate": 6.492603257216828e-05, "loss": 2.2993, "step": 47345 }, { "epoch": 0.4, "learning_rate": 6.491963042139242e-05, "loss": 2.2796, "step": 47350 }, { "epoch": 0.4, "learning_rate": 6.491322800208959e-05, "loss": 2.3643, "step": 47355 }, { "epoch": 0.4, "learning_rate": 6.490682531437505e-05, "loss": 2.2924, "step": 47360 }, { "epoch": 0.4, "learning_rate": 6.490042235836404e-05, "loss": 2.2968, "step": 47365 }, { "epoch": 0.4, "learning_rate": 6.489401913417178e-05, "loss": 2.3106, "step": 47370 }, { "epoch": 0.4, "learning_rate": 6.488761564191354e-05, "loss": 2.2419, "step": 47375 }, { "epoch": 0.4, "learning_rate": 6.488121188170456e-05, "loss": 2.3415, "step": 47380 }, { "epoch": 0.4, "learning_rate": 6.487480785366007e-05, "loss": 2.2949, "step": 47385 }, { "epoch": 0.4, "learning_rate": 6.486840355789537e-05, "loss": 2.3296, "step": 47390 }, { "epoch": 0.4, "learning_rate": 6.486199899452572e-05, "loss": 2.3261, "step": 47395 }, { "epoch": 0.4, "learning_rate": 6.485559416366636e-05, "loss": 2.3106, "step": 47400 }, { "epoch": 0.4, "learning_rate": 6.484918906543262e-05, "loss": 2.2507, "step": 47405 }, { "epoch": 0.4, "learning_rate": 6.484278369993973e-05, "loss": 2.3094, "step": 47410 }, { "epoch": 0.4, "learning_rate": 6.483637806730301e-05, "loss": 2.3043, "step": 47415 }, { "epoch": 0.4, "learning_rate": 6.48299721676377e-05, "loss": 2.2802, "step": 47420 }, { "epoch": 0.4, "learning_rate": 6.482356600105917e-05, "loss": 2.262, "step": 47425 }, { "epoch": 0.4, "learning_rate": 6.481715956768268e-05, "loss": 2.309, "step": 47430 }, { "epoch": 0.4, "learning_rate": 6.48107528676235e-05, "loss": 2.2246, "step": 47435 }, { "epoch": 0.4, "learning_rate": 6.4804345900997e-05, "loss": 2.2914, "step": 47440 }, { "epoch": 0.4, "learning_rate": 6.479793866791845e-05, "loss": 2.3205, "step": 47445 }, { "epoch": 0.4, "learning_rate": 6.47915311685032e-05, "loss": 2.2194, "step": 47450 }, { "epoch": 0.4, "learning_rate": 6.478512340286655e-05, "loss": 2.2938, "step": 47455 }, { "epoch": 0.4, "learning_rate": 6.477871537112384e-05, "loss": 2.2424, "step": 47460 }, { "epoch": 0.41, "learning_rate": 6.47723070733904e-05, "loss": 2.332, "step": 47465 }, { "epoch": 0.41, "learning_rate": 6.476589850978156e-05, "loss": 2.2533, "step": 47470 }, { "epoch": 0.41, "learning_rate": 6.475948968041268e-05, "loss": 2.2342, "step": 47475 }, { "epoch": 0.41, "learning_rate": 6.475308058539912e-05, "loss": 2.3333, "step": 47480 }, { "epoch": 0.41, "learning_rate": 6.474667122485618e-05, "loss": 2.2576, "step": 47485 }, { "epoch": 0.41, "learning_rate": 6.474026159889927e-05, "loss": 2.3207, "step": 47490 }, { "epoch": 0.41, "learning_rate": 6.473385170764373e-05, "loss": 2.2615, "step": 47495 }, { "epoch": 0.41, "learning_rate": 6.472744155120492e-05, "loss": 2.2539, "step": 47500 }, { "epoch": 0.41, "learning_rate": 6.472103112969823e-05, "loss": 2.3422, "step": 47505 }, { "epoch": 0.41, "learning_rate": 6.4714620443239e-05, "loss": 2.3045, "step": 47510 }, { "epoch": 0.41, "learning_rate": 6.470820949194265e-05, "loss": 2.2966, "step": 47515 }, { "epoch": 0.41, "learning_rate": 6.470179827592456e-05, "loss": 2.3686, "step": 47520 }, { "epoch": 0.41, "learning_rate": 6.469538679530011e-05, "loss": 2.3178, "step": 47525 }, { "epoch": 0.41, "learning_rate": 6.468897505018469e-05, "loss": 2.3499, "step": 47530 }, { "epoch": 0.41, "learning_rate": 6.468256304069373e-05, "loss": 2.3533, "step": 47535 }, { "epoch": 0.41, "learning_rate": 6.46761507669426e-05, "loss": 2.4631, "step": 47540 }, { "epoch": 0.41, "learning_rate": 6.466973822904671e-05, "loss": 2.3727, "step": 47545 }, { "epoch": 0.41, "learning_rate": 6.466332542712152e-05, "loss": 2.3394, "step": 47550 }, { "epoch": 0.41, "learning_rate": 6.465691236128239e-05, "loss": 2.2694, "step": 47555 }, { "epoch": 0.41, "learning_rate": 6.465049903164476e-05, "loss": 2.4134, "step": 47560 }, { "epoch": 0.41, "learning_rate": 6.464408543832407e-05, "loss": 2.3739, "step": 47565 }, { "epoch": 0.41, "learning_rate": 6.463767158143578e-05, "loss": 2.3349, "step": 47570 }, { "epoch": 0.41, "learning_rate": 6.463125746109529e-05, "loss": 2.3049, "step": 47575 }, { "epoch": 0.41, "learning_rate": 6.462484307741804e-05, "loss": 2.2719, "step": 47580 }, { "epoch": 0.41, "learning_rate": 6.461842843051949e-05, "loss": 2.3013, "step": 47585 }, { "epoch": 0.41, "learning_rate": 6.461201352051511e-05, "loss": 2.2903, "step": 47590 }, { "epoch": 0.41, "learning_rate": 6.460559834752033e-05, "loss": 2.3232, "step": 47595 }, { "epoch": 0.41, "learning_rate": 6.459918291165061e-05, "loss": 2.3037, "step": 47600 }, { "epoch": 0.41, "learning_rate": 6.459276721302146e-05, "loss": 2.329, "step": 47605 }, { "epoch": 0.41, "learning_rate": 6.458635125174828e-05, "loss": 2.3051, "step": 47610 }, { "epoch": 0.41, "learning_rate": 6.45799350279466e-05, "loss": 2.2345, "step": 47615 }, { "epoch": 0.41, "learning_rate": 6.45735185417319e-05, "loss": 2.3908, "step": 47620 }, { "epoch": 0.41, "learning_rate": 6.456710179321963e-05, "loss": 2.3617, "step": 47625 }, { "epoch": 0.41, "learning_rate": 6.45606847825253e-05, "loss": 2.325, "step": 47630 }, { "epoch": 0.41, "learning_rate": 6.455426750976443e-05, "loss": 2.3363, "step": 47635 }, { "epoch": 0.41, "learning_rate": 6.454784997505248e-05, "loss": 2.3092, "step": 47640 }, { "epoch": 0.41, "learning_rate": 6.454143217850497e-05, "loss": 2.2481, "step": 47645 }, { "epoch": 0.41, "learning_rate": 6.453501412023741e-05, "loss": 2.345, "step": 47650 }, { "epoch": 0.41, "learning_rate": 6.45285958003653e-05, "loss": 2.3073, "step": 47655 }, { "epoch": 0.41, "learning_rate": 6.45221772190042e-05, "loss": 2.3311, "step": 47660 }, { "epoch": 0.41, "learning_rate": 6.451575837626958e-05, "loss": 2.2528, "step": 47665 }, { "epoch": 0.41, "learning_rate": 6.450933927227701e-05, "loss": 2.3584, "step": 47670 }, { "epoch": 0.41, "learning_rate": 6.450291990714198e-05, "loss": 2.2929, "step": 47675 }, { "epoch": 0.41, "learning_rate": 6.449650028098007e-05, "loss": 2.2788, "step": 47680 }, { "epoch": 0.41, "learning_rate": 6.449008039390681e-05, "loss": 2.2783, "step": 47685 }, { "epoch": 0.41, "learning_rate": 6.448366024603772e-05, "loss": 2.2461, "step": 47690 }, { "epoch": 0.41, "learning_rate": 6.447723983748838e-05, "loss": 2.3185, "step": 47695 }, { "epoch": 0.41, "learning_rate": 6.447081916837434e-05, "loss": 2.2827, "step": 47700 }, { "epoch": 0.41, "learning_rate": 6.446439823881115e-05, "loss": 2.3554, "step": 47705 }, { "epoch": 0.41, "learning_rate": 6.44579770489144e-05, "loss": 2.3166, "step": 47710 }, { "epoch": 0.41, "learning_rate": 6.445155559879963e-05, "loss": 2.2743, "step": 47715 }, { "epoch": 0.41, "learning_rate": 6.444513388858243e-05, "loss": 2.3049, "step": 47720 }, { "epoch": 0.41, "learning_rate": 6.443871191837838e-05, "loss": 2.3356, "step": 47725 }, { "epoch": 0.41, "learning_rate": 6.443228968830306e-05, "loss": 2.2967, "step": 47730 }, { "epoch": 0.41, "learning_rate": 6.442586719847207e-05, "loss": 2.3136, "step": 47735 }, { "epoch": 0.41, "learning_rate": 6.441944444900098e-05, "loss": 2.2987, "step": 47740 }, { "epoch": 0.41, "learning_rate": 6.44130214400054e-05, "loss": 2.2653, "step": 47745 }, { "epoch": 0.41, "learning_rate": 6.440659817160095e-05, "loss": 2.2932, "step": 47750 }, { "epoch": 0.41, "learning_rate": 6.440017464390321e-05, "loss": 2.2501, "step": 47755 }, { "epoch": 0.41, "learning_rate": 6.439375085702782e-05, "loss": 2.308, "step": 47760 }, { "epoch": 0.41, "learning_rate": 6.438732681109036e-05, "loss": 2.3248, "step": 47765 }, { "epoch": 0.41, "learning_rate": 6.438090250620648e-05, "loss": 2.3641, "step": 47770 }, { "epoch": 0.41, "learning_rate": 6.437447794249181e-05, "loss": 2.2943, "step": 47775 }, { "epoch": 0.41, "learning_rate": 6.436805312006196e-05, "loss": 2.2664, "step": 47780 }, { "epoch": 0.41, "learning_rate": 6.436162803903258e-05, "loss": 2.2992, "step": 47785 }, { "epoch": 0.41, "learning_rate": 6.43552026995193e-05, "loss": 2.3301, "step": 47790 }, { "epoch": 0.41, "learning_rate": 6.434877710163777e-05, "loss": 2.3129, "step": 47795 }, { "epoch": 0.41, "learning_rate": 6.434235124550364e-05, "loss": 2.4242, "step": 47800 }, { "epoch": 0.41, "learning_rate": 6.433592513123257e-05, "loss": 2.265, "step": 47805 }, { "epoch": 0.41, "learning_rate": 6.432949875894021e-05, "loss": 2.2953, "step": 47810 }, { "epoch": 0.41, "learning_rate": 6.432307212874223e-05, "loss": 2.3073, "step": 47815 }, { "epoch": 0.41, "learning_rate": 6.431664524075427e-05, "loss": 2.307, "step": 47820 }, { "epoch": 0.41, "learning_rate": 6.431021809509205e-05, "loss": 2.3599, "step": 47825 }, { "epoch": 0.41, "learning_rate": 6.430379069187121e-05, "loss": 2.2446, "step": 47830 }, { "epoch": 0.41, "learning_rate": 6.429736303120744e-05, "loss": 2.3129, "step": 47835 }, { "epoch": 0.41, "learning_rate": 6.429093511321646e-05, "loss": 2.2303, "step": 47840 }, { "epoch": 0.41, "learning_rate": 6.428450693801392e-05, "loss": 2.3517, "step": 47845 }, { "epoch": 0.41, "learning_rate": 6.427807850571552e-05, "loss": 2.3345, "step": 47850 }, { "epoch": 0.41, "learning_rate": 6.427164981643697e-05, "loss": 2.2969, "step": 47855 }, { "epoch": 0.41, "learning_rate": 6.426522087029399e-05, "loss": 2.3589, "step": 47860 }, { "epoch": 0.41, "learning_rate": 6.425879166740225e-05, "loss": 2.2988, "step": 47865 }, { "epoch": 0.41, "learning_rate": 6.42523622078775e-05, "loss": 2.417, "step": 47870 }, { "epoch": 0.41, "learning_rate": 6.424593249183544e-05, "loss": 2.3213, "step": 47875 }, { "epoch": 0.41, "learning_rate": 6.423950251939181e-05, "loss": 2.3185, "step": 47880 }, { "epoch": 0.41, "learning_rate": 6.423307229066231e-05, "loss": 2.3553, "step": 47885 }, { "epoch": 0.41, "learning_rate": 6.422664180576272e-05, "loss": 2.348, "step": 47890 }, { "epoch": 0.41, "learning_rate": 6.422021106480873e-05, "loss": 2.3388, "step": 47895 }, { "epoch": 0.41, "learning_rate": 6.42137800679161e-05, "loss": 2.2422, "step": 47900 }, { "epoch": 0.41, "learning_rate": 6.420734881520059e-05, "loss": 2.3164, "step": 47905 }, { "epoch": 0.41, "learning_rate": 6.420091730677793e-05, "loss": 2.2554, "step": 47910 }, { "epoch": 0.41, "learning_rate": 6.419448554276389e-05, "loss": 2.3365, "step": 47915 }, { "epoch": 0.41, "learning_rate": 6.418805352327421e-05, "loss": 2.3333, "step": 47920 }, { "epoch": 0.41, "learning_rate": 6.418162124842467e-05, "loss": 2.3255, "step": 47925 }, { "epoch": 0.41, "learning_rate": 6.417518871833104e-05, "loss": 2.3054, "step": 47930 }, { "epoch": 0.41, "learning_rate": 6.416875593310912e-05, "loss": 2.3069, "step": 47935 }, { "epoch": 0.41, "learning_rate": 6.416232289287464e-05, "loss": 2.3229, "step": 47940 }, { "epoch": 0.41, "learning_rate": 6.41558895977434e-05, "loss": 2.3375, "step": 47945 }, { "epoch": 0.41, "learning_rate": 6.41494560478312e-05, "loss": 2.3284, "step": 47950 }, { "epoch": 0.41, "learning_rate": 6.414302224325384e-05, "loss": 2.2834, "step": 47955 }, { "epoch": 0.41, "learning_rate": 6.413658818412708e-05, "loss": 2.2825, "step": 47960 }, { "epoch": 0.41, "learning_rate": 6.413015387056676e-05, "loss": 2.3338, "step": 47965 }, { "epoch": 0.41, "learning_rate": 6.412371930268866e-05, "loss": 2.2538, "step": 47970 }, { "epoch": 0.41, "learning_rate": 6.41172844806086e-05, "loss": 2.2599, "step": 47975 }, { "epoch": 0.41, "learning_rate": 6.411084940444239e-05, "loss": 2.2827, "step": 47980 }, { "epoch": 0.41, "learning_rate": 6.410441407430587e-05, "loss": 2.3188, "step": 47985 }, { "epoch": 0.41, "learning_rate": 6.409797849031488e-05, "loss": 2.3109, "step": 47990 }, { "epoch": 0.41, "learning_rate": 6.409154265258517e-05, "loss": 2.3348, "step": 47995 }, { "epoch": 0.41, "learning_rate": 6.408510656123265e-05, "loss": 2.3632, "step": 48000 } ], "logging_steps": 5, "max_steps": 117186, "num_train_epochs": 1, "save_steps": 1000, "total_flos": 6.461462616735744e+18, "trial_name": null, "trial_params": null }