|
{ |
|
"best_metric": 0.30745795369148254, |
|
"best_model_checkpoint": "asd_pronunciation_w2v_xlsr-reg/checkpoint-99", |
|
"epoch": 49.977777777777774, |
|
"global_step": 550, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.98, |
|
"eval_loss": 0.8269791603088379, |
|
"eval_mse": 0.8274638056755066, |
|
"eval_runtime": 67.3404, |
|
"eval_samples_per_second": 31.497, |
|
"eval_steps_per_second": 0.995, |
|
"step": 11 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_loss": 0.4631172716617584, |
|
"eval_mse": 0.46300947666168213, |
|
"eval_runtime": 67.2163, |
|
"eval_samples_per_second": 31.555, |
|
"eval_steps_per_second": 0.997, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 2.98, |
|
"eval_loss": 0.351409912109375, |
|
"eval_mse": 0.3515050709247589, |
|
"eval_runtime": 67.5563, |
|
"eval_samples_per_second": 31.396, |
|
"eval_steps_per_second": 0.992, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 3.98, |
|
"eval_loss": 0.3585782051086426, |
|
"eval_mse": 0.35852691531181335, |
|
"eval_runtime": 69.7976, |
|
"eval_samples_per_second": 30.388, |
|
"eval_steps_per_second": 0.96, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 4.98, |
|
"eval_loss": 0.4412296712398529, |
|
"eval_mse": 0.4412075877189636, |
|
"eval_runtime": 79.1138, |
|
"eval_samples_per_second": 26.809, |
|
"eval_steps_per_second": 0.847, |
|
"step": 55 |
|
}, |
|
{ |
|
"epoch": 5.98, |
|
"eval_loss": 0.430486798286438, |
|
"eval_mse": 0.43049314618110657, |
|
"eval_runtime": 72.5547, |
|
"eval_samples_per_second": 29.233, |
|
"eval_steps_per_second": 0.923, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 6.98, |
|
"eval_loss": 0.42916765809059143, |
|
"eval_mse": 0.4291659891605377, |
|
"eval_runtime": 95.5528, |
|
"eval_samples_per_second": 22.197, |
|
"eval_steps_per_second": 0.701, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 7.98, |
|
"eval_loss": 0.4343053996562958, |
|
"eval_mse": 0.43428245186805725, |
|
"eval_runtime": 66.5007, |
|
"eval_samples_per_second": 31.894, |
|
"eval_steps_per_second": 1.008, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 8.98, |
|
"eval_loss": 0.30745795369148254, |
|
"eval_mse": 0.3074318766593933, |
|
"eval_runtime": 66.2359, |
|
"eval_samples_per_second": 32.022, |
|
"eval_steps_per_second": 1.012, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"eval_loss": 0.42939332127571106, |
|
"eval_mse": 0.4293690323829651, |
|
"eval_runtime": 66.3865, |
|
"eval_samples_per_second": 31.949, |
|
"eval_steps_per_second": 1.009, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 10.98, |
|
"eval_loss": 0.3727492094039917, |
|
"eval_mse": 0.3727482855319977, |
|
"eval_runtime": 66.8857, |
|
"eval_samples_per_second": 31.711, |
|
"eval_steps_per_second": 1.002, |
|
"step": 121 |
|
}, |
|
{ |
|
"epoch": 11.98, |
|
"eval_loss": 0.42278197407722473, |
|
"eval_mse": 0.42277276515960693, |
|
"eval_runtime": 65.5197, |
|
"eval_samples_per_second": 32.372, |
|
"eval_steps_per_second": 1.023, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 12.98, |
|
"eval_loss": 0.4014572203159332, |
|
"eval_mse": 0.40141549706459045, |
|
"eval_runtime": 65.6627, |
|
"eval_samples_per_second": 32.301, |
|
"eval_steps_per_second": 1.02, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 13.98, |
|
"eval_loss": 0.37818050384521484, |
|
"eval_mse": 0.37818947434425354, |
|
"eval_runtime": 66.0031, |
|
"eval_samples_per_second": 32.135, |
|
"eval_steps_per_second": 1.015, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 14.98, |
|
"eval_loss": 0.4358225166797638, |
|
"eval_mse": 0.43578916788101196, |
|
"eval_runtime": 65.7571, |
|
"eval_samples_per_second": 32.255, |
|
"eval_steps_per_second": 1.019, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 15.98, |
|
"eval_loss": 0.36039263010025024, |
|
"eval_mse": 0.3603877127170563, |
|
"eval_runtime": 67.6323, |
|
"eval_samples_per_second": 31.361, |
|
"eval_steps_per_second": 0.991, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 16.98, |
|
"eval_loss": 0.40446653962135315, |
|
"eval_mse": 0.40447959303855896, |
|
"eval_runtime": 66.1021, |
|
"eval_samples_per_second": 32.087, |
|
"eval_steps_per_second": 1.014, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 17.98, |
|
"eval_loss": 0.3638509213924408, |
|
"eval_mse": 0.3638397455215454, |
|
"eval_runtime": 66.1765, |
|
"eval_samples_per_second": 32.051, |
|
"eval_steps_per_second": 1.012, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 18.98, |
|
"eval_loss": 0.4001483619213104, |
|
"eval_mse": 0.400104284286499, |
|
"eval_runtime": 66.5235, |
|
"eval_samples_per_second": 31.883, |
|
"eval_steps_per_second": 1.007, |
|
"step": 209 |
|
}, |
|
{ |
|
"epoch": 19.98, |
|
"eval_loss": 0.3836788535118103, |
|
"eval_mse": 0.38362112641334534, |
|
"eval_runtime": 65.5397, |
|
"eval_samples_per_second": 32.362, |
|
"eval_steps_per_second": 1.022, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 20.98, |
|
"eval_loss": 0.3813478350639343, |
|
"eval_mse": 0.3813202679157257, |
|
"eval_runtime": 67.0847, |
|
"eval_samples_per_second": 31.617, |
|
"eval_steps_per_second": 0.999, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 21.98, |
|
"eval_loss": 0.3911483883857727, |
|
"eval_mse": 0.39113306999206543, |
|
"eval_runtime": 66.4329, |
|
"eval_samples_per_second": 31.927, |
|
"eval_steps_per_second": 1.009, |
|
"step": 242 |
|
}, |
|
{ |
|
"epoch": 22.98, |
|
"eval_loss": 0.43994417786598206, |
|
"eval_mse": 0.4399244487285614, |
|
"eval_runtime": 66.1358, |
|
"eval_samples_per_second": 32.07, |
|
"eval_steps_per_second": 1.013, |
|
"step": 253 |
|
}, |
|
{ |
|
"epoch": 23.98, |
|
"eval_loss": 0.4228975772857666, |
|
"eval_mse": 0.42288002371788025, |
|
"eval_runtime": 66.6907, |
|
"eval_samples_per_second": 31.804, |
|
"eval_steps_per_second": 1.005, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 24.98, |
|
"eval_loss": 0.4192221462726593, |
|
"eval_mse": 0.4191807508468628, |
|
"eval_runtime": 65.8241, |
|
"eval_samples_per_second": 32.222, |
|
"eval_steps_per_second": 1.018, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 25.98, |
|
"eval_loss": 0.40975797176361084, |
|
"eval_mse": 0.4097472131252289, |
|
"eval_runtime": 67.5766, |
|
"eval_samples_per_second": 31.387, |
|
"eval_steps_per_second": 0.991, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 26.98, |
|
"eval_loss": 0.3760901093482971, |
|
"eval_mse": 0.37607377767562866, |
|
"eval_runtime": 65.9157, |
|
"eval_samples_per_second": 32.177, |
|
"eval_steps_per_second": 1.016, |
|
"step": 297 |
|
}, |
|
{ |
|
"epoch": 27.98, |
|
"eval_loss": 0.389096200466156, |
|
"eval_mse": 0.3890584111213684, |
|
"eval_runtime": 65.956, |
|
"eval_samples_per_second": 32.158, |
|
"eval_steps_per_second": 1.016, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 28.98, |
|
"eval_loss": 0.4243176579475403, |
|
"eval_mse": 0.4242975115776062, |
|
"eval_runtime": 66.4794, |
|
"eval_samples_per_second": 31.905, |
|
"eval_steps_per_second": 1.008, |
|
"step": 319 |
|
}, |
|
{ |
|
"epoch": 29.98, |
|
"eval_loss": 0.4235914349555969, |
|
"eval_mse": 0.4235744774341583, |
|
"eval_runtime": 66.2277, |
|
"eval_samples_per_second": 32.026, |
|
"eval_steps_per_second": 1.012, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 30.98, |
|
"eval_loss": 0.4235081076622009, |
|
"eval_mse": 0.42347782850265503, |
|
"eval_runtime": 66.6381, |
|
"eval_samples_per_second": 31.829, |
|
"eval_steps_per_second": 1.005, |
|
"step": 341 |
|
}, |
|
{ |
|
"epoch": 31.98, |
|
"eval_loss": 0.4236636757850647, |
|
"eval_mse": 0.4236546456813812, |
|
"eval_runtime": 65.6032, |
|
"eval_samples_per_second": 32.331, |
|
"eval_steps_per_second": 1.021, |
|
"step": 352 |
|
}, |
|
{ |
|
"epoch": 32.98, |
|
"eval_loss": 0.4269878566265106, |
|
"eval_mse": 0.4269687533378601, |
|
"eval_runtime": 65.9665, |
|
"eval_samples_per_second": 32.153, |
|
"eval_steps_per_second": 1.016, |
|
"step": 363 |
|
}, |
|
{ |
|
"epoch": 33.98, |
|
"eval_loss": 0.39142194390296936, |
|
"eval_mse": 0.3913804888725281, |
|
"eval_runtime": 66.6217, |
|
"eval_samples_per_second": 31.836, |
|
"eval_steps_per_second": 1.006, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 34.98, |
|
"eval_loss": 0.3899790942668915, |
|
"eval_mse": 0.38995301723480225, |
|
"eval_runtime": 65.771, |
|
"eval_samples_per_second": 32.248, |
|
"eval_steps_per_second": 1.019, |
|
"step": 385 |
|
}, |
|
{ |
|
"epoch": 35.98, |
|
"eval_loss": 0.4031297564506531, |
|
"eval_mse": 0.4031302034854889, |
|
"eval_runtime": 68.033, |
|
"eval_samples_per_second": 31.176, |
|
"eval_steps_per_second": 0.985, |
|
"step": 396 |
|
}, |
|
{ |
|
"epoch": 36.98, |
|
"eval_loss": 0.373826265335083, |
|
"eval_mse": 0.3738201856613159, |
|
"eval_runtime": 66.1644, |
|
"eval_samples_per_second": 32.057, |
|
"eval_steps_per_second": 1.013, |
|
"step": 407 |
|
}, |
|
{ |
|
"epoch": 37.98, |
|
"eval_loss": 0.37409740686416626, |
|
"eval_mse": 0.37407544255256653, |
|
"eval_runtime": 65.7007, |
|
"eval_samples_per_second": 32.283, |
|
"eval_steps_per_second": 1.02, |
|
"step": 418 |
|
}, |
|
{ |
|
"epoch": 38.98, |
|
"eval_loss": 0.41098639369010925, |
|
"eval_mse": 0.4109634459018707, |
|
"eval_runtime": 65.8334, |
|
"eval_samples_per_second": 32.218, |
|
"eval_steps_per_second": 1.018, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 39.98, |
|
"eval_loss": 0.38580140471458435, |
|
"eval_mse": 0.3857785165309906, |
|
"eval_runtime": 65.912, |
|
"eval_samples_per_second": 32.179, |
|
"eval_steps_per_second": 1.017, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 40.98, |
|
"eval_loss": 0.40168315172195435, |
|
"eval_mse": 0.4016563296318054, |
|
"eval_runtime": 67.322, |
|
"eval_samples_per_second": 31.505, |
|
"eval_steps_per_second": 0.995, |
|
"step": 451 |
|
}, |
|
{ |
|
"epoch": 41.98, |
|
"eval_loss": 0.3875749111175537, |
|
"eval_mse": 0.3875587284564972, |
|
"eval_runtime": 65.9445, |
|
"eval_samples_per_second": 32.163, |
|
"eval_steps_per_second": 1.016, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 42.98, |
|
"eval_loss": 0.401607483625412, |
|
"eval_mse": 0.4015834629535675, |
|
"eval_runtime": 66.235, |
|
"eval_samples_per_second": 32.022, |
|
"eval_steps_per_second": 1.012, |
|
"step": 473 |
|
}, |
|
{ |
|
"epoch": 43.98, |
|
"eval_loss": 0.3939042389392853, |
|
"eval_mse": 0.3938945233821869, |
|
"eval_runtime": 66.0054, |
|
"eval_samples_per_second": 32.134, |
|
"eval_steps_per_second": 1.015, |
|
"step": 484 |
|
}, |
|
{ |
|
"epoch": 44.98, |
|
"eval_loss": 0.40803390741348267, |
|
"eval_mse": 0.40802931785583496, |
|
"eval_runtime": 66.0842, |
|
"eval_samples_per_second": 32.095, |
|
"eval_steps_per_second": 1.014, |
|
"step": 495 |
|
}, |
|
{ |
|
"epoch": 45.44, |
|
"learning_rate": 3.03030303030303e-05, |
|
"loss": 0.4034, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 45.98, |
|
"eval_loss": 0.38819119334220886, |
|
"eval_mse": 0.38818415999412537, |
|
"eval_runtime": 67.7262, |
|
"eval_samples_per_second": 31.317, |
|
"eval_steps_per_second": 0.989, |
|
"step": 506 |
|
}, |
|
{ |
|
"epoch": 46.98, |
|
"eval_loss": 0.4062108099460602, |
|
"eval_mse": 0.4061962068080902, |
|
"eval_runtime": 63.6037, |
|
"eval_samples_per_second": 33.347, |
|
"eval_steps_per_second": 1.053, |
|
"step": 517 |
|
}, |
|
{ |
|
"epoch": 47.98, |
|
"eval_loss": 0.38834279775619507, |
|
"eval_mse": 0.38832658529281616, |
|
"eval_runtime": 64.2256, |
|
"eval_samples_per_second": 33.024, |
|
"eval_steps_per_second": 1.043, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 48.98, |
|
"eval_loss": 0.3969601094722748, |
|
"eval_mse": 0.3969435691833496, |
|
"eval_runtime": 63.6409, |
|
"eval_samples_per_second": 33.328, |
|
"eval_steps_per_second": 1.053, |
|
"step": 539 |
|
}, |
|
{ |
|
"epoch": 49.98, |
|
"eval_loss": 0.3963707685470581, |
|
"eval_mse": 0.3963526785373688, |
|
"eval_runtime": 63.4841, |
|
"eval_samples_per_second": 33.41, |
|
"eval_steps_per_second": 1.055, |
|
"step": 550 |
|
} |
|
], |
|
"max_steps": 550, |
|
"num_train_epochs": 50, |
|
"total_flos": 1.603121844978697e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|