|
{ |
|
"best_metric": 0.027737604454159737, |
|
"best_model_checkpoint": "/home/cloudwalker/ASVmodel/wavlm-base_5/checkpoint-100", |
|
"epoch": 9.98109640831758, |
|
"eval_steps": 100, |
|
"global_step": 3960, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.25, |
|
"learning_rate": 7.575757575757576e-05, |
|
"loss": 0.3764, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_accuracy": 0.9947673482530993, |
|
"eval_loss": 0.027737604454159737, |
|
"eval_runtime": 497.2467, |
|
"eval_samples_per_second": 49.963, |
|
"eval_steps_per_second": 24.982, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 0.00015151515151515152, |
|
"loss": 0.1211, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_accuracy": 0.998108195137659, |
|
"eval_loss": 0.02966056950390339, |
|
"eval_runtime": 498.935, |
|
"eval_samples_per_second": 49.794, |
|
"eval_steps_per_second": 24.897, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"learning_rate": 0.00022727272727272725, |
|
"loss": 0.2525, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_accuracy": 0.9168008372242795, |
|
"eval_loss": 1.283957839012146, |
|
"eval_runtime": 499.0992, |
|
"eval_samples_per_second": 49.778, |
|
"eval_steps_per_second": 24.889, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 0.00029966329966329963, |
|
"loss": 0.784, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.34426796436309814, |
|
"eval_runtime": 499.2746, |
|
"eval_samples_per_second": 49.76, |
|
"eval_steps_per_second": 24.88, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"learning_rate": 0.00029124579124579125, |
|
"loss": 0.6053, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.3957619071006775, |
|
"eval_runtime": 499.3187, |
|
"eval_samples_per_second": 49.756, |
|
"eval_steps_per_second": 24.878, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"learning_rate": 0.0002828282828282828, |
|
"loss": 0.6038, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4848286509513855, |
|
"eval_runtime": 499.175, |
|
"eval_samples_per_second": 49.77, |
|
"eval_steps_per_second": 24.885, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 0.0002744107744107744, |
|
"loss": 0.5996, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.39541468024253845, |
|
"eval_runtime": 499.7897, |
|
"eval_samples_per_second": 49.709, |
|
"eval_steps_per_second": 24.854, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 0.00026599326599326595, |
|
"loss": 0.5914, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.3970233201980591, |
|
"eval_runtime": 499.6888, |
|
"eval_samples_per_second": 49.719, |
|
"eval_steps_per_second": 24.859, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"learning_rate": 0.00025757575757575756, |
|
"loss": 0.6077, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4722130298614502, |
|
"eval_runtime": 499.722, |
|
"eval_samples_per_second": 49.716, |
|
"eval_steps_per_second": 24.858, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"learning_rate": 0.00024915824915824913, |
|
"loss": 0.5991, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.43623748421669006, |
|
"eval_runtime": 499.9532, |
|
"eval_samples_per_second": 49.693, |
|
"eval_steps_per_second": 24.846, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 0.00024074074074074072, |
|
"loss": 0.5813, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.38707101345062256, |
|
"eval_runtime": 499.9678, |
|
"eval_samples_per_second": 49.691, |
|
"eval_steps_per_second": 24.846, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"learning_rate": 0.0002323232323232323, |
|
"loss": 0.5953, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.40134623646736145, |
|
"eval_runtime": 499.6897, |
|
"eval_samples_per_second": 49.719, |
|
"eval_steps_per_second": 24.859, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"learning_rate": 0.0002239057239057239, |
|
"loss": 0.5957, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.46927762031555176, |
|
"eval_runtime": 499.7933, |
|
"eval_samples_per_second": 49.709, |
|
"eval_steps_per_second": 24.854, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"learning_rate": 0.00021548821548821544, |
|
"loss": 0.5852, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.387899786233902, |
|
"eval_runtime": 499.9294, |
|
"eval_samples_per_second": 49.695, |
|
"eval_steps_per_second": 24.848, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"learning_rate": 0.00020707070707070703, |
|
"loss": 0.6066, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42799168825149536, |
|
"eval_runtime": 499.9481, |
|
"eval_samples_per_second": 49.693, |
|
"eval_steps_per_second": 24.847, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"learning_rate": 0.00019865319865319862, |
|
"loss": 0.6085, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4358781576156616, |
|
"eval_runtime": 499.7505, |
|
"eval_samples_per_second": 49.713, |
|
"eval_steps_per_second": 24.856, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"learning_rate": 0.00019023569023569022, |
|
"loss": 0.5944, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41665858030319214, |
|
"eval_runtime": 499.6545, |
|
"eval_samples_per_second": 49.722, |
|
"eval_steps_per_second": 24.861, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"learning_rate": 0.0001818181818181818, |
|
"loss": 0.5994, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4139242172241211, |
|
"eval_runtime": 499.4729, |
|
"eval_samples_per_second": 49.74, |
|
"eval_steps_per_second": 24.87, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"learning_rate": 0.0001734006734006734, |
|
"loss": 0.5953, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42556148767471313, |
|
"eval_runtime": 499.5722, |
|
"eval_samples_per_second": 49.731, |
|
"eval_steps_per_second": 24.865, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"learning_rate": 0.000164983164983165, |
|
"loss": 0.5929, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4370674192905426, |
|
"eval_runtime": 499.6245, |
|
"eval_samples_per_second": 49.725, |
|
"eval_steps_per_second": 24.863, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"learning_rate": 0.00015656565656565653, |
|
"loss": 0.6067, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4254782199859619, |
|
"eval_runtime": 499.8266, |
|
"eval_samples_per_second": 49.705, |
|
"eval_steps_per_second": 24.853, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"learning_rate": 0.00014814814814814812, |
|
"loss": 0.5944, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41206374764442444, |
|
"eval_runtime": 499.9874, |
|
"eval_samples_per_second": 49.689, |
|
"eval_steps_per_second": 24.845, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"learning_rate": 0.0001397306397306397, |
|
"loss": 0.5926, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42098236083984375, |
|
"eval_runtime": 499.6375, |
|
"eval_samples_per_second": 49.724, |
|
"eval_steps_per_second": 24.862, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"learning_rate": 0.0001313131313131313, |
|
"loss": 0.594, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.40572819113731384, |
|
"eval_runtime": 499.6473, |
|
"eval_samples_per_second": 49.723, |
|
"eval_steps_per_second": 24.862, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"learning_rate": 0.0001228956228956229, |
|
"loss": 0.6042, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42515799403190613, |
|
"eval_runtime": 499.6019, |
|
"eval_samples_per_second": 49.728, |
|
"eval_steps_per_second": 24.864, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"learning_rate": 0.00011447811447811446, |
|
"loss": 0.5971, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.395828515291214, |
|
"eval_runtime": 500.1612, |
|
"eval_samples_per_second": 49.672, |
|
"eval_steps_per_second": 24.836, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"learning_rate": 0.00010606060606060605, |
|
"loss": 0.597, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41235631704330444, |
|
"eval_runtime": 499.5804, |
|
"eval_samples_per_second": 49.73, |
|
"eval_steps_per_second": 24.865, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"learning_rate": 9.764309764309764e-05, |
|
"loss": 0.5816, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41006505489349365, |
|
"eval_runtime": 499.6536, |
|
"eval_samples_per_second": 49.722, |
|
"eval_steps_per_second": 24.861, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"learning_rate": 8.92255892255892e-05, |
|
"loss": 0.5944, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42578616738319397, |
|
"eval_runtime": 499.7205, |
|
"eval_samples_per_second": 49.716, |
|
"eval_steps_per_second": 24.858, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"learning_rate": 8.08080808080808e-05, |
|
"loss": 0.6053, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4414595365524292, |
|
"eval_runtime": 499.6011, |
|
"eval_samples_per_second": 49.728, |
|
"eval_steps_per_second": 24.864, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"learning_rate": 7.239057239057239e-05, |
|
"loss": 0.5894, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.40666893124580383, |
|
"eval_runtime": 499.6727, |
|
"eval_samples_per_second": 49.721, |
|
"eval_steps_per_second": 24.86, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"learning_rate": 6.397306397306397e-05, |
|
"loss": 0.5987, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41087645292282104, |
|
"eval_runtime": 499.5755, |
|
"eval_samples_per_second": 49.73, |
|
"eval_steps_per_second": 24.865, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 5.5555555555555545e-05, |
|
"loss": 0.5846, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4095437824726105, |
|
"eval_runtime": 499.7301, |
|
"eval_samples_per_second": 49.715, |
|
"eval_steps_per_second": 24.857, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"learning_rate": 4.7138047138047136e-05, |
|
"loss": 0.5982, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41868552565574646, |
|
"eval_runtime": 499.638, |
|
"eval_samples_per_second": 49.724, |
|
"eval_steps_per_second": 24.862, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"learning_rate": 3.8720538720538714e-05, |
|
"loss": 0.5932, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4124181866645813, |
|
"eval_runtime": 499.6303, |
|
"eval_samples_per_second": 49.725, |
|
"eval_steps_per_second": 24.862, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"learning_rate": 3.03030303030303e-05, |
|
"loss": 0.6007, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42121654748916626, |
|
"eval_runtime": 499.864, |
|
"eval_samples_per_second": 49.702, |
|
"eval_steps_per_second": 24.851, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 2.1885521885521884e-05, |
|
"loss": 0.6041, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4257338345050812, |
|
"eval_runtime": 499.3339, |
|
"eval_samples_per_second": 49.754, |
|
"eval_steps_per_second": 24.877, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"learning_rate": 1.3468013468013465e-05, |
|
"loss": 0.5859, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4176446497440338, |
|
"eval_runtime": 499.7293, |
|
"eval_samples_per_second": 49.715, |
|
"eval_steps_per_second": 24.857, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"learning_rate": 5.05050505050505e-06, |
|
"loss": 0.5842, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41514307260513306, |
|
"eval_runtime": 499.5922, |
|
"eval_samples_per_second": 49.729, |
|
"eval_steps_per_second": 24.864, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"step": 3960, |
|
"total_flos": 1.506420070651024e+19, |
|
"train_loss": 0.5747933341999246, |
|
"train_runtime": 22880.3496, |
|
"train_samples_per_second": 11.092, |
|
"train_steps_per_second": 0.173 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 3960, |
|
"num_train_epochs": 10, |
|
"save_steps": 100, |
|
"total_flos": 1.506420070651024e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|