swinv2-tiny-patch4-window8-256-OT / trainer_state.json
Augusto777's picture
End of training
39ca2be verified
{
"best_metric": 0.8225806451612904,
"best_model_checkpoint": "swinv2-tiny-patch4-window8-256-OT\\checkpoint-176",
"epoch": 36.36363636363637,
"eval_steps": 500,
"global_step": 200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.91,
"eval_accuracy": 0.08064516129032258,
"eval_loss": 8.843916893005371,
"eval_runtime": 2.8151,
"eval_samples_per_second": 22.024,
"eval_steps_per_second": 1.421,
"step": 5
},
{
"epoch": 1.82,
"learning_rate": 7.5e-05,
"loss": 8.7922,
"step": 10
},
{
"epoch": 2.0,
"eval_accuracy": 0.08064516129032258,
"eval_loss": 8.001582145690918,
"eval_runtime": 2.1045,
"eval_samples_per_second": 29.461,
"eval_steps_per_second": 1.901,
"step": 11
},
{
"epoch": 2.91,
"eval_accuracy": 0.08064516129032258,
"eval_loss": 6.000851154327393,
"eval_runtime": 2.0735,
"eval_samples_per_second": 29.901,
"eval_steps_per_second": 1.929,
"step": 16
},
{
"epoch": 3.64,
"learning_rate": 0.00015,
"loss": 6.5264,
"step": 20
},
{
"epoch": 4.0,
"eval_accuracy": 0.08064516129032258,
"eval_loss": 2.7431113719940186,
"eval_runtime": 2.1035,
"eval_samples_per_second": 29.475,
"eval_steps_per_second": 1.902,
"step": 22
},
{
"epoch": 4.91,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.3018240928649902,
"eval_runtime": 2.0906,
"eval_samples_per_second": 29.656,
"eval_steps_per_second": 1.913,
"step": 27
},
{
"epoch": 5.45,
"learning_rate": 0.00014166666666666665,
"loss": 2.16,
"step": 30
},
{
"epoch": 6.0,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.2696114778518677,
"eval_runtime": 2.0785,
"eval_samples_per_second": 29.829,
"eval_steps_per_second": 1.924,
"step": 33
},
{
"epoch": 6.91,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.2057440280914307,
"eval_runtime": 2.5671,
"eval_samples_per_second": 24.152,
"eval_steps_per_second": 1.558,
"step": 38
},
{
"epoch": 7.27,
"learning_rate": 0.0001333333333333333,
"loss": 1.2876,
"step": 40
},
{
"epoch": 8.0,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.2157402038574219,
"eval_runtime": 2.1295,
"eval_samples_per_second": 29.115,
"eval_steps_per_second": 1.878,
"step": 44
},
{
"epoch": 8.91,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.245875597000122,
"eval_runtime": 2.141,
"eval_samples_per_second": 28.958,
"eval_steps_per_second": 1.868,
"step": 49
},
{
"epoch": 9.09,
"learning_rate": 0.000125,
"loss": 1.2456,
"step": 50
},
{
"epoch": 10.0,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.210959792137146,
"eval_runtime": 2.181,
"eval_samples_per_second": 28.427,
"eval_steps_per_second": 1.834,
"step": 55
},
{
"epoch": 10.91,
"learning_rate": 0.00011666666666666665,
"loss": 1.1901,
"step": 60
},
{
"epoch": 10.91,
"eval_accuracy": 0.45161290322580644,
"eval_loss": 1.1861207485198975,
"eval_runtime": 2.094,
"eval_samples_per_second": 29.608,
"eval_steps_per_second": 1.91,
"step": 60
},
{
"epoch": 12.0,
"eval_accuracy": 0.46774193548387094,
"eval_loss": 1.0847262144088745,
"eval_runtime": 2.212,
"eval_samples_per_second": 28.028,
"eval_steps_per_second": 1.808,
"step": 66
},
{
"epoch": 12.73,
"learning_rate": 0.00010833333333333333,
"loss": 1.0665,
"step": 70
},
{
"epoch": 12.91,
"eval_accuracy": 0.46774193548387094,
"eval_loss": 1.0943629741668701,
"eval_runtime": 2.08,
"eval_samples_per_second": 29.808,
"eval_steps_per_second": 1.923,
"step": 71
},
{
"epoch": 14.0,
"eval_accuracy": 0.46774193548387094,
"eval_loss": 1.1853879690170288,
"eval_runtime": 2.093,
"eval_samples_per_second": 29.623,
"eval_steps_per_second": 1.911,
"step": 77
},
{
"epoch": 14.55,
"learning_rate": 9.999999999999999e-05,
"loss": 1.033,
"step": 80
},
{
"epoch": 14.91,
"eval_accuracy": 0.5,
"eval_loss": 1.025220274925232,
"eval_runtime": 2.4167,
"eval_samples_per_second": 25.655,
"eval_steps_per_second": 1.655,
"step": 82
},
{
"epoch": 16.0,
"eval_accuracy": 0.5161290322580645,
"eval_loss": 1.216417908668518,
"eval_runtime": 2.2296,
"eval_samples_per_second": 27.808,
"eval_steps_per_second": 1.794,
"step": 88
},
{
"epoch": 16.36,
"learning_rate": 9.166666666666667e-05,
"loss": 1.0323,
"step": 90
},
{
"epoch": 16.91,
"eval_accuracy": 0.5,
"eval_loss": 1.0642980337142944,
"eval_runtime": 2.199,
"eval_samples_per_second": 28.194,
"eval_steps_per_second": 1.819,
"step": 93
},
{
"epoch": 18.0,
"eval_accuracy": 0.6612903225806451,
"eval_loss": 0.9802310466766357,
"eval_runtime": 2.1395,
"eval_samples_per_second": 28.979,
"eval_steps_per_second": 1.87,
"step": 99
},
{
"epoch": 18.18,
"learning_rate": 8.333333333333333e-05,
"loss": 0.9329,
"step": 100
},
{
"epoch": 18.91,
"eval_accuracy": 0.5967741935483871,
"eval_loss": 0.9474769830703735,
"eval_runtime": 2.179,
"eval_samples_per_second": 28.453,
"eval_steps_per_second": 1.836,
"step": 104
},
{
"epoch": 20.0,
"learning_rate": 7.5e-05,
"loss": 0.8619,
"step": 110
},
{
"epoch": 20.0,
"eval_accuracy": 0.6451612903225806,
"eval_loss": 0.9114610552787781,
"eval_runtime": 2.125,
"eval_samples_per_second": 29.176,
"eval_steps_per_second": 1.882,
"step": 110
},
{
"epoch": 20.91,
"eval_accuracy": 0.6451612903225806,
"eval_loss": 0.8893528580665588,
"eval_runtime": 2.2755,
"eval_samples_per_second": 27.246,
"eval_steps_per_second": 1.758,
"step": 115
},
{
"epoch": 21.82,
"learning_rate": 6.666666666666666e-05,
"loss": 0.8019,
"step": 120
},
{
"epoch": 22.0,
"eval_accuracy": 0.6935483870967742,
"eval_loss": 0.8276461958885193,
"eval_runtime": 2.182,
"eval_samples_per_second": 28.414,
"eval_steps_per_second": 1.833,
"step": 121
},
{
"epoch": 22.91,
"eval_accuracy": 0.6774193548387096,
"eval_loss": 0.8156123757362366,
"eval_runtime": 2.1835,
"eval_samples_per_second": 28.394,
"eval_steps_per_second": 1.832,
"step": 126
},
{
"epoch": 23.64,
"learning_rate": 5.8333333333333326e-05,
"loss": 0.7675,
"step": 130
},
{
"epoch": 24.0,
"eval_accuracy": 0.6290322580645161,
"eval_loss": 0.7928251624107361,
"eval_runtime": 2.7367,
"eval_samples_per_second": 22.655,
"eval_steps_per_second": 1.462,
"step": 132
},
{
"epoch": 24.91,
"eval_accuracy": 0.7419354838709677,
"eval_loss": 0.7163397669792175,
"eval_runtime": 2.3511,
"eval_samples_per_second": 26.371,
"eval_steps_per_second": 1.701,
"step": 137
},
{
"epoch": 25.45,
"learning_rate": 4.9999999999999996e-05,
"loss": 0.6762,
"step": 140
},
{
"epoch": 26.0,
"eval_accuracy": 0.6774193548387096,
"eval_loss": 0.7387820482254028,
"eval_runtime": 2.261,
"eval_samples_per_second": 27.421,
"eval_steps_per_second": 1.769,
"step": 143
},
{
"epoch": 26.91,
"eval_accuracy": 0.7580645161290323,
"eval_loss": 0.6518718004226685,
"eval_runtime": 2.2715,
"eval_samples_per_second": 27.294,
"eval_steps_per_second": 1.761,
"step": 148
},
{
"epoch": 27.27,
"learning_rate": 4.1666666666666665e-05,
"loss": 0.6771,
"step": 150
},
{
"epoch": 28.0,
"eval_accuracy": 0.7419354838709677,
"eval_loss": 0.6709696054458618,
"eval_runtime": 2.6851,
"eval_samples_per_second": 23.09,
"eval_steps_per_second": 1.49,
"step": 154
},
{
"epoch": 28.91,
"eval_accuracy": 0.7580645161290323,
"eval_loss": 0.6073653697967529,
"eval_runtime": 2.3635,
"eval_samples_per_second": 26.232,
"eval_steps_per_second": 1.692,
"step": 159
},
{
"epoch": 29.09,
"learning_rate": 3.333333333333333e-05,
"loss": 0.6424,
"step": 160
},
{
"epoch": 30.0,
"eval_accuracy": 0.7258064516129032,
"eval_loss": 0.672946035861969,
"eval_runtime": 2.2598,
"eval_samples_per_second": 27.436,
"eval_steps_per_second": 1.77,
"step": 165
},
{
"epoch": 30.91,
"learning_rate": 2.4999999999999998e-05,
"loss": 0.6139,
"step": 170
},
{
"epoch": 30.91,
"eval_accuracy": 0.7903225806451613,
"eval_loss": 0.5744480490684509,
"eval_runtime": 2.189,
"eval_samples_per_second": 28.323,
"eval_steps_per_second": 1.827,
"step": 170
},
{
"epoch": 32.0,
"eval_accuracy": 0.8225806451612904,
"eval_loss": 0.6192476749420166,
"eval_runtime": 2.142,
"eval_samples_per_second": 28.945,
"eval_steps_per_second": 1.867,
"step": 176
},
{
"epoch": 32.73,
"learning_rate": 1.6666666666666664e-05,
"loss": 0.5713,
"step": 180
},
{
"epoch": 32.91,
"eval_accuracy": 0.7903225806451613,
"eval_loss": 0.6452686190605164,
"eval_runtime": 2.1495,
"eval_samples_per_second": 28.844,
"eval_steps_per_second": 1.861,
"step": 181
},
{
"epoch": 34.0,
"eval_accuracy": 0.7903225806451613,
"eval_loss": 0.6392035484313965,
"eval_runtime": 2.1965,
"eval_samples_per_second": 28.226,
"eval_steps_per_second": 1.821,
"step": 187
},
{
"epoch": 34.55,
"learning_rate": 8.333333333333332e-06,
"loss": 0.5462,
"step": 190
},
{
"epoch": 34.91,
"eval_accuracy": 0.8225806451612904,
"eval_loss": 0.5955818295478821,
"eval_runtime": 2.247,
"eval_samples_per_second": 27.592,
"eval_steps_per_second": 1.78,
"step": 192
},
{
"epoch": 36.0,
"eval_accuracy": 0.8225806451612904,
"eval_loss": 0.5892814993858337,
"eval_runtime": 2.5326,
"eval_samples_per_second": 24.481,
"eval_steps_per_second": 1.579,
"step": 198
},
{
"epoch": 36.36,
"learning_rate": 0.0,
"loss": 0.5393,
"step": 200
},
{
"epoch": 36.36,
"eval_accuracy": 0.8225806451612904,
"eval_loss": 0.5898378491401672,
"eval_runtime": 2.2395,
"eval_samples_per_second": 27.685,
"eval_steps_per_second": 1.786,
"step": 200
},
{
"epoch": 36.36,
"step": 200,
"total_flos": 4.141200256480051e+17,
"train_loss": 1.5982162952423096,
"train_runtime": 635.1405,
"train_samples_per_second": 22.042,
"train_steps_per_second": 0.315
}
],
"logging_steps": 10,
"max_steps": 200,
"num_input_tokens_seen": 0,
"num_train_epochs": 40,
"save_steps": 500,
"total_flos": 4.141200256480051e+17,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}