{ "best_metric": 0.29358136653900146, "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/vit-base-patch16-224_rice-leaf-disease-augmented-v2_fft/checkpoint-750", "epoch": 19.0, "eval_steps": 500, "global_step": 2375, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 3.8496286869049072, "learning_rate": 5e-06, "loss": 1.9482, "step": 125 }, { "epoch": 1.0, "eval_accuracy": 0.5684523809523809, "eval_loss": 1.5012105703353882, "eval_runtime": 11.0652, "eval_samples_per_second": 30.365, "eval_steps_per_second": 0.542, "step": 125 }, { "epoch": 2.0, "grad_norm": 3.772235155105591, "learning_rate": 1e-05, "loss": 0.9894, "step": 250 }, { "epoch": 2.0, "eval_accuracy": 0.7976190476190477, "eval_loss": 0.6444453001022339, "eval_runtime": 11.0129, "eval_samples_per_second": 30.51, "eval_steps_per_second": 0.545, "step": 250 }, { "epoch": 3.0, "grad_norm": 1.4745649099349976, "learning_rate": 8.83022221559489e-06, "loss": 0.3321, "step": 375 }, { "epoch": 3.0, "eval_accuracy": 0.8958333333333334, "eval_loss": 0.3858731687068939, "eval_runtime": 10.958, "eval_samples_per_second": 30.663, "eval_steps_per_second": 0.548, "step": 375 }, { "epoch": 4.0, "grad_norm": 1.1253288984298706, "learning_rate": 5.8682408883346535e-06, "loss": 0.1115, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.9107142857142857, "eval_loss": 0.3080737888813019, "eval_runtime": 10.9888, "eval_samples_per_second": 30.577, "eval_steps_per_second": 0.546, "step": 500 }, { "epoch": 5.0, "grad_norm": 0.3589422404766083, "learning_rate": 2.5000000000000015e-06, "loss": 0.0387, "step": 625 }, { "epoch": 5.0, "eval_accuracy": 0.9136904761904762, "eval_loss": 0.2979942262172699, "eval_runtime": 11.1535, "eval_samples_per_second": 30.125, "eval_steps_per_second": 0.538, "step": 625 }, { "epoch": 6.0, "grad_norm": 0.2502361536026001, "learning_rate": 3.015368960704584e-07, "loss": 0.0204, "step": 750 }, { "epoch": 6.0, "eval_accuracy": 0.9136904761904762, "eval_loss": 0.29358136653900146, "eval_runtime": 11.1371, "eval_samples_per_second": 30.169, "eval_steps_per_second": 0.539, "step": 750 }, { "epoch": 7.0, "grad_norm": 0.5141955018043518, "learning_rate": 9.698463103929542e-06, "loss": 0.0169, "step": 875 }, { "epoch": 7.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.2952845096588135, "eval_runtime": 11.0115, "eval_samples_per_second": 30.513, "eval_steps_per_second": 0.545, "step": 875 }, { "epoch": 8.0, "grad_norm": 0.1391526609659195, "learning_rate": 7.500000000000003e-06, "loss": 0.0078, "step": 1000 }, { "epoch": 8.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.3067362606525421, "eval_runtime": 11.2875, "eval_samples_per_second": 29.767, "eval_steps_per_second": 0.532, "step": 1000 }, { "epoch": 9.0, "grad_norm": 0.06930585205554962, "learning_rate": 4.131759111665349e-06, "loss": 0.0034, "step": 1125 }, { "epoch": 9.0, "eval_accuracy": 0.9285714285714286, "eval_loss": 0.3087221682071686, "eval_runtime": 10.9679, "eval_samples_per_second": 30.635, "eval_steps_per_second": 0.547, "step": 1125 }, { "epoch": 10.0, "grad_norm": 0.09097771346569061, "learning_rate": 1.1697777844051105e-06, "loss": 0.0025, "step": 1250 }, { "epoch": 10.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.3138602674007416, "eval_runtime": 10.3394, "eval_samples_per_second": 32.497, "eval_steps_per_second": 0.58, "step": 1250 }, { "epoch": 11.0, "grad_norm": 0.06938016414642334, "learning_rate": 1e-05, "loss": 0.0023, "step": 1375 }, { "epoch": 11.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.3141930401325226, "eval_runtime": 10.7534, "eval_samples_per_second": 31.246, "eval_steps_per_second": 0.558, "step": 1375 }, { "epoch": 12.0, "grad_norm": 0.04166670888662338, "learning_rate": 8.83022221559489e-06, "loss": 0.0019, "step": 1500 }, { "epoch": 12.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.3288079798221588, "eval_runtime": 10.8781, "eval_samples_per_second": 30.888, "eval_steps_per_second": 0.552, "step": 1500 }, { "epoch": 13.0, "grad_norm": 0.04881810024380684, "learning_rate": 5.86824088833465e-06, "loss": 0.0013, "step": 1625 }, { "epoch": 13.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.33594179153442383, "eval_runtime": 11.2397, "eval_samples_per_second": 29.894, "eval_steps_per_second": 0.534, "step": 1625 }, { "epoch": 14.0, "grad_norm": 0.02085023745894432, "learning_rate": 2.5000000000000036e-06, "loss": 0.001, "step": 1750 }, { "epoch": 14.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.34129947423934937, "eval_runtime": 11.0362, "eval_samples_per_second": 30.445, "eval_steps_per_second": 0.544, "step": 1750 }, { "epoch": 15.0, "grad_norm": 0.028393927961587906, "learning_rate": 3.015368960704584e-07, "loss": 0.0009, "step": 1875 }, { "epoch": 15.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.3424765169620514, "eval_runtime": 10.9571, "eval_samples_per_second": 30.665, "eval_steps_per_second": 0.548, "step": 1875 }, { "epoch": 16.0, "grad_norm": 0.018229400739073753, "learning_rate": 9.698463103929542e-06, "loss": 0.0009, "step": 2000 }, { "epoch": 16.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.3481498956680298, "eval_runtime": 11.0764, "eval_samples_per_second": 30.335, "eval_steps_per_second": 0.542, "step": 2000 }, { "epoch": 17.0, "grad_norm": 0.018818996846675873, "learning_rate": 7.499999999999999e-06, "loss": 0.0007, "step": 2125 }, { "epoch": 17.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.35712891817092896, "eval_runtime": 10.3576, "eval_samples_per_second": 32.44, "eval_steps_per_second": 0.579, "step": 2125 }, { "epoch": 18.0, "grad_norm": 0.021823769435286522, "learning_rate": 4.131759111665352e-06, "loss": 0.0006, "step": 2250 }, { "epoch": 18.0, "eval_accuracy": 0.9196428571428571, "eval_loss": 0.36197924613952637, "eval_runtime": 11.0713, "eval_samples_per_second": 30.349, "eval_steps_per_second": 0.542, "step": 2250 }, { "epoch": 19.0, "grad_norm": 0.01798320934176445, "learning_rate": 0.0, "loss": 0.0005, "step": 2375 }, { "epoch": 19.0, "eval_accuracy": 0.9226190476190477, "eval_loss": 0.36210647225379944, "eval_runtime": 21.033, "eval_samples_per_second": 15.975, "eval_steps_per_second": 0.285, "step": 2375 }, { "epoch": 19.0, "step": 2375, "total_flos": 1.1779415838425088e+19, "train_loss": 2.718197358281989e-05, "train_runtime": 389.5228, "train_samples_per_second": 390.221, "train_steps_per_second": 6.097 } ], "logging_steps": 500, "max_steps": 2375, "num_input_tokens_seen": 0, "num_train_epochs": 19, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.1779415838425088e+19, "train_batch_size": 64, "trial_name": null, "trial_params": null }