{ "best_metric": 0.6061349693251534, "best_model_checkpoint": "bert-finetuned-sem_eval-georgian/checkpoint-2110", "epoch": 5.0, "eval_steps": 500, "global_step": 2110, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.45023696682464454, "eval_f1": 0.5087014725568942, "eval_loss": 0.4644582271575928, "eval_roc_auc": 0.6718009478672986, "eval_runtime": 12.4119, "eval_samples_per_second": 33.999, "eval_steps_per_second": 4.27, "step": 422 }, { "epoch": 1.1848341232227488, "grad_norm": 5.8598737716674805, "learning_rate": 1.5260663507109007e-05, "loss": 0.4952, "step": 500 }, { "epoch": 2.0, "eval_accuracy": 0.523696682464455, "eval_f1": 0.5441176470588235, "eval_loss": 0.47526419162750244, "eval_roc_auc": 0.6951026856240126, "eval_runtime": 12.3933, "eval_samples_per_second": 34.051, "eval_steps_per_second": 4.277, "step": 844 }, { "epoch": 2.3696682464454977, "grad_norm": 2.699039936065674, "learning_rate": 1.052132701421801e-05, "loss": 0.3968, "step": 1000 }, { "epoch": 3.0, "eval_accuracy": 0.5616113744075829, "eval_f1": 0.6025316455696202, "eval_loss": 0.43833649158477783, "eval_roc_auc": 0.7306477093206951, "eval_runtime": 12.4177, "eval_samples_per_second": 33.984, "eval_steps_per_second": 4.268, "step": 1266 }, { "epoch": 3.5545023696682465, "grad_norm": 6.871908664703369, "learning_rate": 5.7819905213270145e-06, "loss": 0.3198, "step": 1500 }, { "epoch": 4.0, "eval_accuracy": 0.5734597156398105, "eval_f1": 0.6, "eval_loss": 0.49058645963668823, "eval_roc_auc": 0.7306477093206951, "eval_runtime": 12.4414, "eval_samples_per_second": 33.919, "eval_steps_per_second": 4.26, "step": 1688 }, { "epoch": 4.739336492890995, "grad_norm": 3.2302420139312744, "learning_rate": 1.042654028436019e-06, "loss": 0.2409, "step": 2000 }, { "epoch": 5.0, "eval_accuracy": 0.5829383886255924, "eval_f1": 0.6061349693251534, "eval_loss": 0.4966834783554077, "eval_roc_auc": 0.7349921011058452, "eval_runtime": 12.2307, "eval_samples_per_second": 34.503, "eval_steps_per_second": 4.333, "step": 2110 } ], "logging_steps": 500, "max_steps": 2110, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 4440078789120000.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }