{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.8990638351115062, | |
"eval_loss": 0.4193418025970459, | |
"eval_runtime": 3750.3751, | |
"eval_samples": 600753, | |
"eval_samples_per_second": 160.185, | |
"eval_steps_per_second": 5.006, | |
"perplexity": 1.5209601340780117, | |
"total_flos": 8.947355434270848e+18, | |
"train_loss": 0.5702250743976136, | |
"train_runtime": 431071.4094, | |
"train_samples": 11319535, | |
"train_samples_per_second": 78.777, | |
"train_steps_per_second": 2.462 | |
} |