{ | |
"epoch": 1.0, | |
"eval_loss": 2.0893874168395996, | |
"eval_runtime": 32.9539, | |
"eval_samples_per_second": 13.716, | |
"eval_steps_per_second": 1.73, | |
"perplexity": 8.079963998077499, | |
"total_flos": 5.34201935659008e+16, | |
"train_loss": 2.1967257285604673, | |
"train_runtime": 922.9625, | |
"train_samples_per_second": 6.37, | |
"train_steps_per_second": 3.185 | |
} |