{ | |
"epoch": 0.4, | |
"eval_loss": 1.0858668088912964, | |
"eval_runtime": 2658.3456, | |
"eval_samples": 5000, | |
"eval_samples_per_second": 9.435, | |
"eval_steps_per_second": 4.718, | |
"perplexity": 2.9620061996078197, | |
"train_loss": 1.1317986328125, | |
"train_runtime": 62833.7719, | |
"train_samples": 100000, | |
"train_samples_per_second": 3.183, | |
"train_steps_per_second": 0.398 | |
} |