{ | |
"epoch": 0.9654654119273377, | |
"eval_loss": 1.1314566135406494, | |
"eval_runtime": 436.9279, | |
"eval_samples": 14740, | |
"eval_samples_per_second": 33.736, | |
"eval_steps_per_second": 8.434, | |
"perplexity": 3.100168960957919, | |
"total_flos": 5.4436621713408e+18, | |
"train_loss": 1.237374488548799, | |
"train_runtime": 275308.8222, | |
"train_samples": 2916726, | |
"train_samples_per_second": 10.229, | |
"train_steps_per_second": 0.04 | |
} |