{ | |
"epoch": 1.0, | |
"eval_loss": 1.9246433973312378, | |
"eval_runtime": 282.1545, | |
"eval_samples": 100000, | |
"eval_samples_per_second": 354.416, | |
"eval_steps_per_second": 44.302, | |
"perplexity": 6.852704537407429, | |
"train_loss": 1.8196985500431868, | |
"train_runtime": 434920.5349, | |
"train_samples": 64750662, | |
"train_samples_per_second": 148.879, | |
"train_steps_per_second": 0.62 | |
} |