{ | |
"epoch": 0.9999493031929397, | |
"eval_loss": 1.1348882913589478, | |
"eval_runtime": 428.9305, | |
"eval_samples": 14447, | |
"eval_samples_per_second": 33.681, | |
"eval_steps_per_second": 8.421, | |
"perplexity": 3.110826017347737, | |
"total_flos": 5.643098158163558e+18, | |
"train_loss": 1.1702608942389645, | |
"train_runtime": 336251.1326, | |
"train_samples": 2919315, | |
"train_samples_per_second": 8.682, | |
"train_steps_per_second": 0.034 | |
} |