mega-ar-525m-v0.07-ultraTBfw / all_results.json
pszemraj's picture
End of training
a69dd7f verified
raw
history blame contribute delete
496 Bytes
{
"epoch": 0.9999149532682873,
"eval_accuracy": 0.5874091441969519,
"eval_loss": 1.9824198484420776,
"eval_runtime": 86.7224,
"eval_samples": 400,
"eval_samples_per_second": 4.612,
"eval_steps_per_second": 1.153,
"perplexity": 7.26029054814878,
"total_flos": 6.861219031857234e+18,
"train_loss": 2.0199434388696393,
"train_runtime": 95478.6823,
"train_samples": 1363955,
"train_samples_per_second": 14.285,
"train_steps_per_second": 0.112
}