ModernBERT2gpt2-700m-v0.1 / train_results.json
pszemraj's picture
End of training
0d68fab verified
{
"epoch": 0.9999754305791012,
"num_input_tokens_seen": 524625736,
"total_flos": 1.8734435060870185e+18,
"train_loss": 51.37127453965696,
"train_runtime": 54286.9149,
"train_samples": 651215,
"train_samples_per_second": 11.996,
"train_steps_per_second": 0.187,
"train_tokens_per_second": 9664.096
}