{ | |
"epoch": 62.0, | |
"eval_explained_variance": 0.44826042652130127, | |
"eval_kl_divergence": 0.41849657893180847, | |
"eval_loss": 0.4693068563938141, | |
"eval_mae": 0.11716800183057785, | |
"eval_rmse": 0.15763415396213531, | |
"eval_runtime": 70.8809, | |
"eval_samples_per_second": 33.253, | |
"eval_steps_per_second": 2.088, | |
"learning_rate": 1.0000000000000002e-07, | |
"total_flos": 6.42634409963284e+19, | |
"train_loss": 0.466335079458891, | |
"train_runtime": 17194.6751, | |
"train_samples_per_second": 61.092, | |
"train_steps_per_second": 3.821 | |
} |