{ "epoch": 62.0, "eval_explained_variance": 0.44826042652130127, "eval_kl_divergence": 0.41849657893180847, "eval_loss": 0.4693068563938141, "eval_mae": 0.11716800183057785, "eval_rmse": 0.15763415396213531, "eval_runtime": 70.8809, "eval_samples_per_second": 33.253, "eval_steps_per_second": 2.088, "learning_rate": 1.0000000000000002e-07, "total_flos": 6.42634409963284e+19, "train_loss": 0.466335079458891, "train_runtime": 17194.6751, "train_samples_per_second": 61.092, "train_steps_per_second": 3.821 }