{ "name": "root", "gauges": { "Huggy.Policy.Entropy.mean": { "value": 1.4131202697753906, "min": 1.413079857826233, "max": 1.423565149307251, "count": 40 }, "Huggy.Policy.Entropy.sum": { "value": 72084.6796875, "min": 51755.68359375, "max": 269279.84375, "count": 40 }, "Huggy.Environment.EpisodeLength.mean": { "value": 105.78924731182796, "min": 104.71789473684211, "max": 376.8731343283582, "count": 40 }, "Huggy.Environment.EpisodeLength.sum": { "value": 49192.0, "min": 49025.0, "max": 50501.0, "count": 40 }, "Huggy.Step.mean": { "value": 1999890.0, "min": 49931.0, "max": 1999890.0, "count": 40 }, "Huggy.Step.sum": { "value": 1999890.0, "min": 49931.0, "max": 1999890.0, "count": 40 }, "Huggy.Policy.ExtrinsicValueEstimate.mean": { "value": 2.2955219745635986, "min": 0.07826226204633713, "max": 2.3292925357818604, "count": 40 }, "Huggy.Policy.ExtrinsicValueEstimate.sum": { "value": 1076.599853515625, "min": 18.156845092773438, "max": 1098.015380859375, "count": 40 }, "Huggy.Environment.CumulativeReward.mean": { "value": 3.7928782554069307, "min": 1.5994393494108627, "max": 3.9371629182725227, "count": 40 }, "Huggy.Environment.CumulativeReward.sum": { "value": 1778.8599017858505, "min": 258.9458881020546, "max": 1797.3172799944878, "count": 40 }, "Huggy.Policy.ExtrinsicReward.mean": { "value": 3.7928782554069307, "min": 1.5994393494108627, "max": 3.9371629182725227, "count": 40 }, "Huggy.Policy.ExtrinsicReward.sum": { "value": 1778.8599017858505, "min": 258.9458881020546, "max": 1797.3172799944878, "count": 40 }, "Huggy.Losses.PolicyLoss.mean": { "value": 0.016255841462407262, "min": 0.01212340142519679, "max": 0.019309578390998974, "count": 40 }, "Huggy.Losses.PolicyLoss.sum": { "value": 0.04876752438722179, "min": 0.02424680285039358, "max": 0.05792873517299692, "count": 40 }, "Huggy.Losses.ValueLoss.mean": { "value": 0.0489630249225431, "min": 0.014743209211155774, "max": 0.0489630249225431, "count": 40 }, "Huggy.Losses.ValueLoss.sum": { "value": 0.1468890747676293, "min": 0.029486418422311547, "max": 0.1468890747676293, "count": 40 }, "Huggy.Policy.LearningRate.mean": { "value": 4.098098633999991e-06, "min": 4.098098633999991e-06, "max": 0.0002953878765373749, "count": 40 }, "Huggy.Policy.LearningRate.sum": { "value": 1.2294295901999973e-05, "min": 1.2294295901999973e-05, "max": 0.0008439181686939499, "count": 40 }, "Huggy.Policy.Epsilon.mean": { "value": 0.101366, "min": 0.101366, "max": 0.198462625, "count": 40 }, "Huggy.Policy.Epsilon.sum": { "value": 0.304098, "min": 0.20796145, "max": 0.58130605, "count": 40 }, "Huggy.Policy.Beta.mean": { "value": 7.816339999999981e-05, "min": 7.816339999999981e-05, "max": 0.0049232849875, "count": 40 }, "Huggy.Policy.Beta.sum": { "value": 0.00023449019999999946, "min": 0.00023449019999999946, "max": 0.014067171895000001, "count": 40 }, "Huggy.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 }, "Huggy.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1736613618", "python_version": "3.10.16 (main, Dec 4 2024, 08:53:38) [GCC 13.2.0]", "command_line_arguments": "/home/hrichter/projects/hf_rl_course/.venv/bin/mlagents-learn /home/hrichter/projects/hf_rl_course/content/ml-agents/config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy-mp --no-graphics --num-envs=32 --force", "mlagents_version": "1.2.0.dev0", "mlagents_envs_version": "1.2.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.5.1+cu124", "numpy_version": "1.23.5", "end_time_seconds": "1736614352" }, "total": 734.250364192998, "count": 1, "self": 0.5323062630013737, "children": { "run_training.setup": { "total": 0.2869157899986021, "count": 1, "self": 0.2869157899986021 }, "TrainerController.start_learning": { "total": 733.431142139998, "count": 1, "self": 0.5467636279936414, "children": { "TrainerController._reset_env": { "total": 2.037717203002103, "count": 1, "self": 2.037717203002103 }, "TrainerController.advance": { "total": 730.7628460230044, "count": 7768, "self": 0.15108564022739301, "children": { "env_step": { "total": 416.6019123589358, "count": 7768, "self": 125.41878614153393, "children": { "SubprocessEnvManager._take_step": { "total": 290.2305916363075, "count": 234729, "self": 9.837283263143036, "children": { "TorchPolicy.evaluate": { "total": 280.3933083731645, "count": 228845, "self": 280.3933083731645 } } }, "workers": { "total": 0.9525345810943691, "count": 7768, "self": 0.0, "children": { "worker_root": { "total": 23465.509365453938, "count": 234726, "is_parallel": true, "self": 22624.190179401645, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.022741498014511308, "count": 32, "is_parallel": true, "self": 0.0055951490212464705, "children": { "_process_rank_one_or_two_observation": { "total": 0.017146348993264837, "count": 64, "is_parallel": true, "self": 0.017146348993264837 } } }, "UnityEnvironment.step": { "total": 0.5873354549985379, "count": 32, "is_parallel": true, "self": 0.006916628997714724, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0036634670104831457, "count": 32, "is_parallel": true, "self": 0.0036634670104831457 }, "communicator.exchange": { "total": 0.5584091749951767, "count": 32, "is_parallel": true, "self": 0.5584091749951767 }, "steps_from_proto": { "total": 0.0183461839951633, "count": 32, "is_parallel": true, "self": 0.0049502399742777925, "children": { "_process_rank_one_or_two_observation": { "total": 0.013395944020885509, "count": 64, "is_parallel": true, "self": 0.013395944020885509 } } } } } } }, "UnityEnvironment.step": { "total": 841.3191860522929, "count": 234694, "is_parallel": true, "self": 26.958348805062997, "children": { "UnityEnvironment._generate_step_input": { "total": 48.180654894236795, "count": 234694, "is_parallel": true, "self": 48.180654894236795 }, "communicator.exchange": { "total": 706.8437248906266, "count": 234694, "is_parallel": true, "self": 706.8437248906266 }, "steps_from_proto": { "total": 59.336457462366525, "count": 234694, "is_parallel": true, "self": 21.40152212467001, "children": { "_process_rank_one_or_two_observation": { "total": 37.934935337696515, "count": 469388, "is_parallel": true, "self": 37.934935337696515 } } } } } } } } } } }, "trainer_advance": { "total": 314.0098480238412, "count": 7768, "self": 1.118876133728918, "children": { "process_trajectory": { "total": 107.88227381509569, "count": 7768, "self": 107.009227194103, "children": { "RLTrainer._checkpoint": { "total": 0.8730466209926817, "count": 10, "self": 0.8730466209926817 } } }, "_update_policy": { "total": 205.00869807501658, "count": 96, "self": 169.6087109192158, "children": { "TorchPPOOptimizer.update": { "total": 35.39998715580077, "count": 2880, "self": 35.39998715580077 } } } } } } }, "trainer_threads": { "total": 8.899987733457237e-07, "count": 1, "self": 8.899987733457237e-07 }, "TrainerController._save_models": { "total": 0.08381439599907026, "count": 1, "self": 0.0035746590001508594, "children": { "RLTrainer._checkpoint": { "total": 0.0802397369989194, "count": 1, "self": 0.0802397369989194 } } } } } } }