|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Huggy.Policy.Entropy.mean": { |
|
"value": 1.4131202697753906, |
|
"min": 1.413079857826233, |
|
"max": 1.423565149307251, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.Entropy.sum": { |
|
"value": 72084.6796875, |
|
"min": 51755.68359375, |
|
"max": 269279.84375, |
|
"count": 40 |
|
}, |
|
"Huggy.Environment.EpisodeLength.mean": { |
|
"value": 105.78924731182796, |
|
"min": 104.71789473684211, |
|
"max": 376.8731343283582, |
|
"count": 40 |
|
}, |
|
"Huggy.Environment.EpisodeLength.sum": { |
|
"value": 49192.0, |
|
"min": 49025.0, |
|
"max": 50501.0, |
|
"count": 40 |
|
}, |
|
"Huggy.Step.mean": { |
|
"value": 1999890.0, |
|
"min": 49931.0, |
|
"max": 1999890.0, |
|
"count": 40 |
|
}, |
|
"Huggy.Step.sum": { |
|
"value": 1999890.0, |
|
"min": 49931.0, |
|
"max": 1999890.0, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 2.2955219745635986, |
|
"min": 0.07826226204633713, |
|
"max": 2.3292925357818604, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 1076.599853515625, |
|
"min": 18.156845092773438, |
|
"max": 1098.015380859375, |
|
"count": 40 |
|
}, |
|
"Huggy.Environment.CumulativeReward.mean": { |
|
"value": 3.7928782554069307, |
|
"min": 1.5994393494108627, |
|
"max": 3.9371629182725227, |
|
"count": 40 |
|
}, |
|
"Huggy.Environment.CumulativeReward.sum": { |
|
"value": 1778.8599017858505, |
|
"min": 258.9458881020546, |
|
"max": 1797.3172799944878, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.ExtrinsicReward.mean": { |
|
"value": 3.7928782554069307, |
|
"min": 1.5994393494108627, |
|
"max": 3.9371629182725227, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.ExtrinsicReward.sum": { |
|
"value": 1778.8599017858505, |
|
"min": 258.9458881020546, |
|
"max": 1797.3172799944878, |
|
"count": 40 |
|
}, |
|
"Huggy.Losses.PolicyLoss.mean": { |
|
"value": 0.016255841462407262, |
|
"min": 0.01212340142519679, |
|
"max": 0.019309578390998974, |
|
"count": 40 |
|
}, |
|
"Huggy.Losses.PolicyLoss.sum": { |
|
"value": 0.04876752438722179, |
|
"min": 0.02424680285039358, |
|
"max": 0.05792873517299692, |
|
"count": 40 |
|
}, |
|
"Huggy.Losses.ValueLoss.mean": { |
|
"value": 0.0489630249225431, |
|
"min": 0.014743209211155774, |
|
"max": 0.0489630249225431, |
|
"count": 40 |
|
}, |
|
"Huggy.Losses.ValueLoss.sum": { |
|
"value": 0.1468890747676293, |
|
"min": 0.029486418422311547, |
|
"max": 0.1468890747676293, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.LearningRate.mean": { |
|
"value": 4.098098633999991e-06, |
|
"min": 4.098098633999991e-06, |
|
"max": 0.0002953878765373749, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.LearningRate.sum": { |
|
"value": 1.2294295901999973e-05, |
|
"min": 1.2294295901999973e-05, |
|
"max": 0.0008439181686939499, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.Epsilon.mean": { |
|
"value": 0.101366, |
|
"min": 0.101366, |
|
"max": 0.198462625, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.Epsilon.sum": { |
|
"value": 0.304098, |
|
"min": 0.20796145, |
|
"max": 0.58130605, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.Beta.mean": { |
|
"value": 7.816339999999981e-05, |
|
"min": 7.816339999999981e-05, |
|
"max": 0.0049232849875, |
|
"count": 40 |
|
}, |
|
"Huggy.Policy.Beta.sum": { |
|
"value": 0.00023449019999999946, |
|
"min": 0.00023449019999999946, |
|
"max": 0.014067171895000001, |
|
"count": 40 |
|
}, |
|
"Huggy.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 40 |
|
}, |
|
"Huggy.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 40 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1736613618", |
|
"python_version": "3.10.16 (main, Dec 4 2024, 08:53:38) [GCC 13.2.0]", |
|
"command_line_arguments": "/home/hrichter/projects/hf_rl_course/.venv/bin/mlagents-learn /home/hrichter/projects/hf_rl_course/content/ml-agents/config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy-mp --no-graphics --num-envs=32 --force", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.5.1+cu124", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1736614352" |
|
}, |
|
"total": 734.250364192998, |
|
"count": 1, |
|
"self": 0.5323062630013737, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.2869157899986021, |
|
"count": 1, |
|
"self": 0.2869157899986021 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 733.431142139998, |
|
"count": 1, |
|
"self": 0.5467636279936414, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.037717203002103, |
|
"count": 1, |
|
"self": 2.037717203002103 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 730.7628460230044, |
|
"count": 7768, |
|
"self": 0.15108564022739301, |
|
"children": { |
|
"env_step": { |
|
"total": 416.6019123589358, |
|
"count": 7768, |
|
"self": 125.41878614153393, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 290.2305916363075, |
|
"count": 234729, |
|
"self": 9.837283263143036, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 280.3933083731645, |
|
"count": 228845, |
|
"self": 280.3933083731645 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.9525345810943691, |
|
"count": 7768, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 23465.509365453938, |
|
"count": 234726, |
|
"is_parallel": true, |
|
"self": 22624.190179401645, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.022741498014511308, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.0055951490212464705, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.017146348993264837, |
|
"count": 64, |
|
"is_parallel": true, |
|
"self": 0.017146348993264837 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.5873354549985379, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.006916628997714724, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0036634670104831457, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.0036634670104831457 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.5584091749951767, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.5584091749951767 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0183461839951633, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.0049502399742777925, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.013395944020885509, |
|
"count": 64, |
|
"is_parallel": true, |
|
"self": 0.013395944020885509 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 841.3191860522929, |
|
"count": 234694, |
|
"is_parallel": true, |
|
"self": 26.958348805062997, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 48.180654894236795, |
|
"count": 234694, |
|
"is_parallel": true, |
|
"self": 48.180654894236795 |
|
}, |
|
"communicator.exchange": { |
|
"total": 706.8437248906266, |
|
"count": 234694, |
|
"is_parallel": true, |
|
"self": 706.8437248906266 |
|
}, |
|
"steps_from_proto": { |
|
"total": 59.336457462366525, |
|
"count": 234694, |
|
"is_parallel": true, |
|
"self": 21.40152212467001, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 37.934935337696515, |
|
"count": 469388, |
|
"is_parallel": true, |
|
"self": 37.934935337696515 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 314.0098480238412, |
|
"count": 7768, |
|
"self": 1.118876133728918, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 107.88227381509569, |
|
"count": 7768, |
|
"self": 107.009227194103, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.8730466209926817, |
|
"count": 10, |
|
"self": 0.8730466209926817 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 205.00869807501658, |
|
"count": 96, |
|
"self": 169.6087109192158, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 35.39998715580077, |
|
"count": 2880, |
|
"self": 35.39998715580077 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.899987733457237e-07, |
|
"count": 1, |
|
"self": 8.899987733457237e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.08381439599907026, |
|
"count": 1, |
|
"self": 0.0035746590001508594, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.0802397369989194, |
|
"count": 1, |
|
"self": 0.0802397369989194 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |