|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.5548450350761414, |
|
"min": 0.5548450350761414, |
|
"max": 0.9097636938095093, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 16538.8203125, |
|
"min": 9048.5341796875, |
|
"max": 27394.8046875, |
|
"count": 17 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989877.0, |
|
"min": 509969.0, |
|
"max": 989877.0, |
|
"count": 17 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989877.0, |
|
"min": 509969.0, |
|
"max": 989877.0, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.4498426616191864, |
|
"min": 0.018395353108644485, |
|
"max": 0.47865211963653564, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 121.00767517089844, |
|
"min": 1.471628189086914, |
|
"max": 130.67202758789062, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.15813587605953217, |
|
"min": -0.15813587605953217, |
|
"max": 0.18717536330223083, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -42.538551330566406, |
|
"min": -42.538551330566406, |
|
"max": 50.537349700927734, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06940189483256767, |
|
"min": 0.06384416604364038, |
|
"max": 0.07085341716899786, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9716265276559474, |
|
"min": 0.21131838193590136, |
|
"max": 1.0338376412298256, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.02051455678502818, |
|
"min": 0.004671117367647003, |
|
"max": 0.02051455678502818, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.28720379499039456, |
|
"min": 0.021576496421403135, |
|
"max": 0.28720379499039456, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.646754593971431e-06, |
|
"min": 7.646754593971431e-06, |
|
"max": 0.0001481200506266667, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010705456431560002, |
|
"min": 0.00010705456431560002, |
|
"max": 0.0019958326347227, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10254888571428573, |
|
"min": 0.10254888571428573, |
|
"max": 0.14937333333333333, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4356844000000002, |
|
"min": 0.44811999999999996, |
|
"max": 2.0773133, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002646336828571429, |
|
"min": 0.0002646336828571429, |
|
"max": 0.004942395999999999, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003704871560000001, |
|
"min": 0.003704871560000001, |
|
"max": 0.06660120227, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.011130442842841148, |
|
"min": 0.011130442842841148, |
|
"max": 0.018592344596982002, |
|
"count": 17 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.15582619607448578, |
|
"min": 0.055777035653591156, |
|
"max": 0.25444158911705017, |
|
"count": 17 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 381.958904109589, |
|
"min": 381.958904109589, |
|
"max": 835.3428571428572, |
|
"count": 17 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 27883.0, |
|
"min": 2341.0, |
|
"max": 31805.0, |
|
"count": 17 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.5632301107661364, |
|
"min": -0.04676927492404596, |
|
"max": 1.5632301107661364, |
|
"count": 17 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 114.11579808592796, |
|
"min": -1.8240017220377922, |
|
"max": 114.88739801198244, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.5632301107661364, |
|
"min": -0.04676927492404596, |
|
"max": 1.5632301107661364, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 114.11579808592796, |
|
"min": -1.8240017220377922, |
|
"max": 114.88739801198244, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.04380278093405451, |
|
"min": 0.04380278093405451, |
|
"max": 0.15401908088750085, |
|
"count": 17 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 3.197603008185979, |
|
"min": 0.4970928718103096, |
|
"max": 6.006744154612534, |
|
"count": 17 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 17 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 17 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1666820411", |
|
"python_version": "3.7.15 (default, Oct 12 2022, 19:14:55) \n[GCC 7.5.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./trained-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1666821515" |
|
}, |
|
"total": 1104.50703153, |
|
"count": 1, |
|
"self": 0.44053384599965284, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.043343765000372514, |
|
"count": 1, |
|
"self": 0.043343765000372514 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1104.023153919, |
|
"count": 1, |
|
"self": 0.8265517110116889, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.503371287999926, |
|
"count": 1, |
|
"self": 6.503371287999926 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1096.5990557029882, |
|
"count": 32026, |
|
"self": 0.8887431339071554, |
|
"children": { |
|
"env_step": { |
|
"total": 734.722037918054, |
|
"count": 32026, |
|
"self": 676.3580663430766, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 57.92033342601144, |
|
"count": 32026, |
|
"self": 2.486959676054994, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 55.433373749956445, |
|
"count": 31318, |
|
"self": 18.669532147922382, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 36.76384160203406, |
|
"count": 31318, |
|
"self": 36.76384160203406 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.4436381489658743, |
|
"count": 32026, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1101.6087957520535, |
|
"count": 32026, |
|
"is_parallel": true, |
|
"self": 481.4929296781247, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0019209470001442241, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0007091149991538259, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012118320009903982, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012118320009903982 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.060161157000038656, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005135700002938393, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004762000003211142, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004762000003211142 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.05752015199959715, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.05752015199959715 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016512349998265563, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000425104999976611, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012261299998499453, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012261299998499453 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 620.1158660739288, |
|
"count": 32025, |
|
"is_parallel": true, |
|
"self": 14.729850475844614, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 12.183287286025916, |
|
"count": 32025, |
|
"is_parallel": true, |
|
"self": 12.183287286025916 |
|
}, |
|
"communicator.exchange": { |
|
"total": 545.050911685014, |
|
"count": 32025, |
|
"is_parallel": true, |
|
"self": 545.050911685014 |
|
}, |
|
"steps_from_proto": { |
|
"total": 48.151816627044354, |
|
"count": 32025, |
|
"is_parallel": true, |
|
"self": 12.507719423942035, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 35.64409720310232, |
|
"count": 256200, |
|
"is_parallel": true, |
|
"self": 35.64409720310232 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 360.98827465102704, |
|
"count": 32026, |
|
"self": 1.5785568430037529, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 82.8166930020293, |
|
"count": 32026, |
|
"self": 82.70609321602933, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.11059978599996612, |
|
"count": 1, |
|
"self": 0.11059978599996612 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 276.593024805994, |
|
"count": 234, |
|
"self": 109.23629919799805, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 167.35672560799594, |
|
"count": 11340, |
|
"self": 167.35672560799594 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.244000031874748e-06, |
|
"count": 1, |
|
"self": 1.244000031874748e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09417397300012453, |
|
"count": 1, |
|
"self": 0.002133608999884018, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09204036400024052, |
|
"count": 1, |
|
"self": 0.09204036400024052 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |