|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.6524809002876282, |
|
"min": 0.6524809002876282, |
|
"max": 1.4705501794815063, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 19250.796875, |
|
"min": 19250.796875, |
|
"max": 44610.609375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989941.0, |
|
"min": 29952.0, |
|
"max": 989941.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989941.0, |
|
"min": 29952.0, |
|
"max": 989941.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.36446237564086914, |
|
"min": -0.09325811266899109, |
|
"max": 0.4770409166812897, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 96.94699096679688, |
|
"min": -22.381946563720703, |
|
"max": 129.755126953125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": -0.16427282989025116, |
|
"min": -0.17130430042743683, |
|
"max": 0.30304327607154846, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": -43.696571350097656, |
|
"min": -46.59476852416992, |
|
"max": 71.82125854492188, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06792325928964761, |
|
"min": 0.06559769146506288, |
|
"max": 0.07268592918913264, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9509256300550665, |
|
"min": 0.4991692476435872, |
|
"max": 1.0654710608279998, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.012431059297588682, |
|
"min": 0.0004807890688668602, |
|
"max": 0.0199622696269899, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.17403483016624155, |
|
"min": 0.006250257895269183, |
|
"max": 0.27947177477785856, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.5667617634928576e-06, |
|
"min": 7.5667617634928576e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010593466468890001, |
|
"min": 0.00010593466468890001, |
|
"max": 0.0035072564309145994, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10252222142857145, |
|
"min": 0.10252222142857145, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4353111000000003, |
|
"min": 1.3886848, |
|
"max": 2.5690854, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.00026196992071428587, |
|
"min": 0.00026196992071428587, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.003667578890000002, |
|
"min": 0.003667578890000002, |
|
"max": 0.11693163146000002, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.00930571649223566, |
|
"min": 0.009168436750769615, |
|
"max": 0.3567742705345154, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.1302800327539444, |
|
"min": 0.12835811078548431, |
|
"max": 2.497419834136963, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 496.08474576271186, |
|
"min": 378.0759493670886, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29269.0, |
|
"min": 15984.0, |
|
"max": 32282.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.232637262066542, |
|
"min": -1.0000000521540642, |
|
"max": 1.5459594690724263, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 72.72559846192598, |
|
"min": -30.312001638114452, |
|
"max": 122.13079805672169, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.232637262066542, |
|
"min": -1.0000000521540642, |
|
"max": 1.5459594690724263, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 72.72559846192598, |
|
"min": -30.312001638114452, |
|
"max": 122.13079805672169, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.04779064674936709, |
|
"min": 0.03630968288568591, |
|
"max": 6.943391263484955, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.819648158212658, |
|
"min": 2.819648158212658, |
|
"max": 111.09426021575928, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1729237814", |
|
"python_version": "3.10.0 (default, Mar 3 2022, 09:58:08) [GCC 7.5.0]", |
|
"command_line_arguments": "/cpfs/user/taishan/miniconda3/envs/ml-agents/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.4.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1729240461" |
|
}, |
|
"total": 2647.1359304729995, |
|
"count": 1, |
|
"self": 0.4285606839985121, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.13243761200283188, |
|
"count": 1, |
|
"self": 0.13243761200283188 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2646.574932176998, |
|
"count": 1, |
|
"self": 1.0098255497578066, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 3.1970746160077397, |
|
"count": 1, |
|
"self": 3.1970746160077397 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2642.229406590239, |
|
"count": 63543, |
|
"self": 0.9336012892308645, |
|
"children": { |
|
"env_step": { |
|
"total": 2231.576490821055, |
|
"count": 63543, |
|
"self": 2129.4908955313294, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 101.45009034496616, |
|
"count": 63544, |
|
"self": 3.7880231003218796, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 97.66206724464428, |
|
"count": 62621, |
|
"self": 97.66206724464428 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.6355049447593046, |
|
"count": 63543, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3351.990387798811, |
|
"count": 63543, |
|
"is_parallel": true, |
|
"self": 1298.1987625510228, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.13243761200283188, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.015098709991434589, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00161097600357607, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000494004983920604, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001116971019655466, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001116971019655466 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.11572792600782122, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00012103002518415451, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006946339999558404, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006946339999558404 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.1140279339888366, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.1140279339888366 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0008843279938446358, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00019012900884263217, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0006941989850020036, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0006941989850020036 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2053.659187635785, |
|
"count": 63541, |
|
"is_parallel": true, |
|
"self": 7.234220153011847, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 34.52307016259874, |
|
"count": 63541, |
|
"is_parallel": true, |
|
"self": 34.52307016259874 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1959.9089433813351, |
|
"count": 63541, |
|
"is_parallel": true, |
|
"self": 1959.9089433813351 |
|
}, |
|
"steps_from_proto": { |
|
"total": 51.99295393883949, |
|
"count": 63541, |
|
"is_parallel": true, |
|
"self": 10.524916169350035, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 41.468037769489456, |
|
"count": 508328, |
|
"is_parallel": true, |
|
"self": 41.468037769489456 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 3.1970746160077397, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 3.1970746160077397 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 704.0082399569801, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 0.2507582859834656, |
|
"children": { |
|
"env_step": { |
|
"total": 591.1661858067528, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 561.950506352805, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 28.991436835975037, |
|
"count": 17446, |
|
"is_parallel": true, |
|
"self": 1.0435211764706764, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 27.94791565950436, |
|
"count": 17357, |
|
"is_parallel": true, |
|
"self": 27.94791565950436 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.17297721598879434, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 707.1044786637358, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 163.69765298755374, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.00161097600357607, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000494004983920604, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001116971019655466, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001116971019655466 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.11572792600782122, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00012103002518415451, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006946339999558404, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006946339999558404 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.1140279339888366, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.1140279339888366 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0008843279938446358, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00019012900884263217, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0006941989850020036, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0006941989850020036 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 543.406825676182, |
|
"count": 17444, |
|
"is_parallel": true, |
|
"self": 1.8957679864397505, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 9.49863564989937, |
|
"count": 17444, |
|
"is_parallel": true, |
|
"self": 9.49863564989937 |
|
}, |
|
"communicator.exchange": { |
|
"total": 517.8208545059751, |
|
"count": 17444, |
|
"is_parallel": true, |
|
"self": 517.8208545059751 |
|
}, |
|
"steps_from_proto": { |
|
"total": 14.191567533867783, |
|
"count": 17444, |
|
"is_parallel": true, |
|
"self": 2.828539321257267, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 11.363028212610516, |
|
"count": 139552, |
|
"is_parallel": true, |
|
"self": 11.363028212610516 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0015358179953182116, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004476649919524789, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010881530033657327, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010881530033657327 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04972958398866467, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00012414799130056053, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006500849995063618, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006500849995063618 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.048106713002198376, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.048106713002198376 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0008486379956593737, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00018992897821590304, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0006587090174434707, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0006587090174434707 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 112.59129586424388, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 0.40781646892719436, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 21.065620380381006, |
|
"count": 17445, |
|
"is_parallel": true, |
|
"self": 21.065620380381006 |
|
}, |
|
"_update_policy": { |
|
"total": 91.11785901493568, |
|
"count": 110, |
|
"is_parallel": true, |
|
"self": 50.792928515482345, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 40.32493049945333, |
|
"count": 6330, |
|
"is_parallel": true, |
|
"self": 40.32493049945333 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 409.719314479953, |
|
"count": 63543, |
|
"self": 1.7765321361948736, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 80.34752689780726, |
|
"count": 63543, |
|
"self": 80.0011609288049, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.34636596900236327, |
|
"count": 2, |
|
"self": 0.34636596900236327 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 327.5952554459509, |
|
"count": 442, |
|
"self": 183.68929388972174, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 143.90596155622916, |
|
"count": 22815, |
|
"self": 143.90596155622916 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.469949873164296e-07, |
|
"count": 1, |
|
"self": 9.469949873164296e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.13862447399878874, |
|
"count": 1, |
|
"self": 0.017148501006886363, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.12147597299190238, |
|
"count": 1, |
|
"self": 0.12147597299190238 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |