{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.3569423258304596, "min": 0.3569423258304596, "max": 1.4746330976486206, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 10622.603515625, "min": 10622.603515625, "max": 44734.46875, "count": 33 }, "Pyramids.Step.mean": { "value": 989934.0, "min": 29952.0, "max": 989934.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989934.0, "min": 29952.0, "max": 989934.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.40554696321487427, "min": -0.14670321345329285, "max": 0.4706757664680481, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 106.65885162353516, "min": -34.76866149902344, "max": 126.61177825927734, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": -0.0045495848171412945, "min": -0.0045495848171412945, "max": 0.25074440240859985, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": -1.1965408325195312, "min": -1.1965408325195312, "max": 59.426422119140625, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06814846335392861, "min": 0.06275959842515841, "max": 0.07399084628480797, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 1.0222269503089292, "min": 0.4851005819934586, "max": 1.0940490033330312, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.01363182086449039, "min": 0.0010118964599019062, "max": 0.015477508004031346, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.20447731296735586, "min": 0.007545239252673733, "max": 0.21668511205643884, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.515897494733334e-06, "min": 7.515897494733334e-06, "max": 0.00029515063018788575, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.00011273846242100001, "min": 0.00011273846242100001, "max": 0.0036335314888228994, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10250526666666668, "min": 0.10250526666666668, "max": 0.19838354285714285, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.5375790000000003, "min": 1.3691136000000002, "max": 2.6111771000000004, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.0002602761400000001, "min": 0.0002602761400000001, "max": 0.00983851593142857, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.0039041421000000015, "min": 0.0039041421000000015, "max": 0.12113659229, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.009283142164349556, "min": 0.009283142164349556, "max": 0.2695707380771637, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.1392471343278885, "min": 0.13411398231983185, "max": 1.8869950771331787, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 410.875, "min": 382.1392405063291, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 29583.0, "min": 15984.0, "max": 32371.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.4223972018808126, "min": -1.0000000521540642, "max": 1.4405923827162272, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 102.41259853541851, "min": -32.000001668930054, "max": 113.80679823458195, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.4223972018808126, "min": -1.0000000521540642, "max": 1.4405923827162272, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 102.41259853541851, "min": -32.000001668930054, "max": 113.80679823458195, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.039131969059477946, "min": 0.039131969059477946, "max": 5.096554284915328, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 2.8175017722824123, "min": 2.8175017722824123, "max": 81.54486855864525, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1673444558", "python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1673446600" }, "total": 2042.3718711020001, "count": 1, "self": 0.4746067269998093, "children": { "run_training.setup": { "total": 0.10942183099996328, "count": 1, "self": 0.10942183099996328 }, "TrainerController.start_learning": { "total": 2041.7878425440003, "count": 1, "self": 1.13619342614993, "children": { "TrainerController._reset_env": { "total": 6.510633092999797, "count": 1, "self": 6.510633092999797 }, "TrainerController.advance": { "total": 2034.0497634288513, "count": 63678, "self": 1.1913426247469943, "children": { "env_step": { "total": 1370.4626225610673, "count": 63678, "self": 1270.7756676140934, "children": { "SubprocessEnvManager._take_step": { "total": 98.94974638800068, "count": 63678, "self": 4.0518581009309855, "children": { "TorchPolicy.evaluate": { "total": 94.89788828706969, "count": 62561, "self": 32.316950265092146, "children": { "TorchPolicy.sample_actions": { "total": 62.580938021977545, "count": 62561, "self": 62.580938021977545 } } } } }, "workers": { "total": 0.7372085589731796, "count": 63678, "self": 0.0, "children": { "worker_root": { "total": 2038.2262380288726, "count": 63678, "is_parallel": true, "self": 862.7297736628807, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.001760930999807897, "count": 1, "is_parallel": true, "self": 0.0005919409995840397, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011689900002238574, "count": 8, "is_parallel": true, "self": 0.0011689900002238574 } } }, "UnityEnvironment.step": { "total": 0.04399581900042904, "count": 1, "is_parallel": true, "self": 0.000491171000248869, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0004309040000407549, "count": 1, "is_parallel": true, "self": 0.0004309040000407549 }, "communicator.exchange": { "total": 0.04150152500005788, "count": 1, "is_parallel": true, "self": 0.04150152500005788 }, "steps_from_proto": { "total": 0.0015722190000815317, "count": 1, "is_parallel": true, "self": 0.000427639999998064, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011445790000834677, "count": 8, "is_parallel": true, "self": 0.0011445790000834677 } } } } } } }, "UnityEnvironment.step": { "total": 1175.4964643659919, "count": 63677, "is_parallel": true, "self": 28.05835989913703, "children": { "UnityEnvironment._generate_step_input": { "total": 22.545035458977054, "count": 63677, "is_parallel": true, "self": 22.545035458977054 }, "communicator.exchange": { "total": 1032.9946892349335, "count": 63677, "is_parallel": true, "self": 1032.9946892349335 }, "steps_from_proto": { "total": 91.89837977294428, "count": 63677, "is_parallel": true, "self": 20.982000310051717, "children": { "_process_rank_one_or_two_observation": { "total": 70.91637946289256, "count": 509416, "is_parallel": true, "self": 70.91637946289256 } } } } } } } } } } }, "trainer_advance": { "total": 662.395798243037, "count": 63678, "self": 2.180197372996645, "children": { "process_trajectory": { "total": 141.78992880504302, "count": 63678, "self": 141.52560823304339, "children": { "RLTrainer._checkpoint": { "total": 0.2643205719996331, "count": 2, "self": 0.2643205719996331 } } }, "_update_policy": { "total": 518.4256720649973, "count": 450, "self": 200.06690263508563, "children": { "TorchPPOOptimizer.update": { "total": 318.3587694299117, "count": 22794, "self": 318.3587694299117 } } } } } } }, "trainer_threads": { "total": 1.032999534800183e-06, "count": 1, "self": 1.032999534800183e-06 }, "TrainerController._save_models": { "total": 0.09125156299978698, "count": 1, "self": 0.0015541779994237004, "children": { "RLTrainer._checkpoint": { "total": 0.08969738500036328, "count": 1, "self": 0.08969738500036328 } } } } } } }