|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.20312833786010742, |
|
"min": 0.1852981597185135, |
|
"max": 1.4716616868972778, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 6048.349609375, |
|
"min": 5579.6982421875, |
|
"max": 44644.328125, |
|
"count": 64 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1919935.0, |
|
"min": 29952.0, |
|
"max": 1919935.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1919935.0, |
|
"min": 29952.0, |
|
"max": 1919935.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.7642052173614502, |
|
"min": -0.12216313183307648, |
|
"max": 0.801848292350769, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 224.67633056640625, |
|
"min": -29.319150924682617, |
|
"max": 240.5544891357422, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.03788827359676361, |
|
"min": -0.009359977208077908, |
|
"max": 0.23613667488098145, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 11.139152526855469, |
|
"min": -2.7331132888793945, |
|
"max": 55.964393615722656, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06845925557094493, |
|
"min": 0.06387119473348482, |
|
"max": 0.07363246895416761, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9584295779932289, |
|
"min": 0.49938676214439726, |
|
"max": 1.0991964447603095, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.013329540630885667, |
|
"min": 0.00010155148852295709, |
|
"max": 0.01622062214231673, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.18661356883239935, |
|
"min": 0.001320169350798442, |
|
"max": 0.2270887099924342, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.0001095209992073071, |
|
"min": 0.0001095209992073071, |
|
"max": 0.00029838354339596195, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0015332939889022995, |
|
"min": 0.0015332939889022995, |
|
"max": 0.003968969577010166, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.1365069785714286, |
|
"min": 0.1365069785714286, |
|
"max": 0.19946118095238097, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.9110977000000005, |
|
"min": 1.3962282666666668, |
|
"max": 2.722989833333333, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0036570471592857153, |
|
"min": 0.0036570471592857153, |
|
"max": 0.009946171977142856, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.05119866023000001, |
|
"min": 0.05119866023000001, |
|
"max": 0.13230668435, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.0062941014766693115, |
|
"min": 0.0062941014766693115, |
|
"max": 0.39106887578964233, |
|
"count": 64 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.08811742067337036, |
|
"min": 0.08811742067337036, |
|
"max": 2.7374820709228516, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 256.6578947368421, |
|
"min": 235.2153846153846, |
|
"max": 999.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29259.0, |
|
"min": 15984.0, |
|
"max": 33331.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.7257912161580302, |
|
"min": -1.0000000521540642, |
|
"max": 1.7647845991528952, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 196.74019864201546, |
|
"min": -30.992401592433453, |
|
"max": 229.42199788987637, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.7257912161580302, |
|
"min": -1.0000000521540642, |
|
"max": 1.7647845991528952, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 196.74019864201546, |
|
"min": -30.992401592433453, |
|
"max": 229.42199788987637, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.01690496996480649, |
|
"min": 0.01690496996480649, |
|
"max": 8.611706785857677, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 1.9271665759879397, |
|
"min": 1.9271665759879397, |
|
"max": 137.78730857372284, |
|
"count": 64 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 64 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1722662330", |
|
"python_version": "3.10.12 (main, Jul 29 2024, 16:56:48) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.3.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1722666872" |
|
}, |
|
"total": 4541.322192753, |
|
"count": 1, |
|
"self": 0.3473138570006995, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.05186400799993862, |
|
"count": 1, |
|
"self": 0.05186400799993862 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 4540.923014888, |
|
"count": 1, |
|
"self": 3.041778984093071, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 1.8350260879997222, |
|
"count": 1, |
|
"self": 1.8350260879997222 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 4535.915879362908, |
|
"count": 124609, |
|
"self": 3.0144043176414925, |
|
"children": { |
|
"env_step": { |
|
"total": 3286.7031434862683, |
|
"count": 124609, |
|
"self": 3025.5543719656307, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 259.4163059708044, |
|
"count": 124609, |
|
"self": 9.415928384680228, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 250.00037758612416, |
|
"count": 120799, |
|
"self": 250.00037758612416 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.7324655498332504, |
|
"count": 124608, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 4530.698063024101, |
|
"count": 124608, |
|
"is_parallel": true, |
|
"self": 1747.2683188711562, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0021797890003654175, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000736717999643588, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014430710007218295, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014430710007218295 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.049098313999820675, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006490259993370273, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004746209997392725, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004746209997392725 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04627934800009825, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04627934800009825 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016953190006461227, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00035778900200966746, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013375299986364553, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013375299986364553 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2783.429744152945, |
|
"count": 124607, |
|
"is_parallel": true, |
|
"self": 64.93267705257131, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 45.90360956096629, |
|
"count": 124607, |
|
"is_parallel": true, |
|
"self": 45.90360956096629 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2479.240100841118, |
|
"count": 124607, |
|
"is_parallel": true, |
|
"self": 2479.240100841118 |
|
}, |
|
"steps_from_proto": { |
|
"total": 193.35335669828964, |
|
"count": 124607, |
|
"is_parallel": true, |
|
"self": 40.13082598911933, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 153.22253070917031, |
|
"count": 996856, |
|
"is_parallel": true, |
|
"self": 153.22253070917031 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1246.1983315589978, |
|
"count": 124608, |
|
"self": 5.429093567839118, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 261.6591720881688, |
|
"count": 124608, |
|
"self": 261.3742739461686, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.2848981420002019, |
|
"count": 3, |
|
"self": 0.2848981420002019 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 979.1100659029898, |
|
"count": 888, |
|
"self": 581.2051412269293, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 397.90492467606055, |
|
"count": 44085, |
|
"self": 397.90492467606055 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.3829994713887572e-06, |
|
"count": 1, |
|
"self": 1.3829994713887572e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.13032906999978877, |
|
"count": 1, |
|
"self": 0.0019873940000252333, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.12834167599976354, |
|
"count": 1, |
|
"self": 0.12834167599976354 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |