|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 3.2957401275634766, |
|
"min": 3.295724630355835, |
|
"max": 3.295741081237793, |
|
"count": 13 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 15503.1611328125, |
|
"min": 3796.68798828125, |
|
"max": 48091.3984375, |
|
"count": 13 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 182.0, |
|
"min": 35.0, |
|
"max": 455.0, |
|
"count": 13 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 728.0, |
|
"min": 140.0, |
|
"max": 1820.0, |
|
"count": 13 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1200.7550203109818, |
|
"min": 1199.2507195558546, |
|
"max": 1200.7550203109818, |
|
"count": 9 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 2401.5100406219635, |
|
"min": 2398.5014391117093, |
|
"max": 4800.022959467346, |
|
"count": 9 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 4947.0, |
|
"min": 56.0, |
|
"max": 4947.0, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 4947.0, |
|
"min": 56.0, |
|
"max": 4947.0, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.02621970698237419, |
|
"min": 0.026093436405062675, |
|
"max": 0.026227079331874847, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 0.02621970698237419, |
|
"min": 0.026093436405062675, |
|
"max": 0.07862967997789383, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.026209291070699692, |
|
"min": 0.02613411471247673, |
|
"max": 0.026260271668434143, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 0.026209291070699692, |
|
"min": 0.02613411471247673, |
|
"max": 0.07878081500530243, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.0, |
|
"min": -1.0, |
|
"max": 0.9646000266075134, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 0.0, |
|
"min": -3.0, |
|
"max": 0.9646000266075134, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": -1.0, |
|
"max": 0.9646000266075134, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": -3.0, |
|
"max": 0.9646000266075134, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 39 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 39 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1737362686", |
|
"python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", |
|
"command_line_arguments": "/usr/local/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.5.1+cu124", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1737362756" |
|
}, |
|
"total": 70.4294646999997, |
|
"count": 1, |
|
"self": 0.7932846680000694, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.02756584600001588, |
|
"count": 1, |
|
"self": 0.02756584600001588 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 69.60861418599961, |
|
"count": 1, |
|
"self": 0.04943464000007225, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.2544019809997735, |
|
"count": 11, |
|
"self": 4.2544019809997735 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 65.02888599699963, |
|
"count": 2188, |
|
"self": 0.055819227999563736, |
|
"children": { |
|
"env_step": { |
|
"total": 63.02995204199806, |
|
"count": 2188, |
|
"self": 45.36964371300746, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 17.62963284298621, |
|
"count": 2188, |
|
"self": 0.35130317598850525, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 17.278329666997706, |
|
"count": 4370, |
|
"self": 17.278329666997706 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.030675486004383856, |
|
"count": 2188, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 69.08412094700316, |
|
"count": 2188, |
|
"is_parallel": true, |
|
"self": 30.670649410988972, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.008255239999925834, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.004782023001098423, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.003473216998827411, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.003473216998827411 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.040953847999844584, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0011449739995441632, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.000888929999746324, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000888929999746324 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.03531846200030486, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.03531846200030486 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0036014820002492343, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0006345290003082482, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.002966952999940986, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.002966952999940986 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 38.39007652801274, |
|
"count": 2187, |
|
"is_parallel": true, |
|
"self": 2.334880060005162, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 1.707200902011209, |
|
"count": 2187, |
|
"is_parallel": true, |
|
"self": 1.707200902011209 |
|
}, |
|
"communicator.exchange": { |
|
"total": 26.698371974996007, |
|
"count": 2187, |
|
"is_parallel": true, |
|
"self": 26.698371974996007 |
|
}, |
|
"steps_from_proto": { |
|
"total": 7.649623591000363, |
|
"count": 4374, |
|
"is_parallel": true, |
|
"self": 1.2880389300335082, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 6.361584660966855, |
|
"count": 17496, |
|
"is_parallel": true, |
|
"self": 6.361584660966855 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.023395008001443784, |
|
"count": 18, |
|
"is_parallel": true, |
|
"self": 0.004519783002251643, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.01887522499919214, |
|
"count": 72, |
|
"is_parallel": true, |
|
"self": 0.01887522499919214 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1.943114727002012, |
|
"count": 2188, |
|
"self": 0.18521795199012558, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 1.7578967750118863, |
|
"count": 2188, |
|
"self": 1.7578967750118863 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.2840000636060722e-06, |
|
"count": 1, |
|
"self": 1.2840000636060722e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.2758902840000701, |
|
"count": 1, |
|
"self": 0.004644124000151351, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.27124615999991875, |
|
"count": 1, |
|
"self": 0.27124615999991875 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |