{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 0.6666061878204346, "min": 0.6463891267776489, "max": 3.2958338260650635, "count": 10000 }, "SoccerTwos.Policy.Entropy.sum": { "value": 12350.8798828125, "min": 632.800048828125, "max": 376832.4375, "count": 10000 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 76.29230769230769, "min": 35.094202898550726, "max": 999.0, "count": 10000 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19836.0, "min": 3692.0, "max": 30668.0, "count": 10000 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1831.6678677537593, "min": 1187.3317604562183, "max": 1852.5110702140453, "count": 9955 }, "SoccerTwos.Self-play.ELO.sum": { "value": 238116.8228079887, "min": 2375.1556434615, "max": 466622.93640783173, "count": 9955 }, "SoccerTwos.Step.mean": { "value": 99999989.0, "min": 9975.0, "max": 99999989.0, "count": 10000 }, "SoccerTwos.Step.sum": { "value": 99999989.0, "min": 9975.0, "max": 99999989.0, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.01400040090084076, "min": -0.13026683032512665, "max": 0.1905166059732437, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 1.834052562713623, "min": -24.271142959594727, "max": 32.21083068847656, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.014650966972112656, "min": -0.13573074340820312, "max": 0.18502849340438843, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 1.9192767143249512, "min": -24.160072326660156, "max": 31.156681060791016, "count": 10000 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 10000 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.07949313225636956, "min": -0.564457142991679, "max": 0.596973911575649, "count": 10000 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 10.413600325584412, "min": -68.68439996242523, "max": 68.3793997168541, "count": 10000 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.07949313225636956, "min": -0.564457142991679, "max": 0.596973911575649, "count": 10000 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 10.413600325584412, "min": -68.68439996242523, "max": 68.3793997168541, "count": 10000 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 10000 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 10000 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.015226859835416285, "min": 0.013034687134980535, "max": 0.022104917299455136, "count": 1994 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.015226859835416285, "min": 0.013034687134980535, "max": 0.022104917299455136, "count": 1994 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.1041516460892227, "min": 0.00041215566246440477, "max": 0.122376452303595, "count": 1994 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.1041516460892227, "min": 0.00041215566246440477, "max": 0.122376452303595, "count": 1994 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.10435032565146685, "min": 0.0004121556636770644, "max": 0.12528275191369984, "count": 1994 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.10435032565146685, "min": 0.0004121556636770644, "max": 0.12528275191369984, "count": 1994 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 2.241999286004973e-09, "min": 2.241999286004973e-09, "max": 0.000299829744056752, "count": 1994 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 2.241999286004973e-09, "min": 2.241999286004973e-09, "max": 0.000299829744056752, "count": 1994 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.100000714, "min": 0.100000714, "max": 0.19994324800000005, "count": 1994 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.100000714, "min": 0.100000714, "max": 0.19994324800000005, "count": 1994 }, "SoccerTwos.Policy.Beta.mean": { "value": 1.0035628600000084e-05, "min": 1.0035628600000084e-05, "max": 0.0049971680752000005, "count": 1994 }, "SoccerTwos.Policy.Beta.sum": { "value": 1.0035628600000084e-05, "min": 1.0035628600000084e-05, "max": 0.0049971680752000005, "count": 1994 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1677049487", "python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]", "command_line_arguments": "/home/zhihdeng/anaconda3/envs/HuggingFaceDRL/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --no-graphics", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1677133391" }, "total": 83904.80731506646, "count": 1, "self": 0.5806480310857296, "children": { "run_training.setup": { "total": 0.08121960237622261, "count": 1, "self": 0.08121960237622261 }, "TrainerController.start_learning": { "total": 83904.145447433, "count": 1, "self": 94.22289557754993, "children": { "TrainerController._reset_env": { "total": 54.67632833123207, "count": 500, "self": 54.67632833123207 }, "TrainerController.advance": { "total": 83754.96005585045, "count": 4527425, "self": 92.62372266501188, "children": { "env_step": { "total": 42756.356216367334, "count": 4527425, "self": 13836.03085809201, "children": { "SubprocessEnvManager._take_step": { "total": 28856.72142047435, "count": 7029668, "self": 857.1122543402016, "children": { "TorchPolicy.evaluate": { "total": 27999.60916613415, "count": 12771564, "self": 27999.60916613415 } } }, "workers": { "total": 63.603937800973654, "count": 4527425, "self": 0.0, "children": { "worker_root": { "total": 335850.2568864301, "count": 7028693, "is_parallel": true, "self": 257239.22801594436, "children": { "run_training.setup": { "total": 0.32487840950489044, "count": 4, "is_parallel": true, "self": 0.21821270883083344, "children": { "steps_from_proto": { "total": 0.010150227695703506, "count": 8, "is_parallel": true, "self": 0.0028362199664115906, "children": { "_process_rank_one_or_two_observation": { "total": 0.007314007729291916, "count": 32, "is_parallel": true, "self": 0.007314007729291916 } } }, "UnityEnvironment.step": { "total": 0.0965154729783535, "count": 4, "is_parallel": true, "self": 0.0024172402918338776, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0016319416463375092, "count": 4, "is_parallel": true, "self": 0.0016319416463375092 }, "communicator.exchange": { "total": 0.08511260151863098, "count": 4, "is_parallel": true, "self": 0.08511260151863098 }, "steps_from_proto": { "total": 0.007353689521551132, "count": 8, "is_parallel": true, "self": 0.0015354901552200317, "children": { "_process_rank_one_or_two_observation": { "total": 0.0058181993663311005, "count": 32, "is_parallel": true, "self": 0.0058181993663311005 } } } } } } }, "UnityEnvironment.step": { "total": 78606.48418792337, "count": 7028685, "is_parallel": true, "self": 5973.933590978384, "children": { "UnityEnvironment._generate_step_input": { "total": 2846.3787834383547, "count": 7028685, "is_parallel": true, "self": 2846.3787834383547 }, "communicator.exchange": { "total": 56477.49033830315, "count": 7028685, "is_parallel": true, "self": 56477.49033830315 }, "steps_from_proto": { "total": 13308.681475203484, "count": 14057370, "is_parallel": true, "self": 2520.244860779494, "children": { "_process_rank_one_or_two_observation": { "total": 10788.43661442399, "count": 56229480, "is_parallel": true, "self": 10788.43661442399 } } } } }, "TrainerController.start_learning": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "TrainerController._reset_env": { "total": 87.11462037265301, "count": 4, "is_parallel": true, "self": 87.11462037265301 }, "TrainerController.advance": { "total": 525.4730990827084, "count": 24940, "is_parallel": true, "self": 0.5285775065422058, "children": { "env_step": { "total": 321.84629322588444, "count": 24940, "is_parallel": true, "self": 105.12262518703938, "children": { "SubprocessEnvManager._take_step": { "total": 216.17542307078838, "count": 47828, "is_parallel": true, "self": 6.077347084879875, "children": { "TorchPolicy.evaluate": { "total": 210.0980759859085, "count": 95328, "is_parallel": true, "self": 210.0980759859085 } } }, "workers": { "total": 0.39629462361335754, "count": 24940, "is_parallel": true, "self": 0.0, "children": { "worker_root": { "total": 2352.3570114970207, "count": 47812, "is_parallel": true, "self": 1840.0889991819859, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.040600910782814026, "count": 32, "is_parallel": true, "self": 0.011344879865646362, "children": { "_process_rank_one_or_two_observation": { "total": 0.029256030917167664, "count": 128, "is_parallel": true, "self": 0.029256030917167664 } } }, "UnityEnvironment.step": { "total": 0.386061891913414, "count": 16, "is_parallel": true, "self": 0.00966896116733551, "children": { "UnityEnvironment._generate_step_input": { "total": 0.006527766585350037, "count": 16, "is_parallel": true, "self": 0.006527766585350037 }, "communicator.exchange": { "total": 0.3404504060745239, "count": 16, "is_parallel": true, "self": 0.3404504060745239 }, "steps_from_proto": { "total": 0.02941475808620453, "count": 32, "is_parallel": true, "self": 0.006141960620880127, "children": { "_process_rank_one_or_two_observation": { "total": 0.023272797465324402, "count": 128, "is_parallel": true, "self": 0.023272797465324402 } } } } } } }, "UnityEnvironment.step": { "total": 512.2680123150349, "count": 47796, "is_parallel": true, "self": 27.34689722955227, "children": { "UnityEnvironment._generate_step_input": { "total": 18.028440296649933, "count": 47796, "is_parallel": true, "self": 18.028440296649933 }, "communicator.exchange": { "total": 384.59400632977486, "count": 47796, "is_parallel": true, "self": 384.59400632977486 }, "steps_from_proto": { "total": 82.29866845905781, "count": 95592, "is_parallel": true, "self": 16.143723011016846, "children": { "_process_rank_one_or_two_observation": { "total": 66.15494544804096, "count": 382368, "is_parallel": true, "self": 66.15494544804096 } } } } } } } } }, "steps_from_proto": { "total": 0.023402098566293716, "count": 8, "is_parallel": true, "self": 0.004221200942993164, "children": { "_process_rank_one_or_two_observation": { "total": 0.019180897623300552, "count": 32, "is_parallel": true, "self": 0.019180897623300552 } } }, "UnityEnvironment.step": { "total": 0.1285482458770275, "count": 4, "is_parallel": true, "self": 0.013892177492380142, "children": { "UnityEnvironment._generate_step_input": { "total": 0.005419403314590454, "count": 4, "is_parallel": true, "self": 0.005419403314590454 }, "communicator.exchange": { "total": 0.09192324057221413, "count": 4, "is_parallel": true, "self": 0.09192324057221413 }, "steps_from_proto": { "total": 0.01731342449784279, "count": 8, "is_parallel": true, "self": 0.002764381468296051, "children": { "_process_rank_one_or_two_observation": { "total": 0.014549043029546738, "count": 32, "is_parallel": true, "self": 0.014549043029546738 } } } } } } }, "trainer_advance": { "total": 203.09822835028172, "count": 24940, "is_parallel": true, "self": 7.581616789102554, "children": { "process_trajectory": { "total": 52.86894811689854, "count": 24940, "is_parallel": true, "self": 52.86894811689854 }, "_update_policy": { "total": 142.64766344428062, "count": 12, "is_parallel": true, "self": 93.26212346553802, "children": { "TorchPOCAOptimizer.update": { "total": 49.3855399787426, "count": 912, "is_parallel": true, "self": 49.3855399787426 } } } } } } } } }, "steps_from_proto": { "total": 4.219804152846336, "count": 3992, "is_parallel": true, "self": 0.7932459115982056, "children": { "_process_rank_one_or_two_observation": { "total": 3.426558241248131, "count": 15968, "is_parallel": true, "self": 3.426558241248131 } } } } } } } } }, "trainer_advance": { "total": 40905.9801168181, "count": 4527425, "self": 1099.933923009783, "children": { "process_trajectory": { "total": 18540.67933832854, "count": 4527425, "self": 18395.13620839268, "children": { "RLTrainer._checkpoint": { "total": 145.54312993586063, "count": 200, "self": 145.54312993586063 } } }, "_update_policy": { "total": 21265.366855479777, "count": 1994, "self": 14209.924621451646, "children": { "TorchPOCAOptimizer.update": { "total": 7055.442234028131, "count": 143631, "self": 7055.442234028131 } } } } } } }, "trainer_threads": { "total": 8.903443813323975e-07, "count": 1, "self": 8.903443813323975e-07 }, "TrainerController._save_models": { "total": 0.2861667834222317, "count": 1, "self": 0.03692487254738808, "children": { "RLTrainer._checkpoint": { "total": 0.2492419108748436, "count": 1, "self": 0.2492419108748436 } } } } } } }