{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.5933685302734375, "min": 1.555415391921997, "max": 3.2957260608673096, "count": 1190 }, "SoccerTwos.Policy.Entropy.sum": { "value": 31867.37109375, "min": 7245.72607421875, "max": 160250.546875, "count": 1190 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 50.56701030927835, "min": 39.86290322580645, "max": 999.0, "count": 1190 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19620.0, "min": 1324.0, "max": 29924.0, "count": 1190 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1552.4123372657316, "min": 1171.0870379635965, "max": 1593.7937115535658, "count": 1172 }, "SoccerTwos.Self-play.ELO.sum": { "value": 301167.99342955195, "min": 2342.549064692899, "max": 379277.177015662, "count": 1172 }, "SoccerTwos.Step.mean": { "value": 11899988.0, "min": 9908.0, "max": 11899988.0, "count": 1190 }, "SoccerTwos.Step.sum": { "value": 11899988.0, "min": 9908.0, "max": 11899988.0, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.05609159916639328, "min": -0.10269837826490402, "max": 0.1604011207818985, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -10.881770133972168, "min": -20.803024291992188, "max": 26.55428695678711, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.05540889501571655, "min": -0.10428468883037567, "max": 0.16165974736213684, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -10.7493257522583, "min": -20.830650329589844, "max": 25.814809799194336, "count": 1190 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1190 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.22509896847390637, "min": -0.7, "max": 0.43244597521321526, "count": 1190 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -43.669199883937836, "min": -67.99799966812134, "max": 49.72719997167587, "count": 1190 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.22509896847390637, "min": -0.7, "max": 0.43244597521321526, "count": 1190 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -43.669199883937836, "min": -67.99799966812134, "max": 49.72719997167587, "count": 1190 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1190 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1190 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.018065108659599597, "min": 0.009599036445918804, "max": 0.024713016274229935, "count": 572 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.018065108659599597, "min": 0.009599036445918804, "max": 0.024713016274229935, "count": 572 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.10961750323573748, "min": 5.087670245605598e-05, "max": 0.1267578721046448, "count": 572 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.10961750323573748, "min": 5.087670245605598e-05, "max": 0.1267578721046448, "count": 572 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.11107018887996674, "min": 4.992426869042295e-05, "max": 0.12836463153362274, "count": 572 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.11107018887996674, "min": 4.992426869042295e-05, "max": 0.12836463153362274, "count": 572 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 572 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 572 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.19999999999999996, "max": 0.20000000000000007, "count": 572 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.19999999999999996, "max": 0.20000000000000007, "count": 572 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005, "max": 0.005000000000000001, "count": 572 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005, "max": 0.005000000000000001, "count": 572 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1681368361", "python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", "command_line_arguments": "/home/agarcia/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1681391743" }, "total": 23381.772990735, "count": 1, "self": 0.25354983799843467, "children": { "run_training.setup": { "total": 0.007767745000364812, "count": 1, "self": 0.007767745000364812 }, "TrainerController.start_learning": { "total": 23381.511673152003, "count": 1, "self": 20.547621270012314, "children": { "TrainerController._reset_env": { "total": 4.133485494004617, "count": 60, "self": 4.133485494004617 }, "TrainerController.advance": { "total": 23356.09298498699, "count": 816806, "self": 20.105895319626143, "children": { "env_step": { "total": 17012.01835669991, "count": 816806, "self": 13377.597879131725, "children": { "SubprocessEnvManager._take_step": { "total": 3621.965414975484, "count": 816806, "self": 107.18239118388192, "children": { "TorchPolicy.evaluate": { "total": 3514.783023791602, "count": 1503958, "self": 3514.783023791602 } } }, "workers": { "total": 12.455062592702689, "count": 816805, "self": 0.0, "children": { "worker_root": { "total": 23353.504601857137, "count": 816805, "is_parallel": true, "self": 12172.06109010599, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.002013325000007171, "count": 2, "is_parallel": true, "self": 0.0005329470000106085, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014803779999965627, "count": 8, "is_parallel": true, "self": 0.0014803779999965627 } } }, "UnityEnvironment.step": { "total": 0.023350181999830966, "count": 1, "is_parallel": true, "self": 0.00044781700080420705, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0003764809998756391, "count": 1, "is_parallel": true, "self": 0.0003764809998756391 }, "communicator.exchange": { "total": 0.021061302999896725, "count": 1, "is_parallel": true, "self": 0.021061302999896725 }, "steps_from_proto": { "total": 0.0014645809992543946, "count": 2, "is_parallel": true, "self": 0.00030255999945438816, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011620209998000064, "count": 8, "is_parallel": true, "self": 0.0011620209998000064 } } } } } } }, "UnityEnvironment.step": { "total": 11181.315135833142, "count": 816804, "is_parallel": true, "self": 555.8757341502806, "children": { "UnityEnvironment._generate_step_input": { "total": 354.9397385261914, "count": 816804, "is_parallel": true, "self": 354.9397385261914 }, "communicator.exchange": { "total": 8646.955241935066, "count": 816804, "is_parallel": true, "self": 8646.955241935066 }, "steps_from_proto": { "total": 1623.5444212216044, "count": 1633608, "is_parallel": true, "self": 324.40628953083296, "children": { "_process_rank_one_or_two_observation": { "total": 1299.1381316907714, "count": 6534432, "is_parallel": true, "self": 1299.1381316907714 } } } } }, "steps_from_proto": { "total": 0.12837591800553128, "count": 118, "is_parallel": true, "self": 0.02598310997518638, "children": { "_process_rank_one_or_two_observation": { "total": 0.1023928080303449, "count": 472, "is_parallel": true, "self": 0.1023928080303449 } } } } } } } } }, "trainer_advance": { "total": 6323.968732967453, "count": 816805, "self": 130.42697614090685, "children": { "process_trajectory": { "total": 2013.9432173255736, "count": 816805, "self": 2009.0746457905789, "children": { "RLTrainer._checkpoint": { "total": 4.868571534994771, "count": 23, "self": 4.868571534994771 } } }, "_update_policy": { "total": 4179.598539500973, "count": 572, "self": 1904.0242409148877, "children": { "TorchPOCAOptimizer.update": { "total": 2275.574298586085, "count": 17172, "self": 2275.574298586085 } } } } } } }, "trainer_threads": { "total": 6.318998202914372e-06, "count": 1, "self": 6.318998202914372e-06 }, "TrainerController._save_models": { "total": 0.737575081999239, "count": 1, "self": 0.0052373040016391315, "children": { "RLTrainer._checkpoint": { "total": 0.7323377779975999, "count": 1, "self": 0.7323377779975999 } } } } } } }