|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.034095048904419, |
|
"min": 2.034095048904419, |
|
"max": 3.2957186698913574, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 43415.7265625, |
|
"min": 21021.2265625, |
|
"max": 136054.640625, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 57.92857142857143, |
|
"min": 43.642857142857146, |
|
"max": 999.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19464.0, |
|
"min": 13476.0, |
|
"max": 28232.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1444.277444267153, |
|
"min": 1188.5688610622024, |
|
"max": 1467.9057905021382, |
|
"count": 459 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 242638.6106368817, |
|
"min": 2378.6217784244172, |
|
"max": 318196.4601373692, |
|
"count": 459 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 5059920.0, |
|
"min": 9138.0, |
|
"max": 5059920.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 5059920.0, |
|
"min": 9138.0, |
|
"max": 5059920.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.008102988824248314, |
|
"min": -0.102271169424057, |
|
"max": 0.15609072148799896, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 1.3694051504135132, |
|
"min": -15.033862113952637, |
|
"max": 27.724905014038086, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.0010254208464175463, |
|
"min": -0.10244327783584595, |
|
"max": 0.15248753130435944, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 0.17329612374305725, |
|
"min": -15.059162139892578, |
|
"max": 26.837806701660156, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.04445562172218187, |
|
"min": -0.6912857123783657, |
|
"max": 0.34533906215801835, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 7.513000071048737, |
|
"min": -55.49279975891113, |
|
"max": 59.57000023126602, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.04445562172218187, |
|
"min": -0.6912857123783657, |
|
"max": 0.34533906215801835, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 7.513000071048737, |
|
"min": -55.49279975891113, |
|
"max": 59.57000023126602, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 506 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.015287019886697333, |
|
"min": 0.011718268912348624, |
|
"max": 0.02362056450607876, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.015287019886697333, |
|
"min": 0.011718268912348624, |
|
"max": 0.02362056450607876, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.08906070366501809, |
|
"min": 1.4289946382935645e-06, |
|
"max": 0.10702010343472163, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.08906070366501809, |
|
"min": 1.4289946382935645e-06, |
|
"max": 0.10702010343472163, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09028938934206962, |
|
"min": 1.5878587040181932e-06, |
|
"max": 0.11088861897587776, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09028938934206962, |
|
"min": 1.5878587040181932e-06, |
|
"max": 0.11088861897587776, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 241 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 241 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1710034452", |
|
"python_version": "3.10.12 (main, Mar 9 2024, 16:10:11) [Clang 14.0.3 (clang-1403.0.22.14.1)]", |
|
"command_line_arguments": "/Users/rushideshmukh/.pyenv/versions/3.10.12/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.2.1", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1710053756" |
|
}, |
|
"total": 19304.27785824999, |
|
"count": 1, |
|
"self": 0.33178508398123085, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.016164916014531627, |
|
"count": 1, |
|
"self": 0.016164916014531627 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 19303.929908249993, |
|
"count": 1, |
|
"self": 2.9813993361894973, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.200544664054178, |
|
"count": 26, |
|
"self": 5.200544664054178 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 19295.492771041783, |
|
"count": 339291, |
|
"self": 2.7193128646176774, |
|
"children": { |
|
"env_step": { |
|
"total": 15219.818307881098, |
|
"count": 339291, |
|
"self": 14713.968574603234, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 503.8066189119709, |
|
"count": 339291, |
|
"self": 14.768715203303145, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 489.0379037086677, |
|
"count": 644640, |
|
"self": 489.0379037086677 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.043114365893416, |
|
"count": 339290, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 19295.864006676624, |
|
"count": 339290, |
|
"is_parallel": true, |
|
"self": 5003.252988209628, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.042950455099344254, |
|
"count": 52, |
|
"is_parallel": true, |
|
"self": 0.005378327245125547, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.037572127854218706, |
|
"count": 208, |
|
"is_parallel": true, |
|
"self": 0.037572127854218706 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 14292.568068011897, |
|
"count": 339290, |
|
"is_parallel": true, |
|
"self": 35.37599831694388, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 256.56465872059925, |
|
"count": 339290, |
|
"is_parallel": true, |
|
"self": 256.56465872059925 |
|
}, |
|
"communicator.exchange": { |
|
"total": 13514.89062661829, |
|
"count": 339290, |
|
"is_parallel": true, |
|
"self": 13514.89062661829 |
|
}, |
|
"steps_from_proto": { |
|
"total": 485.73678435606416, |
|
"count": 678580, |
|
"is_parallel": true, |
|
"self": 55.636882274993695, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 430.09990208107047, |
|
"count": 2714320, |
|
"is_parallel": true, |
|
"self": 430.09990208107047 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 4072.9551502960676, |
|
"count": 339290, |
|
"self": 33.577861527737696, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 621.0739785193873, |
|
"count": 339290, |
|
"self": 619.0081556433288, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 2.065822876058519, |
|
"count": 10, |
|
"self": 2.065822876058519 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 3418.3033102489426, |
|
"count": 241, |
|
"self": 385.8818468901736, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 3032.421463358769, |
|
"count": 7230, |
|
"self": 3032.421463358769 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.2499804142862558e-06, |
|
"count": 1, |
|
"self": 1.2499804142862558e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.25519195798551664, |
|
"count": 1, |
|
"self": 0.0014662499888800085, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.25372570799663663, |
|
"count": 1, |
|
"self": 0.25372570799663663 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |