|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.5817396640777588, |
|
"min": 1.455094575881958, |
|
"max": 3.295758008956909, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 29357.087890625, |
|
"min": 20119.16796875, |
|
"max": 114796.1875, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 52.795698924731184, |
|
"min": 41.78632478632478, |
|
"max": 999.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19640.0, |
|
"min": 14576.0, |
|
"max": 25692.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1617.6406867369267, |
|
"min": 1199.9802019082556, |
|
"max": 1639.294376297447, |
|
"count": 1110 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 300881.16773306835, |
|
"min": 2407.8869932951948, |
|
"max": 375980.1001040295, |
|
"count": 1110 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 11169994.0, |
|
"min": 9864.0, |
|
"max": 11169994.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 11169994.0, |
|
"min": 9864.0, |
|
"max": 11169994.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.0189067330211401, |
|
"min": -0.10604812204837799, |
|
"max": 0.17163971066474915, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -3.4977455139160156, |
|
"min": -20.073341369628906, |
|
"max": 32.61154556274414, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.014979016967117786, |
|
"min": -0.10466466844081879, |
|
"max": 0.1675061136484146, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -2.7711181640625, |
|
"min": -19.67367935180664, |
|
"max": 31.826160430908203, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.040820540286399226, |
|
"min": -0.4907428537096296, |
|
"max": 0.5533685423015209, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -7.551799952983856, |
|
"min": -68.55279970169067, |
|
"max": 51.44579952955246, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.040820540286399226, |
|
"min": -0.4907428537096296, |
|
"max": 0.5533685423015209, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -7.551799952983856, |
|
"min": -68.55279970169067, |
|
"max": 51.44579952955246, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 1117 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.015818389842752367, |
|
"min": 0.01056509285311525, |
|
"max": 0.023983135318849234, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.015818389842752367, |
|
"min": 0.01056509285311525, |
|
"max": 0.023983135318849234, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.1106756404042244, |
|
"min": 0.00010585838147865918, |
|
"max": 0.12311240409811337, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.1106756404042244, |
|
"min": 0.00010585838147865918, |
|
"max": 0.12311240409811337, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.11272074555357298, |
|
"min": 0.00010605515211257929, |
|
"max": 0.12526631702979404, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.11272074555357298, |
|
"min": 0.00010605515211257929, |
|
"max": 0.12526631702979404, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 540 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 540 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1675767301", |
|
"python_version": "3.8.15 | packaged by conda-forge | (default, Nov 22 2022, 08:49:35) \n[GCC 10.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ml-agents/config/poca/SoccerTwos.yaml --env=ml-agents/training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1675797412" |
|
}, |
|
"total": 30110.425812047004, |
|
"count": 1, |
|
"self": 0.024434594000922516, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.017229047999990144, |
|
"count": 1, |
|
"self": 0.017229047999990144 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 30110.384148405003, |
|
"count": 1, |
|
"self": 24.077285353967454, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.759301012999913, |
|
"count": 56, |
|
"self": 6.759301012999913 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 30078.937422030034, |
|
"count": 768718, |
|
"self": 25.25196177511316, |
|
"children": { |
|
"env_step": { |
|
"total": 22809.44976557272, |
|
"count": 768718, |
|
"self": 17891.032676758594, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 4903.552269231004, |
|
"count": 768718, |
|
"self": 142.58574983506878, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 4760.966519395935, |
|
"count": 1405796, |
|
"self": 4760.966519395935 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 14.864819583121061, |
|
"count": 768717, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 30046.03928236312, |
|
"count": 768717, |
|
"is_parallel": true, |
|
"self": 15095.742846892175, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0046049020002101315, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0013496899991878308, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0032552120010223007, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0032552120010223007 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.039663079000092694, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.001042876999690634, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0009266420001949882, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0009266420001949882 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.034336171000177274, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.034336171000177274 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.003357389000029798, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0006177839991323708, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.002739605000897427, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.002739605000897427 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 14950.139402001958, |
|
"count": 768716, |
|
"is_parallel": true, |
|
"self": 810.3926871098065, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 581.4884008703025, |
|
"count": 768716, |
|
"is_parallel": true, |
|
"self": 581.4884008703025 |
|
}, |
|
"communicator.exchange": { |
|
"total": 10917.931029128304, |
|
"count": 768716, |
|
"is_parallel": true, |
|
"self": 10917.931029128304 |
|
}, |
|
"steps_from_proto": { |
|
"total": 2640.3272848935453, |
|
"count": 1537432, |
|
"is_parallel": true, |
|
"self": 493.16249945778736, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 2147.164785435758, |
|
"count": 6149728, |
|
"is_parallel": true, |
|
"self": 2147.164785435758 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.15703346898544623, |
|
"count": 110, |
|
"is_parallel": true, |
|
"self": 0.030603315996813762, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.12643015298863247, |
|
"count": 440, |
|
"is_parallel": true, |
|
"self": 0.12643015298863247 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 7244.235694682202, |
|
"count": 768717, |
|
"self": 172.02504888342446, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 3104.2678107138054, |
|
"count": 768717, |
|
"self": 3097.6380572478156, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 6.629753465989779, |
|
"count": 22, |
|
"self": 6.629753465989779 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 3967.9428350849716, |
|
"count": 540, |
|
"self": 2525.3373333656814, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1442.6055017192903, |
|
"count": 16200, |
|
"self": 1442.6055017192903 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.4360048226080835e-06, |
|
"count": 1, |
|
"self": 1.4360048226080835e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.6101385719957761, |
|
"count": 1, |
|
"self": 0.0024646999954711646, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.607673872000305, |
|
"count": 1, |
|
"self": 0.607673872000305 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |