|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 0.5361879467964172, |
|
"min": 0.5062462091445923, |
|
"max": 3.2957143783569336, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 10792.390625, |
|
"min": 631.1412353515625, |
|
"max": 390950.0625, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 64.55263157894737, |
|
"min": 34.75, |
|
"max": 999.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19624.0, |
|
"min": 9744.0, |
|
"max": 27944.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1655.243002041564, |
|
"min": 1187.9343140936849, |
|
"max": 1763.0418844163403, |
|
"count": 9914 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 251596.93631031775, |
|
"min": 2375.8686281873697, |
|
"max": 451934.74502955977, |
|
"count": 9914 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 99999944.0, |
|
"min": 9718.0, |
|
"max": 99999944.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 99999944.0, |
|
"min": 9718.0, |
|
"max": 99999944.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.03534884750843048, |
|
"min": -0.1369738131761551, |
|
"max": 0.2670484185218811, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -5.408373832702637, |
|
"min": -25.899005889892578, |
|
"max": 37.65174865722656, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.0353168249130249, |
|
"min": -0.1389307826757431, |
|
"max": 0.26651522517204285, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -5.4034743309021, |
|
"min": -25.871084213256836, |
|
"max": 37.80921173095703, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.20054117565840676, |
|
"min": -0.5881272716955706, |
|
"max": 0.6285795958674684, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -30.682799875736237, |
|
"min": -80.2020001411438, |
|
"max": 82.94919991493225, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.20054117565840676, |
|
"min": -0.5881272716955706, |
|
"max": 0.6285795958674684, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -30.682799875736237, |
|
"min": -80.2020001411438, |
|
"max": 82.94919991493225, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 10000 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.02380004380441581, |
|
"min": 0.00802251725399401, |
|
"max": 0.026490185890967646, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.02380004380441581, |
|
"min": 0.00802251725399401, |
|
"max": 0.026490185890967646, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.10786419784029325, |
|
"min": 2.5130218242945073e-06, |
|
"max": 0.1378081552684307, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.10786419784029325, |
|
"min": 2.5130218242945073e-06, |
|
"max": 0.1378081552684307, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.10805333033204079, |
|
"min": 2.2917931763307325e-06, |
|
"max": 0.14002898931503296, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.10805333033204079, |
|
"min": 2.2917931763307325e-06, |
|
"max": 0.14002898931503296, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 3.98439867519971e-08, |
|
"min": 3.98439867519971e-08, |
|
"max": 0.000299931636022788, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 3.98439867519971e-08, |
|
"min": 3.98439867519971e-08, |
|
"max": 0.000299931636022788, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.10001324799999996, |
|
"min": 0.10001324799999996, |
|
"max": 0.19997721200000002, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.10001324799999996, |
|
"min": 0.10001324799999996, |
|
"max": 0.19997721200000002, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 1.0661075199999953e-05, |
|
"min": 1.0661075199999953e-05, |
|
"max": 0.0049988628788, |
|
"count": 4848 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 1.0661075199999953e-05, |
|
"min": 1.0661075199999953e-05, |
|
"max": 0.0049988628788, |
|
"count": 4848 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1676882850", |
|
"python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/zhihdeng/anaconda3/envs/HuggingFaceDRL/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --no-graphics --run-id=SoccerTwosMLP", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1676971223" |
|
}, |
|
"total": 88373.85427070409, |
|
"count": 1, |
|
"self": 0.5767905004322529, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0484183095395565, |
|
"count": 1, |
|
"self": 0.0484183095395565 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 88373.22906189412, |
|
"count": 1, |
|
"self": 88.28237944841385, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 71.24583523720503, |
|
"count": 500, |
|
"self": 71.24583523720503 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 88213.365519315, |
|
"count": 3946472, |
|
"self": 86.39167696610093, |
|
"children": { |
|
"env_step": { |
|
"total": 43111.556869752705, |
|
"count": 3946472, |
|
"self": 13688.833719231188, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 29358.235021069646, |
|
"count": 7046286, |
|
"self": 1046.72575295344, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 28311.509268116206, |
|
"count": 12770724, |
|
"self": 28311.509268116206 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 64.48812945187092, |
|
"count": 3946472, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 354218.49521360174, |
|
"count": 7045365, |
|
"is_parallel": true, |
|
"self": 277056.83259246126, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.193673238158226, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.08062634989619255, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.011169001460075378, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.003017112612724304, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.008151888847351074, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.008151888847351074 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.10187788680195808, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.0025879032909870148, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.001802206039428711, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.001802206039428711 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.08945160359144211, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.08945160359144211 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.00803617388010025, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0016578957438468933, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.006378278136253357, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.006378278136253357 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 77157.02932818234, |
|
"count": 7045357, |
|
"is_parallel": true, |
|
"self": 5271.69396962598, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 2848.0237276628613, |
|
"count": 7045357, |
|
"is_parallel": true, |
|
"self": 2848.0237276628613 |
|
}, |
|
"communicator.exchange": { |
|
"total": 55228.5793344304, |
|
"count": 7045357, |
|
"is_parallel": true, |
|
"self": 55228.5793344304 |
|
}, |
|
"steps_from_proto": { |
|
"total": 13808.732296463102, |
|
"count": 14090714, |
|
"is_parallel": true, |
|
"self": 2671.1489330865443, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 11137.583363376558, |
|
"count": 56362856, |
|
"is_parallel": true, |
|
"self": 11137.583363376558 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 4.439619719982147, |
|
"count": 3992, |
|
"is_parallel": true, |
|
"self": 0.8451655693352222, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 3.594454150646925, |
|
"count": 15968, |
|
"is_parallel": true, |
|
"self": 3.594454150646925 |
|
} |
|
} |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 147.0211791843176, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 147.0211791843176 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 884.1772038340569, |
|
"count": 39316, |
|
"is_parallel": true, |
|
"self": 0.8210047781467438, |
|
"children": { |
|
"env_step": { |
|
"total": 511.9983355551958, |
|
"count": 39316, |
|
"is_parallel": true, |
|
"self": 163.43248023465276, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 347.6746134161949, |
|
"count": 76720, |
|
"is_parallel": true, |
|
"self": 11.412553071975708, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 336.2620603442192, |
|
"count": 152664, |
|
"is_parallel": true, |
|
"self": 336.2620603442192 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.743629664182663, |
|
"count": 39316, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 4125.666426867247, |
|
"count": 76696, |
|
"is_parallel": true, |
|
"self": 3296.758002460003, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.044676005840301514, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.012068450450897217, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0326075553894043, |
|
"count": 128, |
|
"is_parallel": true, |
|
"self": 0.0326075553894043 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.40751154720783234, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.010351613163948059, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.007208824157714844, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.007208824157714844 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.35780641436576843, |
|
"count": 16, |
|
"is_parallel": true, |
|
"self": 0.35780641436576843 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.032144695520401, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.006631582975387573, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.025513112545013428, |
|
"count": 128, |
|
"is_parallel": true, |
|
"self": 0.025513112545013428 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 828.8764188885689, |
|
"count": 76680, |
|
"is_parallel": true, |
|
"self": 46.903960809111595, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 30.588029012084007, |
|
"count": 76680, |
|
"is_parallel": true, |
|
"self": 30.588029012084007 |
|
}, |
|
"communicator.exchange": { |
|
"total": 609.1386138498783, |
|
"count": 76680, |
|
"is_parallel": true, |
|
"self": 609.1386138498783 |
|
}, |
|
"steps_from_proto": { |
|
"total": 142.24581521749496, |
|
"count": 153360, |
|
"is_parallel": true, |
|
"self": 28.042156845331192, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 114.20365837216377, |
|
"count": 613440, |
|
"is_parallel": true, |
|
"self": 114.20365837216377 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.032005518674850464, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.0062446147203445435, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.02576090395450592, |
|
"count": 128, |
|
"is_parallel": true, |
|
"self": 0.02576090395450592 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.019269373267889023, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.003829497843980789, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.015439875423908234, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.015439875423908234 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.128342866897583, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.007858805358409882, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.004416607320308685, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.004416607320308685 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.10227135568857193, |
|
"count": 4, |
|
"is_parallel": true, |
|
"self": 0.10227135568857193 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.013796098530292511, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0021491684019565582, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.011646930128335953, |
|
"count": 32, |
|
"is_parallel": true, |
|
"self": 0.011646930128335953 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 371.3578635007143, |
|
"count": 39316, |
|
"is_parallel": true, |
|
"self": 13.995508208870888, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 101.5431860089302, |
|
"count": 39316, |
|
"is_parallel": true, |
|
"self": 101.5431860089302 |
|
}, |
|
"_update_policy": { |
|
"total": 255.8191692829132, |
|
"count": 44, |
|
"is_parallel": true, |
|
"self": 165.65164488554, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 90.1675243973732, |
|
"count": 1392, |
|
"is_parallel": true, |
|
"self": 90.1675243973732 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 45015.4169725962, |
|
"count": 3946472, |
|
"self": 1186.358848668635, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 19193.84821567312, |
|
"count": 3946472, |
|
"self": 19120.074692908674, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 73.77352276444435, |
|
"count": 200, |
|
"self": 73.77352276444435 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 24635.209908254445, |
|
"count": 4848, |
|
"self": 16051.347006946802, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 8583.862901307642, |
|
"count": 145476, |
|
"self": 8583.862901307642 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.1771917343139648e-06, |
|
"count": 1, |
|
"self": 1.1771917343139648e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.3353267163038254, |
|
"count": 1, |
|
"self": 0.009651627391576767, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.3256750889122486, |
|
"count": 1, |
|
"self": 0.3256750889122486 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |