poca-SoccerTwos / run_logs /timers.json
ucheokechukwu's picture
First Commit
b4985f6 verified
raw
history blame
No virus
19.8 kB
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.6669374704360962,
"min": 1.6359543800354004,
"max": 1.6686762571334839,
"count": 7
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 33285.40625,
"min": 28373.9921875,
"max": 35656.47265625,
"count": 7
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 69.27777777777777,
"min": 56.20238095238095,
"max": 69.27777777777777,
"count": 7
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19952.0,
"min": 16200.0,
"max": 20212.0,
"count": 7
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1539.4471772250445,
"min": 1527.7409143925404,
"max": 1545.935715339572,
"count": 7
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 221680.3935204064,
"min": 210247.2572861818,
"max": 258303.83899147165,
"count": 7
},
"SoccerTwos.Step.mean": {
"value": 7759836.0,
"min": 7699856.0,
"max": 7759836.0,
"count": 7
},
"SoccerTwos.Step.sum": {
"value": 7759836.0,
"min": 7699856.0,
"max": 7759836.0,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.02039300464093685,
"min": -0.06732017546892166,
"max": 0.006477044429630041,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -2.9161996841430664,
"min": -10.462895393371582,
"max": 0.8679239749908447,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.018799273297190666,
"min": -0.06896685063838959,
"max": 0.014638231135904789,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -2.68829607963562,
"min": -10.482961654663086,
"max": 1.9615229368209839,
"count": 7
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 7
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.017475523315109574,
"min": -0.14296273452154598,
"max": 0.18005912183965528,
"count": 7
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 2.498999834060669,
"min": -23.017000257968903,
"max": 28.629400372505188,
"count": 7
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.017475523315109574,
"min": -0.14296273452154598,
"max": 0.18005912183965528,
"count": 7
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 2.498999834060669,
"min": -23.017000257968903,
"max": 28.629400372505188,
"count": 7
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 7
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 7
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.016602384811267256,
"min": 0.014415907952934504,
"max": 0.016602384811267256,
"count": 3
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.016602384811267256,
"min": 0.014415907952934504,
"max": 0.016602384811267256,
"count": 3
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.09950689375400543,
"min": 0.09836041977008184,
"max": 0.10183645983537039,
"count": 3
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.09950689375400543,
"min": 0.09836041977008184,
"max": 0.10183645983537039,
"count": 3
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.1016091840962569,
"min": 0.10012397617101669,
"max": 0.10352428729335467,
"count": 3
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.1016091840962569,
"min": 0.10012397617101669,
"max": 0.10352428729335467,
"count": 3
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0005000000000000001,
"min": 0.0005000000000000001,
"max": 0.0005000000000000001,
"count": 3
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0005000000000000001,
"min": 0.0005000000000000001,
"max": 0.0005000000000000001,
"count": 3
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 3
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 3
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 3
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 3
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1706602397",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.1.2+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1706602573"
},
"total": 176.3850563119995,
"count": 1,
"self": 0.6095307819996378,
"children": {
"run_training.setup": {
"total": 0.06312701000206289,
"count": 1,
"self": 0.06312701000206289
},
"TrainerController.start_learning": {
"total": 175.7123985199978,
"count": 1,
"self": 0.1427209370849596,
"children": {
"TrainerController._reset_env": {
"total": 3.9993831899955694,
"count": 2,
"self": 3.9993831899955694
},
"TrainerController.advance": {
"total": 171.57022046191923,
"count": 4856,
"self": 0.14406386593691423,
"children": {
"env_step": {
"total": 134.875863562007,
"count": 4856,
"self": 104.80080308114339,
"children": {
"SubprocessEnvManager._take_step": {
"total": 29.993070571970748,
"count": 4856,
"self": 0.7589429501349514,
"children": {
"TorchPolicy.evaluate": {
"total": 29.234127621835796,
"count": 8830,
"self": 29.234127621835796
}
}
},
"workers": {
"total": 0.08198990889286506,
"count": 4855,
"self": 0.0,
"children": {
"worker_root": {
"total": 175.3619194520361,
"count": 4855,
"is_parallel": true,
"self": 87.06817251295797,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002859461001207819,
"count": 2,
"is_parallel": true,
"self": 0.0007165480019466486,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0021429129992611706,
"count": 8,
"is_parallel": true,
"self": 0.0021429129992611706
}
}
},
"UnityEnvironment.step": {
"total": 0.042817464000108885,
"count": 1,
"is_parallel": true,
"self": 0.0012375180012895726,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0009868800007097889,
"count": 1,
"is_parallel": true,
"self": 0.0009868800007097889
},
"communicator.exchange": {
"total": 0.03684870999859413,
"count": 1,
"is_parallel": true,
"self": 0.03684870999859413
},
"steps_from_proto": {
"total": 0.003744355999515392,
"count": 2,
"is_parallel": true,
"self": 0.0006717589967593085,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0030725970027560834,
"count": 8,
"is_parallel": true,
"self": 0.0030725970027560834
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.0020243369981471915,
"count": 2,
"is_parallel": true,
"self": 0.00053981399469194,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014845230034552515,
"count": 8,
"is_parallel": true,
"self": 0.0014845230034552515
}
}
},
"UnityEnvironment.step": {
"total": 88.29172260207997,
"count": 4854,
"is_parallel": true,
"self": 5.486264983432193,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 3.4638925718209066,
"count": 4854,
"is_parallel": true,
"self": 3.4638925718209066
},
"communicator.exchange": {
"total": 62.658482434926555,
"count": 4854,
"is_parallel": true,
"self": 62.658482434926555
},
"steps_from_proto": {
"total": 16.683082611900318,
"count": 9708,
"is_parallel": true,
"self": 2.7760117232974153,
"children": {
"_process_rank_one_or_two_observation": {
"total": 13.907070888602902,
"count": 38832,
"is_parallel": true,
"self": 13.907070888602902
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 36.55029303397532,
"count": 4855,
"self": 1.0077057810412953,
"children": {
"process_trajectory": {
"total": 18.079415830929065,
"count": 4855,
"self": 18.079415830929065
},
"_update_policy": {
"total": 17.46317142200496,
"count": 3,
"self": 10.25110586601295,
"children": {
"TorchPOCAOptimizer.update": {
"total": 7.212065555992012,
"count": 90,
"self": 7.212065555992012
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.2669988791458309e-06,
"count": 1,
"self": 1.2669988791458309e-06
},
"TrainerController._save_models": {
"total": 7.266399916261435e-05,
"count": 1,
"self": 5.557499753194861e-05,
"children": {
"RLTrainer._checkpoint": {
"total": 1.7089001630665734e-05,
"count": 1,
"self": 1.7089001630665734e-05
}
}
}
}
}
}
}