|
{
|
|
"name": "root",
|
|
"gauges": {
|
|
"SoccerTwos.Policy.Entropy.mean": {
|
|
"value": 0.8469312191009521,
|
|
"min": 0.8232175707817078,
|
|
"max": 3.295804023742676,
|
|
"count": 1695
|
|
},
|
|
"SoccerTwos.Policy.Entropy.sum": {
|
|
"value": 9187.509765625,
|
|
"min": 2003.845703125,
|
|
"max": 105465.6875,
|
|
"count": 1695
|
|
},
|
|
"SoccerTwos.Environment.EpisodeLength.mean": {
|
|
"value": 64.5,
|
|
"min": 40.152542372881356,
|
|
"max": 999.0,
|
|
"count": 1695
|
|
},
|
|
"SoccerTwos.Environment.EpisodeLength.sum": {
|
|
"value": 10320.0,
|
|
"min": 2732.0,
|
|
"max": 28832.0,
|
|
"count": 1695
|
|
},
|
|
"SoccerTwos.Self-play.ELO.mean": {
|
|
"value": 1763.6273213154295,
|
|
"min": 1189.8904352353843,
|
|
"max": 1771.968606144515,
|
|
"count": 1664
|
|
},
|
|
"SoccerTwos.Self-play.ELO.sum": {
|
|
"value": 141090.18570523435,
|
|
"min": 2381.0377987029947,
|
|
"max": 202012.20693031192,
|
|
"count": 1664
|
|
},
|
|
"SoccerTwos.Step.mean": {
|
|
"value": 8479958.0,
|
|
"min": 4432.0,
|
|
"max": 8479958.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Step.sum": {
|
|
"value": 8479958.0,
|
|
"min": 4432.0,
|
|
"max": 8479958.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
|
|
"value": -0.040951985865831375,
|
|
"min": -0.19922977685928345,
|
|
"max": 0.2191123515367508,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
|
|
"value": -3.2761588096618652,
|
|
"min": -13.849787712097168,
|
|
"max": 17.74810028076172,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
|
|
"value": -0.04459637776017189,
|
|
"min": -0.19301573932170868,
|
|
"max": 0.2158556580543518,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
|
|
"value": -3.5677101612091064,
|
|
"min": -14.456816673278809,
|
|
"max": 17.48430824279785,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Environment.CumulativeReward.mean": {
|
|
"value": 0.0,
|
|
"min": 0.0,
|
|
"max": 0.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Environment.CumulativeReward.sum": {
|
|
"value": 0.0,
|
|
"min": 0.0,
|
|
"max": 0.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicReward.mean": {
|
|
"value": -0.22534499913454056,
|
|
"min": -1.0,
|
|
"max": 0.7153999871677823,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Policy.ExtrinsicReward.sum": {
|
|
"value": -18.027599930763245,
|
|
"min": -41.74519991874695,
|
|
"max": 40.31680017709732,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
|
|
"value": -0.22534499913454056,
|
|
"min": -1.0,
|
|
"max": 0.7153999871677823,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
|
|
"value": -18.027599930763245,
|
|
"min": -41.74519991874695,
|
|
"max": 40.31680017709732,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.IsTraining.mean": {
|
|
"value": 1.0,
|
|
"min": 1.0,
|
|
"max": 1.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.IsTraining.sum": {
|
|
"value": 1.0,
|
|
"min": 1.0,
|
|
"max": 1.0,
|
|
"count": 1696
|
|
},
|
|
"SoccerTwos.Losses.PolicyLoss.mean": {
|
|
"value": 0.012244973257184029,
|
|
"min": 0.010488120992304175,
|
|
"max": 0.016860684389248492,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Losses.PolicyLoss.sum": {
|
|
"value": 0.012244973257184029,
|
|
"min": 0.010488120992304175,
|
|
"max": 0.016860684389248492,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Losses.ValueLoss.mean": {
|
|
"value": 0.11452542960643769,
|
|
"min": 0.0012547600199468434,
|
|
"max": 0.12134995341300964,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Losses.ValueLoss.sum": {
|
|
"value": 0.11452542960643769,
|
|
"min": 0.0012547600199468434,
|
|
"max": 0.12134995341300964,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Losses.BaselineLoss.mean": {
|
|
"value": 0.1195459270477295,
|
|
"min": 0.001435923029202968,
|
|
"max": 0.12682862743735313,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Losses.BaselineLoss.sum": {
|
|
"value": 0.1195459270477295,
|
|
"min": 0.001435923029202968,
|
|
"max": 0.12682862743735313,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.LearningRate.mean": {
|
|
"value": 8.311875688126e-05,
|
|
"min": 8.311875688126e-05,
|
|
"max": 9.9915052084948e-05,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.LearningRate.sum": {
|
|
"value": 8.311875688126e-05,
|
|
"min": 8.311875688126e-05,
|
|
"max": 9.9915052084948e-05,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.Epsilon.mean": {
|
|
"value": 0.162339055,
|
|
"min": 0.162339055,
|
|
"max": 0.17493628899999997,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.Epsilon.sum": {
|
|
"value": 0.162339055,
|
|
"min": 0.162339055,
|
|
"max": 0.17493628899999997,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.Beta.mean": {
|
|
"value": 0.0008328755259999999,
|
|
"min": 0.0008328755259999999,
|
|
"max": 0.0009991590148,
|
|
"count": 205
|
|
},
|
|
"SoccerTwos.Policy.Beta.sum": {
|
|
"value": 0.0008328755259999999,
|
|
"min": 0.0008328755259999999,
|
|
"max": 0.0009991590148,
|
|
"count": 205
|
|
}
|
|
},
|
|
"metadata": {
|
|
"timer_format_version": "0.1.0",
|
|
"start_time_seconds": "1734530482",
|
|
"python_version": "3.10.12 | packaged by Anaconda, Inc. | (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
|
|
"command_line_arguments": "\\\\?\\C:\\Users\\Edu\\miniconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics",
|
|
"mlagents_version": "1.2.0.dev0",
|
|
"mlagents_envs_version": "1.2.0.dev0",
|
|
"communication_protocol_version": "1.5.0",
|
|
"pytorch_version": "2.5.1+cpu",
|
|
"numpy_version": "1.23.5",
|
|
"end_time_seconds": "1734592781"
|
|
},
|
|
"total": 62297.521005999995,
|
|
"count": 1,
|
|
"self": 0.010206600010860711,
|
|
"children": {
|
|
"run_training.setup": {
|
|
"total": 0.09557769999082666,
|
|
"count": 1,
|
|
"self": 0.09557769999082666
|
|
},
|
|
"TrainerController.start_learning": {
|
|
"total": 62297.415221699994,
|
|
"count": 1,
|
|
"self": 14.6314888002089,
|
|
"children": {
|
|
"TrainerController._reset_env": {
|
|
"total": 15.382453300029738,
|
|
"count": 85,
|
|
"self": 15.382453300029738
|
|
},
|
|
"TrainerController.advance": {
|
|
"total": 62267.04685259974,
|
|
"count": 585681,
|
|
"self": 14.093730005988618,
|
|
"children": {
|
|
"env_step": {
|
|
"total": 10437.005436695807,
|
|
"count": 585681,
|
|
"self": 7298.554581102231,
|
|
"children": {
|
|
"SubprocessEnvManager._take_step": {
|
|
"total": 3129.628976492575,
|
|
"count": 585681,
|
|
"self": 85.2579285860993,
|
|
"children": {
|
|
"TorchPolicy.evaluate": {
|
|
"total": 3044.3710479064757,
|
|
"count": 1075560,
|
|
"self": 3044.3710479064757
|
|
}
|
|
}
|
|
},
|
|
"workers": {
|
|
"total": 8.821879101000377,
|
|
"count": 585681,
|
|
"self": 0.0,
|
|
"children": {
|
|
"worker_root": {
|
|
"total": 62246.82085750632,
|
|
"count": 585681,
|
|
"is_parallel": true,
|
|
"self": 56644.32421551256,
|
|
"children": {
|
|
"steps_from_proto": {
|
|
"total": 0.145146500057308,
|
|
"count": 170,
|
|
"is_parallel": true,
|
|
"self": 0.02975290002359543,
|
|
"children": {
|
|
"_process_rank_one_or_two_observation": {
|
|
"total": 0.11539360003371257,
|
|
"count": 680,
|
|
"is_parallel": true,
|
|
"self": 0.11539360003371257
|
|
}
|
|
}
|
|
},
|
|
"UnityEnvironment.step": {
|
|
"total": 5602.351495493698,
|
|
"count": 585681,
|
|
"is_parallel": true,
|
|
"self": 316.47514569666237,
|
|
"children": {
|
|
"UnityEnvironment._generate_step_input": {
|
|
"total": 278.7953514022229,
|
|
"count": 585681,
|
|
"is_parallel": true,
|
|
"self": 278.7953514022229
|
|
},
|
|
"communicator.exchange": {
|
|
"total": 3961.8991054948565,
|
|
"count": 585681,
|
|
"is_parallel": true,
|
|
"self": 3961.8991054948565
|
|
},
|
|
"steps_from_proto": {
|
|
"total": 1045.1818928999564,
|
|
"count": 1171362,
|
|
"is_parallel": true,
|
|
"self": 209.20651879774232,
|
|
"children": {
|
|
"_process_rank_one_or_two_observation": {
|
|
"total": 835.9753741022141,
|
|
"count": 4685448,
|
|
"is_parallel": true,
|
|
"self": 835.9753741022141
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"trainer_advance": {
|
|
"total": 51815.94768589795,
|
|
"count": 585681,
|
|
"self": 99.25371239797096,
|
|
"children": {
|
|
"process_trajectory": {
|
|
"total": 4604.251587100065,
|
|
"count": 585681,
|
|
"self": 4599.446594900117,
|
|
"children": {
|
|
"RLTrainer._checkpoint": {
|
|
"total": 4.804992199948174,
|
|
"count": 16,
|
|
"self": 4.804992199948174
|
|
}
|
|
}
|
|
},
|
|
"_update_policy": {
|
|
"total": 47112.44238639991,
|
|
"count": 206,
|
|
"self": 1881.7498688001651,
|
|
"children": {
|
|
"TorchPOCAOptimizer.update": {
|
|
"total": 45230.692517599746,
|
|
"count": 10253,
|
|
"self": 45230.692517599746
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"trainer_threads": {
|
|
"total": 1.300009898841381e-06,
|
|
"count": 1,
|
|
"self": 1.300009898841381e-06
|
|
},
|
|
"TrainerController._save_models": {
|
|
"total": 0.3544257000030484,
|
|
"count": 1,
|
|
"self": 0.006995100004132837,
|
|
"children": {
|
|
"RLTrainer._checkpoint": {
|
|
"total": 0.34743059999891557,
|
|
"count": 1,
|
|
"self": 0.34743059999891557
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
} |