|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.2541470527648926, |
|
"min": 2.2264187335968018, |
|
"max": 3.2958130836486816, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 44505.87890625, |
|
"min": 2003.854248046875, |
|
"max": 225908.15625, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 51.822916666666664, |
|
"min": 42.243478260869566, |
|
"max": 999.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19900.0, |
|
"min": 11988.0, |
|
"max": 32504.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1525.3226441654676, |
|
"min": 1199.384981924398, |
|
"max": 1541.9464998647475, |
|
"count": 586 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 292861.9476797698, |
|
"min": 2398.769963848796, |
|
"max": 349523.70447069826, |
|
"count": 586 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 5999964.0, |
|
"min": 9476.0, |
|
"max": 5999964.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 5999964.0, |
|
"min": 9476.0, |
|
"max": 5999964.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.006578030996024609, |
|
"min": -0.07075738161802292, |
|
"max": 0.14711181819438934, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 1.256403923034668, |
|
"min": -15.849653244018555, |
|
"max": 21.771282196044922, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.00042870157631114125, |
|
"min": -0.08137570321559906, |
|
"max": 0.15133030712604523, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -0.08188199996948242, |
|
"min": -18.22815704345703, |
|
"max": 22.004295349121094, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.08447329723398099, |
|
"min": -0.5101333335042, |
|
"max": 0.5614355537626479, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -16.13439977169037, |
|
"min": -39.12819993495941, |
|
"max": 55.46360003948212, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.08447329723398099, |
|
"min": -0.5101333335042, |
|
"max": 0.5614355537626479, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -16.13439977169037, |
|
"min": -39.12819993495941, |
|
"max": 55.46360003948212, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 600 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.0166406735116147, |
|
"min": 0.014553197751067476, |
|
"max": 0.02096656994221525, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.0166406735116147, |
|
"min": 0.014553197751067476, |
|
"max": 0.02096656994221525, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.09528738483786584, |
|
"min": 0.0014326320227054466, |
|
"max": 0.10267178962628047, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09528738483786584, |
|
"min": 0.0014326320227054466, |
|
"max": 0.10267178962628047, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.10004813447594643, |
|
"min": 0.001436497309542675, |
|
"max": 0.10778420658575164, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.10004813447594643, |
|
"min": 0.001436497309542675, |
|
"max": 0.10778420658575164, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.19999999999999996, |
|
"min": 0.19999999999999996, |
|
"max": 0.19999999999999996, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.19999999999999996, |
|
"min": 0.19999999999999996, |
|
"max": 0.19999999999999996, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.004999999999999999, |
|
"min": 0.004999999999999999, |
|
"max": 0.004999999999999999, |
|
"count": 96 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.004999999999999999, |
|
"min": 0.004999999999999999, |
|
"max": 0.004999999999999999, |
|
"count": 96 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1677412416", |
|
"python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/fbeghell/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --num-envs=3 --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos_v2 --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1677416509" |
|
}, |
|
"total": 4093.656747773988, |
|
"count": 1, |
|
"self": 0.2196339899674058, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.021348519949242473, |
|
"count": 1, |
|
"self": 0.021348519949242473 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 4093.4157652640715, |
|
"count": 1, |
|
"self": 7.478107919450849, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.246652701403946, |
|
"count": 18, |
|
"self": 4.246652701403946 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 4081.3988734942395, |
|
"count": 376605, |
|
"self": 7.324552450329065, |
|
"children": { |
|
"env_step": { |
|
"total": 2150.052749511553, |
|
"count": 376605, |
|
"self": 731.7759145805612, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 1414.3715546100866, |
|
"count": 407059, |
|
"self": 43.13556841947138, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 1371.2359861906152, |
|
"count": 769044, |
|
"self": 1371.2359861906152 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 3.905280320905149, |
|
"count": 376605, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 12267.75443618535, |
|
"count": 407036, |
|
"is_parallel": true, |
|
"self": 9066.076087541878, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.005463488167151809, |
|
"count": 6, |
|
"is_parallel": true, |
|
"self": 0.0015623001381754875, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0039011880289763212, |
|
"count": 24, |
|
"is_parallel": true, |
|
"self": 0.0039011880289763212 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.053212333004921675, |
|
"count": 3, |
|
"is_parallel": true, |
|
"self": 0.001589423744007945, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0010393550619482994, |
|
"count": 3, |
|
"is_parallel": true, |
|
"self": 0.0010393550619482994 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.045753989135846496, |
|
"count": 3, |
|
"is_parallel": true, |
|
"self": 0.045753989135846496 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.004829565063118935, |
|
"count": 6, |
|
"is_parallel": true, |
|
"self": 0.0010161756072193384, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.003813389455899596, |
|
"count": 24, |
|
"is_parallel": true, |
|
"self": 0.003813389455899596 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 3201.6111709214747, |
|
"count": 407033, |
|
"is_parallel": true, |
|
"self": 188.8647192621138, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 123.01010983204469, |
|
"count": 407033, |
|
"is_parallel": true, |
|
"self": 123.01010983204469 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2299.7066926585976, |
|
"count": 407033, |
|
"is_parallel": true, |
|
"self": 2299.7066926585976 |
|
}, |
|
"steps_from_proto": { |
|
"total": 590.0296491687186, |
|
"count": 814066, |
|
"is_parallel": true, |
|
"self": 118.64347190852277, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 471.38617726019584, |
|
"count": 3256264, |
|
"is_parallel": true, |
|
"self": 471.38617726019584 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.06717772199772298, |
|
"count": 102, |
|
"is_parallel": true, |
|
"self": 0.013331872411072254, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.05384584958665073, |
|
"count": 408, |
|
"is_parallel": true, |
|
"self": 0.05384584958665073 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1924.0215715323575, |
|
"count": 376605, |
|
"self": 56.068650795845315, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 612.8880028438289, |
|
"count": 376605, |
|
"self": 609.3015440409072, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 3.5864588029216975, |
|
"count": 12, |
|
"self": 3.5864588029216975 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1255.0649178926833, |
|
"count": 96, |
|
"self": 667.3783815919887, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 587.6865363006946, |
|
"count": 8640, |
|
"self": 587.6865363006946 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 5.818437784910202e-07, |
|
"count": 1, |
|
"self": 5.818437784910202e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.29213056713342667, |
|
"count": 1, |
|
"self": 0.0031741161365062, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.28895645099692047, |
|
"count": 1, |
|
"self": 0.28895645099692047 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |