{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.2989126741886139, "min": 0.2989126741886139, "max": 1.4436542987823486, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 9072.59765625, "min": 9072.59765625, "max": 43794.6953125, "count": 33 }, "Pyramids.Step.mean": { "value": 989984.0, "min": 29908.0, "max": 989984.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989984.0, "min": 29908.0, "max": 989984.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.5364909172058105, "min": -0.09286700934171677, "max": 0.5414549708366394, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 149.14447021484375, "min": -22.292495727539062, "max": 149.14447021484375, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.02987596206367016, "min": 0.010084972716867924, "max": 0.35073304176330566, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 8.305517196655273, "min": 2.682602643966675, "max": 83.12373352050781, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06786293758722466, "min": 0.06556648364700167, "max": 0.07418343837036649, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9500811262211452, "min": 0.48269940523300914, "max": 1.1127515755554973, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.013875093594140795, "min": 0.00021738470543989483, "max": 0.014047219173724963, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.19425131031797113, "min": 0.0028260011707186327, "max": 0.19666106843214948, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.618318889164287e-06, "min": 7.618318889164287e-06, "max": 0.0002952348015884, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.00010665646444830001, "min": 0.00010665646444830001, "max": 0.0036334417888527993, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10253940714285714, "min": 0.10253940714285714, "max": 0.1984116, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4355517, "min": 1.3888812, "max": 2.6111471999999996, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.00026368677357142866, "min": 0.00026368677357142866, "max": 0.00984131884, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.003691614830000001, "min": 0.003691614830000001, "max": 0.12113360528000001, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.037940140813589096, "min": 0.03662216663360596, "max": 0.46993550658226013, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.5311619639396667, "min": 0.5164991617202759, "max": 3.289548635482788, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 339.83516483516485, "min": 339.83516483516485, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 30925.0, "min": 16707.0, "max": 32235.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.5252222056190172, "min": -0.9998500528745353, "max": 1.6110124825499952, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 137.26999850571156, "min": -31.99520169198513, "max": 137.26999850571156, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.5252222056190172, "min": -0.9998500528745353, "max": 1.6110124825499952, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 137.26999850571156, "min": -31.99520169198513, "max": 137.26999850571156, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.13117907410293508, "min": 0.13117907410293508, "max": 8.846885418190675, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 11.806116669264156, "min": 10.511265887238551, "max": 150.39705210924149, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1692931909", "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1692934229" }, "total": 2319.4423249520005, "count": 1, "self": 0.8995214400001714, "children": { "run_training.setup": { "total": 0.06624013300006482, "count": 1, "self": 0.06624013300006482 }, "TrainerController.start_learning": { "total": 2318.4765633790003, "count": 1, "self": 1.318920739027817, "children": { "TrainerController._reset_env": { "total": 4.628697011000213, "count": 1, "self": 4.628697011000213 }, "TrainerController.advance": { "total": 2312.3785713739717, "count": 63858, "self": 1.3165784119637465, "children": { "env_step": { "total": 1641.5370895119706, "count": 63858, "self": 1533.2071723269419, "children": { "SubprocessEnvManager._take_step": { "total": 107.5227801869737, "count": 63858, "self": 4.622046196979227, "children": { "TorchPolicy.evaluate": { "total": 102.90073398999448, "count": 62581, "self": 102.90073398999448 } } }, "workers": { "total": 0.8071369980550571, "count": 63858, "self": 0.0, "children": { "worker_root": { "total": 2313.4918685579737, "count": 63858, "is_parallel": true, "self": 893.2963652889159, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0026867279998441518, "count": 1, "is_parallel": true, "self": 0.0007060650000312307, "children": { "_process_rank_one_or_two_observation": { "total": 0.001980662999812921, "count": 8, "is_parallel": true, "self": 0.001980662999812921 } } }, "UnityEnvironment.step": { "total": 0.04964788500001305, "count": 1, "is_parallel": true, "self": 0.0005966800001715455, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0004931650000798982, "count": 1, "is_parallel": true, "self": 0.0004931650000798982 }, "communicator.exchange": { "total": 0.04659035299982861, "count": 1, "is_parallel": true, "self": 0.04659035299982861 }, "steps_from_proto": { "total": 0.001967686999932994, "count": 1, "is_parallel": true, "self": 0.00037835300031474617, "children": { "_process_rank_one_or_two_observation": { "total": 0.0015893339996182476, "count": 8, "is_parallel": true, "self": 0.0015893339996182476 } } } } } } }, "UnityEnvironment.step": { "total": 1420.1955032690578, "count": 63857, "is_parallel": true, "self": 33.96063004308894, "children": { "UnityEnvironment._generate_step_input": { "total": 23.049314843939783, "count": 63857, "is_parallel": true, "self": 23.049314843939783 }, "communicator.exchange": { "total": 1257.6007783799848, "count": 63857, "is_parallel": true, "self": 1257.6007783799848 }, "steps_from_proto": { "total": 105.58478000204423, "count": 63857, "is_parallel": true, "self": 20.71381203996293, "children": { "_process_rank_one_or_two_observation": { "total": 84.8709679620813, "count": 510856, "is_parallel": true, "self": 84.8709679620813 } } } } } } } } } } }, "trainer_advance": { "total": 669.5249034500375, "count": 63858, "self": 2.5453854340298676, "children": { "process_trajectory": { "total": 111.69608916600646, "count": 63858, "self": 111.3661821020064, "children": { "RLTrainer._checkpoint": { "total": 0.32990706400005365, "count": 2, "self": 0.32990706400005365 } } }, "_update_policy": { "total": 555.2834288500012, "count": 456, "self": 360.9778594669906, "children": { "TorchPPOOptimizer.update": { "total": 194.3055693830106, "count": 22788, "self": 194.3055693830106 } } } } } } }, "trainer_threads": { "total": 1.3389999367063865e-06, "count": 1, "self": 1.3389999367063865e-06 }, "TrainerController._save_models": { "total": 0.1503729160003786, "count": 1, "self": 0.0018418620002194075, "children": { "RLTrainer._checkpoint": { "total": 0.1485310540001592, "count": 1, "self": 0.1485310540001592 } } } } } } }