| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 1.0121504068374634, | |
| "min": 0.9460815787315369, | |
| "max": 1.503366231918335, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 20032.48046875, | |
| "min": 19012.455078125, | |
| "max": 30211.6484375, | |
| "count": 25 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 499940.0, | |
| "min": 19968.0, | |
| "max": 499940.0, | |
| "count": 25 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 499940.0, | |
| "min": 19968.0, | |
| "max": 499940.0, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": -0.026038452982902527, | |
| "min": -0.11006768047809601, | |
| "max": 0.02244146727025509, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": -4.218229293823242, | |
| "min": -17.500761032104492, | |
| "max": 3.6355175971984863, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.01763242855668068, | |
| "min": 0.01425930019468069, | |
| "max": 0.3973273038864136, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 2.8564534187316895, | |
| "min": 2.2957472801208496, | |
| "max": 63.17504119873047, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.06658720749889172, | |
| "min": 0.06285811453503008, | |
| "max": 0.07633348781014686, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.6658720749889171, | |
| "min": 0.2727794712516426, | |
| "max": 0.7160643609806877, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.003296598828339091, | |
| "min": 0.00021042404057236845, | |
| "max": 0.015986815926257333, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.03296598828339091, | |
| "min": 0.0017292712748508332, | |
| "max": 0.06394726370502933, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 5.765018078360002e-06, | |
| "min": 5.765018078360002e-06, | |
| "max": 0.00029391360202879994, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 5.765018078360002e-05, | |
| "min": 5.765018078360002e-05, | |
| "max": 0.0020648809117064, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10192164000000001, | |
| "min": 0.10192164000000001, | |
| "max": 0.1979712, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.0192164000000001, | |
| "min": 0.7918848, | |
| "max": 1.5669624, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.00020197183600000014, | |
| "min": 0.00020197183600000014, | |
| "max": 0.009797322879999997, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.0020197183600000014, | |
| "min": 0.0020197183600000014, | |
| "max": 0.06884053064, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.016766127198934555, | |
| "min": 0.016766127198934555, | |
| "max": 0.5906252861022949, | |
| "count": 25 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.16766127943992615, | |
| "min": 0.156918466091156, | |
| "max": 2.3625011444091797, | |
| "count": 25 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 902.0, | |
| "min": 835.1304347826087, | |
| "max": 999.0, | |
| "count": 25 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 19844.0, | |
| "min": 15631.0, | |
| "max": 30619.0, | |
| "count": 25 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": -0.44795459136366844, | |
| "min": -1.0000000521540642, | |
| "max": -0.1398783096152803, | |
| "count": 25 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": -9.855001010000706, | |
| "min": -28.64680152386427, | |
| "max": -3.2172011211514473, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": -0.44795459136366844, | |
| "min": -1.0000000521540642, | |
| "max": -0.1398783096152803, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": -9.855001010000706, | |
| "min": -28.64680152386427, | |
| "max": -3.2172011211514473, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.15901358330368318, | |
| "min": 0.14874269537951634, | |
| "max": 9.738041854463518, | |
| "count": 25 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 3.49829883268103, | |
| "min": 3.421081993728876, | |
| "max": 155.80866967141628, | |
| "count": 25 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 25 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 25 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1749532101", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids_Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.7.1+cu126", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1749533204" | |
| }, | |
| "total": 1103.651244273, | |
| "count": 1, | |
| "self": 0.4777003239996702, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.021289202999923873, | |
| "count": 1, | |
| "self": 0.021289202999923873 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 1103.1522547460004, | |
| "count": 1, | |
| "self": 0.6987394619704901, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.8920449060001374, | |
| "count": 1, | |
| "self": 2.8920449060001374 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 1099.4652133230297, | |
| "count": 31560, | |
| "self": 0.7282170380190109, | |
| "children": { | |
| "env_step": { | |
| "total": 753.6990319060619, | |
| "count": 31560, | |
| "self": 673.6376814861242, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 79.64410036299614, | |
| "count": 31560, | |
| "self": 2.4693943649881476, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 77.174705998008, | |
| "count": 31306, | |
| "self": 77.174705998008 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.41725005694161155, | |
| "count": 31560, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 1100.3690120639862, | |
| "count": 31560, | |
| "is_parallel": true, | |
| "self": 486.0401613490021, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0020381109998197644, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007387539990304504, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.001299357000789314, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.001299357000789314 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.1065906100002394, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005650740004057297, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004772229999616684, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004772229999616684 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.10394590599980802, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.10394590599980802 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016024070000639767, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00036290200068833656, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012395049993756402, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012395049993756402 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 614.3288507149841, | |
| "count": 31559, | |
| "is_parallel": true, | |
| "self": 16.558972978113616, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 12.415291498007264, | |
| "count": 31559, | |
| "is_parallel": true, | |
| "self": 12.415291498007264 | |
| }, | |
| "communicator.exchange": { | |
| "total": 533.5693294359462, | |
| "count": 31559, | |
| "is_parallel": true, | |
| "self": 533.5693294359462 | |
| }, | |
| "steps_from_proto": { | |
| "total": 51.78525680291705, | |
| "count": 31559, | |
| "is_parallel": true, | |
| "self": 10.327377288923799, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 41.45787951399325, | |
| "count": 252472, | |
| "is_parallel": true, | |
| "self": 41.45787951399325 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 345.0379643789488, | |
| "count": 31560, | |
| "self": 1.1553330019182795, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 66.97376207703155, | |
| "count": 31560, | |
| "self": 66.8499179780315, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.12384409900005267, | |
| "count": 1, | |
| "self": 0.12384409900005267 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 276.90886929999897, | |
| "count": 217, | |
| "self": 155.22698258899072, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 121.68188671100825, | |
| "count": 11439, | |
| "self": 121.68188671100825 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.0869998732232489e-06, | |
| "count": 1, | |
| "self": 1.0869998732232489e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.09625596800015046, | |
| "count": 1, | |
| "self": 0.0011127219995614723, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09514324600058899, | |
| "count": 1, | |
| "self": 0.09514324600058899 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |