|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.40288931131362915, |
|
"min": 0.4010867774486542, |
|
"max": 1.5102291107177734, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 12170.48046875, |
|
"min": 12077.525390625, |
|
"max": 45814.30859375, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989919.0, |
|
"min": 29914.0, |
|
"max": 989919.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989919.0, |
|
"min": 29914.0, |
|
"max": 989919.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.5135869979858398, |
|
"min": -0.09541986882686615, |
|
"max": 0.5539620518684387, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 140.72283935546875, |
|
"min": -22.900768280029297, |
|
"max": 152.33956909179688, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.02740642800927162, |
|
"min": -0.0381057932972908, |
|
"max": 0.17480121552944183, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 7.509361267089844, |
|
"min": -10.136140823364258, |
|
"max": 41.952293395996094, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07054058476351202, |
|
"min": 0.0653048978440763, |
|
"max": 0.07520934263621235, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 1.0581087714526802, |
|
"min": 0.5086942826629879, |
|
"max": 1.091625958341562, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.01841895796759572, |
|
"min": 0.0001937613274648397, |
|
"max": 0.01841895796759572, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.27628436951393576, |
|
"min": 0.002263156109023451, |
|
"max": 0.27628436951393576, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.560657479813333e-06, |
|
"min": 7.560657479813333e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00011340986219719999, |
|
"min": 0.00011340986219719999, |
|
"max": 0.0032594468135177996, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10252018666666667, |
|
"min": 0.10252018666666667, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.5378028, |
|
"min": 1.3886848, |
|
"max": 2.5273411000000006, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.000261766648, |
|
"min": 0.000261766648, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.00392649972, |
|
"min": 0.00392649972, |
|
"max": 0.10866957178, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.007845134474337101, |
|
"min": 0.007650338113307953, |
|
"max": 0.3309972584247589, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.11767701059579849, |
|
"min": 0.10710473358631134, |
|
"max": 2.3169808387756348, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 367.7654320987654, |
|
"min": 342.9887640449438, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29789.0, |
|
"min": 16841.0, |
|
"max": 33538.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.5087407146706993, |
|
"min": -0.9999806972280625, |
|
"max": 1.5446112194422925, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 122.20799788832664, |
|
"min": -31.997201651334763, |
|
"max": 137.47039853036404, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.5087407146706993, |
|
"min": -0.9999806972280625, |
|
"max": 1.5446112194422925, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 122.20799788832664, |
|
"min": -31.997201651334763, |
|
"max": 137.47039853036404, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.029903462017961076, |
|
"min": 0.02750641659452852, |
|
"max": 6.427782424232539, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.422180423454847, |
|
"min": 2.4076854368977365, |
|
"max": 109.27230121195316, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1675182810", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1675184808" |
|
}, |
|
"total": 1998.0449856110001, |
|
"count": 1, |
|
"self": 0.3833817839997664, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.09547951300010027, |
|
"count": 1, |
|
"self": 0.09547951300010027 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 1997.5661243140003, |
|
"count": 1, |
|
"self": 1.1407022610576405, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.827710047999972, |
|
"count": 1, |
|
"self": 5.827710047999972 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 1990.5181007799426, |
|
"count": 63743, |
|
"self": 1.184563573983496, |
|
"children": { |
|
"env_step": { |
|
"total": 1355.7159409269464, |
|
"count": 63743, |
|
"self": 1256.4522739329961, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 98.54657221294042, |
|
"count": 63743, |
|
"self": 3.9640127118661894, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 94.58255950107423, |
|
"count": 62560, |
|
"self": 31.60515122910192, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 62.97740827197231, |
|
"count": 62560, |
|
"self": 62.97740827197231 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.7170947810097914, |
|
"count": 63743, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 1994.8710345049644, |
|
"count": 63743, |
|
"is_parallel": true, |
|
"self": 828.0359216209806, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0016320730001098127, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005900010003188072, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010420719997910055, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010420719997910055 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.044336030999829745, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005731079997985944, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0004249969999818859, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004249969999818859 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.041850004000025365, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.041850004000025365 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0014879220000239002, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003870070006541937, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011009149993697065, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011009149993697065 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1166.8351128839838, |
|
"count": 63742, |
|
"is_parallel": true, |
|
"self": 26.386677122058927, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 20.82206777092165, |
|
"count": 63742, |
|
"is_parallel": true, |
|
"self": 20.82206777092165 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1033.9213887280575, |
|
"count": 63742, |
|
"is_parallel": true, |
|
"self": 1033.9213887280575 |
|
}, |
|
"steps_from_proto": { |
|
"total": 85.7049792629457, |
|
"count": 63742, |
|
"is_parallel": true, |
|
"self": 19.814140387758698, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 65.890838875187, |
|
"count": 509936, |
|
"is_parallel": true, |
|
"self": 65.890838875187 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 633.6175962790128, |
|
"count": 63743, |
|
"self": 2.187064913012364, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 136.55067967999935, |
|
"count": 63743, |
|
"self": 136.36776741699964, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.1829122629997073, |
|
"count": 2, |
|
"self": 0.1829122629997073 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 494.8798516860011, |
|
"count": 448, |
|
"self": 185.0999364590309, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 309.77991522697016, |
|
"count": 22851, |
|
"self": 309.77991522697016 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 9.189998309011571e-07, |
|
"count": 1, |
|
"self": 9.189998309011571e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.07961030600017693, |
|
"count": 1, |
|
"self": 0.0012944330001118942, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.07831587300006504, |
|
"count": 1, |
|
"self": 0.07831587300006504 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |