| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.7579878568649292, | |
| "min": 0.6082875728607178, | |
| "max": 1.448693037033081, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 22800.275390625, | |
| "min": 17791.1953125, | |
| "max": 43947.55078125, | |
| "count": 16 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 479894.0, | |
| "min": 29952.0, | |
| "max": 479894.0, | |
| "count": 16 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 479894.0, | |
| "min": 29952.0, | |
| "max": 479894.0, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": -0.07348731905221939, | |
| "min": -0.1460859626531601, | |
| "max": -0.02258189395070076, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": -17.6369571685791, | |
| "min": -34.622371673583984, | |
| "max": -5.442236423492432, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.02711433544754982, | |
| "min": 0.02525223232805729, | |
| "max": 0.3571232855319977, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 6.507440567016602, | |
| "min": 6.085787773132324, | |
| "max": 84.63822174072266, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.07035029758043791, | |
| "min": 0.0661739269676664, | |
| "max": 0.07172009596808034, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9849041661261309, | |
| "min": 0.48547021068676766, | |
| "max": 0.9946436752322311, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.000834662312260333, | |
| "min": 0.00031523870841881376, | |
| "max": 0.0065712490545257, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.011685272371644661, | |
| "min": 0.003782864501025765, | |
| "max": 0.053147435931653796, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 2.0766264506514284e-05, | |
| "min": 2.0766264506514284e-05, | |
| "max": 0.00029030126037577137, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.00029072770309119996, | |
| "min": 0.00029072770309119996, | |
| "max": 0.0026353767215412, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.10692205714285717, | |
| "min": 0.10692205714285717, | |
| "max": 0.19676708571428575, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 1.4969088000000004, | |
| "min": 1.3773696000000002, | |
| "max": 2.0784588000000004, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0007015135085714285, | |
| "min": 0.0007015135085714285, | |
| "max": 0.00967703186285714, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.009821189119999999, | |
| "min": 0.009821189119999999, | |
| "max": 0.08787803412000002, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.02401557005941868, | |
| "min": 0.02401557005941868, | |
| "max": 0.4124005138874054, | |
| "count": 16 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.3362179696559906, | |
| "min": 0.3362179696559906, | |
| "max": 2.88680362701416, | |
| "count": 16 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 983.4375, | |
| "min": 833.5, | |
| "max": 999.0, | |
| "count": 16 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 31470.0, | |
| "min": 15984.0, | |
| "max": 33307.0, | |
| "count": 16 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": -0.8590250513516366, | |
| "min": -1.0000000521540642, | |
| "max": -0.2507500406354666, | |
| "count": 16 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": -27.488801643252373, | |
| "min": -31.99920167028904, | |
| "max": -6.018000975251198, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": -0.8590250513516366, | |
| "min": -1.0000000521540642, | |
| "max": -0.2507500406354666, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": -27.488801643252373, | |
| "min": -31.99920167028904, | |
| "max": -6.018000975251198, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.24201162983081304, | |
| "min": 0.24201162983081304, | |
| "max": 7.885494565591216, | |
| "count": 16 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 7.744372154586017, | |
| "min": 7.744372154586017, | |
| "max": 126.16791304945946, | |
| "count": 16 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 16 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 16 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1681293732", | |
| "python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1681294706" | |
| }, | |
| "total": 974.007467129, | |
| "count": 1, | |
| "self": 0.5477050630001941, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.11668722399997478, | |
| "count": 1, | |
| "self": 0.11668722399997478 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 973.3430748419999, | |
| "count": 1, | |
| "self": 0.6759002000075043, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 4.063474004999989, | |
| "count": 1, | |
| "self": 4.063474004999989 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 968.5083623919924, | |
| "count": 31511, | |
| "self": 0.6883046399979094, | |
| "children": { | |
| "env_step": { | |
| "total": 663.3104763319949, | |
| "count": 31511, | |
| "self": 610.5543238240207, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 52.34823230698407, | |
| "count": 31511, | |
| "self": 2.3505269959886164, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 49.99770531099546, | |
| "count": 31304, | |
| "self": 49.99770531099546 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.40792020099007686, | |
| "count": 31511, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 971.0200774940174, | |
| "count": 31511, | |
| "is_parallel": true, | |
| "self": 414.67753474100573, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.004816813999980241, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0035615759999814145, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012552379999988261, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012552379999988261 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.07777846400000499, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0025735670000130995, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004756429999588363, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004756429999588363 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.0730688180000243, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0730688180000243 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0016604360000087581, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0003779680000661756, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0012824679999425825, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0012824679999425825 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 556.3425427530117, | |
| "count": 31510, | |
| "is_parallel": true, | |
| "self": 16.367329631991083, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 11.473071650002282, | |
| "count": 31510, | |
| "is_parallel": true, | |
| "self": 11.473071650002282 | |
| }, | |
| "communicator.exchange": { | |
| "total": 481.73043130901266, | |
| "count": 31510, | |
| "is_parallel": true, | |
| "self": 481.73043130901266 | |
| }, | |
| "steps_from_proto": { | |
| "total": 46.77171016200566, | |
| "count": 31510, | |
| "is_parallel": true, | |
| "self": 9.849368285999674, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 36.92234187600599, | |
| "count": 252080, | |
| "is_parallel": true, | |
| "self": 36.92234187600599 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 304.5095814199995, | |
| "count": 31511, | |
| "self": 1.0428892009993547, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 51.15358043199831, | |
| "count": 31511, | |
| "self": 51.039550797998345, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.11402963399996224, | |
| "count": 1, | |
| "self": 0.11402963399996224 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 252.31311178700184, | |
| "count": 200, | |
| "self": 161.73627050800786, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 90.57684127899398, | |
| "count": 11445, | |
| "self": 90.57684127899398 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 9.259999842470279e-07, | |
| "count": 1, | |
| "self": 9.259999842470279e-07 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.0953373190000093, | |
| "count": 1, | |
| "self": 0.001378044999910344, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.09395927400009896, | |
| "count": 1, | |
| "self": 0.09395927400009896 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |