ppo-Pyramids-1 / run_logs /timers.json
greg-szopinski's picture
First Push
0997fac
raw
history blame
18.7 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.4934672713279724,
"min": 0.4934672713279724,
"max": 1.4450116157531738,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 14732.958984375,
"min": 14732.958984375,
"max": 43835.87109375,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989906.0,
"min": 29874.0,
"max": 989906.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989906.0,
"min": 29874.0,
"max": 989906.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.27884921431541443,
"min": -0.17593970894813538,
"max": 0.28898894786834717,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 71.94309997558594,
"min": -41.69771194458008,
"max": 75.42611694335938,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.056208305060863495,
"min": -0.030473720282316208,
"max": 0.2238595336675644,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 14.501742362976074,
"min": -7.9231672286987305,
"max": 53.054710388183594,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07014219388042368,
"min": 0.0658704014723688,
"max": 0.07354745060162741,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 1.0521329082063553,
"min": 0.5776908353363143,
"max": 1.0521329082063553,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.014194753618438779,
"min": 0.0001860607926464386,
"max": 0.014194753618438779,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.21292130427658168,
"min": 0.0026048510970501405,
"max": 0.21292130427658168,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.4775575075133285e-06,
"min": 7.4775575075133285e-06,
"max": 0.000294848776717075,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00011216336261269993,
"min": 0.00011216336261269993,
"max": 0.003507914630695199,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10249248666666669,
"min": 0.10249248666666669,
"max": 0.198282925,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.5373873000000002,
"min": 1.4780293000000002,
"max": 2.5693048000000003,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.0002589994179999999,
"min": 0.0002589994179999999,
"max": 0.0098284642075,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003884991269999998,
"min": 0.003884991269999998,
"max": 0.11695354952,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.010413600131869316,
"min": 0.010413600131869316,
"max": 0.2825762927532196,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.1562040001153946,
"min": 0.1539803445339203,
"max": 2.260610342025757,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 538.4561403508771,
"min": 538.4561403508771,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 30692.0,
"min": 16417.0,
"max": 33253.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.0754561109239595,
"min": -0.999987552408129,
"max": 1.1025499586875622,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 61.30099832266569,
"min": -31.999601677060127,
"max": 61.30099832266569,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.0754561109239595,
"min": -0.999987552408129,
"max": 1.1025499586875622,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 61.30099832266569,
"min": -31.999601677060127,
"max": 61.30099832266569,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.058395058635556905,
"min": 0.058395058635556905,
"max": 5.646892654106898,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.3285183422267437,
"min": 3.279166377404181,
"max": 95.99717511981726,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1690883048",
"python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1690885344"
},
"total": 2296.321596244,
"count": 1,
"self": 0.5306272090001585,
"children": {
"run_training.setup": {
"total": 0.04446796100000938,
"count": 1,
"self": 0.04446796100000938
},
"TrainerController.start_learning": {
"total": 2295.7465010739998,
"count": 1,
"self": 1.46235737793495,
"children": {
"TrainerController._reset_env": {
"total": 4.248992591999922,
"count": 1,
"self": 4.248992591999922
},
"TrainerController.advance": {
"total": 2289.932577652064,
"count": 63405,
"self": 1.4369880831704904,
"children": {
"env_step": {
"total": 1589.1509158689992,
"count": 63405,
"self": 1474.3315427470602,
"children": {
"SubprocessEnvManager._take_step": {
"total": 113.94385847899184,
"count": 63405,
"self": 4.8541462100729404,
"children": {
"TorchPolicy.evaluate": {
"total": 109.0897122689189,
"count": 62577,
"self": 109.0897122689189
}
}
},
"workers": {
"total": 0.8755146429471097,
"count": 63405,
"self": 0.0,
"children": {
"worker_root": {
"total": 2290.266117599915,
"count": 63405,
"is_parallel": true,
"self": 936.3116937949021,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.00179847300023539,
"count": 1,
"is_parallel": true,
"self": 0.0005892199997106218,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012092530005247681,
"count": 8,
"is_parallel": true,
"self": 0.0012092530005247681
}
}
},
"UnityEnvironment.step": {
"total": 0.05288322300020809,
"count": 1,
"is_parallel": true,
"self": 0.0005624289997285814,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005639020000671735,
"count": 1,
"is_parallel": true,
"self": 0.0005639020000671735
},
"communicator.exchange": {
"total": 0.04986806000033539,
"count": 1,
"is_parallel": true,
"self": 0.04986806000033539
},
"steps_from_proto": {
"total": 0.0018888320000769454,
"count": 1,
"is_parallel": true,
"self": 0.000369254999441182,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0015195770006357634,
"count": 8,
"is_parallel": true,
"self": 0.0015195770006357634
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1353.954423805013,
"count": 63404,
"is_parallel": true,
"self": 36.29273797097221,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 24.630590313025095,
"count": 63404,
"is_parallel": true,
"self": 24.630590313025095
},
"communicator.exchange": {
"total": 1186.0272770850838,
"count": 63404,
"is_parallel": true,
"self": 1186.0272770850838
},
"steps_from_proto": {
"total": 107.00381843593186,
"count": 63404,
"is_parallel": true,
"self": 21.555862068659735,
"children": {
"_process_rank_one_or_two_observation": {
"total": 85.44795636727213,
"count": 507232,
"is_parallel": true,
"self": 85.44795636727213
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 699.3446736998944,
"count": 63405,
"self": 2.6815816988696497,
"children": {
"process_trajectory": {
"total": 112.92814549203467,
"count": 63405,
"self": 112.71062610503486,
"children": {
"RLTrainer._checkpoint": {
"total": 0.2175193869998111,
"count": 2,
"self": 0.2175193869998111
}
}
},
"_update_policy": {
"total": 583.7349465089901,
"count": 449,
"self": 382.42100187805863,
"children": {
"TorchPPOOptimizer.update": {
"total": 201.31394463093147,
"count": 22764,
"self": 201.31394463093147
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.380000847158954e-07,
"count": 1,
"self": 9.380000847158954e-07
},
"TrainerController._save_models": {
"total": 0.10257251400071254,
"count": 1,
"self": 0.001436692000424955,
"children": {
"RLTrainer._checkpoint": {
"total": 0.10113582200028759,
"count": 1,
"self": 0.10113582200028759
}
}
}
}
}
}
}