ppo-Pyramids / run_logs /timers.json
Simple-Chop's picture
First Push
c37b883 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.4849931299686432,
"min": 0.4849931299686432,
"max": 1.4617489576339722,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 14534.2744140625,
"min": 14534.2744140625,
"max": 44343.6171875,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989944.0,
"min": 29952.0,
"max": 989944.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989944.0,
"min": 29952.0,
"max": 989944.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.44973358511924744,
"min": -0.10290933400392532,
"max": 0.570103645324707,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 123.22700500488281,
"min": -24.801149368286133,
"max": 157.34860229492188,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.05136988312005997,
"min": -0.05136988312005997,
"max": 0.3580794930458069,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -14.075347900390625,
"min": -14.075347900390625,
"max": 84.86483764648438,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.0680983506345434,
"min": 0.06509623204004125,
"max": 0.0729792808483992,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9533769088836077,
"min": 0.5073702113385762,
"max": 1.0666662966250442,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.01531557868327668,
"min": 0.00031360778427866494,
"max": 0.016716500662109217,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.21441810156587351,
"min": 0.0028224700585079846,
"max": 0.24823321242001842,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.247347584250002e-06,
"min": 7.247347584250002e-06,
"max": 0.00029515063018788575,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00010146286617950002,
"min": 0.00010146286617950002,
"max": 0.0031368077543975,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10241575000000003,
"min": 0.10241575000000003,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4338205000000004,
"min": 1.3886848,
"max": 2.4013283999999997,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.0002513334250000001,
"min": 0.0002513334250000001,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0035186679500000015,
"min": 0.0035186679500000015,
"max": 0.10458568974999999,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.0048655057325959206,
"min": 0.004860612563788891,
"max": 0.4736633598804474,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.06811708211898804,
"min": 0.06811708211898804,
"max": 3.315643548965454,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 368.71604938271605,
"min": 350.54545454545456,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29866.0,
"min": 15984.0,
"max": 35167.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.483088873234796,
"min": -1.0000000521540642,
"max": 1.6379761695861816,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 120.13019873201847,
"min": -30.999201610684395,
"max": 137.58999824523926,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.483088873234796,
"min": -1.0000000521540642,
"max": 1.6379761695861816,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 120.13019873201847,
"min": -30.999201610684395,
"max": 137.58999824523926,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.018742875021416694,
"min": 0.01831325851283812,
"max": 10.621151620522141,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 1.5181728767347522,
"min": 1.4725718807749217,
"max": 169.93842592835426,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1741648031",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.6.0+cu124",
"numpy_version": "1.23.5",
"end_time_seconds": "1741650320"
},
"total": 2288.4332473330005,
"count": 1,
"self": 0.47578670400116607,
"children": {
"run_training.setup": {
"total": 0.020574058999955014,
"count": 1,
"self": 0.020574058999955014
},
"TrainerController.start_learning": {
"total": 2287.9368865699994,
"count": 1,
"self": 1.4758147910238222,
"children": {
"TrainerController._reset_env": {
"total": 2.099275698999918,
"count": 1,
"self": 2.099275698999918
},
"TrainerController.advance": {
"total": 2284.273111573976,
"count": 63723,
"self": 1.6630028159202084,
"children": {
"env_step": {
"total": 1599.7098786010465,
"count": 63723,
"self": 1437.0821860721494,
"children": {
"SubprocessEnvManager._take_step": {
"total": 161.77856773892654,
"count": 63723,
"self": 4.987737537873272,
"children": {
"TorchPolicy.evaluate": {
"total": 156.79083020105327,
"count": 62550,
"self": 156.79083020105327
}
}
},
"workers": {
"total": 0.8491247899705741,
"count": 63723,
"self": 0.0,
"children": {
"worker_root": {
"total": 2282.369480734049,
"count": 63723,
"is_parallel": true,
"self": 963.1068658810123,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0021109549998072907,
"count": 1,
"is_parallel": true,
"self": 0.000699127999268967,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014118270005383238,
"count": 8,
"is_parallel": true,
"self": 0.0014118270005383238
}
}
},
"UnityEnvironment.step": {
"total": 0.051930184999946505,
"count": 1,
"is_parallel": true,
"self": 0.0006210209999153449,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004708159999609052,
"count": 1,
"is_parallel": true,
"self": 0.0004708159999609052
},
"communicator.exchange": {
"total": 0.04891846300006364,
"count": 1,
"is_parallel": true,
"self": 0.04891846300006364
},
"steps_from_proto": {
"total": 0.0019198850000066159,
"count": 1,
"is_parallel": true,
"self": 0.0004255870003362361,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014942979996703798,
"count": 8,
"is_parallel": true,
"self": 0.0014942979996703798
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1319.2626148530367,
"count": 63722,
"is_parallel": true,
"self": 32.1315479059931,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 23.022852285060708,
"count": 63722,
"is_parallel": true,
"self": 23.022852285060708
},
"communicator.exchange": {
"total": 1166.3759513868672,
"count": 63722,
"is_parallel": true,
"self": 1166.3759513868672
},
"steps_from_proto": {
"total": 97.73226327511566,
"count": 63722,
"is_parallel": true,
"self": 20.348952180821016,
"children": {
"_process_rank_one_or_two_observation": {
"total": 77.38331109429464,
"count": 509776,
"is_parallel": true,
"self": 77.38331109429464
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 682.9002301570094,
"count": 63723,
"self": 2.770866145983291,
"children": {
"process_trajectory": {
"total": 129.33958363203647,
"count": 63723,
"self": 129.13331545803567,
"children": {
"RLTrainer._checkpoint": {
"total": 0.20626817400079744,
"count": 2,
"self": 0.20626817400079744
}
}
},
"_update_policy": {
"total": 550.7897803789897,
"count": 442,
"self": 301.2279141460226,
"children": {
"TorchPPOOptimizer.update": {
"total": 249.56186623296708,
"count": 22848,
"self": 249.56186623296708
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.139995770761743e-07,
"count": 1,
"self": 8.139995770761743e-07
},
"TrainerController._save_models": {
"total": 0.08868369199990411,
"count": 1,
"self": 0.001496696999311098,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08718699500059301,
"count": 1,
"self": 0.08718699500059301
}
}
}
}
}
}
}