First Push

c37b883 verified 5 months ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4849931299686432,
	"min": 0.4849931299686432,
	"max": 1.4617489576339722,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 14534.2744140625,
	"min": 14534.2744140625,
	"max": 44343.6171875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989944.0,
	"min": 29952.0,
	"max": 989944.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989944.0,
	"min": 29952.0,
	"max": 989944.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.44973358511924744,
	"min": -0.10290933400392532,
	"max": 0.570103645324707,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 123.22700500488281,
	"min": -24.801149368286133,
	"max": 157.34860229492188,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.05136988312005997,
	"min": -0.05136988312005997,
	"max": 0.3580794930458069,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -14.075347900390625,
	"min": -14.075347900390625,
	"max": 84.86483764648438,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0680983506345434,
	"min": 0.06509623204004125,
	"max": 0.0729792808483992,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9533769088836077,
	"min": 0.5073702113385762,
	"max": 1.0666662966250442,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01531557868327668,
	"min": 0.00031360778427866494,
	"max": 0.016716500662109217,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21441810156587351,
	"min": 0.0028224700585079846,
	"max": 0.24823321242001842,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.247347584250002e-06,
	"min": 7.247347584250002e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010146286617950002,
	"min": 0.00010146286617950002,
	"max": 0.0031368077543975,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10241575000000003,
	"min": 0.10241575000000003,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4338205000000004,
	"min": 1.3886848,
	"max": 2.4013283999999997,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002513334250000001,
	"min": 0.0002513334250000001,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0035186679500000015,
	"min": 0.0035186679500000015,
	"max": 0.10458568974999999,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.0048655057325959206,
	"min": 0.004860612563788891,
	"max": 0.4736633598804474,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.06811708211898804,
	"min": 0.06811708211898804,
	"max": 3.315643548965454,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 368.71604938271605,
	"min": 350.54545454545456,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29866.0,
	"min": 15984.0,
	"max": 35167.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.483088873234796,
	"min": -1.0000000521540642,
	"max": 1.6379761695861816,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 120.13019873201847,
	"min": -30.999201610684395,
	"max": 137.58999824523926,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.483088873234796,
	"min": -1.0000000521540642,
	"max": 1.6379761695861816,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 120.13019873201847,
	"min": -30.999201610684395,
	"max": 137.58999824523926,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.018742875021416694,
	"min": 0.01831325851283812,
	"max": 10.621151620522141,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.5181728767347522,
	"min": 1.4725718807749217,
	"max": 169.93842592835426,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1741648031",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1741650320"
	},
	"total": 2288.4332473330005,
	"count": 1,
	"self": 0.47578670400116607,
	"children": {
	"run_training.setup": {
	"total": 0.020574058999955014,
	"count": 1,
	"self": 0.020574058999955014
	},
	"TrainerController.start_learning": {
	"total": 2287.9368865699994,
	"count": 1,
	"self": 1.4758147910238222,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.099275698999918,
	"count": 1,
	"self": 2.099275698999918
	},
	"TrainerController.advance": {
	"total": 2284.273111573976,
	"count": 63723,
	"self": 1.6630028159202084,
	"children": {
	"env_step": {
	"total": 1599.7098786010465,
	"count": 63723,
	"self": 1437.0821860721494,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 161.77856773892654,
	"count": 63723,
	"self": 4.987737537873272,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 156.79083020105327,
	"count": 62550,
	"self": 156.79083020105327
	}
	}
	},
	"workers": {
	"total": 0.8491247899705741,
	"count": 63723,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2282.369480734049,
	"count": 63723,
	"is_parallel": true,
	"self": 963.1068658810123,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0021109549998072907,
	"count": 1,
	"is_parallel": true,
	"self": 0.000699127999268967,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014118270005383238,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014118270005383238
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.051930184999946505,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006210209999153449,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004708159999609052,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004708159999609052
	},
	"communicator.exchange": {
	"total": 0.04891846300006364,
	"count": 1,
	"is_parallel": true,
	"self": 0.04891846300006364
	},
	"steps_from_proto": {
	"total": 0.0019198850000066159,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004255870003362361,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014942979996703798,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014942979996703798
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1319.2626148530367,
	"count": 63722,
	"is_parallel": true,
	"self": 32.1315479059931,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.022852285060708,
	"count": 63722,
	"is_parallel": true,
	"self": 23.022852285060708
	},
	"communicator.exchange": {
	"total": 1166.3759513868672,
	"count": 63722,
	"is_parallel": true,
	"self": 1166.3759513868672
	},
	"steps_from_proto": {
	"total": 97.73226327511566,
	"count": 63722,
	"is_parallel": true,
	"self": 20.348952180821016,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 77.38331109429464,
	"count": 509776,
	"is_parallel": true,
	"self": 77.38331109429464
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 682.9002301570094,
	"count": 63723,
	"self": 2.770866145983291,
	"children": {
	"process_trajectory": {
	"total": 129.33958363203647,
	"count": 63723,
	"self": 129.13331545803567,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.20626817400079744,
	"count": 2,
	"self": 0.20626817400079744
	}
	}
	},
	"_update_policy": {
	"total": 550.7897803789897,
	"count": 442,
	"self": 301.2279141460226,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 249.56186623296708,
	"count": 22848,
	"self": 249.56186623296708
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.139995770761743e-07,
	"count": 1,
	"self": 8.139995770761743e-07
	},
	"TrainerController._save_models": {
	"total": 0.08868369199990411,
	"count": 1,
	"self": 0.001496696999311098,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08718699500059301,
	"count": 1,
	"self": 0.08718699500059301
	}
	}
	}
	}
	}
	}
	}