add: added model v1

2b48be8 over 2 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.2916024625301361,
	"min": 0.29125112295150757,
	"max": 1.415248155593872,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 8827.3896484375,
	"min": 8746.53125,
	"max": 42932.96875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989916.0,
	"min": 29956.0,
	"max": 989916.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989916.0,
	"min": 29956.0,
	"max": 989916.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.5374546647071838,
	"min": -0.112742580473423,
	"max": 0.5798947811126709,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 149.94985961914062,
	"min": -27.396446228027344,
	"max": 164.1102294921875,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.027990568429231644,
	"min": -0.018696676939725876,
	"max": 0.546489417552948,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.80936861038208,
	"min": -5.291159629821777,
	"max": 130.06448364257812,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06590100508365854,
	"min": 0.06518899585654847,
	"max": 0.07228057705645621,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9226140711712195,
	"min": 0.48423678529764597,
	"max": 1.0717440580437871,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014334958537485964,
	"min": 0.0006781006875537126,
	"max": 0.01931471981436192,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2006894195248035,
	"min": 0.009493409625751976,
	"max": 0.2271763084084823,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.552490339678574e-06,
	"min": 7.552490339678574e-06,
	"max": 0.0002952382301586857,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010573486475550004,
	"min": 0.00010573486475550004,
	"max": 0.003374662075112699,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10251746428571429,
	"min": 0.10251746428571429,
	"max": 0.19841274285714286,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4352445,
	"min": 1.3888892,
	"max": 2.4441998,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00026149468214285726,
	"min": 0.00026149468214285726,
	"max": 0.009841433011428572,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003660925550000002,
	"min": 0.003660925550000002,
	"max": 0.11250624127,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.014703771099448204,
	"min": 0.014703771099448204,
	"max": 0.6592143177986145,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.20585279166698456,
	"min": 0.20585279166698456,
	"max": 4.614500045776367,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 359.95180722891564,
	"min": 323.93548387096774,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29876.0,
	"min": 16627.0,
	"max": 33226.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.543631308409105,
	"min": -0.9999750521965325,
	"max": 1.654556972525453,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 128.1213985979557,
	"min": -31.99920167028904,
	"max": 153.87379844486713,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.543631308409105,
	"min": -0.9999750521965325,
	"max": 1.654556972525453,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 128.1213985979557,
	"min": -31.99920167028904,
	"max": 153.87379844486713,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.052627474275426044,
	"min": 0.05192310863765337,
	"max": 13.408304013311863,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.368080364860361,
	"min": 4.368080364860361,
	"max": 227.94116822630167,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675370621",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1675372936"
	},
	"total": 2314.935416526,
	"count": 1,
	"self": 0.424498188000598,
	"children": {
	"run_training.setup": {
	"total": 0.0995371310000337,
	"count": 1,
	"self": 0.0995371310000337
	},
	"TrainerController.start_learning": {
	"total": 2314.4113812069995,
	"count": 1,
	"self": 1.4329393200418963,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.065273781000087,
	"count": 1,
	"self": 6.065273781000087
	},
	"TrainerController.advance": {
	"total": 2306.8241047359575,
	"count": 63875,
	"self": 1.5366646640513864,
	"children": {
	"env_step": {
	"total": 1563.27048306198,
	"count": 63875,
	"self": 1443.6524094129186,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 118.70890929300504,
	"count": 63875,
	"self": 4.7884965320454285,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 113.92041276095961,
	"count": 62563,
	"self": 37.60675069903573,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 76.31366206192388,
	"count": 62563,
	"self": 76.31366206192388
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.909164356056408,
	"count": 63875,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2309.067326014983,
	"count": 63875,
	"is_parallel": true,
	"self": 983.1047408640052,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0017364709997309546,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006073059989830654,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011291650007478893,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011291650007478893
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04667686200036769,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005168470001990499,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00046899800008759485,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046899800008759485
	},
	"communicator.exchange": {
	"total": 0.044000779000270995,
	"count": 1,
	"is_parallel": true,
	"self": 0.044000779000270995
	},
	"steps_from_proto": {
	"total": 0.0016902379998100514,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004548000001705077,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012354379996395437,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012354379996395437
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1325.9625851509777,
	"count": 63874,
	"is_parallel": true,
	"self": 27.962366246931197,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.755823151074765,
	"count": 63874,
	"is_parallel": true,
	"self": 23.755823151074765
	},
	"communicator.exchange": {
	"total": 1168.9903366930162,
	"count": 63874,
	"is_parallel": true,
	"self": 1168.9903366930162
	},
	"steps_from_proto": {
	"total": 105.25405905995558,
	"count": 63874,
	"is_parallel": true,
	"self": 23.855910272091478,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 81.3981487878641,
	"count": 510992,
	"is_parallel": true,
	"self": 81.3981487878641
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 742.016957009926,
	"count": 63875,
	"self": 2.7526073689764416,
	"children": {
	"process_trajectory": {
	"total": 170.82747540094806,
	"count": 63875,
	"self": 170.63323539894736,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.19424000200069713,
	"count": 2,
	"self": 0.19424000200069713
	}
	}
	},
	"_update_policy": {
	"total": 568.4368742400015,
	"count": 449,
	"self": 220.59458261598866,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 347.8422916240129,
	"count": 22839,
	"self": 347.8422916240129
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1180000001331791e-06,
	"count": 1,
	"self": 1.1180000001331791e-06
	},
	"TrainerController._save_models": {
	"total": 0.08906225200007611,
	"count": 1,
	"self": 0.0014762419996259268,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08758601000045019,
	"count": 1,
	"self": 0.08758601000045019
	}
	}
	}
	}
	}
	}
	}