|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.14011944830417633, |
|
"min": 0.13738703727722168, |
|
"max": 1.3381617069244385, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 4158.7451171875, |
|
"min": 4115.0166015625, |
|
"max": 40594.47265625, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 2999916.0, |
|
"min": 29952.0, |
|
"max": 2999916.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 2999916.0, |
|
"min": 29952.0, |
|
"max": 2999916.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.8453541398048401, |
|
"min": -0.10252268612384796, |
|
"max": 0.8742783665657043, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 257.8330078125, |
|
"min": -24.810489654541016, |
|
"max": 269.2777404785156, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.0007943588425405324, |
|
"min": -0.008582175709307194, |
|
"max": 0.4010782837867737, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 0.24227944016456604, |
|
"min": -2.566070556640625, |
|
"max": 96.2587890625, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06782120283889058, |
|
"min": 0.06333402807401044, |
|
"max": 0.07829906407741591, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9494968397444681, |
|
"min": 0.49095129747018645, |
|
"max": 1.0748830527585347, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.015354181094173696, |
|
"min": 0.0010574577767504271, |
|
"max": 0.01621668449803895, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.21495853531843176, |
|
"min": 0.00931974074083182, |
|
"max": 0.2292830414177539, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 1.5075280689523765e-06, |
|
"min": 1.5075280689523765e-06, |
|
"max": 0.00029838354339596195, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 2.110539296533327e-05, |
|
"min": 2.110539296533327e-05, |
|
"max": 0.003969281176906299, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10050247619047618, |
|
"min": 0.10050247619047618, |
|
"max": 0.19946118095238097, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4070346666666667, |
|
"min": 1.3897045333333333, |
|
"max": 2.7974415000000006, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 6.019737142857127e-05, |
|
"min": 6.019737142857127e-05, |
|
"max": 0.009946171977142856, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0008427631999999977, |
|
"min": 0.0008427631999999977, |
|
"max": 0.13231706062999998, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.00840148888528347, |
|
"min": 0.008221963420510292, |
|
"max": 0.5902184844017029, |
|
"count": 100 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.11762084811925888, |
|
"min": 0.11510748416185379, |
|
"max": 4.131529331207275, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 205.91666666666666, |
|
"min": 201.9794520547945, |
|
"max": 999.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29652.0, |
|
"min": 15984.0, |
|
"max": 32548.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.7940833220879238, |
|
"min": -1.0000000521540642, |
|
"max": 1.7944999812170863, |
|
"count": 100 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 258.347998380661, |
|
"min": -32.000001668930054, |
|
"max": 265.5713979303837, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.7940833220879238, |
|
"min": -1.0000000521540642, |
|
"max": 1.7944999812170863, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 258.347998380661, |
|
"min": -32.000001668930054, |
|
"max": 265.5713979303837, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.01803157640663105, |
|
"min": 0.01797448639857989, |
|
"max": 11.956338007003069, |
|
"count": 100 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.596547002554871, |
|
"min": 2.462504636605445, |
|
"max": 191.3014081120491, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 100 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1687986314", |
|
"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1687993697" |
|
}, |
|
"total": 7382.744843643, |
|
"count": 1, |
|
"self": 1.1112634849996539, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.03709086100002423, |
|
"count": 1, |
|
"self": 0.03709086100002423 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 7381.5964892970005, |
|
"count": 1, |
|
"self": 4.173439872898598, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.4050869460002104, |
|
"count": 1, |
|
"self": 5.4050869460002104 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 7371.847438255104, |
|
"count": 195431, |
|
"self": 4.281450493071134, |
|
"children": { |
|
"env_step": { |
|
"total": 5458.084999138928, |
|
"count": 195431, |
|
"self": 5134.7961792055285, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 320.8708623448524, |
|
"count": 195431, |
|
"self": 14.046385025705604, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 306.8244773191468, |
|
"count": 187558, |
|
"self": 306.8244773191468 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.4179575885470967, |
|
"count": 195431, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 7365.242647006996, |
|
"count": 195431, |
|
"is_parallel": true, |
|
"self": 2573.2459145027797, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0025555209999765793, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.000681953999446705, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0018735670005298743, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0018735670005298743 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.0456330380000054, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005740570002217282, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00047580000000380096, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00047580000000380096 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.04272288599986496, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.04272288599986496 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0018602949999149132, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003475409998827672, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001512754000032146, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001512754000032146 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 4791.996732504216, |
|
"count": 195430, |
|
"is_parallel": true, |
|
"self": 98.74312471642497, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 66.10156270104926, |
|
"count": 195430, |
|
"is_parallel": true, |
|
"self": 66.10156270104926 |
|
}, |
|
"communicator.exchange": { |
|
"total": 4323.890692395792, |
|
"count": 195430, |
|
"is_parallel": true, |
|
"self": 4323.890692395792 |
|
}, |
|
"steps_from_proto": { |
|
"total": 303.2613526909497, |
|
"count": 195430, |
|
"is_parallel": true, |
|
"self": 60.26883022258244, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 242.99252246836727, |
|
"count": 1563440, |
|
"is_parallel": true, |
|
"self": 242.99252246836727 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1909.4809886231046, |
|
"count": 195431, |
|
"self": 8.259708224072938, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 333.3622472870238, |
|
"count": 195431, |
|
"self": 332.6244581370229, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.7377891500009355, |
|
"count": 6, |
|
"self": 0.7377891500009355 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1567.8590331120079, |
|
"count": 1395, |
|
"self": 1008.2151922029614, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 559.6438409090465, |
|
"count": 68379, |
|
"self": 559.6438409090465 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.0999992809956893e-06, |
|
"count": 1, |
|
"self": 1.0999992809956893e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.17052312299892947, |
|
"count": 1, |
|
"self": 0.002094905999911134, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.16842821699901833, |
|
"count": 1, |
|
"self": 0.16842821699901833 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |