|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.09885845333337784, |
|
"min": 0.09885845333337784, |
|
"max": 1.391262173652649, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 2961.00830078125, |
|
"min": 2961.00830078125, |
|
"max": 42205.328125, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 989942.0, |
|
"min": 29952.0, |
|
"max": 989942.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 989942.0, |
|
"min": 29952.0, |
|
"max": 989942.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.09300978481769562, |
|
"min": -0.11049512028694153, |
|
"max": -0.04772590473294258, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -22.41535758972168, |
|
"min": -26.518829345703125, |
|
"max": -11.50194263458252, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.7057044506072998, |
|
"min": 0.3943696916103363, |
|
"max": 0.7211557030677795, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 170.07476806640625, |
|
"min": 93.46561431884766, |
|
"max": 173.07736206054688, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.06966624491625004, |
|
"min": 0.06390519778727853, |
|
"max": 0.07276667683861657, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9753274288275006, |
|
"min": 0.5053176592062656, |
|
"max": 1.0435171967746653, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.002272243285023804, |
|
"min": 0.0012730152614169057, |
|
"max": 0.01410997276765144, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.031811405990333254, |
|
"min": 0.013503947598538854, |
|
"max": 0.09876980937356009, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 7.468597510499998e-06, |
|
"min": 7.468597510499998e-06, |
|
"max": 0.00029515063018788575, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.00010456036514699997, |
|
"min": 0.00010456036514699997, |
|
"max": 0.0033823124725626, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10248950000000001, |
|
"min": 0.10248950000000001, |
|
"max": 0.19838354285714285, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4348530000000002, |
|
"min": 1.3691136000000002, |
|
"max": 2.5274373999999997, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0002587010499999999, |
|
"min": 0.0002587010499999999, |
|
"max": 0.00983851593142857, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0036218146999999986, |
|
"min": 0.0036218146999999986, |
|
"max": 0.11277099626, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.6952353119850159, |
|
"min": 0.46431103348731995, |
|
"max": 0.701970636844635, |
|
"count": 33 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 9.733294486999512, |
|
"min": 3.286691665649414, |
|
"max": 10.338406562805176, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 971.9677419354839, |
|
"min": 942.2083333333334, |
|
"max": 999.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30131.0, |
|
"min": 15984.0, |
|
"max": 32978.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": -0.9081290818510517, |
|
"min": -1.0000000521540642, |
|
"max": -0.5925652637429859, |
|
"count": 33 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": -28.152001537382603, |
|
"min": -32.000001668930054, |
|
"max": -13.629001066088676, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": -0.9081290818510517, |
|
"min": -1.0000000521540642, |
|
"max": -0.5925652637429859, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": -28.152001537382603, |
|
"min": -32.000001668930054, |
|
"max": -13.629001066088676, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 6.750458623372739, |
|
"min": 4.564700076938607, |
|
"max": 12.862612821161747, |
|
"count": 33 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 209.26421732455492, |
|
"min": 113.24149153381586, |
|
"max": 219.23677159659564, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 33 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1678110199", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.22.4", |
|
"end_time_seconds": "1678112313" |
|
}, |
|
"total": 2113.926096401, |
|
"count": 1, |
|
"self": 0.44358649200012223, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.11608384800001659, |
|
"count": 1, |
|
"self": 0.11608384800001659 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2113.366426061, |
|
"count": 1, |
|
"self": 1.235741714987853, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 10.123026120999953, |
|
"count": 1, |
|
"self": 10.123026120999953 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2101.921326625012, |
|
"count": 62964, |
|
"self": 1.4148093849767065, |
|
"children": { |
|
"env_step": { |
|
"total": 1353.883590047055, |
|
"count": 62964, |
|
"self": 1242.338978340114, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 110.73815874495813, |
|
"count": 62964, |
|
"self": 4.591770718939301, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 106.14638802601883, |
|
"count": 62566, |
|
"self": 36.07177086400759, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 70.07461716201124, |
|
"count": 62566, |
|
"self": 70.07461716201124 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.8064529619829273, |
|
"count": 62964, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2108.7938016910566, |
|
"count": 62964, |
|
"is_parallel": true, |
|
"self": 977.7199052831074, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.005293757000004007, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.003964434999943478, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013293220000605288, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013293220000605288 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.04923415500002193, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005325830001083887, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005033899999489222, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005033899999489222 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.046679495000034876, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.046679495000034876 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0015186869999297414, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00037817099973835866, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011405160001913828, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011405160001913828 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1131.0738964079492, |
|
"count": 62963, |
|
"is_parallel": true, |
|
"self": 31.47343672595889, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 22.78740865404643, |
|
"count": 62963, |
|
"is_parallel": true, |
|
"self": 22.78740865404643 |
|
}, |
|
"communicator.exchange": { |
|
"total": 986.0875945519707, |
|
"count": 62963, |
|
"is_parallel": true, |
|
"self": 986.0875945519707 |
|
}, |
|
"steps_from_proto": { |
|
"total": 90.72545647597315, |
|
"count": 62963, |
|
"is_parallel": true, |
|
"self": 21.305764869089444, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 69.4196916068837, |
|
"count": 503704, |
|
"is_parallel": true, |
|
"self": 69.4196916068837 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 746.6229271929803, |
|
"count": 62964, |
|
"self": 2.268821930978447, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 160.9588118200013, |
|
"count": 62964, |
|
"self": 160.72140422600137, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.23740759399993294, |
|
"count": 2, |
|
"self": 0.23740759399993294 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 583.3952934420006, |
|
"count": 436, |
|
"self": 234.2230539580039, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 349.1722394839967, |
|
"count": 22770, |
|
"self": 349.1722394839967 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.359997991647106e-07, |
|
"count": 1, |
|
"self": 8.359997991647106e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.0863307640001949, |
|
"count": 1, |
|
"self": 0.0013738990005549567, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08495686499963995, |
|
"count": 1, |
|
"self": 0.08495686499963995 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |