pyramids-first

097e0dd almost 2 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.09885845333337784,
	"min": 0.09885845333337784,
	"max": 1.391262173652649,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 2961.00830078125,
	"min": 2961.00830078125,
	"max": 42205.328125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989942.0,
	"min": 29952.0,
	"max": 989942.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989942.0,
	"min": 29952.0,
	"max": 989942.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.09300978481769562,
	"min": -0.11049512028694153,
	"max": -0.04772590473294258,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -22.41535758972168,
	"min": -26.518829345703125,
	"max": -11.50194263458252,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.7057044506072998,
	"min": 0.3943696916103363,
	"max": 0.7211557030677795,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 170.07476806640625,
	"min": 93.46561431884766,
	"max": 173.07736206054688,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06966624491625004,
	"min": 0.06390519778727853,
	"max": 0.07276667683861657,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9753274288275006,
	"min": 0.5053176592062656,
	"max": 1.0435171967746653,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.002272243285023804,
	"min": 0.0012730152614169057,
	"max": 0.01410997276765144,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.031811405990333254,
	"min": 0.013503947598538854,
	"max": 0.09876980937356009,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.468597510499998e-06,
	"min": 7.468597510499998e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010456036514699997,
	"min": 0.00010456036514699997,
	"max": 0.0033823124725626,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10248950000000001,
	"min": 0.10248950000000001,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4348530000000002,
	"min": 1.3691136000000002,
	"max": 2.5274373999999997,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002587010499999999,
	"min": 0.0002587010499999999,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0036218146999999986,
	"min": 0.0036218146999999986,
	"max": 0.11277099626,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.6952353119850159,
	"min": 0.46431103348731995,
	"max": 0.701970636844635,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 9.733294486999512,
	"min": 3.286691665649414,
	"max": 10.338406562805176,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 971.9677419354839,
	"min": 942.2083333333334,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30131.0,
	"min": 15984.0,
	"max": 32978.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.9081290818510517,
	"min": -1.0000000521540642,
	"max": -0.5925652637429859,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -28.152001537382603,
	"min": -32.000001668930054,
	"max": -13.629001066088676,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.9081290818510517,
	"min": -1.0000000521540642,
	"max": -0.5925652637429859,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -28.152001537382603,
	"min": -32.000001668930054,
	"max": -13.629001066088676,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 6.750458623372739,
	"min": 4.564700076938607,
	"max": 12.862612821161747,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 209.26421732455492,
	"min": 113.24149153381586,
	"max": 219.23677159659564,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1678110199",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.22.4",
	"end_time_seconds": "1678112313"
	},
	"total": 2113.926096401,
	"count": 1,
	"self": 0.44358649200012223,
	"children": {
	"run_training.setup": {
	"total": 0.11608384800001659,
	"count": 1,
	"self": 0.11608384800001659
	},
	"TrainerController.start_learning": {
	"total": 2113.366426061,
	"count": 1,
	"self": 1.235741714987853,
	"children": {
	"TrainerController._reset_env": {
	"total": 10.123026120999953,
	"count": 1,
	"self": 10.123026120999953
	},
	"TrainerController.advance": {
	"total": 2101.921326625012,
	"count": 62964,
	"self": 1.4148093849767065,
	"children": {
	"env_step": {
	"total": 1353.883590047055,
	"count": 62964,
	"self": 1242.338978340114,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 110.73815874495813,
	"count": 62964,
	"self": 4.591770718939301,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 106.14638802601883,
	"count": 62566,
	"self": 36.07177086400759,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 70.07461716201124,
	"count": 62566,
	"self": 70.07461716201124
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.8064529619829273,
	"count": 62964,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2108.7938016910566,
	"count": 62964,
	"is_parallel": true,
	"self": 977.7199052831074,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005293757000004007,
	"count": 1,
	"is_parallel": true,
	"self": 0.003964434999943478,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013293220000605288,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013293220000605288
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04923415500002193,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005325830001083887,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005033899999489222,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005033899999489222
	},
	"communicator.exchange": {
	"total": 0.046679495000034876,
	"count": 1,
	"is_parallel": true,
	"self": 0.046679495000034876
	},
	"steps_from_proto": {
	"total": 0.0015186869999297414,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037817099973835866,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011405160001913828,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011405160001913828
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1131.0738964079492,
	"count": 62963,
	"is_parallel": true,
	"self": 31.47343672595889,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.78740865404643,
	"count": 62963,
	"is_parallel": true,
	"self": 22.78740865404643
	},
	"communicator.exchange": {
	"total": 986.0875945519707,
	"count": 62963,
	"is_parallel": true,
	"self": 986.0875945519707
	},
	"steps_from_proto": {
	"total": 90.72545647597315,
	"count": 62963,
	"is_parallel": true,
	"self": 21.305764869089444,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 69.4196916068837,
	"count": 503704,
	"is_parallel": true,
	"self": 69.4196916068837
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 746.6229271929803,
	"count": 62964,
	"self": 2.268821930978447,
	"children": {
	"process_trajectory": {
	"total": 160.9588118200013,
	"count": 62964,
	"self": 160.72140422600137,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.23740759399993294,
	"count": 2,
	"self": 0.23740759399993294
	}
	}
	},
	"_update_policy": {
	"total": 583.3952934420006,
	"count": 436,
	"self": 234.2230539580039,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 349.1722394839967,
	"count": 22770,
	"self": 349.1722394839967
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.359997991647106e-07,
	"count": 1,
	"self": 8.359997991647106e-07
	},
	"TrainerController._save_models": {
	"total": 0.0863307640001949,
	"count": 1,
	"self": 0.0013738990005549567,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08495686499963995,
	"count": 1,
	"self": 0.08495686499963995
	}
	}
	}
	}
	}
	}
	}