First Push

158ba34 almost 2 years ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.7886731624603271,
	"min": 1.7538719177246094,
	"max": 3.2957756519317627,
	"count": 609
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 35029.375,
	"min": 10724.03515625,
	"max": 122329.875,
	"count": 609
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 43.990990990990994,
	"min": 39.483870967741936,
	"max": 999.0,
	"count": 609
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19532.0,
	"min": 2108.0,
	"max": 29424.0,
	"count": 609
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1473.0525575233607,
	"min": 1188.2391535706788,
	"max": 1502.293441927133,
	"count": 569
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 327017.6677701861,
	"min": 2376.4783071413576,
	"max": 362074.8879020111,
	"count": 569
	},
	"SoccerTwos.Step.mean": {
	"value": 6089982.0,
	"min": 9728.0,
	"max": 6089982.0,
	"count": 609
	},
	"SoccerTwos.Step.sum": {
	"value": 6089982.0,
	"min": 9728.0,
	"max": 6089982.0,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.050350673496723175,
	"min": -0.1030958890914917,
	"max": 0.18944373726844788,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -11.177849769592285,
	"min": -18.28963851928711,
	"max": 29.809932708740234,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.04108668491244316,
	"min": -0.10463780909776688,
	"max": 0.19806651771068573,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -9.121244430541992,
	"min": -18.162994384765625,
	"max": 29.94745635986328,
	"count": 609
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 609
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.08414774757247788,
	"min": -0.625,
	"max": 0.6562424284039121,
	"count": 609
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -18.680799961090088,
	"min": -64.89040005207062,
	"max": 53.10900020599365,
	"count": 609
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.08414774757247788,
	"min": -0.625,
	"max": 0.6562424284039121,
	"count": 609
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -18.680799961090088,
	"min": -64.89040005207062,
	"max": 53.10900020599365,
	"count": 609
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 609
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 609
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.018445094802882523,
	"min": 0.01035703014737616,
	"max": 0.023746898758690804,
	"count": 290
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.018445094802882523,
	"min": 0.01035703014737616,
	"max": 0.023746898758690804,
	"count": 290
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.11060444861650467,
	"min": 1.732775888285687e-06,
	"max": 0.12241433983047803,
	"count": 290
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.11060444861650467,
	"min": 1.732775888285687e-06,
	"max": 0.12241433983047803,
	"count": 290
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.1136261910200119,
	"min": 2.1583403925736397e-06,
	"max": 0.12581025809049606,
	"count": 290
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.1136261910200119,
	"min": 2.1583403925736397e-06,
	"max": 0.12581025809049606,
	"count": 290
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 290
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 290
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 290
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 290
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 290
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 290
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1677532344",
	"python_version": "3.9.16 (main, Jan 11 2023, 16:05:54) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/isaac/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1677538255"
	},
	"total": 5910.890998768999,
	"count": 1,
	"self": 0.06460388699997566,
	"children": {
	"run_training.setup": {
	"total": 0.026874823000071046,
	"count": 1,
	"self": 0.026874823000071046
	},
	"TrainerController.start_learning": {
	"total": 5910.799520058999,
	"count": 1,
	"self": 4.6631930575777005,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.187994563994835,
	"count": 31,
	"self": 4.187994563994835
	},
	"TrainerController.advance": {
	"total": 5901.793086253429,
	"count": 413789,
	"self": 4.565254165081569,
	"children": {
	"env_step": {
	"total": 4317.52626907742,
	"count": 413789,
	"self": 3338.7907093795748,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 975.8863963008871,
	"count": 413789,
	"self": 28.583583583496875,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 947.3028127173902,
	"count": 772554,
	"self": 947.3028127173902
	}
	}
	},
	"workers": {
	"total": 2.8491633969579198,
	"count": 413789,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5902.745093290739,
	"count": 413789,
	"is_parallel": true,
	"self": 3176.306758978216,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002331797000806546,
	"count": 2,
	"is_parallel": true,
	"self": 0.0006164599999465281,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0017153370008600177,
	"count": 8,
	"is_parallel": true,
	"self": 0.0017153370008600177
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.019064633999732905,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005129329992996645,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003821440004685428,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003821440004685428
	},
	"communicator.exchange": {
	"total": 0.01688135099993815,
	"count": 1,
	"is_parallel": true,
	"self": 0.01688135099993815
	},
	"steps_from_proto": {
	"total": 0.0012882060000265483,
	"count": 2,
	"is_parallel": true,
	"self": 0.0002719959984460729,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0010162100015804754,
	"count": 8,
	"is_parallel": true,
	"self": 0.0010162100015804754
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2726.406486123524,
	"count": 413788,
	"is_parallel": true,
	"self": 165.69570598195514,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 112.6196814200166,
	"count": 413788,
	"is_parallel": true,
	"self": 112.6196814200166
	},
	"communicator.exchange": {
	"total": 2030.0720541379924,
	"count": 413788,
	"is_parallel": true,
	"self": 2030.0720541379924
	},
	"steps_from_proto": {
	"total": 418.01904458355966,
	"count": 827576,
	"is_parallel": true,
	"self": 79.1009894443232,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 338.91805513923646,
	"count": 3310304,
	"is_parallel": true,
	"self": 338.91805513923646
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.031848188998992555,
	"count": 60,
	"is_parallel": true,
	"self": 0.006230923997463833,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.025617265001528722,
	"count": 240,
	"is_parallel": true,
	"self": 0.025617265001528722
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1579.7015630109272,
	"count": 413789,
	"self": 36.488547004430075,
	"children": {
	"process_trajectory": {
	"total": 520.3228761164983,
	"count": 413789,
	"self": 518.6864089684987,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.6364671479996105,
	"count": 12,
	"self": 1.6364671479996105
	}
	}
	},
	"_update_policy": {
	"total": 1022.8901398899989,
	"count": 291,
	"self": 577.2819298669856,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 445.60821002301327,
	"count": 8722,
	"self": 445.60821002301327
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.979986887425184e-07,
	"count": 1,
	"self": 8.979986887425184e-07
	},
	"TrainerController._save_models": {
	"total": 0.1552452859996265,
	"count": 1,
	"self": 0.0008733739996387158,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1543719119999878,
	"count": 1,
	"self": 0.1543719119999878
	}
	}
	}
	}
	}
	}
	}