First Push

ccae435 verified 10 months ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.9973961114883423,
	"min": 1.9672212600708008,
	"max": 3.295731544494629,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 41737.58984375,
	"min": 20642.34375,
	"max": 168492.96875,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 51.25,
	"min": 39.56910569105691,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19680.0,
	"min": 16220.0,
	"max": 23488.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1428.967954442669,
	"min": 1191.9478556453585,
	"max": 1446.3898811364495,
	"count": 459
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 274361.84725299245,
	"min": 2384.257118072176,
	"max": 344398.37367817503,
	"count": 459
	},
	"SoccerTwos.Step.mean": {
	"value": 4999972.0,
	"min": 9762.0,
	"max": 4999972.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999972.0,
	"min": 9762.0,
	"max": 4999972.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.023390689864754677,
	"min": -0.11991755664348602,
	"max": 0.13205336034297943,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -4.4910125732421875,
	"min": -26.9814510345459,
	"max": 26.146564483642578,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.02350303716957569,
	"min": -0.12512031197547913,
	"max": 0.13728852570056915,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -4.512583255767822,
	"min": -28.152069091796875,
	"max": 27.183128356933594,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.07863125080863635,
	"min": -0.7142857142857143,
	"max": 0.38127500005066395,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -15.097200155258179,
	"min": -72.37800002098083,
	"max": 41.1385999917984,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.07863125080863635,
	"min": -0.7142857142857143,
	"max": 0.38127500005066395,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -15.097200155258179,
	"min": -72.37800002098083,
	"max": 41.1385999917984,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.015707269603929794,
	"min": 0.010822808059553305,
	"max": 0.024873007297477063,
	"count": 238
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.015707269603929794,
	"min": 0.010822808059553305,
	"max": 0.024873007297477063,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0981605698664983,
	"min": 6.071955779892354e-06,
	"max": 0.12207058742642403,
	"count": 238
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0981605698664983,
	"min": 6.071955779892354e-06,
	"max": 0.12207058742642403,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09878558243314425,
	"min": 5.733635695529907e-06,
	"max": 0.12399258886774381,
	"count": 238
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09878558243314425,
	"min": 5.733635695529907e-06,
	"max": 0.12399258886774381,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 238
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 238
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 238
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1729574893",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/byeung/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.5.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1729590393"
	},
	"total": 15499.309189803898,
	"count": 1,
	"self": 10.00968683604151,
	"children": {
	"run_training.setup": {
	"total": 0.024166137911379337,
	"count": 1,
	"self": 0.024166137911379337
	},
	"TrainerController.start_learning": {
	"total": 15489.275336829945,
	"count": 1,
	"self": 5.296790755353868,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.974303150549531,
	"count": 50,
	"self": 4.974303150549531
	},
	"TrainerController.advance": {
	"total": 15478.814608255401,
	"count": 343372,
	"self": 5.434555969201028,
	"children": {
	"env_step": {
	"total": 10587.658404042013,
	"count": 343372,
	"self": 9214.894986375235,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1369.6727111088112,
	"count": 343372,
	"self": 44.204565349034965,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1325.4681457597762,
	"count": 646164,
	"self": 1325.4681457597762
	}
	}
	},
	"workers": {
	"total": 3.0907065579667687,
	"count": 343372,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 15471.547301323153,
	"count": 343372,
	"is_parallel": true,
	"self": 7206.153205802664,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005706407129764557,
	"count": 2,
	"is_parallel": true,
	"self": 0.001284855417907238,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.004421551711857319,
	"count": 8,
	"is_parallel": true,
	"self": 0.004421551711857319
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04190370161086321,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006120866164565086,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0010803602635860443,
	"count": 1,
	"is_parallel": true,
	"self": 0.0010803602635860443
	},
	"communicator.exchange": {
	"total": 0.03848050720989704,
	"count": 1,
	"is_parallel": true,
	"self": 0.03848050720989704
	},
	"steps_from_proto": {
	"total": 0.0017307475209236145,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003641154617071152,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013666320592164993,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013666320592164993
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 8265.178941797465,
	"count": 343371,
	"is_parallel": true,
	"self": 466.2095416150987,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 329.6114039067179,
	"count": 343371,
	"is_parallel": true,
	"self": 329.6114039067179
	},
	"communicator.exchange": {
	"total": 6067.122285557911,
	"count": 343371,
	"is_parallel": true,
	"self": 6067.122285557911
	},
	"steps_from_proto": {
	"total": 1402.2357107177377,
	"count": 686742,
	"is_parallel": true,
	"self": 247.52160685602576,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1154.714103861712,
	"count": 2746968,
	"is_parallel": true,
	"self": 1154.714103861712
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.21515372302383184,
	"count": 98,
	"is_parallel": true,
	"self": 0.03675766568630934,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.1783960573375225,
	"count": 392,
	"is_parallel": true,
	"self": 0.1783960573375225
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 4885.721648244187,
	"count": 343372,
	"self": 57.28664831724018,
	"children": {
	"process_trajectory": {
	"total": 991.135653346777,
	"count": 343372,
	"self": 988.8921352447942,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.2435181019827724,
	"count": 10,
	"self": 2.2435181019827724
	}
	}
	},
	"_update_policy": {
	"total": 3837.29934658017,
	"count": 238,
	"self": 596.9566940963268,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 3240.3426524838433,
	"count": 7140,
	"self": 3240.3426524838433
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 7.245689630508423e-07,
	"count": 1,
	"self": 7.245689630508423e-07
	},
	"TrainerController._save_models": {
	"total": 0.18963394407182932,
	"count": 1,
	"self": 0.004723397083580494,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.18491054698824883,
	"count": 1,
	"self": 0.18491054698824883
	}
	}
	}
	}
	}
	}
	}