Armageddon

10M steps

9fa9479 verified 7 months ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.8955084085464478,
	"min": 1.8422900438308716,
	"max": 2.093956708908081,
	"count": 200
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 38456.07421875,
	"min": 33440.90625,
	"max": 47368.375,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 67.3013698630137,
	"min": 49.77906976744186,
	"max": 104.18367346938776,
	"count": 200
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19652.0,
	"min": 17124.0,
	"max": 22200.0,
	"count": 200
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1551.8239050312495,
	"min": 1488.0337250922112,
	"max": 1560.0137722228626,
	"count": 200
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 226566.29013456244,
	"min": 148296.2012005081,
	"max": 288932.1385805928,
	"count": 200
	},
	"SoccerTwos.Step.mean": {
	"value": 9999976.0,
	"min": 8009970.0,
	"max": 9999976.0,
	"count": 200
	},
	"SoccerTwos.Step.sum": {
	"value": 9999976.0,
	"min": 8009970.0,
	"max": 9999976.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.07242073118686676,
	"min": -0.16348804533481598,
	"max": 0.13070540130138397,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 10.573427200317383,
	"min": -27.629480361938477,
	"max": 19.082988739013672,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.07825343310832977,
	"min": -0.16575385630130768,
	"max": 0.131241574883461,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 11.42500114440918,
	"min": -28.012401580810547,
	"max": 19.161270141601562,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.16666301145945508,
	"min": -0.40307586234191367,
	"max": 0.28878254124096464,
	"count": 200
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 24.332799673080444,
	"min": -58.446000039577484,
	"max": 45.171999752521515,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.16666301145945508,
	"min": -0.40307586234191367,
	"max": 0.28878254124096464,
	"count": 200
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 24.332799673080444,
	"min": -58.446000039577484,
	"max": 45.171999752521515,
	"count": 200
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.025021878300079455,
	"min": 0.021023620530225648,
	"max": 0.03315305429860018,
	"count": 193
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.025021878300079455,
	"min": 0.021023620530225648,
	"max": 0.03315305429860018,
	"count": 193
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.07110492245604595,
	"min": 0.05825461180259784,
	"max": 0.09087043926119805,
	"count": 193
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.07110492245604595,
	"min": 0.05825461180259784,
	"max": 0.09087043926119805,
	"count": 193
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.08191935482124488,
	"min": 0.06437495543311039,
	"max": 0.10171770788729191,
	"count": 193
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.08191935482124488,
	"min": 0.06437495543311039,
	"max": 0.10171770788729191,
	"count": 193
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.00010000000000000003,
	"min": 0.00010000000000000003,
	"max": 0.00010000000000000003,
	"count": 193
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.00010000000000000003,
	"min": 0.00010000000000000003,
	"max": 0.00010000000000000003,
	"count": 193
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.30000000000000004,
	"min": 0.30000000000000004,
	"max": 0.30000000000000004,
	"count": 193
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.30000000000000004,
	"min": 0.30000000000000004,
	"max": 0.30000000000000004,
	"count": 193
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.010000000000000002,
	"min": 0.010000000000000002,
	"max": 0.010000000000000002,
	"count": 193
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.010000000000000002,
	"min": 0.010000000000000002,
	"max": 0.010000000000000002,
	"count": 193
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1718883158",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn config/poca/SoccerTwos.yaml --env=training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1718888181"
	},
	"total": 5022.471962849,
	"count": 1,
	"self": 0.46395551200021146,
	"children": {
	"run_training.setup": {
	"total": 0.05602131899996721,
	"count": 1,
	"self": 0.05602131899996721
	},
	"TrainerController.start_learning": {
	"total": 5021.951986018,
	"count": 1,
	"self": 3.1320614599881083,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.3683689129991876,
	"count": 11,
	"self": 3.3683689129991876
	},
	"TrainerController.advance": {
	"total": 5015.155259341012,
	"count": 137247,
	"self": 3.408958867018555,
	"children": {
	"env_step": {
	"total": 3409.571973765003,
	"count": 137247,
	"self": 2592.642890049901,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 815.1041082270739,
	"count": 137247,
	"self": 20.74925583620177,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 794.3548523908721,
	"count": 250996,
	"self": 794.3548523908721
	}
	}
	},
	"workers": {
	"total": 1.8249754880282012,
	"count": 137247,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5013.951839441042,
	"count": 137247,
	"is_parallel": true,
	"self": 2835.7990415421054,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.007442628000035256,
	"count": 2,
	"is_parallel": true,
	"self": 0.004348741000001155,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0030938870000341012,
	"count": 8,
	"is_parallel": true,
	"self": 0.0030938870000341012
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.038657415999978184,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011664620000146897,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008400569999480467,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008400569999480467
	},
	"communicator.exchange": {
	"total": 0.03322824299999638,
	"count": 1,
	"is_parallel": true,
	"self": 0.03322824299999638
	},
	"steps_from_proto": {
	"total": 0.0034226540000190653,
	"count": 2,
	"is_parallel": true,
	"self": 0.0005984359999047228,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0028242180001143424,
	"count": 8,
	"is_parallel": true,
	"self": 0.0028242180001143424
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.02078374899940627,
	"count": 20,
	"is_parallel": true,
	"self": 0.00429572499774622,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.01648802400166005,
	"count": 80,
	"is_parallel": true,
	"self": 0.01648802400166005
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2178.132014149937,
	"count": 137246,
	"is_parallel": true,
	"self": 137.4480117038629,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 91.87265370296143,
	"count": 137246,
	"is_parallel": true,
	"self": 91.87265370296143
	},
	"communicator.exchange": {
	"total": 1517.5340509910097,
	"count": 137246,
	"is_parallel": true,
	"self": 1517.5340509910097
	},
	"steps_from_proto": {
	"total": 431.27729775210275,
	"count": 274492,
	"is_parallel": true,
	"self": 71.7870211804086,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 359.49027657169415,
	"count": 1097968,
	"is_parallel": true,
	"self": 359.49027657169415
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1602.1743267089912,
	"count": 137247,
	"self": 24.812080927036504,
	"children": {
	"process_trajectory": {
	"total": 455.18851799195363,
	"count": 137247,
	"self": 453.81507471995315,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.373443272000486,
	"count": 4,
	"self": 1.373443272000486
	}
	}
	},
	"_update_policy": {
	"total": 1122.173727790001,
	"count": 193,
	"self": 609.1868159890051,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 512.9869118009959,
	"count": 11580,
	"self": 512.9869118009959
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.120005077216774e-07,
	"count": 1,
	"self": 8.120005077216774e-07
	},
	"TrainerController._save_models": {
	"total": 0.2962954919994445,
	"count": 1,
	"self": 0.005442683999717701,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2908528079997268,
	"count": 1,
	"self": 0.2908528079997268
	}
	}
	}
	}
	}
	}
	}