ppo-Pyramids / run_logs /timers.json
MalyO2's picture
First Push
f177508 verified
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.1812715381383896,
"min": 0.1697080135345459,
"max": 1.6065279245376587,
"count": 200
},
"Pyramids.Policy.Entropy.sum": {
"value": 1864.9215087890625,
"min": 1685.9420166015625,
"max": 16450.845703125,
"count": 200
},
"Pyramids.Step.mean": {
"value": 1999988.0,
"min": 9984.0,
"max": 1999988.0,
"count": 200
},
"Pyramids.Step.sum": {
"value": 1999988.0,
"min": 9984.0,
"max": 1999988.0,
"count": 200
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.7763552069664001,
"min": -0.08807287365198135,
"max": 0.8628113269805908,
"count": 200
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 77.6355209350586,
"min": -7.045829772949219,
"max": 89.73237609863281,
"count": 200
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.12793628871440887,
"min": 0.1241626963019371,
"max": 3.223942279815674,
"count": 200
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 12.793628692626953,
"min": 11.833174705505371,
"max": 256.96441650390625,
"count": 200
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.07152327620079396,
"min": 0.05934585555951344,
"max": 0.08020872884755215,
"count": 200
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.14304655240158792,
"min": 0.05934585555951344,
"max": 0.1604174576951043,
"count": 200
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.016820931834262358,
"min": 0.0004981905462955183,
"max": 1.2856630093107622,
"count": 200
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.033641863668524716,
"min": 0.0004981905462955183,
"max": 1.2856630093107622,
"count": 200
},
"Pyramids.Policy.LearningRate.mean": {
"value": 8.469997176999891e-07,
"min": 8.469997176999891e-07,
"max": 0.0002987712004096,
"count": 200
},
"Pyramids.Policy.LearningRate.sum": {
"value": 1.6939994353999782e-06,
"min": 1.6939994353999782e-06,
"max": 0.0005687616104127999,
"count": 200
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10028230000000002,
"min": 0.10028230000000002,
"max": 0.19959039999999997,
"count": 200
},
"Pyramids.Policy.Epsilon.sum": {
"value": 0.20056460000000004,
"min": 0.10089415000000002,
"max": 0.3895872,
"count": 200
},
"Pyramids.Policy.Beta.mean": {
"value": 3.820176999999964e-05,
"min": 3.820176999999964e-05,
"max": 0.009959080960000002,
"count": 200
},
"Pyramids.Policy.Beta.sum": {
"value": 7.640353999999929e-05,
"min": 7.640353999999929e-05,
"max": 0.01895976128,
"count": 200
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.01132755633443594,
"min": 0.010952742770314217,
"max": 0.7967495918273926,
"count": 200
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.02265511266887188,
"min": 0.011068697087466717,
"max": 0.7967495918273926,
"count": 200
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 200
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 200
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 226.30434782608697,
"min": 210.06521739130434,
"max": 999.0,
"count": 196
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 10410.0,
"min": 406.0,
"max": 15984.0,
"count": 196
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7759361599988126,
"min": -1.0000000521540642,
"max": 1.7878297776617902,
"count": 197
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 83.46899951994419,
"min": -16.000000834465027,
"max": 88.86559921503067,
"count": 197
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7759361599988126,
"min": -1.0000000521540642,
"max": 1.7878297776617902,
"count": 197
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 83.46899951994419,
"min": -16.000000834465027,
"max": 88.86559921503067,
"count": 197
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.2671700805930936,
"min": 0.24556314122552672,
"max": 115.93597248196602,
"count": 197
},
"Pyramids.Policy.RndReward.sum": {
"value": 12.556993787875399,
"min": 3.919705420732498,
"max": 1854.9755597114563,
"count": 197
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1728489636",
"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training_4 --no-graphics",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.4.1+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1728495200"
},
"total": 5563.281154713,
"count": 1,
"self": 0.578380326000115,
"children": {
"run_training.setup": {
"total": 0.06315506800001458,
"count": 1,
"self": 0.06315506800001458
},
"TrainerController.start_learning": {
"total": 5562.639619319,
"count": 1,
"self": 3.658621601048253,
"children": {
"TrainerController._reset_env": {
"total": 2.3372126550002577,
"count": 1,
"self": 2.3372126550002577
},
"TrainerController.advance": {
"total": 5556.585015841953,
"count": 129381,
"self": 3.7074042090926014,
"children": {
"env_step": {
"total": 3966.0238739530296,
"count": 129381,
"self": 3736.5980412040853,
"children": {
"SubprocessEnvManager._take_step": {
"total": 227.22686251303276,
"count": 129381,
"self": 10.69970989295598,
"children": {
"TorchPolicy.evaluate": {
"total": 216.52715262007678,
"count": 125067,
"self": 216.52715262007678
}
}
},
"workers": {
"total": 2.1989702359114744,
"count": 129381,
"self": 0.0,
"children": {
"worker_root": {
"total": 5551.047635885227,
"count": 129381,
"is_parallel": true,
"self": 2103.7738006034288,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0028710380001939484,
"count": 1,
"is_parallel": true,
"self": 0.0008379179998883046,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0020331200003056438,
"count": 8,
"is_parallel": true,
"self": 0.0020331200003056438
}
}
},
"UnityEnvironment.step": {
"total": 0.08737620700048865,
"count": 1,
"is_parallel": true,
"self": 0.0008961279991126503,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0005002860007152776,
"count": 1,
"is_parallel": true,
"self": 0.0005002860007152776
},
"communicator.exchange": {
"total": 0.08327173799989396,
"count": 1,
"is_parallel": true,
"self": 0.08327173799989396
},
"steps_from_proto": {
"total": 0.0027080550007667625,
"count": 1,
"is_parallel": true,
"self": 0.00039993899918044917,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0023081160015863134,
"count": 8,
"is_parallel": true,
"self": 0.0023081160015863134
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 3447.273835281798,
"count": 129380,
"is_parallel": true,
"self": 81.91633728868419,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 53.13809518709877,
"count": 129380,
"is_parallel": true,
"self": 53.13809518709877
},
"communicator.exchange": {
"total": 3082.081615678245,
"count": 129380,
"is_parallel": true,
"self": 3082.081615678245
},
"steps_from_proto": {
"total": 230.13778712777003,
"count": 129380,
"is_parallel": true,
"self": 49.45365916853552,
"children": {
"_process_rank_one_or_two_observation": {
"total": 180.6841279592345,
"count": 1035040,
"is_parallel": true,
"self": 180.6841279592345
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1586.8537376798304,
"count": 129381,
"self": 6.444372039120935,
"children": {
"process_trajectory": {
"total": 284.3386811197315,
"count": 129381,
"self": 284.0804185877314,
"children": {
"RLTrainer._checkpoint": {
"total": 0.25826253200011706,
"count": 4,
"self": 0.25826253200011706
}
}
},
"_update_policy": {
"total": 1296.070684520978,
"count": 242,
"self": 663.0619838800121,
"children": {
"TorchPPOOptimizer.update": {
"total": 633.0087006409658,
"count": 46473,
"self": 633.0087006409658
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.0690000635804608e-06,
"count": 1,
"self": 1.0690000635804608e-06
},
"TrainerController._save_models": {
"total": 0.058768151999174734,
"count": 1,
"self": 0.0011314740004308987,
"children": {
"RLTrainer._checkpoint": {
"total": 0.057636677998743835,
"count": 1,
"self": 0.057636677998743835
}
}
}
}
}
}
}