More tranining
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +7 -7
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 255.23 +/- 18.45
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7e4e423d90>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7e4e423e20>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7e4e423eb0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7e4e423f40>", "_build": "<function ActorCriticPolicy._build at 0x7f7e4e42c040>", "forward": "<function ActorCriticPolicy.forward at 0x7f7e4e42c0d0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7e4e42c160>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7e4e42c1f0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7e4e42c280>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7e4e42c310>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7e4e42c3a0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7e4e42c430>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7e4e430180>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 16384, "_total_timesteps": 1000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1698854986099566860, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAK3xLj5xfi08vK7MvZmdCTwlAJU93Y4BvQAAAAAAAAAAmm5OvQcwlD/KOWu9GaJDv5TwhL7STA++AAAAAAAAAAA6BFc+/R9JP/nIFz+c5H6/VYiCvltCbb4AAAAAAAAAAA1CAD+dios/zto6PzWLUL9GpIO9phOSPAAAAAAAAAAAKruTPukKyD9eVkc/t6MBvhcdIL4ySdu9AAAAAAAAAACaI3a8e6W2PwwKQb98ZK8+FRd8PAXTBz4AAAAAAAAAAG3N5z4iPqo/uQgdP+0+Fr+3L9+9cW6ZvAAAAAAAAAAAjRl2PgMMRz+rJx8/1HaHv+bvX7/cDLS+AAAAAAAAAADtcBM+kxiwPw6+6z4Z5LS+OxppvgeWSL0AAAAAAAAAAH2urT721lI/fxkHP3D5a78+hZA8/bAZPgAAAAAAAAAANs57vn23Ij+rhDG/Vi+Tv8ePBD9qQr0+AAAAAAAAAABmXaY90K2EPsR3L72sQ7W/GUWPPmsPTrwAAAAAAAAAAGbxXL0eCsM/u+MoviA5mr5k8IM+MgFoPgAAAAAAAAAA3jQdv98hpT9LgG+/iywRv+thqj7qP5Q9AAAAAAAAAADNrJ+8ve2qP16lsL59ViC/pJwoPQ9DQj4AAAAAAAAAADMPGbyHIsE/YpjRvYFfmT4AFeA8YQOEPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -15.384, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwGd9MiKR+0CMAWyUS0qMAXSUR0BKNRNATqSpdX2UKGgGR8B0qowBYFJQaAdLXWgIR0BKNwkxASnMdX2UKGgGR8B6LghJRO1waAdLXmgIR0BKOLjYI0IkdX2UKGgGR8Btcxhz/6wdaAdLdmgIR0BKQUIcBEKFdX2UKGgGR8B3JhxiobXIaAdLXmgIR0BKR9szl90BdX2UKGgGR8Bgt53kgfU4aAdLW2gIR0BKScHnlnyvdX2UKGgGR8BXjnhOxjaxaAdLTWgIR0BKTOb7TDwZdX2UKGgGR8BXhVOO801qaAdLRWgIR0BKTQCjk+5fdX2UKGgGR8BXTO+/QBxQaAdLZGgIR0BKUKf4AS39dX2UKGgGR8Bgp6J40Mw2aAdLeGgIR0BKUUMXrMTwdX2UKGgGR8BdjMIeHSF5aAdLS2gIR0BKVQs5GSZCdX2UKGgGR8B22N6w+t8vaAdLYmgIR0BKVxdyDIzWdX2UKGgGR8BgLjM/yGzsaAdLU2gIR0BKWUXP7el9dX2UKGgGR8BT51h5Pdl/aAdLUGgIR0BKXMmv4dp7dX2UKGgGR8BxGqFAVwglaAdLV2gIR0BKYTcynDR/dX2UKGgGR8BuJEAFPi1iaAdLVmgIR0BKZfzJ6po9dX2UKGgGR8B09z/io86naAdLfWgIR0BKZcQyyleodX2UKGgGR8BYSUfPomojaAdLO2gIR0BKaL56+nIidX2UKGgGR8BS82gam4y5aAdLR2gIR0BKaH2qT8pDdX2UKGgGR8B3lNXwLE1maAdLX2gIR0BKbEBbOeJ6dX2UKGgGR8BRlOqvNeMRaAdLdGgIR0BKc+UyHmA9dX2UKGgGR8BYe1Z1V5ryaAdLOGgIR0BKfmax5cC6dX2UKGgGR8BmoOZG8VYZaAdLX2gIR0BKgEB8x9G7dX2UKGgGR8B58n8UEgW8aAdLVWgIR0BKgu3UhFEzdX2UKGgGR8Be/zI/7iyZaAdLYGgIR0BKhIXCTEBKdX2UKGgGR8AKwFLWZqmCaAdLbGgIR0BKhFCswL3LdX2UKGgGR8BgL3D7655JaAdLaGgIR0BKhUAksz2wdX2UKGgGR8BqWkSsbNr1aAdLYWgIR0BKhbx3FDOUdX2UKGgGR8BQ1ZJXhfjTaAdLQGgIR0BKifOdGy5adX2UKGgGR8Bgo2A9V3lkaAdLY2gIR0BKjCUPhAGCdX2UKGgGR8BfzyjpLVWkaAdLUGgIR0BKj6naWX1KdX2UKGgGR8BsOpPCVKPGaAdLZGgIR0BKkhzmwJPZdX2UKGgGR8Bv15KJ2t+1aAdLS2gIR0BKk49xIatLdX2UKGgGR8Bgs8C5mRNiaAdLcWgIR0BKlXYcvM8pdX2UKGgGR8B0/3/YJ3PiaAdLZ2gIR0BKmvhhpg1FdX2UKGgGR8Bo3ckB0ZFYaAdLamgIR0BKn7noxHoYdX2UKGgGR8B6L4b0e2d/aAdLYWgIR0BKppb2USqVdX2UKGgGR8BioC+UQkHEaAdLTmgIR0BKqMGorFwUdX2UKGgGR8BgTJkbxVhkaAdLSGgIR0BKqk+5e7cxdX2UKGgGR8B5fOaEzwc6aAdLX2gIR0BKr8OskpqidX2UKGgGR8BYWz2exwAEaAdLSGgIR0BKsY3m3fALdX2UKGgGR8BqeuqaPS2IaAdLS2gIR0BKsQTufEn9dX2UKGgGR8B5Ogl2NedDaAdLXGgIR0BKtVFH8TBZdX2UKGgGR8Bh7D5ZbILgaAdLcWgIR0BKvjc2zfJndX2UKGgGR8B1X1jnV5KOaAdLcmgIR0BKv987ZFoddX2UKGgGR8BgplQuVX3haAdLemgIR0BKxITwlSjydX2UKGgGR8BydT15B1LbaAdLZWgIR0BKxQl0HQhPdX2UKGgGR8B2TyZLIxQBaAdLWWgIR0BKxJE6T4cndX2UKGgGR8BsQYvi97F9aAdLd2gIR0BK0IfCAMDwdX2UKGgGR8BfWAVCXyAhaAdLZWgIR0BK0I4uK4x2dX2UKGgGR8BCVtgrpaA4aAdLSmgIR0BK0X05EMLGdX2UKGgGR8BpycutfXwtaAdLZ2gIR0BK1lVktmL+dX2UKGgGR8B7YjPu5SWJaAdLW2gIR0BK1rWI42jxdX2UKGgGR8BbNDdcjZ+QaAdLh2gIR0BK2nvlU6xPdX2UKGgGR8BkCnezlcQiaAdLSWgIR0BK2+NT987ZdX2UKGgGR8Bk+Q91U2k0aAdLQWgIR0BK4AjQiRnwdX2UKGgGR8BVl2ZqmCRPaAdLO2gIR0BK5Cz1K5CodX2UKGgGR8BwNUry1/lRaAdLb2gIR0BK7JQcghbGdX2UKGgGR8BhYneLvTgEaAdLVmgIR0BK7iHIp6QedX2UKGgGR8B20MDfWMCLaAdLgmgIR0BK7prk8zRAdX2UKGgGR8BN6SAYpDu0aAdLTWgIR0BK7qOT7l7udX2UKGgGR8BVc2P1ct5EaAdLd2gIR0BK8aKtPpIMdX2UKGgGR8Ba0y+lCTllaAdLemgIR0BK8aSTyJ9BdX2UKGgGR8CACK3lS0jUaAdLZ2gIR0BK+s7+1jRVdX2UKGgGR8BwudppN9H+aAdLU2gIR0BK/L8R+SbIdX2UKGgGR8BZ9UFKTSssaAdLaGgIR0BLB49HMEA6dX2UKGgGR8B1USsXBP9DaAdLYWgIR0BLCZyuIRAbdX2UKGgGR8B5FLypaRp2aAdLWGgIR0BLCpD3M6ikdX2UKGgGR8BlCKeCkGiYaAdLVGgIR0BLDLjYI0IkdX2UKGgGR8B0mdJL/S6UaAdLaGgIR0BLDZZ8rqdIdX2UKGgGR8BheJ+YtxuLaAdLQ2gIR0BLELsrupjudX2UKGgGR8BAF7N8ma6SaAdLXGgIR0BLFC+lCTlldX2UKGgGR8BybxFG5MDfaAdLT2gIR0BLF2U0Nz8xdX2UKGgGR8BqssZYPoV3aAdLUGgIR0BLGAMDwH7hdX2UKGgGR8BcxVHJ9y93aAdLTmgIR0BLGfBnBciXdX2UKGgGR8BRy3IU8FINaAdLOmgIR0BLGYyfthNNdX2UKGgGR8BfBYMz/IbPaAdLXmgIR0BLHVT72tdSdX2UKGgGR8BfktFfAsTWaAdLkmgIR0BLHqGUOd5IdX2UKGgGR8Bz0WglF+d9aAdLhmgIR0BLIRgJC0F9dX2UKGgGR8ByO58CxNZeaAdLZWgIR0BLJTN2TxG2dX2UKGgGR8Bfs3vUjLSvaAdLTmgIR0BLL/029+PSdX2UKGgGR8BbzCBGx2SuaAdLUWgIR0BLM6ZH/cWTdX2UKGgGR8Bfu2bXpW3jaAdLb2gIR0BLNrl3hXKbdX2UKGgGR8B00IOoYNy6aAdLSGgIR0BLP2OhkAggdX2UKGgGR8Bs5WzIFNcoaAdLQmgIR0BLQdR77bcodX2UKGgGR8BbfxUFSsKcaAdLUWgIR0BLQvn8sMAndX2UKGgGR8BS02vW6K+BaAdLVGgIR0BLRBBiTdLydX2UKGgGR8BKC8UuctoSaAdLSWgIR0BLRHkT6BRRdX2UKGgGR8BozdIsiB5HaAdLaGgIR0BLR/zSThYOdX2UKGgGR8BvyadlNDc/aAdLdGgIR0BLSEleF+NMdX2UKGgGR8BmSI3FUADJaAdLfmgIR0BLUHY6GQCCdX2UKGgGR8Bt6aDEm6XjaAdLdGgIR0BLUZ9NN8E3dX2UKGgGR8B9pXiS7oStaAdLYWgIR0BLVQBYFJQMdX2UKGgGR8BWvaoqCpWFaAdLOWgIR0BLVbYbsF+vdX2UKGgGR8BvIRCa7VawaAdLdWgIR0BLWAb6xgRcdX2UKGgGR8Bps5RAKOT8aAdLRWgIR0BLWUN8VpK0dX2UKGgGR8B19MpgCwKTaAdLaGgIR0BLXa9CeEqUdX2UKGgGR8BjLccQyylfaAdLTGgIR0BLaP0I1LrYdX2UKGgGR8BjjCCQLeANaAdLQWgIR0BLa8jZ+QU6dX2UKGgGR8BUBZkK/mDEaAdLUGgIR0BLboZQ53kgdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.1.0+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7e4e423d90>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7e4e423e20>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7e4e423eb0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7e4e423f40>", "_build": "<function ActorCriticPolicy._build at 0x7f7e4e42c040>", "forward": "<function ActorCriticPolicy.forward at 0x7f7e4e42c0d0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7e4e42c160>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7e4e42c1f0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7e4e42c280>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7e4e42c310>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7e4e42c3a0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7e4e42c430>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7e4e430180>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1698856094310016398, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2C5T3On7I/DVKvPhadq76xT9Q99IU0PgAAAAAAAAAAQF8KPhaH8D75aEC+wyuBvteSmL3rT4C9AAAAAAAAAAAABB09WiauPw9OBT9V3sK+SP08vK/Gjz0AAAAAAAAAAJq9IT3DvTQ7Tk1nvk7HKr7Y72m855sTvgAAAAAAAAAAGrcqPZoUsz/Dl0s+su2OvkGdOz2wCpg9AAAAAAAAAACzPBe+I3EPP5e/jD0SAJm+fg0nvcp2ubgAAAAAAAAAADOvhTv9XVw/+78RvYEYbb7W3x+9tk/PvAAAAAAAAAAAZoiJPYWPuD8NQv0+6ZRcvYvAsrohv7A9AAAAAAAAAACam3K8w/1AuoVYIDNBe5irJXK4ux65zbMAAIA/AACAP+aMRT2u5Yu6HuFkMzSiAbDPldo6xnC/swAAgD8AAIA/M88fvB9TwrtqRbq8nF6KPYBaKL3tpww8AACAPwAAgD96Nz4+TCIMP/3yJ73z/pq+uWtDPa48mr0AAAAAAAAAAJodhT6Sumw/SWi9PFLhpb5SGRw+kPY0vgAAAAAAAAAAmrkxu+FAJT6q69y9yqYQvhTYmb0TMH47AAAAAAAAAACDD1q+16E/P6vUVj6WzZu+qsf8vMVZ7bsAAAAAAAAAAM2f0r1vqys/opQsPsJunL4+raI8ohIBvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVNwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHAY3Gff4yqMAWyUTTYBjAF0lEdAoqGHECNjsnV9lChoBkdAbEJk6Lfk3mgHTS4BaAhHQKKhuT101ZV1fZQoaAZHQHCqJ5Z8rqdoB001AWgIR0CiolG7J4jbdX2UKGgGR0BwnHBCUornaAdNSwFoCEdAoqJoPf8/EHV9lChoBkdAcHCFyq+8G2gHTR8BaAhHQKKil8CxNZh1fZQoaAZHQHHWwkHD765oB006AWgIR0CiorWS2Yv4dX2UKGgGR0BueeOS4e90aAdNXAFoCEdAoqMMtAcDKnV9lChoBkdAb9xqXWvr4WgHTR4BaAhHQKKjYqABkqd1fZQoaAZHQEhdLpRoAXFoB0vpaAhHQKKj3l05lvt1fZQoaAZHQG4czpPhybRoB00rAWgIR0CipAona37UdX2UKGgGR0Bt9l/nW8RMaAdNKQFoCEdAoqQk1O0sv3V9lChoBkdAcLmgZjx0+2gHTRABaAhHQKKlkVbA1vV1fZQoaAZHQHGsj4593KVoB009AWgIR0Cipf3FUADJdX2UKGgGR0BxUrfsNUfgaAdNcAFoCEdAoqY99hJAdHV9lChoBkdASjzxG2Cul2gHS9toCEdAoqZj6SDAanV9lChoBkdAcQoTPjXFtWgHTRgBaAhHQKKmdcfvF3p1fZQoaAZHQDPWnbZezD5oB00BAWgIR0CipqUrsjVydX2UKGgGR0BwfuU7jkuIaAdNPQFoCEdAoqbSPU8V6HV9lChoBkdAbGJ2L5ylvmgHTT0BaAhHQKKm5zH0btJ1fZQoaAZHQHJAHT3IuGtoB01XAWgIR0CipvDyOJcgdX2UKGgGR0BwJ7r2QGOdaAdNEgFoCEdAoqcBSLqD9XV9lChoBkdAa8+MCtA9m2gHTTIBaAhHQKKnnrXUYsN1fZQoaAZHQHBUjqKP4mFoB00gAWgIR0CiqBsH8jzJdX2UKGgGR0Bv83ttygf2aAdNNgFoCEdAoqgc3hn8K3V9lChoBkdAcQrUW2w3YWgHTRcBaAhHQKKoeV2zOX51fZQoaAZHQHEIu/xlQMxoB00PAWgIR0CiqJdrXUYsdX2UKGgGR0BwidTho/RmaAdNQwFoCEdAoqlADq4YrXV9lChoBkdAbPLtlZowmGgHTTQBaAhHQKKqpJq7Acl1fZQoaAZHQHJ4Ey+HrQhoB00KAWgIR0Ciq18hLXcydX2UKGgGR0BveIizLOiWaAdNHwFoCEdAoquFU0elsXV9lChoBkdAcBh6PbO/tmgHTU4BaAhHQKKr8fcN6Pd1fZQoaAZHQG/OTMRpUPxoB00nAWgIR0CirBndO6/ZdX2UKGgGR0Bv1XqVyFPBaAdNIQFoCEdAoqwg/u9eyHV9lChoBkdAclighKUVz2gHTT0BaAhHQKKsIgkC3gF1fZQoaAZHQHKCB/EwWWRoB01ZAWgIR0CirLK6nR9gdX2UKGgGR0BtOEIC2c8UaAdNYgFoCEdAoqy40IkZ8HV9lChoBkdAQlsPQOWjXWgHS9ZoCEdAoq0RXCCSR3V9lChoBkdAcPXE2pAD72gHTUkBaAhHQKKtLkHUtqZ1fZQoaAZHQHE2iwGGEf1oB00AAWgIR0CirUOQ6p5vdX2UKGgGR0BHUFgtvn8saAdNAQFoCEdAoq1LxLCemXV9lChoBkdAb28DnvDxb2gHTSQBaAhHQKKtUUA1ejV1fZQoaAZHQHGycCYCyQhoB00vAWgIR0Cirn7MX7+DdX2UKGgGR0BwgQVEd/8VaAdNFgFoCEdAorn+dupCKXV9lChoBkdAcYEqiGnGbWgHTRcBaAhHQKK7upYLb6B1fZQoaAZHQHKu5ydWhh9oB00TAWgIR0CivARG2CumdX2UKGgGR0ByxMV6/qPfaAdNSAFoCEdAorws7dSEUXV9lChoBkdAb+sqaw2VFGgHTTUBaAhHQKK8bPDYRNB1fZQoaAZHQG21zdcjZ+RoB00iAWgIR0CivGwtapxWdX2UKGgGR0BwmOpAD7qIaAdNJQFoCEdAorx/IZIg/3V9lChoBkdAcAPSGrS3LGgHTQcBaAhHQKK8pzundft1fZQoaAZHQHIy83IdU85oB00hAWgIR0CivNSNOuaGdX2UKGgGR0BySKdRR/EwaAdNHQFoCEdAor0sZvUBn3V9lChoBkdAb8OsvqTr3WgHTTsBaAhHQKK9R3vhIe51fZQoaAZHQHIQ5xm03OxoB01jAWgIR0CivYFKTSssdX2UKGgGR0BvmpRwZOzqaAdNRwFoCEdAor3U3wTdtXV9lChoBkdAcxT+pfhMrWgHTVkBaAhHQKK+AaCL/CJ1fZQoaAZHQHEXtvjwQUZoB01TAWgIR0CivgQe/5+IdX2UKGgGR0BqZmdkJ8fFaAdNGgFoCEdAor4p6MR6GHV9lChoBkdAbuQ34sVclmgHTREBaAhHQKK+ZMrVe8h1fZQoaAZHQHM9Uc81XNloB00JAWgIR0Civ8GlQ/HHdX2UKGgGR0BwneZ1FH8TaAdNJwFoCEdAosCfLV4HHHV9lChoBkdAbOD8uSOinGgHS/FoCEdAosDVxffGdnV9lChoBkdAc2fttQ9A5mgHTQYBaAhHQKLA3ArQPZt1fZQoaAZHQG7RoOQQtjFoB008AWgIR0CiwTzUZvUCdX2UKGgGR0Bu5k01qFh5aAdNKAFoCEdAosFZCIDYAnV9lChoBkdAbR2EA5q/NGgHTTYBaAhHQKLBdGqgh8p1fZQoaAZHQG95qCpWFOBoB009AWgIR0CiwYRsEaESdX2UKGgGR0Bytib7TDwZaAdNQgFoCEdAosGXcafjCHV9lChoBkdAIH4E4ecQRWgHS/1oCEdAosHg8r7O3XV9lChoBkdAcE62WIGhVWgHTRYBaAhHQKLB7UNKAax1fZQoaAZHQHDFh9b5dnloB00GAWgIR0Ciwi5DzAerdX2UKGgGR0BwEfrZ8KG+aAdNOAFoCEdAosIw/cFhX3V9lChoBkdAcP8za9K28mgHTRcBaAhHQKLCjNu+AVh1fZQoaAZHQHGMhBu4wytoB002AWgIR0CiwsoRAbADdX2UKGgGR0BBOW+GoJiRaAdLuGgIR0Ciw30HIIWydX2UKGgGR0BywJOYYzi0aAdNRQFoCEdAosN8G5c1O3V9lChoBkdAUROt7rs0HmgHS5toCEdAosOQakyk9HV9lChoBkdAcKv6a9bosGgHTQYBaAhHQKLD9pr1uix1fZQoaAZHQE9gFsYVIqdoB0vMaAhHQKLFUVRk3CN1fZQoaAZHQHGfl5KODJ5oB0v3aAhHQKLFXOk+HJt1fZQoaAZHQG92BwVCXyBoB00cAWgIR0CixWJ8WsRydX2UKGgGR0BtJv446wMZaAdNLQFoCEdAosYLdWQwK3V9lChoBkdAcMBh3aBZp2gHTUEBaAhHQKLGEtWdVed1fZQoaAZHQG7NK/EfkmxoB00iAWgIR0CixhgaFVT8dX2UKGgGR0BuwhuyeI2waAdNMAFoCEdAosZB0wJw9HV9lChoBkdAcF7RujynUGgHTRsBaAhHQKLGYzfJmul1fZQoaAZHQHJPBJAdGRVoB000AWgIR0CixqwiRnvldX2UKGgGR0BxVrj3mFJyaAdNEAFoCEdAosbf0se4kXV9lChoBkdAcjA79ycTamgHTUIBaAhHQKLHLTZxrBV1fZQoaAZHQHJoPx+az/poB00LAWgIR0Cix8VCXyAhdX2UKGgGR0Buvn6CUX54aAdNMAFoCEdAoshrIBBAwHV9lChoBkdATp0qWkadc2gHS6VoCEdAoshxEKE39HV9lChoBkdAcRq22G7Bf2gHTW4BaAhHQKLIi/fwZwZ1fZQoaAZHQG+wZZ0Syt5oB01AAWgIR0CiyJOtnwocdX2UKGgGR0BxGWza9K28aAdNNQFoCEdAosjhFy7wrnV9lChoBkdAcuKbGFSKnGgHS+9oCEdAosj9/J/5L3V9lChoBkdAceB2criEQGgHS/RoCEdAosmozzmOl3V9lChoBkdAcafkRSP2f2gHTSIBaAhHQKLJyswL3K11fZQoaAZHQDaj+AEt/WloB0vwaAhHQKLJ5f2K2rp1fZQoaAZHQG9h5N47ihpoB00LAWgIR0CiygadMCcPdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 252, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.1.0+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b724ee9314594546de569a34851aa03f325eaa91bf518df74f0e2f8a9d33339
|
3 |
+
size 148038
|
ppo-LunarLander-v2/data
CHANGED
@@ -21,17 +21,17 @@
|
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
-
"num_timesteps":
|
25 |
-
"_total_timesteps":
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
-
"start_time":
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
-
":serialized:": "
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -41,17 +41,17 @@
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
-
"_current_progress_remaining": -
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
-
":serialized:": "
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
-
"_n_updates":
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
|
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
+
"num_timesteps": 1015808,
|
25 |
+
"_total_timesteps": 1000000,
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
+
"start_time": 1698856094310016398,
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2C5T3On7I/DVKvPhadq76xT9Q99IU0PgAAAAAAAAAAQF8KPhaH8D75aEC+wyuBvteSmL3rT4C9AAAAAAAAAAAABB09WiauPw9OBT9V3sK+SP08vK/Gjz0AAAAAAAAAAJq9IT3DvTQ7Tk1nvk7HKr7Y72m855sTvgAAAAAAAAAAGrcqPZoUsz/Dl0s+su2OvkGdOz2wCpg9AAAAAAAAAACzPBe+I3EPP5e/jD0SAJm+fg0nvcp2ubgAAAAAAAAAADOvhTv9XVw/+78RvYEYbb7W3x+9tk/PvAAAAAAAAAAAZoiJPYWPuD8NQv0+6ZRcvYvAsrohv7A9AAAAAAAAAACam3K8w/1AuoVYIDNBe5irJXK4ux65zbMAAIA/AACAP+aMRT2u5Yu6HuFkMzSiAbDPldo6xnC/swAAgD8AAIA/M88fvB9TwrtqRbq8nF6KPYBaKL3tpww8AACAPwAAgD96Nz4+TCIMP/3yJ73z/pq+uWtDPa48mr0AAAAAAAAAAJodhT6Sumw/SWi9PFLhpb5SGRw+kPY0vgAAAAAAAAAAmrkxu+FAJT6q69y9yqYQvhTYmb0TMH47AAAAAAAAAACDD1q+16E/P6vUVj6WzZu+qsf8vMVZ7bsAAAAAAAAAAM2f0r1vqys/opQsPsJunL4+raI8ohIBvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
+
"_current_progress_remaining": -0.015808000000000044,
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
+
":serialized:": "gAWVNwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHAY3Gff4yqMAWyUTTYBjAF0lEdAoqGHECNjsnV9lChoBkdAbEJk6Lfk3mgHTS4BaAhHQKKhuT101ZV1fZQoaAZHQHCqJ5Z8rqdoB001AWgIR0CiolG7J4jbdX2UKGgGR0BwnHBCUornaAdNSwFoCEdAoqJoPf8/EHV9lChoBkdAcHCFyq+8G2gHTR8BaAhHQKKil8CxNZh1fZQoaAZHQHHWwkHD765oB006AWgIR0CiorWS2Yv4dX2UKGgGR0BueeOS4e90aAdNXAFoCEdAoqMMtAcDKnV9lChoBkdAb9xqXWvr4WgHTR4BaAhHQKKjYqABkqd1fZQoaAZHQEhdLpRoAXFoB0vpaAhHQKKj3l05lvt1fZQoaAZHQG4czpPhybRoB00rAWgIR0CipAona37UdX2UKGgGR0Bt9l/nW8RMaAdNKQFoCEdAoqQk1O0sv3V9lChoBkdAcLmgZjx0+2gHTRABaAhHQKKlkVbA1vV1fZQoaAZHQHGsj4593KVoB009AWgIR0Cipf3FUADJdX2UKGgGR0BxUrfsNUfgaAdNcAFoCEdAoqY99hJAdHV9lChoBkdASjzxG2Cul2gHS9toCEdAoqZj6SDAanV9lChoBkdAcQoTPjXFtWgHTRgBaAhHQKKmdcfvF3p1fZQoaAZHQDPWnbZezD5oB00BAWgIR0CipqUrsjVydX2UKGgGR0BwfuU7jkuIaAdNPQFoCEdAoqbSPU8V6HV9lChoBkdAbGJ2L5ylvmgHTT0BaAhHQKKm5zH0btJ1fZQoaAZHQHJAHT3IuGtoB01XAWgIR0CipvDyOJcgdX2UKGgGR0BwJ7r2QGOdaAdNEgFoCEdAoqcBSLqD9XV9lChoBkdAa8+MCtA9m2gHTTIBaAhHQKKnnrXUYsN1fZQoaAZHQHBUjqKP4mFoB00gAWgIR0CiqBsH8jzJdX2UKGgGR0Bv83ttygf2aAdNNgFoCEdAoqgc3hn8K3V9lChoBkdAcQrUW2w3YWgHTRcBaAhHQKKoeV2zOX51fZQoaAZHQHEIu/xlQMxoB00PAWgIR0CiqJdrXUYsdX2UKGgGR0BwidTho/RmaAdNQwFoCEdAoqlADq4YrXV9lChoBkdAbPLtlZowmGgHTTQBaAhHQKKqpJq7Acl1fZQoaAZHQHJ4Ey+HrQhoB00KAWgIR0Ciq18hLXcydX2UKGgGR0BveIizLOiWaAdNHwFoCEdAoquFU0elsXV9lChoBkdAcBh6PbO/tmgHTU4BaAhHQKKr8fcN6Pd1fZQoaAZHQG/OTMRpUPxoB00nAWgIR0CirBndO6/ZdX2UKGgGR0Bv1XqVyFPBaAdNIQFoCEdAoqwg/u9eyHV9lChoBkdAclighKUVz2gHTT0BaAhHQKKsIgkC3gF1fZQoaAZHQHKCB/EwWWRoB01ZAWgIR0CirLK6nR9gdX2UKGgGR0BtOEIC2c8UaAdNYgFoCEdAoqy40IkZ8HV9lChoBkdAQlsPQOWjXWgHS9ZoCEdAoq0RXCCSR3V9lChoBkdAcPXE2pAD72gHTUkBaAhHQKKtLkHUtqZ1fZQoaAZHQHE2iwGGEf1oB00AAWgIR0CirUOQ6p5vdX2UKGgGR0BHUFgtvn8saAdNAQFoCEdAoq1LxLCemXV9lChoBkdAb28DnvDxb2gHTSQBaAhHQKKtUUA1ejV1fZQoaAZHQHGycCYCyQhoB00vAWgIR0Cirn7MX7+DdX2UKGgGR0BwgQVEd/8VaAdNFgFoCEdAorn+dupCKXV9lChoBkdAcYEqiGnGbWgHTRcBaAhHQKK7upYLb6B1fZQoaAZHQHKu5ydWhh9oB00TAWgIR0CivARG2CumdX2UKGgGR0ByxMV6/qPfaAdNSAFoCEdAorws7dSEUXV9lChoBkdAb+sqaw2VFGgHTTUBaAhHQKK8bPDYRNB1fZQoaAZHQG21zdcjZ+RoB00iAWgIR0CivGwtapxWdX2UKGgGR0BwmOpAD7qIaAdNJQFoCEdAorx/IZIg/3V9lChoBkdAcAPSGrS3LGgHTQcBaAhHQKK8pzundft1fZQoaAZHQHIy83IdU85oB00hAWgIR0CivNSNOuaGdX2UKGgGR0BySKdRR/EwaAdNHQFoCEdAor0sZvUBn3V9lChoBkdAb8OsvqTr3WgHTTsBaAhHQKK9R3vhIe51fZQoaAZHQHIQ5xm03OxoB01jAWgIR0CivYFKTSssdX2UKGgGR0BvmpRwZOzqaAdNRwFoCEdAor3U3wTdtXV9lChoBkdAcxT+pfhMrWgHTVkBaAhHQKK+AaCL/CJ1fZQoaAZHQHEXtvjwQUZoB01TAWgIR0CivgQe/5+IdX2UKGgGR0BqZmdkJ8fFaAdNGgFoCEdAor4p6MR6GHV9lChoBkdAbuQ34sVclmgHTREBaAhHQKK+ZMrVe8h1fZQoaAZHQHM9Uc81XNloB00JAWgIR0Civ8GlQ/HHdX2UKGgGR0BwneZ1FH8TaAdNJwFoCEdAosCfLV4HHHV9lChoBkdAbOD8uSOinGgHS/FoCEdAosDVxffGdnV9lChoBkdAc2fttQ9A5mgHTQYBaAhHQKLA3ArQPZt1fZQoaAZHQG7RoOQQtjFoB008AWgIR0CiwTzUZvUCdX2UKGgGR0Bu5k01qFh5aAdNKAFoCEdAosFZCIDYAnV9lChoBkdAbR2EA5q/NGgHTTYBaAhHQKLBdGqgh8p1fZQoaAZHQG95qCpWFOBoB009AWgIR0CiwYRsEaESdX2UKGgGR0Bytib7TDwZaAdNQgFoCEdAosGXcafjCHV9lChoBkdAIH4E4ecQRWgHS/1oCEdAosHg8r7O3XV9lChoBkdAcE62WIGhVWgHTRYBaAhHQKLB7UNKAax1fZQoaAZHQHDFh9b5dnloB00GAWgIR0Ciwi5DzAerdX2UKGgGR0BwEfrZ8KG+aAdNOAFoCEdAosIw/cFhX3V9lChoBkdAcP8za9K28mgHTRcBaAhHQKLCjNu+AVh1fZQoaAZHQHGMhBu4wytoB002AWgIR0CiwsoRAbADdX2UKGgGR0BBOW+GoJiRaAdLuGgIR0Ciw30HIIWydX2UKGgGR0BywJOYYzi0aAdNRQFoCEdAosN8G5c1O3V9lChoBkdAUROt7rs0HmgHS5toCEdAosOQakyk9HV9lChoBkdAcKv6a9bosGgHTQYBaAhHQKLD9pr1uix1fZQoaAZHQE9gFsYVIqdoB0vMaAhHQKLFUVRk3CN1fZQoaAZHQHGfl5KODJ5oB0v3aAhHQKLFXOk+HJt1fZQoaAZHQG92BwVCXyBoB00cAWgIR0CixWJ8WsRydX2UKGgGR0BtJv446wMZaAdNLQFoCEdAosYLdWQwK3V9lChoBkdAcMBh3aBZp2gHTUEBaAhHQKLGEtWdVed1fZQoaAZHQG7NK/EfkmxoB00iAWgIR0CixhgaFVT8dX2UKGgGR0BuwhuyeI2waAdNMAFoCEdAosZB0wJw9HV9lChoBkdAcF7RujynUGgHTRsBaAhHQKLGYzfJmul1fZQoaAZHQHJPBJAdGRVoB000AWgIR0CixqwiRnvldX2UKGgGR0BxVrj3mFJyaAdNEAFoCEdAosbf0se4kXV9lChoBkdAcjA79ycTamgHTUIBaAhHQKLHLTZxrBV1fZQoaAZHQHJoPx+az/poB00LAWgIR0Cix8VCXyAhdX2UKGgGR0Buvn6CUX54aAdNMAFoCEdAoshrIBBAwHV9lChoBkdATp0qWkadc2gHS6VoCEdAoshxEKE39HV9lChoBkdAcRq22G7Bf2gHTW4BaAhHQKLIi/fwZwZ1fZQoaAZHQG+wZZ0Syt5oB01AAWgIR0CiyJOtnwocdX2UKGgGR0BxGWza9K28aAdNNQFoCEdAosjhFy7wrnV9lChoBkdAcuKbGFSKnGgHS+9oCEdAosj9/J/5L3V9lChoBkdAceB2criEQGgHS/RoCEdAosmozzmOl3V9lChoBkdAcafkRSP2f2gHTSIBaAhHQKLJyswL3K11fZQoaAZHQDaj+AEt/WloB0vwaAhHQKLJ5f2K2rp1fZQoaAZHQG9h5N47ihpoB00LAWgIR0CiygadMCcPdWUu"
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
+
"_n_updates": 252,
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 88362
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4f83bef89ca93ead01096f22007f78653e265f82dbc4042a5610422ef65c3fa
|
3 |
size 88362
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43762
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29ded85c756c09320dfd90738bbe4f8b2badfd7478017c224ec30c3c13245900
|
3 |
size 43762
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 255.2325068, "std_reward": 18.447433423798184, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-01T16:56:35.922089"}
|