Spaces:
Sleeping
Sleeping
train on new frozen lake
Browse files- DPAgent.py +20 -2
- policies/DPAgent_FrozenLake-v1_i219_g0.9.npy +0 -0
DPAgent.py
CHANGED
@@ -85,10 +85,28 @@ class DP:
|
|
85 |
|
86 |
if __name__ == "__main__":
|
87 |
# env = gym.make('FrozenLake-v1', render_mode='human')
|
88 |
-
dp = DP("FrozenLake-v1"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
89 |
dp.train()
|
90 |
dp.save_policy('dp_policy.npy')
|
91 |
-
env = gym.make('FrozenLake-v1', render_mode='human'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
92 |
|
93 |
state, _ = env.reset()
|
94 |
done = False
|
|
|
85 |
|
86 |
if __name__ == "__main__":
|
87 |
# env = gym.make('FrozenLake-v1', render_mode='human')
|
88 |
+
dp = DP("FrozenLake-v1", is_slippery=False, desc=[
|
89 |
+
"SFFFFFFF",
|
90 |
+
"FFFFFFFH",
|
91 |
+
"FFFHFFFF",
|
92 |
+
"FFFFFHFF",
|
93 |
+
"FFFHFFFF",
|
94 |
+
"FHHFFFHF",
|
95 |
+
"FHFFHFHF",
|
96 |
+
"FFFHFFFG",
|
97 |
+
])
|
98 |
dp.train()
|
99 |
dp.save_policy('dp_policy.npy')
|
100 |
+
env = gym.make('FrozenLake-v1', render_mode='human', is_slippery=False, desc=[
|
101 |
+
"SFFFFFFF",
|
102 |
+
"FFFFFFFH",
|
103 |
+
"FFFHFFFF",
|
104 |
+
"FFFFFHFF",
|
105 |
+
"FFFHFFFF",
|
106 |
+
"FHHFFFHF",
|
107 |
+
"FHFFHFHF",
|
108 |
+
"FFFHFFFG",
|
109 |
+
])
|
110 |
|
111 |
state, _ = env.reset()
|
112 |
done = False
|
policies/DPAgent_FrozenLake-v1_i219_g0.9.npy
CHANGED
Binary files a/policies/DPAgent_FrozenLake-v1_i219_g0.9.npy and b/policies/DPAgent_FrozenLake-v1_i219_g0.9.npy differ
|
|