Spaces:
Sleeping
Sleeping
Andrei Cozma
commited on
Commit
·
9d55737
1
Parent(s):
84b1569
Added Taxi-v3 script
Browse files- run_tests_MC_Taxi-v3.py +34 -0
run_tests_MC_Taxi-v3.py
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import os
|
2 |
+
import multiprocessing
|
3 |
+
import random
|
4 |
+
|
5 |
+
wandb_project = "cs581"
|
6 |
+
|
7 |
+
env = "Taxi-v3"
|
8 |
+
n_train_episodes = 10000
|
9 |
+
max_steps = 500
|
10 |
+
|
11 |
+
num_tests = 10
|
12 |
+
|
13 |
+
vals_update_type = [
|
14 |
+
"first_visit"
|
15 |
+
] # Every visit takes too long due to this environment's reward structure
|
16 |
+
vals_epsilon = [0.1, 0.2, 0.3, 0.4, 0.5]
|
17 |
+
vals_gamma = [1.0, 0.98, 0.96, 0.94]
|
18 |
+
|
19 |
+
|
20 |
+
def run_test(args):
|
21 |
+
os.system(
|
22 |
+
f"python3 run.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
|
23 |
+
)
|
24 |
+
|
25 |
+
|
26 |
+
with multiprocessing.Pool(8) as p:
|
27 |
+
tests = []
|
28 |
+
for update_type in vals_update_type:
|
29 |
+
for gamma in vals_gamma:
|
30 |
+
for eps in vals_epsilon:
|
31 |
+
tests.extend((gamma, eps, update_type, i) for i in range(num_tests))
|
32 |
+
random.shuffle(tests)
|
33 |
+
|
34 |
+
p.map(run_test, tests)
|