Andrei Cozma commited on
Commit
9d55737
·
1 Parent(s): 84b1569

Added Taxi-v3 script

Browse files
Files changed (1) hide show
  1. run_tests_MC_Taxi-v3.py +34 -0
run_tests_MC_Taxi-v3.py ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import multiprocessing
3
+ import random
4
+
5
+ wandb_project = "cs581"
6
+
7
+ env = "Taxi-v3"
8
+ n_train_episodes = 10000
9
+ max_steps = 500
10
+
11
+ num_tests = 10
12
+
13
+ vals_update_type = [
14
+ "first_visit"
15
+ ] # Every visit takes too long due to this environment's reward structure
16
+ vals_epsilon = [0.1, 0.2, 0.3, 0.4, 0.5]
17
+ vals_gamma = [1.0, 0.98, 0.96, 0.94]
18
+
19
+
20
+ def run_test(args):
21
+ os.system(
22
+ f"python3 run.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
23
+ )
24
+
25
+
26
+ with multiprocessing.Pool(8) as p:
27
+ tests = []
28
+ for update_type in vals_update_type:
29
+ for gamma in vals_gamma:
30
+ for eps in vals_epsilon:
31
+ tests.extend((gamma, eps, update_type, i) for i in range(num_tests))
32
+ random.shuffle(tests)
33
+
34
+ p.map(run_test, tests)