Spaces:

acozma
/

CS581-Algos-Demo

Sleeping

Andrei Cozma commited on Apr 19, 2023

Commit

82f7820

1 Parent(s): 45b1b2a

Updates

Files changed (1) hide show

run_tests.py CHANGED Viewed

@@ -3,21 +3,24 @@ import multiprocessing
 import random
 num_tests = 10
 vals_eps = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]
 vals_gamma = [1.0, 0.99, 0.98, 0.97, 0.95]
 def run_test(args):
     os.system(
-        f"python3 MonteCarloAgent.py --train  --gamma {args[0]} --epsilon {args[1]} --wandb_project cs581 --wandb_job_type params --wandb_run_name_suffix {args[2]} --no_save"
     )
 with multiprocessing.Pool(16) as p:
     tests = []
-    for gamma in vals_gamma:
-        for eps in vals_eps:
-            tests.extend((gamma, eps, i) for i in range(num_tests))
     random.shuffle(tests)
     p.map(run_test, tests)

 import random
 num_tests = 10
+update_types = ["first_visit", "every_visit"]
 vals_eps = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]
 vals_gamma = [1.0, 0.99, 0.98, 0.97, 0.95]
 def run_test(args):
     os.system(
+        f"python3 MonteCarloAgent.py --train  --gamma {args[0]} --epsilon {args[1]} --update_type{args[2]} --wandb_project cs581 --wandb_job_type params --wandb_run_name_suffix {args[3]} --no_save"
     )
 with multiprocessing.Pool(16) as p:
     tests = []
+    for update_type in update_types:
+        for gamma in vals_gamma:
+            for eps in vals_eps:
+                tests.extend((gamma, eps, update_type, i) for i in range(num_tests))
     random.shuffle(tests)
     p.map(run_test, tests)