Spaces:
Sleeping
Sleeping
Andrei Cozma
commited on
Commit
·
434e854
1
Parent(s):
99ac186
Updates
Browse files- Shared.py +1 -1
- run.py +1 -7
- run_tests_MC_CliffWalking-v0.py +1 -1
- run_tests_MC_FrozenLake-v1.py +1 -1
Shared.py
CHANGED
@@ -12,7 +12,7 @@ class Shared:
|
|
12 |
gamma=0.99,
|
13 |
epsilon=0.1,
|
14 |
run_name=None,
|
15 |
-
frozenlake_size=
|
16 |
**kwargs,
|
17 |
):
|
18 |
print("=" * 80)
|
|
|
12 |
gamma=0.99,
|
13 |
epsilon=0.1,
|
14 |
run_name=None,
|
15 |
+
frozenlake_size=16,
|
16 |
**kwargs,
|
17 |
):
|
18 |
print("=" * 80)
|
run.py
CHANGED
@@ -108,12 +108,6 @@ def main():
|
|
108 |
default=None,
|
109 |
help="WandB project name for logging. If not provided, no logging is done. (default: None)",
|
110 |
)
|
111 |
-
parser.add_argument(
|
112 |
-
"--wandb_group",
|
113 |
-
type=str,
|
114 |
-
default="monte-carlo",
|
115 |
-
help="WandB group name for logging. (default: monte-carlo)",
|
116 |
-
)
|
117 |
parser.add_argument(
|
118 |
"--wandb_job_type",
|
119 |
type=str,
|
@@ -144,7 +138,7 @@ def main():
|
|
144 |
wandb.init(
|
145 |
project=args.wandb_project,
|
146 |
name=run_name,
|
147 |
-
group=args.
|
148 |
job_type=args.wandb_job_type,
|
149 |
config=dict(args._get_kwargs()),
|
150 |
)
|
|
|
108 |
default=None,
|
109 |
help="WandB project name for logging. If not provided, no logging is done. (default: None)",
|
110 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
111 |
parser.add_argument(
|
112 |
"--wandb_job_type",
|
113 |
type=str,
|
|
|
138 |
wandb.init(
|
139 |
project=args.wandb_project,
|
140 |
name=run_name,
|
141 |
+
group=args.agent,
|
142 |
job_type=args.wandb_job_type,
|
143 |
config=dict(args._get_kwargs()),
|
144 |
)
|
run_tests_MC_CliffWalking-v0.py
CHANGED
@@ -19,7 +19,7 @@ vals_gamma = [1.0, 0.98, 0.96, 0.94]
|
|
19 |
|
20 |
def run_test(args):
|
21 |
os.system(
|
22 |
-
f"python3 MonteCarloAgent.py --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
|
23 |
)
|
24 |
|
25 |
|
|
|
19 |
|
20 |
def run_test(args):
|
21 |
os.system(
|
22 |
+
f"python3 MonteCarloAgent.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
|
23 |
)
|
24 |
|
25 |
|
run_tests_MC_FrozenLake-v1.py
CHANGED
@@ -17,7 +17,7 @@ vals_gamma = [1.0, 0.98, 0.96, 0.94]
|
|
17 |
|
18 |
def run_test(args):
|
19 |
os.system(
|
20 |
-
f"python3 MonteCarloAgent.py --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
|
21 |
)
|
22 |
|
23 |
|
|
|
17 |
|
18 |
def run_test(args):
|
19 |
os.system(
|
20 |
+
f"python3 MonteCarloAgent.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
|
21 |
)
|
22 |
|
23 |
|