Andrei Cozma commited on
Commit
434e854
·
1 Parent(s): 99ac186
Shared.py CHANGED
@@ -12,7 +12,7 @@ class Shared:
12
  gamma=0.99,
13
  epsilon=0.1,
14
  run_name=None,
15
- frozenlake_size=8,
16
  **kwargs,
17
  ):
18
  print("=" * 80)
 
12
  gamma=0.99,
13
  epsilon=0.1,
14
  run_name=None,
15
+ frozenlake_size=16,
16
  **kwargs,
17
  ):
18
  print("=" * 80)
run.py CHANGED
@@ -108,12 +108,6 @@ def main():
108
  default=None,
109
  help="WandB project name for logging. If not provided, no logging is done. (default: None)",
110
  )
111
- parser.add_argument(
112
- "--wandb_group",
113
- type=str,
114
- default="monte-carlo",
115
- help="WandB group name for logging. (default: monte-carlo)",
116
- )
117
  parser.add_argument(
118
  "--wandb_job_type",
119
  type=str,
@@ -144,7 +138,7 @@ def main():
144
  wandb.init(
145
  project=args.wandb_project,
146
  name=run_name,
147
- group=args.wandb_group,
148
  job_type=args.wandb_job_type,
149
  config=dict(args._get_kwargs()),
150
  )
 
108
  default=None,
109
  help="WandB project name for logging. If not provided, no logging is done. (default: None)",
110
  )
 
 
 
 
 
 
111
  parser.add_argument(
112
  "--wandb_job_type",
113
  type=str,
 
138
  wandb.init(
139
  project=args.wandb_project,
140
  name=run_name,
141
+ group=args.agent,
142
  job_type=args.wandb_job_type,
143
  config=dict(args._get_kwargs()),
144
  )
run_tests_MC_CliffWalking-v0.py CHANGED
@@ -19,7 +19,7 @@ vals_gamma = [1.0, 0.98, 0.96, 0.94]
19
 
20
  def run_test(args):
21
  os.system(
22
- f"python3 MonteCarloAgent.py --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
23
  )
24
 
25
 
 
19
 
20
  def run_test(args):
21
  os.system(
22
+ f"python3 MonteCarloAgent.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
23
  )
24
 
25
 
run_tests_MC_FrozenLake-v1.py CHANGED
@@ -17,7 +17,7 @@ vals_gamma = [1.0, 0.98, 0.96, 0.94]
17
 
18
  def run_test(args):
19
  os.system(
20
- f"python3 MonteCarloAgent.py --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
21
  )
22
 
23
 
 
17
 
18
  def run_test(args):
19
  os.system(
20
+ f"python3 MonteCarloAgent.py --agent MCAgent --train --n_train_episodes {n_train_episodes} --max_steps {max_steps} --env {env} --gamma {args[0]} --epsilon {args[1]} --update_type {args[2]} --wandb_project {wandb_project} --wandb_run_name_suffix {args[3]} --no_save"
21
  )
22
 
23