File size: 2,287 Bytes
4d455b3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
seed: 4682
env:
  env_id: OpenSubtaskTrain-v0
  num_envs: 189
  max_episode_steps: 100
  make_env: true
  continuous_task: true
  cat_state: true
  cat_pixels: false
  frame_stack: 3
  stationary_base: false
  stationary_torso: false
  stationary_head: true
  task_plan_fp: task_plans/set_table/open/train/kitchen_counter.json
  spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
  record_video: false
  debug_video: false
  debug_video_gen: false
  save_video_freq: null
  info_on_video: false
  extra_stat_keys: []
  env_kwargs:
    robot_force_mult: 0.001
    robot_force_penalty_min: 0.2
    target_randomization: false
    randomly_slightly_open_articulation: true
eval_env:
  env_id: OpenSubtaskTrain-v0
  num_envs: 63
  max_episode_steps: 200
  make_env: true
  continuous_task: true
  cat_state: true
  cat_pixels: false
  frame_stack: 3
  stationary_base: false
  stationary_torso: false
  stationary_head: true
  task_plan_fp: task_plans/set_table/open/train/kitchen_counter.json
  spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
  record_video: false
  debug_video: false
  debug_video_gen: false
  save_video_freq: 10
  info_on_video: false
  extra_stat_keys: []
  env_kwargs:
    robot_force_mult: 0.001
    robot_force_penalty_min: 0.2
    target_randomization: false
    randomly_slightly_open_articulation: false
algo:
  name: ppo
  total_timesteps: 50000000
  learning_rate: 0.0003
  anneal_lr: false
  gamma: 0.9
  gae_lambda: 0.9
  num_minibatches: 16
  update_epochs: 8
  norm_adv: true
  clip_coef: 0.2
  clip_vloss: false
  ent_coef: 0.0
  vf_coef: 0.5
  max_grad_norm: 0.5
  target_kl: 0.2
  log_freq: 10000
  save_freq: 100000
  eval_freq: 100000
  finite_horizon_gae: true
  torch_deterministic: true
  save_backup_ckpts: false
  eval_episodes: 189
  num_steps: 100
  num_envs: 189
  num_eval_envs: 63
  batch_size: 18900
  minibatch_size: 1181
  num_iterations: 2646
logger:
  workspace: mshab_exps
  exp_name: rcad-set_table-open-kitchen_counter
  clear_out: true
  tensorboard: true
  wandb: false
model_ckpt: "mshab_checkpoints/rl/set_table/open/kitchen_counter/policy.pt"