arth-shukla commited on
Commit
4d455b3
·
verified ·
1 Parent(s): 420fdd1

bc and rl checkpoints

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. bc/prepare_groceries/pick/all/config.yml +46 -0
  2. bc/prepare_groceries/pick/all/policy.pt +3 -0
  3. bc/prepare_groceries/place/all/config.yml +47 -0
  4. bc/prepare_groceries/place/all/policy.pt +3 -0
  5. bc/set_table/close/fridge/config.yml +47 -0
  6. bc/set_table/close/fridge/policy.pt +3 -0
  7. bc/set_table/close/kitchen_counter/config.yml +47 -0
  8. bc/set_table/close/kitchen_counter/policy.pt +3 -0
  9. bc/set_table/open/fridge/config.yml +47 -0
  10. bc/set_table/open/fridge/policy.pt +3 -0
  11. bc/set_table/open/kitchen_counter/config.yml +47 -0
  12. bc/set_table/open/kitchen_counter/policy.pt +3 -0
  13. bc/set_table/pick/all/config.yml +47 -0
  14. bc/set_table/pick/all/policy.pt +3 -0
  15. bc/set_table/place/all/config.yml +47 -0
  16. bc/set_table/place/all/policy.pt +3 -0
  17. bc/tidy_house/pick/all/config.yml +46 -0
  18. bc/tidy_house/pick/all/policy.pt +3 -0
  19. bc/tidy_house/place/all/config.yml +46 -0
  20. bc/tidy_house/place/all/policy.pt +3 -0
  21. rl/prepare_groceries/pick/002_master_chef_can/config.yml +110 -0
  22. rl/prepare_groceries/pick/002_master_chef_can/policy.pt +3 -0
  23. rl/prepare_groceries/pick/003_cracker_box/config.yml +110 -0
  24. rl/prepare_groceries/pick/003_cracker_box/policy.pt +3 -0
  25. rl/prepare_groceries/pick/004_sugar_box/config.yml +111 -0
  26. rl/prepare_groceries/pick/004_sugar_box/policy.pt +3 -0
  27. rl/prepare_groceries/pick/005_tomato_soup_can/config.yml +115 -0
  28. rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt +3 -0
  29. rl/prepare_groceries/pick/007_tuna_fish_can/config.yml +111 -0
  30. rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt +3 -0
  31. rl/prepare_groceries/pick/008_pudding_box/config.yml +113 -0
  32. rl/prepare_groceries/pick/008_pudding_box/policy.pt +3 -0
  33. rl/prepare_groceries/pick/009_gelatin_box/config.yml +113 -0
  34. rl/prepare_groceries/pick/009_gelatin_box/policy.pt +3 -0
  35. rl/prepare_groceries/pick/010_potted_meat_can/config.yml +110 -0
  36. rl/prepare_groceries/pick/010_potted_meat_can/policy.pt +3 -0
  37. rl/prepare_groceries/pick/024_bowl/config.yml +115 -0
  38. rl/prepare_groceries/pick/024_bowl/policy.pt +3 -0
  39. rl/prepare_groceries/pick/all/config.yml +113 -0
  40. rl/prepare_groceries/pick/all/policy.pt +3 -0
  41. rl/prepare_groceries/place/002_master_chef_can/config.yml +115 -0
  42. rl/prepare_groceries/place/002_master_chef_can/policy.pt +3 -0
  43. rl/prepare_groceries/place/003_cracker_box/config.yml +115 -0
  44. rl/prepare_groceries/place/003_cracker_box/policy.pt +3 -0
  45. rl/prepare_groceries/place/004_sugar_box/config.yml +115 -0
  46. rl/prepare_groceries/place/004_sugar_box/policy.pt +3 -0
  47. rl/prepare_groceries/place/005_tomato_soup_can/config.yml +115 -0
  48. rl/prepare_groceries/place/005_tomato_soup_can/policy.pt +3 -0
  49. rl/prepare_groceries/place/007_tuna_fish_can/config.yml +115 -0
  50. rl/prepare_groceries/place/007_tuna_fish_can/policy.pt +3 -0
bc/prepare_groceries/pick/all/config.yml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/prepare_groceries/pick
36
+ max_cache_size: 300000
37
+ torch_deterministic: true
38
+ eval_episodes: 252
39
+ num_eval_envs: 252
40
+ logger:
41
+ workspace: mshab_exps
42
+ exp_name: rcad-prepare_groceries-pick-all
43
+ clear_out: true
44
+ tensorboard: true
45
+ wandb: false
46
+ model_ckpt: "mshab_checkpoints/bc/prepare_groceries/pick/all/policy.pt"
bc/prepare_groceries/pick/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b90849268bcaefe1fa1c1abd79f9e259a48f42617bc152bdeb8943dbd39a45c
3
+ size 238201234
bc/prepare_groceries/place/all/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/prepare_groceries/place
36
+ max_cache_size: 300000
37
+ trajs_per_obj: all
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-prepare_groceries-place-all
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/prepare_groceries/place/all/policy.pt"
bc/prepare_groceries/place/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4bc570e9aad369d26c62d69c5e441f7a46fc45ec20221c5c6f3d11708a49f6e
3
+ size 238201234
bc/set_table/close/fridge/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: CloseSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/close/train/fridge.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/close/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/close/fridge.h5
36
+ max_cache_size: 300000
37
+ trajs_per_obj: 1000
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-close-fridge
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/close/fridge/policy.pt"
bc/set_table/close/fridge/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4e6802c0b767f70b819f74eaf1b063d028e0592cf6ad0cf47739439bf2f1a3f
3
+ size 238200850
bc/set_table/close/kitchen_counter/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: CloseSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/close/train/kitchen_counter.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/close/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/close/kitchen_counter.h5
36
+ max_cache_size: 300000
37
+ trajs_per_obj: 1000
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-close-kitchen_counter
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/close/kitchen_counter/policy.pt"
bc/set_table/close/kitchen_counter/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cc31e96c04a6e5ffc1f698c9c55e17f2ca136db1865085df71520ec4a59025a
3
+ size 238200850
bc/set_table/open/fridge/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: OpenSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/open/train/fridge.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/open/fridge.h5
36
+ max_cache_size: 300000
37
+ trajs_per_obj: 1000
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-close-fridge
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/close/fridge/policy.pt"
bc/set_table/open/fridge/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80f614cdfbef42079f9f4254224484d71d49057801182417628d181646cefe38
3
+ size 238200850
bc/set_table/open/kitchen_counter/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: OpenSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/open/train/kitchen_counter.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/open/kitchen_counter.h5
36
+ max_cache_size: 300000
37
+ trajs_per_obj: 1000
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-close-kitchen_counter
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/close/kitchen_counter/policy.pt"
bc/set_table/open/kitchen_counter/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dc77a7e29552c1d407a38bd608173d12d40da3dd35eec934b537a9024b8c21e
3
+ size 238200850
bc/set_table/pick/all/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/pick/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/pick
36
+ max_cache_size: 300000
37
+ trajs_per_obj: all
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-pick-all
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/pick/all/policy.pt"
bc/set_table/pick/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3593b72dfc3c265fb8a294b6f3bb79c86472d4efada6437d50c66daee7cbd58
3
+ size 238200850
bc/set_table/place/all/config.yml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/set_table/place/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/place
36
+ max_cache_size: 300000
37
+ trajs_per_obj: all
38
+ torch_deterministic: true
39
+ eval_episodes: 252
40
+ num_eval_envs: 252
41
+ logger:
42
+ workspace: mshab_exps
43
+ exp_name: rcad-set_table-place-all
44
+ clear_out: true
45
+ tensorboard: true
46
+ wandb: false
47
+ model_ckpt: "mshab_checkpoints/bc/set_table/place/all/policy.pt"
bc/set_table/place/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39cb5b0a2000c8184a5e4a25cda28e60602734a81e05be972a18f27f911bda2a
3
+ size 238200850
bc/tidy_house/pick/all/config.yml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/tidy_house/pick/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/tidy_house/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 25
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/tidy_house/pick
36
+ max_cache_size: 300000
37
+ torch_deterministic: true
38
+ eval_episodes: 252
39
+ num_eval_envs: 252
40
+ logger:
41
+ workspace: mshab_exps
42
+ exp_name: rcad-tidy_house-pick-all
43
+ clear_out: true
44
+ tensorboard: true
45
+ wandb: false
46
+ model_ckpt: "mshab_checkpoints/bc/tidy_house/pick/all/policy.pt"
bc/tidy_house/pick/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:250f92d9a0d6c42f78ba85ac0cab740eee1f80619f6f6fbf39b7ad8aa676d3c8
3
+ size 238201234
bc/tidy_house/place/all/config.yml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ eval_env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 252
5
+ max_episode_steps: 200
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 1
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/tidy_house/place/train/all.json
15
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/tidy_house/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: 1
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ algo:
27
+ name: bc
28
+ lr: 0.0003
29
+ batch_size: 512
30
+ epochs: 10
31
+ eval_freq: 1
32
+ log_freq: 1
33
+ save_freq: 1
34
+ save_backup_ckpts: false
35
+ data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/tidy_house/place
36
+ max_cache_size: 300000
37
+ torch_deterministic: true
38
+ eval_episodes: 252
39
+ num_eval_envs: 252
40
+ logger:
41
+ workspace: mshab_exps
42
+ exp_name: rcad-tidy_house-place-all
43
+ clear_out: true
44
+ tensorboard: true
45
+ wandb: false
46
+ model_ckpt: "mshab_checkpoints/bc/tidy_house/place/all/policy.pt"
bc/tidy_house/place/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e947b7ab786abd6817536bd7af53897f97c89d1214d06ac0c025df5c915b0f2
3
+ size 238200850
rl/prepare_groceries/pick/002_master_chef_can/config.yml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/002_master_chef_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ save_video_freq: null
18
+ info_on_video: false
19
+ extra_stat_keys: []
20
+ env_kwargs:
21
+ robot_force_mult: 0.001
22
+ robot_force_penalty_min: 0.2
23
+ target_randomization: false
24
+ eval_env:
25
+ env_id: PickSubtaskTrain-v0
26
+ num_envs: 189
27
+ max_episode_steps: 200
28
+ make_env: true
29
+ continuous_task: true
30
+ cat_state: true
31
+ cat_pixels: false
32
+ frame_stack: 3
33
+ stationary_base: false
34
+ stationary_torso: false
35
+ stationary_head: true
36
+ task_plan_fp: task_plans/prepare_groceries/pick/train/002_master_chef_can.json
37
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
38
+ record_video: false
39
+ save_video_freq: null
40
+ info_on_video: true
41
+ extra_stat_keys: []
42
+ env_kwargs:
43
+ robot_force_mult: 0.001
44
+ robot_force_penalty_min: 0.2
45
+ target_randomization: false
46
+ algo:
47
+ name: sac
48
+ replay_buffer_capacity: 995400
49
+ total_timesteps: 50000000
50
+ num_steps: 100
51
+ init_steps: 5000
52
+ batch_size: 512
53
+ critic_encoder_tau: 0.005
54
+ cnn_features:
55
+ - 32
56
+ - 64
57
+ - 128
58
+ - 256
59
+ cnn_filters:
60
+ - 3
61
+ - 3
62
+ - 3
63
+ - 3
64
+ cnn_strides:
65
+ - 2
66
+ - 2
67
+ - 2
68
+ - 2
69
+ cnn_padding: valid
70
+ encoder_pixels_feature_dim: 50
71
+ encoder_state_feature_dim: 50
72
+ detach_encoder: false
73
+ critic_hidden_dims:
74
+ - 256
75
+ - 256
76
+ - 256
77
+ critic_lr: 0.0003
78
+ critic_layer_norm: true
79
+ critic_dropout: null
80
+ critic_beta: 0.9
81
+ critic_tau: 0.005
82
+ critic_target_update_freq: 2
83
+ actor_hidden_dims:
84
+ - 256
85
+ - 256
86
+ - 256
87
+ actor_lr: 0.0003
88
+ actor_beta: 0.9
89
+ actor_log_std_min: -20
90
+ actor_log_std_max: 2
91
+ actor_update_freq: 2
92
+ gamma: 0.9
93
+ init_temperature: 0.1
94
+ alpha_lr: 0.0003
95
+ alpha_beta: 0.9
96
+ log_freq: 10000
97
+ save_freq: 100000000
98
+ eval_freq: 100000
99
+ torch_deterministic: true
100
+ eval_episodes: 189
101
+ num_envs: 63
102
+ num_eval_envs: 189
103
+ num_iterations: 793651
104
+ logger:
105
+ workspace: mshab_exps
106
+ exp_name: rcad-prepare_groceries-pick-002_master_chef_can
107
+ clear_out: true
108
+ tensorboard: true
109
+ wandb: false
110
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/002_master_chef_can/policy.pt"
rl/prepare_groceries/pick/002_master_chef_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb338580bfb74b7d50796705f8f5f5caccfe6d5e3a22a57485b5ccab9690ef98
3
+ size 55487432
rl/prepare_groceries/pick/003_cracker_box/config.yml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/003_cracker_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ save_video_freq: null
18
+ info_on_video: false
19
+ extra_stat_keys: []
20
+ env_kwargs:
21
+ robot_force_mult: 0.001
22
+ robot_force_penalty_min: 0.2
23
+ target_randomization: false
24
+ eval_env:
25
+ env_id: PickSubtaskTrain-v0
26
+ num_envs: 189
27
+ max_episode_steps: 200
28
+ make_env: true
29
+ continuous_task: true
30
+ cat_state: true
31
+ cat_pixels: false
32
+ frame_stack: 3
33
+ stationary_base: false
34
+ stationary_torso: false
35
+ stationary_head: true
36
+ task_plan_fp: task_plans/prepare_groceries/pick/train/003_cracker_box.json
37
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
38
+ record_video: false
39
+ save_video_freq: null
40
+ info_on_video: true
41
+ extra_stat_keys: []
42
+ env_kwargs:
43
+ robot_force_mult: 0.001
44
+ robot_force_penalty_min: 0.2
45
+ target_randomization: false
46
+ algo:
47
+ name: sac
48
+ replay_buffer_capacity: 995400
49
+ total_timesteps: 50000000
50
+ num_steps: 100
51
+ init_steps: 5000
52
+ batch_size: 512
53
+ critic_encoder_tau: 0.005
54
+ cnn_features:
55
+ - 32
56
+ - 64
57
+ - 128
58
+ - 256
59
+ cnn_filters:
60
+ - 3
61
+ - 3
62
+ - 3
63
+ - 3
64
+ cnn_strides:
65
+ - 2
66
+ - 2
67
+ - 2
68
+ - 2
69
+ cnn_padding: valid
70
+ encoder_pixels_feature_dim: 50
71
+ encoder_state_feature_dim: 50
72
+ detach_encoder: false
73
+ critic_hidden_dims:
74
+ - 256
75
+ - 256
76
+ - 256
77
+ critic_lr: 0.0003
78
+ critic_layer_norm: true
79
+ critic_dropout: null
80
+ critic_beta: 0.9
81
+ critic_tau: 0.005
82
+ critic_target_update_freq: 2
83
+ actor_hidden_dims:
84
+ - 256
85
+ - 256
86
+ - 256
87
+ actor_lr: 0.0003
88
+ actor_beta: 0.9
89
+ actor_log_std_min: -20
90
+ actor_log_std_max: 2
91
+ actor_update_freq: 2
92
+ gamma: 0.9
93
+ init_temperature: 0.1
94
+ alpha_lr: 0.0003
95
+ alpha_beta: 0.9
96
+ log_freq: 10000
97
+ save_freq: 100000000
98
+ eval_freq: 100000
99
+ torch_deterministic: true
100
+ eval_episodes: 189
101
+ num_envs: 63
102
+ num_eval_envs: 189
103
+ num_iterations: 793651
104
+ logger:
105
+ workspace: mshab_exps
106
+ exp_name: rcad-prepare_groceries-pick-003_cracker_box
107
+ clear_out: true
108
+ tensorboard: true
109
+ wandb: false
110
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/003_cracker_box/policy.pt"
rl/prepare_groceries/pick/003_cracker_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d11038630d4ed9ccc9de2c8bc1522b8e104b8180c2c87cdf82e7cc10094c88c
3
+ size 55487432
rl/prepare_groceries/pick/004_sugar_box/config.yml ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/004_sugar_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ save_video_freq: null
18
+ info_on_video: false
19
+ extra_stat_keys: []
20
+ env_kwargs:
21
+ robot_force_mult: 0.001
22
+ robot_force_penalty_min: 0.2
23
+ target_randomization: false
24
+ eval_env:
25
+ env_id: PickSubtaskTrain-v0
26
+ num_envs: 189
27
+ max_episode_steps: 200
28
+ make_env: true
29
+ continuous_task: true
30
+ cat_state: true
31
+ cat_pixels: false
32
+ frame_stack: 3
33
+ stationary_base: false
34
+ stationary_torso: false
35
+ stationary_head: true
36
+ task_plan_fp: task_plans/prepare_groceries/pick/train/004_sugar_box.json
37
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
38
+ record_video: false
39
+ save_video_freq: null
40
+ info_on_video: true
41
+ extra_stat_keys: []
42
+ env_kwargs:
43
+ robot_force_mult: 0.001
44
+ robot_force_penalty_min: 0.2
45
+ target_randomization: false
46
+ algo:
47
+ name: sac
48
+ replay_buffer_capacity: 995400
49
+ total_timesteps: 50000000
50
+ num_steps: 100
51
+ init_steps: 5000
52
+ batch_size: 512
53
+ critic_encoder_tau: 0.005
54
+ cnn_features:
55
+ - 32
56
+ - 64
57
+ - 128
58
+ - 256
59
+ cnn_filters:
60
+ - 3
61
+ - 3
62
+ - 3
63
+ - 3
64
+ cnn_strides:
65
+ - 2
66
+ - 2
67
+ - 2
68
+ - 2
69
+ cnn_padding: valid
70
+ encoder_pixels_feature_dim: 50
71
+ encoder_state_feature_dim: 50
72
+ detach_encoder: false
73
+ critic_hidden_dims:
74
+ - 256
75
+ - 256
76
+ - 256
77
+ critic_lr: 0.0003
78
+ critic_layer_norm: true
79
+ critic_dropout: null
80
+ critic_beta: 0.9
81
+ critic_tau: 0.005
82
+ critic_target_update_freq: 2
83
+ actor_hidden_dims:
84
+ - 256
85
+ - 256
86
+ - 256
87
+ actor_lr: 0.0003
88
+ actor_beta: 0.9
89
+ actor_log_std_min: -20
90
+ actor_log_std_max: 2
91
+ actor_update_freq: 2
92
+ gamma: 0.9
93
+ init_temperature: 0.1
94
+ alpha_lr: 0.0003
95
+ alpha_beta: 0.9
96
+ log_freq: 10000
97
+ save_freq: 100000000
98
+ eval_freq: 100000
99
+ torch_deterministic: true
100
+ save_backup_ckpts: false
101
+ eval_episodes: 189
102
+ num_envs: 63
103
+ num_eval_envs: 189
104
+ num_iterations: 793651
105
+ logger:
106
+ workspace: mshab_exps
107
+ exp_name: rcad-prepare_groceries-pick-004_sugar_box
108
+ clear_out: true
109
+ tensorboard: true
110
+ wandb: false
111
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/004_sugar_box/policy.pt"
rl/prepare_groceries/pick/004_sugar_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc935696ffe962efbe8e418312082245a90f43abd4a9aecaed1a130132478576
3
+ size 55487432
rl/prepare_groceries/pick/005_tomato_soup_can/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 4682
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/005_tomato_soup_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PickSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/pick/train/005_tomato_soup_can.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-pick-005_tomato_soup_can
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt"
rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77288352508ea9e9aab0499c0a8a1bfd680cba704c98d36d8bbfbc84be8f7c4c
3
+ size 55487706
rl/prepare_groceries/pick/007_tuna_fish_can/config.yml ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/007_tuna_fish_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ save_video_freq: null
18
+ info_on_video: false
19
+ extra_stat_keys: []
20
+ env_kwargs:
21
+ robot_force_mult: 0.001
22
+ robot_force_penalty_min: 0.2
23
+ target_randomization: false
24
+ eval_env:
25
+ env_id: PickSubtaskTrain-v0
26
+ num_envs: 189
27
+ max_episode_steps: 200
28
+ make_env: true
29
+ continuous_task: true
30
+ cat_state: true
31
+ cat_pixels: false
32
+ frame_stack: 3
33
+ stationary_base: false
34
+ stationary_torso: false
35
+ stationary_head: true
36
+ task_plan_fp: task_plans/prepare_groceries/pick/train/007_tuna_fish_can.json
37
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
38
+ record_video: false
39
+ save_video_freq: null
40
+ info_on_video: true
41
+ extra_stat_keys: []
42
+ env_kwargs:
43
+ robot_force_mult: 0.001
44
+ robot_force_penalty_min: 0.2
45
+ target_randomization: false
46
+ algo:
47
+ name: sac
48
+ replay_buffer_capacity: 995400
49
+ total_timesteps: 50000000
50
+ num_steps: 100
51
+ init_steps: 5000
52
+ batch_size: 512
53
+ critic_encoder_tau: 0.005
54
+ cnn_features:
55
+ - 32
56
+ - 64
57
+ - 128
58
+ - 256
59
+ cnn_filters:
60
+ - 3
61
+ - 3
62
+ - 3
63
+ - 3
64
+ cnn_strides:
65
+ - 2
66
+ - 2
67
+ - 2
68
+ - 2
69
+ cnn_padding: valid
70
+ encoder_pixels_feature_dim: 50
71
+ encoder_state_feature_dim: 50
72
+ detach_encoder: false
73
+ critic_hidden_dims:
74
+ - 256
75
+ - 256
76
+ - 256
77
+ critic_lr: 0.0003
78
+ critic_layer_norm: true
79
+ critic_dropout: null
80
+ critic_beta: 0.9
81
+ critic_tau: 0.005
82
+ critic_target_update_freq: 2
83
+ actor_hidden_dims:
84
+ - 256
85
+ - 256
86
+ - 256
87
+ actor_lr: 0.0003
88
+ actor_beta: 0.9
89
+ actor_log_std_min: -20
90
+ actor_log_std_max: 2
91
+ actor_update_freq: 2
92
+ gamma: 0.9
93
+ init_temperature: 0.1
94
+ alpha_lr: 0.0003
95
+ alpha_beta: 0.9
96
+ log_freq: 10000
97
+ save_freq: 100000000
98
+ eval_freq: 100000
99
+ torch_deterministic: true
100
+ save_backup_ckpts: false
101
+ eval_episodes: 189
102
+ num_envs: 63
103
+ num_eval_envs: 189
104
+ num_iterations: 793651
105
+ logger:
106
+ workspace: mshab_exps
107
+ exp_name: rcad-prepare_groceries-pick-007_tuna_fish_can
108
+ clear_out: true
109
+ tensorboard: true
110
+ wandb: false
111
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt"
rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caf45664947dc617cc252782f7883395cc1b50472c313864220444ffe9eb2701
3
+ size 55487432
rl/prepare_groceries/pick/008_pudding_box/config.yml ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 5227
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/008_pudding_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ save_video_freq: null
19
+ info_on_video: false
20
+ extra_stat_keys: []
21
+ env_kwargs:
22
+ robot_force_mult: 0.001
23
+ robot_force_penalty_min: 0.2
24
+ target_randomization: false
25
+ eval_env:
26
+ env_id: PickSubtaskTrain-v0
27
+ num_envs: 189
28
+ max_episode_steps: 200
29
+ make_env: true
30
+ continuous_task: true
31
+ cat_state: true
32
+ cat_pixels: false
33
+ frame_stack: 3
34
+ stationary_base: false
35
+ stationary_torso: false
36
+ stationary_head: true
37
+ task_plan_fp: task_plans/prepare_groceries/pick/train/008_pudding_box.json
38
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
39
+ record_video: false
40
+ debug_video: false
41
+ save_video_freq: null
42
+ info_on_video: true
43
+ extra_stat_keys: []
44
+ env_kwargs:
45
+ robot_force_mult: 0.001
46
+ robot_force_penalty_min: 0.2
47
+ target_randomization: false
48
+ algo:
49
+ name: sac
50
+ replay_buffer_capacity: 995400
51
+ total_timesteps: 50000000
52
+ num_steps: 100
53
+ init_steps: 5000
54
+ batch_size: 512
55
+ critic_encoder_tau: 0.005
56
+ cnn_features:
57
+ - 32
58
+ - 64
59
+ - 128
60
+ - 256
61
+ cnn_filters:
62
+ - 3
63
+ - 3
64
+ - 3
65
+ - 3
66
+ cnn_strides:
67
+ - 2
68
+ - 2
69
+ - 2
70
+ - 2
71
+ cnn_padding: valid
72
+ encoder_pixels_feature_dim: 50
73
+ encoder_state_feature_dim: 50
74
+ detach_encoder: false
75
+ critic_hidden_dims:
76
+ - 256
77
+ - 256
78
+ - 256
79
+ critic_lr: 0.0003
80
+ critic_layer_norm: true
81
+ critic_dropout: null
82
+ critic_beta: 0.9
83
+ critic_tau: 0.005
84
+ critic_target_update_freq: 2
85
+ actor_hidden_dims:
86
+ - 256
87
+ - 256
88
+ - 256
89
+ actor_lr: 0.0003
90
+ actor_beta: 0.9
91
+ actor_log_std_min: -20
92
+ actor_log_std_max: 2
93
+ actor_update_freq: 2
94
+ gamma: 0.9
95
+ init_temperature: 0.1
96
+ alpha_lr: 0.0003
97
+ alpha_beta: 0.9
98
+ log_freq: 10000
99
+ save_freq: 100000000
100
+ eval_freq: 100000
101
+ torch_deterministic: true
102
+ save_backup_ckpts: false
103
+ eval_episodes: 189
104
+ num_envs: 63
105
+ num_eval_envs: 189
106
+ num_iterations: 793651
107
+ logger:
108
+ workspace: mshab_exps
109
+ exp_name: rcad-prepare_groceries-pick-008_pudding_box
110
+ clear_out: true
111
+ tensorboard: true
112
+ wandb: false
113
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/008_pudding_box/policy.pt"
rl/prepare_groceries/pick/008_pudding_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:092289867d462c7818abc0d452207edb305cf12c4be251b26eba6396377ffdc3
3
+ size 55487432
rl/prepare_groceries/pick/009_gelatin_box/config.yml ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 4682
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/009_gelatin_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ save_video_freq: null
19
+ info_on_video: false
20
+ extra_stat_keys: []
21
+ env_kwargs:
22
+ robot_force_mult: 0.001
23
+ robot_force_penalty_min: 0.2
24
+ target_randomization: false
25
+ eval_env:
26
+ env_id: PickSubtaskTrain-v0
27
+ num_envs: 189
28
+ max_episode_steps: 200
29
+ make_env: true
30
+ continuous_task: true
31
+ cat_state: true
32
+ cat_pixels: false
33
+ frame_stack: 3
34
+ stationary_base: false
35
+ stationary_torso: false
36
+ stationary_head: true
37
+ task_plan_fp: task_plans/prepare_groceries/pick/train/009_gelatin_box.json
38
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
39
+ record_video: false
40
+ debug_video: false
41
+ save_video_freq: null
42
+ info_on_video: true
43
+ extra_stat_keys: []
44
+ env_kwargs:
45
+ robot_force_mult: 0.001
46
+ robot_force_penalty_min: 0.2
47
+ target_randomization: false
48
+ algo:
49
+ name: sac
50
+ replay_buffer_capacity: 995400
51
+ total_timesteps: 50000000
52
+ num_steps: 100
53
+ init_steps: 5000
54
+ batch_size: 512
55
+ critic_encoder_tau: 0.005
56
+ cnn_features:
57
+ - 32
58
+ - 64
59
+ - 128
60
+ - 256
61
+ cnn_filters:
62
+ - 3
63
+ - 3
64
+ - 3
65
+ - 3
66
+ cnn_strides:
67
+ - 2
68
+ - 2
69
+ - 2
70
+ - 2
71
+ cnn_padding: valid
72
+ encoder_pixels_feature_dim: 50
73
+ encoder_state_feature_dim: 50
74
+ detach_encoder: false
75
+ critic_hidden_dims:
76
+ - 256
77
+ - 256
78
+ - 256
79
+ critic_lr: 0.0003
80
+ critic_layer_norm: true
81
+ critic_dropout: null
82
+ critic_beta: 0.9
83
+ critic_tau: 0.005
84
+ critic_target_update_freq: 2
85
+ actor_hidden_dims:
86
+ - 256
87
+ - 256
88
+ - 256
89
+ actor_lr: 0.0003
90
+ actor_beta: 0.9
91
+ actor_log_std_min: -20
92
+ actor_log_std_max: 2
93
+ actor_update_freq: 2
94
+ gamma: 0.9
95
+ init_temperature: 0.1
96
+ alpha_lr: 0.0003
97
+ alpha_beta: 0.9
98
+ log_freq: 10000
99
+ save_freq: 100000000
100
+ eval_freq: 100000
101
+ torch_deterministic: true
102
+ save_backup_ckpts: false
103
+ eval_episodes: 189
104
+ num_envs: 63
105
+ num_eval_envs: 189
106
+ num_iterations: 793651
107
+ logger:
108
+ workspace: mshab_exps
109
+ exp_name: rcad-prepare_groceries-pick-009_gelatin_box
110
+ clear_out: true
111
+ tensorboard: true
112
+ wandb: false
113
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/009_gelatin_box/policy.pt"
rl/prepare_groceries/pick/009_gelatin_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:832117171b3829047b6f2f661abd769bb17ef6c47fb580572478d82f8f034ee3
3
+ size 55487432
rl/prepare_groceries/pick/010_potted_meat_can/config.yml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/010_potted_meat_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ save_video_freq: null
18
+ info_on_video: false
19
+ extra_stat_keys: []
20
+ env_kwargs:
21
+ robot_force_mult: 0.001
22
+ robot_force_penalty_min: 0.2
23
+ target_randomization: false
24
+ eval_env:
25
+ env_id: PickSubtaskTrain-v0
26
+ num_envs: 189
27
+ max_episode_steps: 200
28
+ make_env: true
29
+ continuous_task: true
30
+ cat_state: true
31
+ cat_pixels: false
32
+ frame_stack: 3
33
+ stationary_base: false
34
+ stationary_torso: false
35
+ stationary_head: true
36
+ task_plan_fp: task_plans/prepare_groceries/pick/train/010_potted_meat_can.json
37
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
38
+ record_video: false
39
+ save_video_freq: null
40
+ info_on_video: true
41
+ extra_stat_keys: []
42
+ env_kwargs:
43
+ robot_force_mult: 0.001
44
+ robot_force_penalty_min: 0.2
45
+ target_randomization: false
46
+ algo:
47
+ name: sac
48
+ replay_buffer_capacity: 995400
49
+ total_timesteps: 50000000
50
+ num_steps: 100
51
+ init_steps: 5000
52
+ batch_size: 512
53
+ critic_encoder_tau: 0.005
54
+ cnn_features:
55
+ - 32
56
+ - 64
57
+ - 128
58
+ - 256
59
+ cnn_filters:
60
+ - 3
61
+ - 3
62
+ - 3
63
+ - 3
64
+ cnn_strides:
65
+ - 2
66
+ - 2
67
+ - 2
68
+ - 2
69
+ cnn_padding: valid
70
+ encoder_pixels_feature_dim: 50
71
+ encoder_state_feature_dim: 50
72
+ detach_encoder: false
73
+ critic_hidden_dims:
74
+ - 256
75
+ - 256
76
+ - 256
77
+ critic_lr: 0.0003
78
+ critic_layer_norm: true
79
+ critic_dropout: null
80
+ critic_beta: 0.9
81
+ critic_tau: 0.005
82
+ critic_target_update_freq: 2
83
+ actor_hidden_dims:
84
+ - 256
85
+ - 256
86
+ - 256
87
+ actor_lr: 0.0003
88
+ actor_beta: 0.9
89
+ actor_log_std_min: -20
90
+ actor_log_std_max: 2
91
+ actor_update_freq: 2
92
+ gamma: 0.9
93
+ init_temperature: 0.1
94
+ alpha_lr: 0.0003
95
+ alpha_beta: 0.9
96
+ log_freq: 10000
97
+ save_freq: 100000000
98
+ eval_freq: 100000
99
+ torch_deterministic: true
100
+ eval_episodes: 189
101
+ num_envs: 63
102
+ num_eval_envs: 189
103
+ num_iterations: 793651
104
+ logger:
105
+ workspace: mshab_exps
106
+ exp_name: rcad-prepare_groceries-pick-010_potted_meat_can
107
+ clear_out: true
108
+ tensorboard: true
109
+ wandb: false
110
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/010_potted_meat_can/policy.pt"
rl/prepare_groceries/pick/010_potted_meat_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a04f8e0243b9ba59f50e2ae07d9269f34334d95da45e88897f1cd10d6dab5824
3
+ size 55487432
rl/prepare_groceries/pick/024_bowl/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 4682
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/024_bowl.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PickSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/pick/train/024_bowl.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-pick-024_bowl
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/024_bowl/policy.pt"
rl/prepare_groceries/pick/024_bowl/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:814686bd77abb5defd041b3ebf8edbdce26701255125843601ab03430e0d8180
3
+ size 55487706
rl/prepare_groceries/pick/all/config.yml ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 4682
2
+ env:
3
+ env_id: PickSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ save_video_freq: null
19
+ info_on_video: false
20
+ extra_stat_keys: []
21
+ env_kwargs:
22
+ robot_force_mult: 0.001
23
+ robot_force_penalty_min: 0.2
24
+ target_randomization: false
25
+ eval_env:
26
+ env_id: PickSubtaskTrain-v0
27
+ num_envs: 189
28
+ max_episode_steps: 200
29
+ make_env: true
30
+ continuous_task: true
31
+ cat_state: true
32
+ cat_pixels: false
33
+ frame_stack: 3
34
+ stationary_base: false
35
+ stationary_torso: false
36
+ stationary_head: true
37
+ task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
38
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
39
+ record_video: false
40
+ debug_video: false
41
+ save_video_freq: null
42
+ info_on_video: true
43
+ extra_stat_keys: []
44
+ env_kwargs:
45
+ robot_force_mult: 0.001
46
+ robot_force_penalty_min: 0.2
47
+ target_randomization: false
48
+ algo:
49
+ name: sac
50
+ replay_buffer_capacity: 995400
51
+ total_timesteps: 50000000
52
+ num_steps: 100
53
+ init_steps: 5000
54
+ batch_size: 512
55
+ critic_encoder_tau: 0.005
56
+ cnn_features:
57
+ - 32
58
+ - 64
59
+ - 128
60
+ - 256
61
+ cnn_filters:
62
+ - 3
63
+ - 3
64
+ - 3
65
+ - 3
66
+ cnn_strides:
67
+ - 2
68
+ - 2
69
+ - 2
70
+ - 2
71
+ cnn_padding: valid
72
+ encoder_pixels_feature_dim: 50
73
+ encoder_state_feature_dim: 50
74
+ detach_encoder: false
75
+ critic_hidden_dims:
76
+ - 256
77
+ - 256
78
+ - 256
79
+ critic_lr: 0.0003
80
+ critic_layer_norm: true
81
+ critic_dropout: null
82
+ critic_beta: 0.9
83
+ critic_tau: 0.005
84
+ critic_target_update_freq: 2
85
+ actor_hidden_dims:
86
+ - 256
87
+ - 256
88
+ - 256
89
+ actor_lr: 0.0003
90
+ actor_beta: 0.9
91
+ actor_log_std_min: -20
92
+ actor_log_std_max: 2
93
+ actor_update_freq: 2
94
+ gamma: 0.9
95
+ init_temperature: 0.1
96
+ alpha_lr: 0.0003
97
+ alpha_beta: 0.9
98
+ log_freq: 10000
99
+ save_freq: 100000000
100
+ eval_freq: 100000
101
+ torch_deterministic: true
102
+ save_backup_ckpts: false
103
+ eval_episodes: 189
104
+ num_envs: 63
105
+ num_eval_envs: 189
106
+ num_iterations: 793651
107
+ logger:
108
+ workspace: mshab_exps
109
+ exp_name: rcad-prepare_groceries-pick-all
110
+ clear_out: true
111
+ tensorboard: true
112
+ wandb: false
113
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/all/policy.pt"
rl/prepare_groceries/pick/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29ae12a7bbac520ae4b0c46abfa955da294b6a09e5467abe6ecfbf9d672de52b
3
+ size 55487432
rl/prepare_groceries/place/002_master_chef_can/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/002_master_chef_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PlaceSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/place/train/002_master_chef_can.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-place-002_master_chef_can
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/002_master_chef_can/policy.pt"
rl/prepare_groceries/place/002_master_chef_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab001cd4b88ee6cf115c6c65a67c40b9953b347610540b17b3d524e3b82f7bde
3
+ size 55487706
rl/prepare_groceries/place/003_cracker_box/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/003_cracker_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PlaceSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/place/train/003_cracker_box.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-place-003_cracker_box
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/003_cracker_box/policy.pt"
rl/prepare_groceries/place/003_cracker_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc5a60777bb9cbbc3287de2b66e908913ffde5ed2c289096bd06702cbcf6f09a
3
+ size 55487706
rl/prepare_groceries/place/004_sugar_box/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 4682
2
+ env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/004_sugar_box.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PlaceSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/place/train/004_sugar_box.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 25000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 396826
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-place-004_sugar_box
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/004_sugar_box/policy.pt"
rl/prepare_groceries/place/004_sugar_box/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b9cace25d850c05712488fd4cbeb409c08c2f73cd0fcfa253e411b434a7a1c2
3
+ size 55487706
rl/prepare_groceries/place/005_tomato_soup_can/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/005_tomato_soup_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PlaceSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/place/train/005_tomato_soup_can.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-place-005_tomato_soup_can
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/005_tomato_soup_can/policy.pt"
rl/prepare_groceries/place/005_tomato_soup_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbe87309a420c505231a349b10c2d27e25e5cf481f3b485f301e7267244cebfe
3
+ size 55487706
rl/prepare_groceries/place/007_tuna_fish_can/config.yml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: PlaceSubtaskTrain-v0
4
+ num_envs: 63
5
+ max_episode_steps: 100
6
+ make_env: true
7
+ continuous_task: true
8
+ cat_state: true
9
+ cat_pixels: false
10
+ frame_stack: 3
11
+ stationary_base: false
12
+ stationary_torso: false
13
+ stationary_head: true
14
+ task_plan_fp: task_plans/prepare_groceries/place/train/007_tuna_fish_can.json
15
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
16
+ record_video: false
17
+ debug_video: false
18
+ debug_video_gen: false
19
+ save_video_freq: null
20
+ info_on_video: false
21
+ extra_stat_keys: []
22
+ env_kwargs:
23
+ robot_force_mult: 0.001
24
+ robot_force_penalty_min: 0.2
25
+ target_randomization: false
26
+ eval_env:
27
+ env_id: PlaceSubtaskTrain-v0
28
+ num_envs: 189
29
+ max_episode_steps: 200
30
+ make_env: true
31
+ continuous_task: true
32
+ cat_state: true
33
+ cat_pixels: false
34
+ frame_stack: 3
35
+ stationary_base: false
36
+ stationary_torso: false
37
+ stationary_head: true
38
+ task_plan_fp: task_plans/prepare_groceries/place/train/007_tuna_fish_can.json
39
+ spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
40
+ record_video: false
41
+ debug_video: false
42
+ debug_video_gen: false
43
+ save_video_freq: null
44
+ info_on_video: true
45
+ extra_stat_keys: []
46
+ env_kwargs:
47
+ robot_force_mult: 0.001
48
+ robot_force_penalty_min: 0.2
49
+ target_randomization: false
50
+ algo:
51
+ name: sac
52
+ replay_buffer_capacity: 995400
53
+ total_timesteps: 50000000
54
+ num_steps: 100
55
+ init_steps: 5000
56
+ batch_size: 512
57
+ critic_encoder_tau: 0.005
58
+ cnn_features:
59
+ - 32
60
+ - 64
61
+ - 128
62
+ - 256
63
+ cnn_filters:
64
+ - 3
65
+ - 3
66
+ - 3
67
+ - 3
68
+ cnn_strides:
69
+ - 2
70
+ - 2
71
+ - 2
72
+ - 2
73
+ cnn_padding: valid
74
+ encoder_pixels_feature_dim: 50
75
+ encoder_state_feature_dim: 50
76
+ detach_encoder: false
77
+ critic_hidden_dims:
78
+ - 256
79
+ - 256
80
+ - 256
81
+ critic_lr: 0.0003
82
+ critic_layer_norm: true
83
+ critic_dropout: null
84
+ critic_beta: 0.9
85
+ critic_tau: 0.005
86
+ critic_target_update_freq: 2
87
+ actor_hidden_dims:
88
+ - 256
89
+ - 256
90
+ - 256
91
+ actor_lr: 0.0003
92
+ actor_beta: 0.9
93
+ actor_log_std_min: -20
94
+ actor_log_std_max: 2
95
+ actor_update_freq: 2
96
+ gamma: 0.9
97
+ init_temperature: 0.1
98
+ alpha_lr: 0.0003
99
+ alpha_beta: 0.9
100
+ log_freq: 10000
101
+ save_freq: 100000
102
+ eval_freq: 100000
103
+ torch_deterministic: true
104
+ save_backup_ckpts: false
105
+ eval_episodes: 189
106
+ num_envs: 63
107
+ num_eval_envs: 189
108
+ num_iterations: 793651
109
+ logger:
110
+ workspace: mshab_exps
111
+ exp_name: rcad-prepare_groceries-place-007_tuna_fish_can
112
+ clear_out: true
113
+ tensorboard: true
114
+ wandb: false
115
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/007_tuna_fish_can/policy.pt"
rl/prepare_groceries/place/007_tuna_fish_can/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a142a4f53b76fa20c185c2b44bb5396f40755d83005b5f2b1a4b3dab25da5d1c
3
+ size 55487706