bc and rl checkpoints
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- bc/prepare_groceries/pick/all/config.yml +46 -0
- bc/prepare_groceries/pick/all/policy.pt +3 -0
- bc/prepare_groceries/place/all/config.yml +47 -0
- bc/prepare_groceries/place/all/policy.pt +3 -0
- bc/set_table/close/fridge/config.yml +47 -0
- bc/set_table/close/fridge/policy.pt +3 -0
- bc/set_table/close/kitchen_counter/config.yml +47 -0
- bc/set_table/close/kitchen_counter/policy.pt +3 -0
- bc/set_table/open/fridge/config.yml +47 -0
- bc/set_table/open/fridge/policy.pt +3 -0
- bc/set_table/open/kitchen_counter/config.yml +47 -0
- bc/set_table/open/kitchen_counter/policy.pt +3 -0
- bc/set_table/pick/all/config.yml +47 -0
- bc/set_table/pick/all/policy.pt +3 -0
- bc/set_table/place/all/config.yml +47 -0
- bc/set_table/place/all/policy.pt +3 -0
- bc/tidy_house/pick/all/config.yml +46 -0
- bc/tidy_house/pick/all/policy.pt +3 -0
- bc/tidy_house/place/all/config.yml +46 -0
- bc/tidy_house/place/all/policy.pt +3 -0
- rl/prepare_groceries/pick/002_master_chef_can/config.yml +110 -0
- rl/prepare_groceries/pick/002_master_chef_can/policy.pt +3 -0
- rl/prepare_groceries/pick/003_cracker_box/config.yml +110 -0
- rl/prepare_groceries/pick/003_cracker_box/policy.pt +3 -0
- rl/prepare_groceries/pick/004_sugar_box/config.yml +111 -0
- rl/prepare_groceries/pick/004_sugar_box/policy.pt +3 -0
- rl/prepare_groceries/pick/005_tomato_soup_can/config.yml +115 -0
- rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt +3 -0
- rl/prepare_groceries/pick/007_tuna_fish_can/config.yml +111 -0
- rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt +3 -0
- rl/prepare_groceries/pick/008_pudding_box/config.yml +113 -0
- rl/prepare_groceries/pick/008_pudding_box/policy.pt +3 -0
- rl/prepare_groceries/pick/009_gelatin_box/config.yml +113 -0
- rl/prepare_groceries/pick/009_gelatin_box/policy.pt +3 -0
- rl/prepare_groceries/pick/010_potted_meat_can/config.yml +110 -0
- rl/prepare_groceries/pick/010_potted_meat_can/policy.pt +3 -0
- rl/prepare_groceries/pick/024_bowl/config.yml +115 -0
- rl/prepare_groceries/pick/024_bowl/policy.pt +3 -0
- rl/prepare_groceries/pick/all/config.yml +113 -0
- rl/prepare_groceries/pick/all/policy.pt +3 -0
- rl/prepare_groceries/place/002_master_chef_can/config.yml +115 -0
- rl/prepare_groceries/place/002_master_chef_can/policy.pt +3 -0
- rl/prepare_groceries/place/003_cracker_box/config.yml +115 -0
- rl/prepare_groceries/place/003_cracker_box/policy.pt +3 -0
- rl/prepare_groceries/place/004_sugar_box/config.yml +115 -0
- rl/prepare_groceries/place/004_sugar_box/policy.pt +3 -0
- rl/prepare_groceries/place/005_tomato_soup_can/config.yml +115 -0
- rl/prepare_groceries/place/005_tomato_soup_can/policy.pt +3 -0
- rl/prepare_groceries/place/007_tuna_fish_can/config.yml +115 -0
- rl/prepare_groceries/place/007_tuna_fish_can/policy.pt +3 -0
bc/prepare_groceries/pick/all/config.yml
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/prepare_groceries/pick
|
36 |
+
max_cache_size: 300000
|
37 |
+
torch_deterministic: true
|
38 |
+
eval_episodes: 252
|
39 |
+
num_eval_envs: 252
|
40 |
+
logger:
|
41 |
+
workspace: mshab_exps
|
42 |
+
exp_name: rcad-prepare_groceries-pick-all
|
43 |
+
clear_out: true
|
44 |
+
tensorboard: true
|
45 |
+
wandb: false
|
46 |
+
model_ckpt: "mshab_checkpoints/bc/prepare_groceries/pick/all/policy.pt"
|
bc/prepare_groceries/pick/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b90849268bcaefe1fa1c1abd79f9e259a48f42617bc152bdeb8943dbd39a45c
|
3 |
+
size 238201234
|
bc/prepare_groceries/place/all/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/prepare_groceries/place
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: all
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-prepare_groceries-place-all
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/prepare_groceries/place/all/policy.pt"
|
bc/prepare_groceries/place/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4bc570e9aad369d26c62d69c5e441f7a46fc45ec20221c5c6f3d11708a49f6e
|
3 |
+
size 238201234
|
bc/set_table/close/fridge/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: CloseSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/close/train/fridge.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/close/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/close/fridge.h5
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: 1000
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-close-fridge
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/close/fridge/policy.pt"
|
bc/set_table/close/fridge/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e6802c0b767f70b819f74eaf1b063d028e0592cf6ad0cf47739439bf2f1a3f
|
3 |
+
size 238200850
|
bc/set_table/close/kitchen_counter/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: CloseSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/close/train/kitchen_counter.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/close/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/close/kitchen_counter.h5
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: 1000
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-close-kitchen_counter
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/close/kitchen_counter/policy.pt"
|
bc/set_table/close/kitchen_counter/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc31e96c04a6e5ffc1f698c9c55e17f2ca136db1865085df71520ec4a59025a
|
3 |
+
size 238200850
|
bc/set_table/open/fridge/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: OpenSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/open/train/fridge.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/open/fridge.h5
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: 1000
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-close-fridge
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/close/fridge/policy.pt"
|
bc/set_table/open/fridge/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80f614cdfbef42079f9f4254224484d71d49057801182417628d181646cefe38
|
3 |
+
size 238200850
|
bc/set_table/open/kitchen_counter/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: OpenSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/open/train/kitchen_counter.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/open/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/open/kitchen_counter.h5
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: 1000
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-close-kitchen_counter
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/close/kitchen_counter/policy.pt"
|
bc/set_table/open/kitchen_counter/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dc77a7e29552c1d407a38bd608173d12d40da3dd35eec934b537a9024b8c21e
|
3 |
+
size 238200850
|
bc/set_table/pick/all/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/pick/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/pick
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: all
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-pick-all
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/pick/all/policy.pt"
|
bc/set_table/pick/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3593b72dfc3c265fb8a294b6f3bb79c86472d4efada6437d50c66daee7cbd58
|
3 |
+
size 238200850
|
bc/set_table/place/all/config.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/set_table/place/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/set_table/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/set_table/place
|
36 |
+
max_cache_size: 300000
|
37 |
+
trajs_per_obj: all
|
38 |
+
torch_deterministic: true
|
39 |
+
eval_episodes: 252
|
40 |
+
num_eval_envs: 252
|
41 |
+
logger:
|
42 |
+
workspace: mshab_exps
|
43 |
+
exp_name: rcad-set_table-place-all
|
44 |
+
clear_out: true
|
45 |
+
tensorboard: true
|
46 |
+
wandb: false
|
47 |
+
model_ckpt: "mshab_checkpoints/bc/set_table/place/all/policy.pt"
|
bc/set_table/place/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39cb5b0a2000c8184a5e4a25cda28e60602734a81e05be972a18f27f911bda2a
|
3 |
+
size 238200850
|
bc/tidy_house/pick/all/config.yml
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/tidy_house/pick/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/tidy_house/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 25
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/tidy_house/pick
|
36 |
+
max_cache_size: 300000
|
37 |
+
torch_deterministic: true
|
38 |
+
eval_episodes: 252
|
39 |
+
num_eval_envs: 252
|
40 |
+
logger:
|
41 |
+
workspace: mshab_exps
|
42 |
+
exp_name: rcad-tidy_house-pick-all
|
43 |
+
clear_out: true
|
44 |
+
tensorboard: true
|
45 |
+
wandb: false
|
46 |
+
model_ckpt: "mshab_checkpoints/bc/tidy_house/pick/all/policy.pt"
|
bc/tidy_house/pick/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:250f92d9a0d6c42f78ba85ac0cab740eee1f80619f6f6fbf39b7ad8aa676d3c8
|
3 |
+
size 238201234
|
bc/tidy_house/place/all/config.yml
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 0
|
2 |
+
eval_env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 252
|
5 |
+
max_episode_steps: 200
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 1
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/tidy_house/place/train/all.json
|
15 |
+
spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/tidy_house/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: 1
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
algo:
|
27 |
+
name: bc
|
28 |
+
lr: 0.0003
|
29 |
+
batch_size: 512
|
30 |
+
epochs: 10
|
31 |
+
eval_freq: 1
|
32 |
+
log_freq: 1
|
33 |
+
save_freq: 1
|
34 |
+
save_backup_ckpts: false
|
35 |
+
data_dir_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange-dataset/tidy_house/place
|
36 |
+
max_cache_size: 300000
|
37 |
+
torch_deterministic: true
|
38 |
+
eval_episodes: 252
|
39 |
+
num_eval_envs: 252
|
40 |
+
logger:
|
41 |
+
workspace: mshab_exps
|
42 |
+
exp_name: rcad-tidy_house-place-all
|
43 |
+
clear_out: true
|
44 |
+
tensorboard: true
|
45 |
+
wandb: false
|
46 |
+
model_ckpt: "mshab_checkpoints/bc/tidy_house/place/all/policy.pt"
|
bc/tidy_house/place/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e947b7ab786abd6817536bd7af53897f97c89d1214d06ac0c025df5c915b0f2
|
3 |
+
size 238200850
|
rl/prepare_groceries/pick/002_master_chef_can/config.yml
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/002_master_chef_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
save_video_freq: null
|
18 |
+
info_on_video: false
|
19 |
+
extra_stat_keys: []
|
20 |
+
env_kwargs:
|
21 |
+
robot_force_mult: 0.001
|
22 |
+
robot_force_penalty_min: 0.2
|
23 |
+
target_randomization: false
|
24 |
+
eval_env:
|
25 |
+
env_id: PickSubtaskTrain-v0
|
26 |
+
num_envs: 189
|
27 |
+
max_episode_steps: 200
|
28 |
+
make_env: true
|
29 |
+
continuous_task: true
|
30 |
+
cat_state: true
|
31 |
+
cat_pixels: false
|
32 |
+
frame_stack: 3
|
33 |
+
stationary_base: false
|
34 |
+
stationary_torso: false
|
35 |
+
stationary_head: true
|
36 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/002_master_chef_can.json
|
37 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
38 |
+
record_video: false
|
39 |
+
save_video_freq: null
|
40 |
+
info_on_video: true
|
41 |
+
extra_stat_keys: []
|
42 |
+
env_kwargs:
|
43 |
+
robot_force_mult: 0.001
|
44 |
+
robot_force_penalty_min: 0.2
|
45 |
+
target_randomization: false
|
46 |
+
algo:
|
47 |
+
name: sac
|
48 |
+
replay_buffer_capacity: 995400
|
49 |
+
total_timesteps: 50000000
|
50 |
+
num_steps: 100
|
51 |
+
init_steps: 5000
|
52 |
+
batch_size: 512
|
53 |
+
critic_encoder_tau: 0.005
|
54 |
+
cnn_features:
|
55 |
+
- 32
|
56 |
+
- 64
|
57 |
+
- 128
|
58 |
+
- 256
|
59 |
+
cnn_filters:
|
60 |
+
- 3
|
61 |
+
- 3
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
cnn_strides:
|
65 |
+
- 2
|
66 |
+
- 2
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
cnn_padding: valid
|
70 |
+
encoder_pixels_feature_dim: 50
|
71 |
+
encoder_state_feature_dim: 50
|
72 |
+
detach_encoder: false
|
73 |
+
critic_hidden_dims:
|
74 |
+
- 256
|
75 |
+
- 256
|
76 |
+
- 256
|
77 |
+
critic_lr: 0.0003
|
78 |
+
critic_layer_norm: true
|
79 |
+
critic_dropout: null
|
80 |
+
critic_beta: 0.9
|
81 |
+
critic_tau: 0.005
|
82 |
+
critic_target_update_freq: 2
|
83 |
+
actor_hidden_dims:
|
84 |
+
- 256
|
85 |
+
- 256
|
86 |
+
- 256
|
87 |
+
actor_lr: 0.0003
|
88 |
+
actor_beta: 0.9
|
89 |
+
actor_log_std_min: -20
|
90 |
+
actor_log_std_max: 2
|
91 |
+
actor_update_freq: 2
|
92 |
+
gamma: 0.9
|
93 |
+
init_temperature: 0.1
|
94 |
+
alpha_lr: 0.0003
|
95 |
+
alpha_beta: 0.9
|
96 |
+
log_freq: 10000
|
97 |
+
save_freq: 100000000
|
98 |
+
eval_freq: 100000
|
99 |
+
torch_deterministic: true
|
100 |
+
eval_episodes: 189
|
101 |
+
num_envs: 63
|
102 |
+
num_eval_envs: 189
|
103 |
+
num_iterations: 793651
|
104 |
+
logger:
|
105 |
+
workspace: mshab_exps
|
106 |
+
exp_name: rcad-prepare_groceries-pick-002_master_chef_can
|
107 |
+
clear_out: true
|
108 |
+
tensorboard: true
|
109 |
+
wandb: false
|
110 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/002_master_chef_can/policy.pt"
|
rl/prepare_groceries/pick/002_master_chef_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb338580bfb74b7d50796705f8f5f5caccfe6d5e3a22a57485b5ccab9690ef98
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/003_cracker_box/config.yml
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/003_cracker_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
save_video_freq: null
|
18 |
+
info_on_video: false
|
19 |
+
extra_stat_keys: []
|
20 |
+
env_kwargs:
|
21 |
+
robot_force_mult: 0.001
|
22 |
+
robot_force_penalty_min: 0.2
|
23 |
+
target_randomization: false
|
24 |
+
eval_env:
|
25 |
+
env_id: PickSubtaskTrain-v0
|
26 |
+
num_envs: 189
|
27 |
+
max_episode_steps: 200
|
28 |
+
make_env: true
|
29 |
+
continuous_task: true
|
30 |
+
cat_state: true
|
31 |
+
cat_pixels: false
|
32 |
+
frame_stack: 3
|
33 |
+
stationary_base: false
|
34 |
+
stationary_torso: false
|
35 |
+
stationary_head: true
|
36 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/003_cracker_box.json
|
37 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
38 |
+
record_video: false
|
39 |
+
save_video_freq: null
|
40 |
+
info_on_video: true
|
41 |
+
extra_stat_keys: []
|
42 |
+
env_kwargs:
|
43 |
+
robot_force_mult: 0.001
|
44 |
+
robot_force_penalty_min: 0.2
|
45 |
+
target_randomization: false
|
46 |
+
algo:
|
47 |
+
name: sac
|
48 |
+
replay_buffer_capacity: 995400
|
49 |
+
total_timesteps: 50000000
|
50 |
+
num_steps: 100
|
51 |
+
init_steps: 5000
|
52 |
+
batch_size: 512
|
53 |
+
critic_encoder_tau: 0.005
|
54 |
+
cnn_features:
|
55 |
+
- 32
|
56 |
+
- 64
|
57 |
+
- 128
|
58 |
+
- 256
|
59 |
+
cnn_filters:
|
60 |
+
- 3
|
61 |
+
- 3
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
cnn_strides:
|
65 |
+
- 2
|
66 |
+
- 2
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
cnn_padding: valid
|
70 |
+
encoder_pixels_feature_dim: 50
|
71 |
+
encoder_state_feature_dim: 50
|
72 |
+
detach_encoder: false
|
73 |
+
critic_hidden_dims:
|
74 |
+
- 256
|
75 |
+
- 256
|
76 |
+
- 256
|
77 |
+
critic_lr: 0.0003
|
78 |
+
critic_layer_norm: true
|
79 |
+
critic_dropout: null
|
80 |
+
critic_beta: 0.9
|
81 |
+
critic_tau: 0.005
|
82 |
+
critic_target_update_freq: 2
|
83 |
+
actor_hidden_dims:
|
84 |
+
- 256
|
85 |
+
- 256
|
86 |
+
- 256
|
87 |
+
actor_lr: 0.0003
|
88 |
+
actor_beta: 0.9
|
89 |
+
actor_log_std_min: -20
|
90 |
+
actor_log_std_max: 2
|
91 |
+
actor_update_freq: 2
|
92 |
+
gamma: 0.9
|
93 |
+
init_temperature: 0.1
|
94 |
+
alpha_lr: 0.0003
|
95 |
+
alpha_beta: 0.9
|
96 |
+
log_freq: 10000
|
97 |
+
save_freq: 100000000
|
98 |
+
eval_freq: 100000
|
99 |
+
torch_deterministic: true
|
100 |
+
eval_episodes: 189
|
101 |
+
num_envs: 63
|
102 |
+
num_eval_envs: 189
|
103 |
+
num_iterations: 793651
|
104 |
+
logger:
|
105 |
+
workspace: mshab_exps
|
106 |
+
exp_name: rcad-prepare_groceries-pick-003_cracker_box
|
107 |
+
clear_out: true
|
108 |
+
tensorboard: true
|
109 |
+
wandb: false
|
110 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/003_cracker_box/policy.pt"
|
rl/prepare_groceries/pick/003_cracker_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d11038630d4ed9ccc9de2c8bc1522b8e104b8180c2c87cdf82e7cc10094c88c
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/004_sugar_box/config.yml
ADDED
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/004_sugar_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
save_video_freq: null
|
18 |
+
info_on_video: false
|
19 |
+
extra_stat_keys: []
|
20 |
+
env_kwargs:
|
21 |
+
robot_force_mult: 0.001
|
22 |
+
robot_force_penalty_min: 0.2
|
23 |
+
target_randomization: false
|
24 |
+
eval_env:
|
25 |
+
env_id: PickSubtaskTrain-v0
|
26 |
+
num_envs: 189
|
27 |
+
max_episode_steps: 200
|
28 |
+
make_env: true
|
29 |
+
continuous_task: true
|
30 |
+
cat_state: true
|
31 |
+
cat_pixels: false
|
32 |
+
frame_stack: 3
|
33 |
+
stationary_base: false
|
34 |
+
stationary_torso: false
|
35 |
+
stationary_head: true
|
36 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/004_sugar_box.json
|
37 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
38 |
+
record_video: false
|
39 |
+
save_video_freq: null
|
40 |
+
info_on_video: true
|
41 |
+
extra_stat_keys: []
|
42 |
+
env_kwargs:
|
43 |
+
robot_force_mult: 0.001
|
44 |
+
robot_force_penalty_min: 0.2
|
45 |
+
target_randomization: false
|
46 |
+
algo:
|
47 |
+
name: sac
|
48 |
+
replay_buffer_capacity: 995400
|
49 |
+
total_timesteps: 50000000
|
50 |
+
num_steps: 100
|
51 |
+
init_steps: 5000
|
52 |
+
batch_size: 512
|
53 |
+
critic_encoder_tau: 0.005
|
54 |
+
cnn_features:
|
55 |
+
- 32
|
56 |
+
- 64
|
57 |
+
- 128
|
58 |
+
- 256
|
59 |
+
cnn_filters:
|
60 |
+
- 3
|
61 |
+
- 3
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
cnn_strides:
|
65 |
+
- 2
|
66 |
+
- 2
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
cnn_padding: valid
|
70 |
+
encoder_pixels_feature_dim: 50
|
71 |
+
encoder_state_feature_dim: 50
|
72 |
+
detach_encoder: false
|
73 |
+
critic_hidden_dims:
|
74 |
+
- 256
|
75 |
+
- 256
|
76 |
+
- 256
|
77 |
+
critic_lr: 0.0003
|
78 |
+
critic_layer_norm: true
|
79 |
+
critic_dropout: null
|
80 |
+
critic_beta: 0.9
|
81 |
+
critic_tau: 0.005
|
82 |
+
critic_target_update_freq: 2
|
83 |
+
actor_hidden_dims:
|
84 |
+
- 256
|
85 |
+
- 256
|
86 |
+
- 256
|
87 |
+
actor_lr: 0.0003
|
88 |
+
actor_beta: 0.9
|
89 |
+
actor_log_std_min: -20
|
90 |
+
actor_log_std_max: 2
|
91 |
+
actor_update_freq: 2
|
92 |
+
gamma: 0.9
|
93 |
+
init_temperature: 0.1
|
94 |
+
alpha_lr: 0.0003
|
95 |
+
alpha_beta: 0.9
|
96 |
+
log_freq: 10000
|
97 |
+
save_freq: 100000000
|
98 |
+
eval_freq: 100000
|
99 |
+
torch_deterministic: true
|
100 |
+
save_backup_ckpts: false
|
101 |
+
eval_episodes: 189
|
102 |
+
num_envs: 63
|
103 |
+
num_eval_envs: 189
|
104 |
+
num_iterations: 793651
|
105 |
+
logger:
|
106 |
+
workspace: mshab_exps
|
107 |
+
exp_name: rcad-prepare_groceries-pick-004_sugar_box
|
108 |
+
clear_out: true
|
109 |
+
tensorboard: true
|
110 |
+
wandb: false
|
111 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/004_sugar_box/policy.pt"
|
rl/prepare_groceries/pick/004_sugar_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc935696ffe962efbe8e418312082245a90f43abd4a9aecaed1a130132478576
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/005_tomato_soup_can/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 4682
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/005_tomato_soup_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PickSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/005_tomato_soup_can.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-pick-005_tomato_soup_can
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt"
|
rl/prepare_groceries/pick/005_tomato_soup_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77288352508ea9e9aab0499c0a8a1bfd680cba704c98d36d8bbfbc84be8f7c4c
|
3 |
+
size 55487706
|
rl/prepare_groceries/pick/007_tuna_fish_can/config.yml
ADDED
@@ -0,0 +1,111 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/007_tuna_fish_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
save_video_freq: null
|
18 |
+
info_on_video: false
|
19 |
+
extra_stat_keys: []
|
20 |
+
env_kwargs:
|
21 |
+
robot_force_mult: 0.001
|
22 |
+
robot_force_penalty_min: 0.2
|
23 |
+
target_randomization: false
|
24 |
+
eval_env:
|
25 |
+
env_id: PickSubtaskTrain-v0
|
26 |
+
num_envs: 189
|
27 |
+
max_episode_steps: 200
|
28 |
+
make_env: true
|
29 |
+
continuous_task: true
|
30 |
+
cat_state: true
|
31 |
+
cat_pixels: false
|
32 |
+
frame_stack: 3
|
33 |
+
stationary_base: false
|
34 |
+
stationary_torso: false
|
35 |
+
stationary_head: true
|
36 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/007_tuna_fish_can.json
|
37 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
38 |
+
record_video: false
|
39 |
+
save_video_freq: null
|
40 |
+
info_on_video: true
|
41 |
+
extra_stat_keys: []
|
42 |
+
env_kwargs:
|
43 |
+
robot_force_mult: 0.001
|
44 |
+
robot_force_penalty_min: 0.2
|
45 |
+
target_randomization: false
|
46 |
+
algo:
|
47 |
+
name: sac
|
48 |
+
replay_buffer_capacity: 995400
|
49 |
+
total_timesteps: 50000000
|
50 |
+
num_steps: 100
|
51 |
+
init_steps: 5000
|
52 |
+
batch_size: 512
|
53 |
+
critic_encoder_tau: 0.005
|
54 |
+
cnn_features:
|
55 |
+
- 32
|
56 |
+
- 64
|
57 |
+
- 128
|
58 |
+
- 256
|
59 |
+
cnn_filters:
|
60 |
+
- 3
|
61 |
+
- 3
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
cnn_strides:
|
65 |
+
- 2
|
66 |
+
- 2
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
cnn_padding: valid
|
70 |
+
encoder_pixels_feature_dim: 50
|
71 |
+
encoder_state_feature_dim: 50
|
72 |
+
detach_encoder: false
|
73 |
+
critic_hidden_dims:
|
74 |
+
- 256
|
75 |
+
- 256
|
76 |
+
- 256
|
77 |
+
critic_lr: 0.0003
|
78 |
+
critic_layer_norm: true
|
79 |
+
critic_dropout: null
|
80 |
+
critic_beta: 0.9
|
81 |
+
critic_tau: 0.005
|
82 |
+
critic_target_update_freq: 2
|
83 |
+
actor_hidden_dims:
|
84 |
+
- 256
|
85 |
+
- 256
|
86 |
+
- 256
|
87 |
+
actor_lr: 0.0003
|
88 |
+
actor_beta: 0.9
|
89 |
+
actor_log_std_min: -20
|
90 |
+
actor_log_std_max: 2
|
91 |
+
actor_update_freq: 2
|
92 |
+
gamma: 0.9
|
93 |
+
init_temperature: 0.1
|
94 |
+
alpha_lr: 0.0003
|
95 |
+
alpha_beta: 0.9
|
96 |
+
log_freq: 10000
|
97 |
+
save_freq: 100000000
|
98 |
+
eval_freq: 100000
|
99 |
+
torch_deterministic: true
|
100 |
+
save_backup_ckpts: false
|
101 |
+
eval_episodes: 189
|
102 |
+
num_envs: 63
|
103 |
+
num_eval_envs: 189
|
104 |
+
num_iterations: 793651
|
105 |
+
logger:
|
106 |
+
workspace: mshab_exps
|
107 |
+
exp_name: rcad-prepare_groceries-pick-007_tuna_fish_can
|
108 |
+
clear_out: true
|
109 |
+
tensorboard: true
|
110 |
+
wandb: false
|
111 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt"
|
rl/prepare_groceries/pick/007_tuna_fish_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caf45664947dc617cc252782f7883395cc1b50472c313864220444ffe9eb2701
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/008_pudding_box/config.yml
ADDED
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 5227
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/008_pudding_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
save_video_freq: null
|
19 |
+
info_on_video: false
|
20 |
+
extra_stat_keys: []
|
21 |
+
env_kwargs:
|
22 |
+
robot_force_mult: 0.001
|
23 |
+
robot_force_penalty_min: 0.2
|
24 |
+
target_randomization: false
|
25 |
+
eval_env:
|
26 |
+
env_id: PickSubtaskTrain-v0
|
27 |
+
num_envs: 189
|
28 |
+
max_episode_steps: 200
|
29 |
+
make_env: true
|
30 |
+
continuous_task: true
|
31 |
+
cat_state: true
|
32 |
+
cat_pixels: false
|
33 |
+
frame_stack: 3
|
34 |
+
stationary_base: false
|
35 |
+
stationary_torso: false
|
36 |
+
stationary_head: true
|
37 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/008_pudding_box.json
|
38 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
39 |
+
record_video: false
|
40 |
+
debug_video: false
|
41 |
+
save_video_freq: null
|
42 |
+
info_on_video: true
|
43 |
+
extra_stat_keys: []
|
44 |
+
env_kwargs:
|
45 |
+
robot_force_mult: 0.001
|
46 |
+
robot_force_penalty_min: 0.2
|
47 |
+
target_randomization: false
|
48 |
+
algo:
|
49 |
+
name: sac
|
50 |
+
replay_buffer_capacity: 995400
|
51 |
+
total_timesteps: 50000000
|
52 |
+
num_steps: 100
|
53 |
+
init_steps: 5000
|
54 |
+
batch_size: 512
|
55 |
+
critic_encoder_tau: 0.005
|
56 |
+
cnn_features:
|
57 |
+
- 32
|
58 |
+
- 64
|
59 |
+
- 128
|
60 |
+
- 256
|
61 |
+
cnn_filters:
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
cnn_strides:
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
cnn_padding: valid
|
72 |
+
encoder_pixels_feature_dim: 50
|
73 |
+
encoder_state_feature_dim: 50
|
74 |
+
detach_encoder: false
|
75 |
+
critic_hidden_dims:
|
76 |
+
- 256
|
77 |
+
- 256
|
78 |
+
- 256
|
79 |
+
critic_lr: 0.0003
|
80 |
+
critic_layer_norm: true
|
81 |
+
critic_dropout: null
|
82 |
+
critic_beta: 0.9
|
83 |
+
critic_tau: 0.005
|
84 |
+
critic_target_update_freq: 2
|
85 |
+
actor_hidden_dims:
|
86 |
+
- 256
|
87 |
+
- 256
|
88 |
+
- 256
|
89 |
+
actor_lr: 0.0003
|
90 |
+
actor_beta: 0.9
|
91 |
+
actor_log_std_min: -20
|
92 |
+
actor_log_std_max: 2
|
93 |
+
actor_update_freq: 2
|
94 |
+
gamma: 0.9
|
95 |
+
init_temperature: 0.1
|
96 |
+
alpha_lr: 0.0003
|
97 |
+
alpha_beta: 0.9
|
98 |
+
log_freq: 10000
|
99 |
+
save_freq: 100000000
|
100 |
+
eval_freq: 100000
|
101 |
+
torch_deterministic: true
|
102 |
+
save_backup_ckpts: false
|
103 |
+
eval_episodes: 189
|
104 |
+
num_envs: 63
|
105 |
+
num_eval_envs: 189
|
106 |
+
num_iterations: 793651
|
107 |
+
logger:
|
108 |
+
workspace: mshab_exps
|
109 |
+
exp_name: rcad-prepare_groceries-pick-008_pudding_box
|
110 |
+
clear_out: true
|
111 |
+
tensorboard: true
|
112 |
+
wandb: false
|
113 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/008_pudding_box/policy.pt"
|
rl/prepare_groceries/pick/008_pudding_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:092289867d462c7818abc0d452207edb305cf12c4be251b26eba6396377ffdc3
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/009_gelatin_box/config.yml
ADDED
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 4682
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/009_gelatin_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
save_video_freq: null
|
19 |
+
info_on_video: false
|
20 |
+
extra_stat_keys: []
|
21 |
+
env_kwargs:
|
22 |
+
robot_force_mult: 0.001
|
23 |
+
robot_force_penalty_min: 0.2
|
24 |
+
target_randomization: false
|
25 |
+
eval_env:
|
26 |
+
env_id: PickSubtaskTrain-v0
|
27 |
+
num_envs: 189
|
28 |
+
max_episode_steps: 200
|
29 |
+
make_env: true
|
30 |
+
continuous_task: true
|
31 |
+
cat_state: true
|
32 |
+
cat_pixels: false
|
33 |
+
frame_stack: 3
|
34 |
+
stationary_base: false
|
35 |
+
stationary_torso: false
|
36 |
+
stationary_head: true
|
37 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/009_gelatin_box.json
|
38 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
39 |
+
record_video: false
|
40 |
+
debug_video: false
|
41 |
+
save_video_freq: null
|
42 |
+
info_on_video: true
|
43 |
+
extra_stat_keys: []
|
44 |
+
env_kwargs:
|
45 |
+
robot_force_mult: 0.001
|
46 |
+
robot_force_penalty_min: 0.2
|
47 |
+
target_randomization: false
|
48 |
+
algo:
|
49 |
+
name: sac
|
50 |
+
replay_buffer_capacity: 995400
|
51 |
+
total_timesteps: 50000000
|
52 |
+
num_steps: 100
|
53 |
+
init_steps: 5000
|
54 |
+
batch_size: 512
|
55 |
+
critic_encoder_tau: 0.005
|
56 |
+
cnn_features:
|
57 |
+
- 32
|
58 |
+
- 64
|
59 |
+
- 128
|
60 |
+
- 256
|
61 |
+
cnn_filters:
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
cnn_strides:
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
cnn_padding: valid
|
72 |
+
encoder_pixels_feature_dim: 50
|
73 |
+
encoder_state_feature_dim: 50
|
74 |
+
detach_encoder: false
|
75 |
+
critic_hidden_dims:
|
76 |
+
- 256
|
77 |
+
- 256
|
78 |
+
- 256
|
79 |
+
critic_lr: 0.0003
|
80 |
+
critic_layer_norm: true
|
81 |
+
critic_dropout: null
|
82 |
+
critic_beta: 0.9
|
83 |
+
critic_tau: 0.005
|
84 |
+
critic_target_update_freq: 2
|
85 |
+
actor_hidden_dims:
|
86 |
+
- 256
|
87 |
+
- 256
|
88 |
+
- 256
|
89 |
+
actor_lr: 0.0003
|
90 |
+
actor_beta: 0.9
|
91 |
+
actor_log_std_min: -20
|
92 |
+
actor_log_std_max: 2
|
93 |
+
actor_update_freq: 2
|
94 |
+
gamma: 0.9
|
95 |
+
init_temperature: 0.1
|
96 |
+
alpha_lr: 0.0003
|
97 |
+
alpha_beta: 0.9
|
98 |
+
log_freq: 10000
|
99 |
+
save_freq: 100000000
|
100 |
+
eval_freq: 100000
|
101 |
+
torch_deterministic: true
|
102 |
+
save_backup_ckpts: false
|
103 |
+
eval_episodes: 189
|
104 |
+
num_envs: 63
|
105 |
+
num_eval_envs: 189
|
106 |
+
num_iterations: 793651
|
107 |
+
logger:
|
108 |
+
workspace: mshab_exps
|
109 |
+
exp_name: rcad-prepare_groceries-pick-009_gelatin_box
|
110 |
+
clear_out: true
|
111 |
+
tensorboard: true
|
112 |
+
wandb: false
|
113 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/009_gelatin_box/policy.pt"
|
rl/prepare_groceries/pick/009_gelatin_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:832117171b3829047b6f2f661abd769bb17ef6c47fb580572478d82f8f034ee3
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/010_potted_meat_can/config.yml
ADDED
@@ -0,0 +1,110 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/010_potted_meat_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
save_video_freq: null
|
18 |
+
info_on_video: false
|
19 |
+
extra_stat_keys: []
|
20 |
+
env_kwargs:
|
21 |
+
robot_force_mult: 0.001
|
22 |
+
robot_force_penalty_min: 0.2
|
23 |
+
target_randomization: false
|
24 |
+
eval_env:
|
25 |
+
env_id: PickSubtaskTrain-v0
|
26 |
+
num_envs: 189
|
27 |
+
max_episode_steps: 200
|
28 |
+
make_env: true
|
29 |
+
continuous_task: true
|
30 |
+
cat_state: true
|
31 |
+
cat_pixels: false
|
32 |
+
frame_stack: 3
|
33 |
+
stationary_base: false
|
34 |
+
stationary_torso: false
|
35 |
+
stationary_head: true
|
36 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/010_potted_meat_can.json
|
37 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
38 |
+
record_video: false
|
39 |
+
save_video_freq: null
|
40 |
+
info_on_video: true
|
41 |
+
extra_stat_keys: []
|
42 |
+
env_kwargs:
|
43 |
+
robot_force_mult: 0.001
|
44 |
+
robot_force_penalty_min: 0.2
|
45 |
+
target_randomization: false
|
46 |
+
algo:
|
47 |
+
name: sac
|
48 |
+
replay_buffer_capacity: 995400
|
49 |
+
total_timesteps: 50000000
|
50 |
+
num_steps: 100
|
51 |
+
init_steps: 5000
|
52 |
+
batch_size: 512
|
53 |
+
critic_encoder_tau: 0.005
|
54 |
+
cnn_features:
|
55 |
+
- 32
|
56 |
+
- 64
|
57 |
+
- 128
|
58 |
+
- 256
|
59 |
+
cnn_filters:
|
60 |
+
- 3
|
61 |
+
- 3
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
cnn_strides:
|
65 |
+
- 2
|
66 |
+
- 2
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
cnn_padding: valid
|
70 |
+
encoder_pixels_feature_dim: 50
|
71 |
+
encoder_state_feature_dim: 50
|
72 |
+
detach_encoder: false
|
73 |
+
critic_hidden_dims:
|
74 |
+
- 256
|
75 |
+
- 256
|
76 |
+
- 256
|
77 |
+
critic_lr: 0.0003
|
78 |
+
critic_layer_norm: true
|
79 |
+
critic_dropout: null
|
80 |
+
critic_beta: 0.9
|
81 |
+
critic_tau: 0.005
|
82 |
+
critic_target_update_freq: 2
|
83 |
+
actor_hidden_dims:
|
84 |
+
- 256
|
85 |
+
- 256
|
86 |
+
- 256
|
87 |
+
actor_lr: 0.0003
|
88 |
+
actor_beta: 0.9
|
89 |
+
actor_log_std_min: -20
|
90 |
+
actor_log_std_max: 2
|
91 |
+
actor_update_freq: 2
|
92 |
+
gamma: 0.9
|
93 |
+
init_temperature: 0.1
|
94 |
+
alpha_lr: 0.0003
|
95 |
+
alpha_beta: 0.9
|
96 |
+
log_freq: 10000
|
97 |
+
save_freq: 100000000
|
98 |
+
eval_freq: 100000
|
99 |
+
torch_deterministic: true
|
100 |
+
eval_episodes: 189
|
101 |
+
num_envs: 63
|
102 |
+
num_eval_envs: 189
|
103 |
+
num_iterations: 793651
|
104 |
+
logger:
|
105 |
+
workspace: mshab_exps
|
106 |
+
exp_name: rcad-prepare_groceries-pick-010_potted_meat_can
|
107 |
+
clear_out: true
|
108 |
+
tensorboard: true
|
109 |
+
wandb: false
|
110 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/010_potted_meat_can/policy.pt"
|
rl/prepare_groceries/pick/010_potted_meat_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a04f8e0243b9ba59f50e2ae07d9269f34334d95da45e88897f1cd10d6dab5824
|
3 |
+
size 55487432
|
rl/prepare_groceries/pick/024_bowl/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 4682
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/024_bowl.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PickSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/024_bowl.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-pick-024_bowl
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/024_bowl/policy.pt"
|
rl/prepare_groceries/pick/024_bowl/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:814686bd77abb5defd041b3ebf8edbdce26701255125843601ab03430e0d8180
|
3 |
+
size 55487706
|
rl/prepare_groceries/pick/all/config.yml
ADDED
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 4682
|
2 |
+
env:
|
3 |
+
env_id: PickSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
save_video_freq: null
|
19 |
+
info_on_video: false
|
20 |
+
extra_stat_keys: []
|
21 |
+
env_kwargs:
|
22 |
+
robot_force_mult: 0.001
|
23 |
+
robot_force_penalty_min: 0.2
|
24 |
+
target_randomization: false
|
25 |
+
eval_env:
|
26 |
+
env_id: PickSubtaskTrain-v0
|
27 |
+
num_envs: 189
|
28 |
+
max_episode_steps: 200
|
29 |
+
make_env: true
|
30 |
+
continuous_task: true
|
31 |
+
cat_state: true
|
32 |
+
cat_pixels: false
|
33 |
+
frame_stack: 3
|
34 |
+
stationary_base: false
|
35 |
+
stationary_torso: false
|
36 |
+
stationary_head: true
|
37 |
+
task_plan_fp: task_plans/prepare_groceries/pick/train/all.json
|
38 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/pick/train/spawn_data.pt
|
39 |
+
record_video: false
|
40 |
+
debug_video: false
|
41 |
+
save_video_freq: null
|
42 |
+
info_on_video: true
|
43 |
+
extra_stat_keys: []
|
44 |
+
env_kwargs:
|
45 |
+
robot_force_mult: 0.001
|
46 |
+
robot_force_penalty_min: 0.2
|
47 |
+
target_randomization: false
|
48 |
+
algo:
|
49 |
+
name: sac
|
50 |
+
replay_buffer_capacity: 995400
|
51 |
+
total_timesteps: 50000000
|
52 |
+
num_steps: 100
|
53 |
+
init_steps: 5000
|
54 |
+
batch_size: 512
|
55 |
+
critic_encoder_tau: 0.005
|
56 |
+
cnn_features:
|
57 |
+
- 32
|
58 |
+
- 64
|
59 |
+
- 128
|
60 |
+
- 256
|
61 |
+
cnn_filters:
|
62 |
+
- 3
|
63 |
+
- 3
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
cnn_strides:
|
67 |
+
- 2
|
68 |
+
- 2
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
cnn_padding: valid
|
72 |
+
encoder_pixels_feature_dim: 50
|
73 |
+
encoder_state_feature_dim: 50
|
74 |
+
detach_encoder: false
|
75 |
+
critic_hidden_dims:
|
76 |
+
- 256
|
77 |
+
- 256
|
78 |
+
- 256
|
79 |
+
critic_lr: 0.0003
|
80 |
+
critic_layer_norm: true
|
81 |
+
critic_dropout: null
|
82 |
+
critic_beta: 0.9
|
83 |
+
critic_tau: 0.005
|
84 |
+
critic_target_update_freq: 2
|
85 |
+
actor_hidden_dims:
|
86 |
+
- 256
|
87 |
+
- 256
|
88 |
+
- 256
|
89 |
+
actor_lr: 0.0003
|
90 |
+
actor_beta: 0.9
|
91 |
+
actor_log_std_min: -20
|
92 |
+
actor_log_std_max: 2
|
93 |
+
actor_update_freq: 2
|
94 |
+
gamma: 0.9
|
95 |
+
init_temperature: 0.1
|
96 |
+
alpha_lr: 0.0003
|
97 |
+
alpha_beta: 0.9
|
98 |
+
log_freq: 10000
|
99 |
+
save_freq: 100000000
|
100 |
+
eval_freq: 100000
|
101 |
+
torch_deterministic: true
|
102 |
+
save_backup_ckpts: false
|
103 |
+
eval_episodes: 189
|
104 |
+
num_envs: 63
|
105 |
+
num_eval_envs: 189
|
106 |
+
num_iterations: 793651
|
107 |
+
logger:
|
108 |
+
workspace: mshab_exps
|
109 |
+
exp_name: rcad-prepare_groceries-pick-all
|
110 |
+
clear_out: true
|
111 |
+
tensorboard: true
|
112 |
+
wandb: false
|
113 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/pick/all/policy.pt"
|
rl/prepare_groceries/pick/all/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29ae12a7bbac520ae4b0c46abfa955da294b6a09e5467abe6ecfbf9d672de52b
|
3 |
+
size 55487432
|
rl/prepare_groceries/place/002_master_chef_can/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/002_master_chef_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PlaceSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/002_master_chef_can.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-place-002_master_chef_can
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/002_master_chef_can/policy.pt"
|
rl/prepare_groceries/place/002_master_chef_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab001cd4b88ee6cf115c6c65a67c40b9953b347610540b17b3d524e3b82f7bde
|
3 |
+
size 55487706
|
rl/prepare_groceries/place/003_cracker_box/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/003_cracker_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PlaceSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/003_cracker_box.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-place-003_cracker_box
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/003_cracker_box/policy.pt"
|
rl/prepare_groceries/place/003_cracker_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc5a60777bb9cbbc3287de2b66e908913ffde5ed2c289096bd06702cbcf6f09a
|
3 |
+
size 55487706
|
rl/prepare_groceries/place/004_sugar_box/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 4682
|
2 |
+
env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/004_sugar_box.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PlaceSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/004_sugar_box.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 25000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 396826
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-place-004_sugar_box
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/004_sugar_box/policy.pt"
|
rl/prepare_groceries/place/004_sugar_box/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b9cace25d850c05712488fd4cbeb409c08c2f73cd0fcfa253e411b434a7a1c2
|
3 |
+
size 55487706
|
rl/prepare_groceries/place/005_tomato_soup_can/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/005_tomato_soup_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PlaceSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/005_tomato_soup_can.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-place-005_tomato_soup_can
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/005_tomato_soup_can/policy.pt"
|
rl/prepare_groceries/place/005_tomato_soup_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbe87309a420c505231a349b10c2d27e25e5cf481f3b485f301e7267244cebfe
|
3 |
+
size 55487706
|
rl/prepare_groceries/place/007_tuna_fish_can/config.yml
ADDED
@@ -0,0 +1,115 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
seed: 2337
|
2 |
+
env:
|
3 |
+
env_id: PlaceSubtaskTrain-v0
|
4 |
+
num_envs: 63
|
5 |
+
max_episode_steps: 100
|
6 |
+
make_env: true
|
7 |
+
continuous_task: true
|
8 |
+
cat_state: true
|
9 |
+
cat_pixels: false
|
10 |
+
frame_stack: 3
|
11 |
+
stationary_base: false
|
12 |
+
stationary_torso: false
|
13 |
+
stationary_head: true
|
14 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/007_tuna_fish_can.json
|
15 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
16 |
+
record_video: false
|
17 |
+
debug_video: false
|
18 |
+
debug_video_gen: false
|
19 |
+
save_video_freq: null
|
20 |
+
info_on_video: false
|
21 |
+
extra_stat_keys: []
|
22 |
+
env_kwargs:
|
23 |
+
robot_force_mult: 0.001
|
24 |
+
robot_force_penalty_min: 0.2
|
25 |
+
target_randomization: false
|
26 |
+
eval_env:
|
27 |
+
env_id: PlaceSubtaskTrain-v0
|
28 |
+
num_envs: 189
|
29 |
+
max_episode_steps: 200
|
30 |
+
make_env: true
|
31 |
+
continuous_task: true
|
32 |
+
cat_state: true
|
33 |
+
cat_pixels: false
|
34 |
+
frame_stack: 3
|
35 |
+
stationary_base: false
|
36 |
+
stationary_torso: false
|
37 |
+
stationary_head: true
|
38 |
+
task_plan_fp: task_plans/prepare_groceries/place/train/007_tuna_fish_can.json
|
39 |
+
spawn_data_fp: /arshukla-fast-vol-1/ManiSkill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/place/train/spawn_data.pt
|
40 |
+
record_video: false
|
41 |
+
debug_video: false
|
42 |
+
debug_video_gen: false
|
43 |
+
save_video_freq: null
|
44 |
+
info_on_video: true
|
45 |
+
extra_stat_keys: []
|
46 |
+
env_kwargs:
|
47 |
+
robot_force_mult: 0.001
|
48 |
+
robot_force_penalty_min: 0.2
|
49 |
+
target_randomization: false
|
50 |
+
algo:
|
51 |
+
name: sac
|
52 |
+
replay_buffer_capacity: 995400
|
53 |
+
total_timesteps: 50000000
|
54 |
+
num_steps: 100
|
55 |
+
init_steps: 5000
|
56 |
+
batch_size: 512
|
57 |
+
critic_encoder_tau: 0.005
|
58 |
+
cnn_features:
|
59 |
+
- 32
|
60 |
+
- 64
|
61 |
+
- 128
|
62 |
+
- 256
|
63 |
+
cnn_filters:
|
64 |
+
- 3
|
65 |
+
- 3
|
66 |
+
- 3
|
67 |
+
- 3
|
68 |
+
cnn_strides:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 2
|
72 |
+
- 2
|
73 |
+
cnn_padding: valid
|
74 |
+
encoder_pixels_feature_dim: 50
|
75 |
+
encoder_state_feature_dim: 50
|
76 |
+
detach_encoder: false
|
77 |
+
critic_hidden_dims:
|
78 |
+
- 256
|
79 |
+
- 256
|
80 |
+
- 256
|
81 |
+
critic_lr: 0.0003
|
82 |
+
critic_layer_norm: true
|
83 |
+
critic_dropout: null
|
84 |
+
critic_beta: 0.9
|
85 |
+
critic_tau: 0.005
|
86 |
+
critic_target_update_freq: 2
|
87 |
+
actor_hidden_dims:
|
88 |
+
- 256
|
89 |
+
- 256
|
90 |
+
- 256
|
91 |
+
actor_lr: 0.0003
|
92 |
+
actor_beta: 0.9
|
93 |
+
actor_log_std_min: -20
|
94 |
+
actor_log_std_max: 2
|
95 |
+
actor_update_freq: 2
|
96 |
+
gamma: 0.9
|
97 |
+
init_temperature: 0.1
|
98 |
+
alpha_lr: 0.0003
|
99 |
+
alpha_beta: 0.9
|
100 |
+
log_freq: 10000
|
101 |
+
save_freq: 100000
|
102 |
+
eval_freq: 100000
|
103 |
+
torch_deterministic: true
|
104 |
+
save_backup_ckpts: false
|
105 |
+
eval_episodes: 189
|
106 |
+
num_envs: 63
|
107 |
+
num_eval_envs: 189
|
108 |
+
num_iterations: 793651
|
109 |
+
logger:
|
110 |
+
workspace: mshab_exps
|
111 |
+
exp_name: rcad-prepare_groceries-place-007_tuna_fish_can
|
112 |
+
clear_out: true
|
113 |
+
tensorboard: true
|
114 |
+
wandb: false
|
115 |
+
model_ckpt: "mshab_checkpoints/rl/prepare_groceries/place/007_tuna_fish_can/policy.pt"
|
rl/prepare_groceries/place/007_tuna_fish_can/policy.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a142a4f53b76fa20c185c2b44bb5396f40755d83005b5f2b1a4b3dab25da5d1c
|
3 |
+
size 55487706
|