arth-shukla commited on
Commit
91e96be
·
1 Parent(s): 4e43224

RL nav policies

Browse files
rl/prepare_groceries/navigate/all/config.yml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 2337
2
+ env:
3
+ env_id: NavigateSubtaskTrain-v0
4
+ num_envs: 189
5
+ max_episode_steps: 1000
6
+ make_env: true
7
+ obs_mode: depth
8
+ render_mode: all
9
+ shader_dir: minimal
10
+ sim_backend: gpu
11
+ continuous_task: false
12
+ cat_state: true
13
+ cat_pixels: false
14
+ frame_stack: 3
15
+ stack: null
16
+ stationary_base: false
17
+ stationary_torso: false
18
+ stationary_head: true
19
+ task_plan_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/task_plans/prepare_groceries/navigate/train/all.json
20
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/navigate/train/spawn_data.pt
21
+ record_video: false
22
+ debug_video: false
23
+ debug_video_gen: false
24
+ save_video_freq: null
25
+ info_on_video: false
26
+ extra_stat_keys: []
27
+ env_kwargs:
28
+ robot_force_mult: 0.001
29
+ robot_force_penalty_min: 0.2
30
+ target_randomization: false
31
+ task_cfgs:
32
+ navigate:
33
+ horizon: 1000
34
+ use_rot_rew: false
35
+ eval_env:
36
+ env_id: NavigateSubtaskTrain-v0
37
+ num_envs: 63
38
+ max_episode_steps: 1000
39
+ make_env: true
40
+ obs_mode: depth
41
+ render_mode: all
42
+ shader_dir: minimal
43
+ sim_backend: gpu
44
+ continuous_task: false
45
+ cat_state: true
46
+ cat_pixels: false
47
+ frame_stack: 3
48
+ stack: null
49
+ stationary_base: false
50
+ stationary_torso: false
51
+ stationary_head: true
52
+ task_plan_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/task_plans/prepare_groceries/navigate/train/all.json
53
+ spawn_data_fp: ~/.maniskill/data/scene_datasets/replica_cad_dataset/rearrange/spawn_data/prepare_groceries/navigate/train/spawn_data.pt
54
+ record_video: false
55
+ debug_video: false
56
+ debug_video_gen: false
57
+ save_video_freq: 10
58
+ info_on_video: false
59
+ extra_stat_keys: []
60
+ env_kwargs:
61
+ robot_force_mult: 0.001
62
+ robot_force_penalty_min: 0.2
63
+ target_randomization: false
64
+ task_cfgs:
65
+ navigate:
66
+ horizon: 1000
67
+ use_rot_rew: false
68
+ algo:
69
+ name: ppo
70
+ total_timesteps: 1000000000
71
+ learning_rate: 0.0003
72
+ anneal_lr: false
73
+ gamma: 0.95
74
+ gae_lambda: 0.9
75
+ num_minibatches: 16
76
+ update_epochs: 8
77
+ norm_adv: true
78
+ clip_coef: 0.2
79
+ clip_vloss: false
80
+ ent_coef: 0.0
81
+ vf_coef: 0.5
82
+ max_grad_norm: 0.5
83
+ target_kl: 0.2
84
+ log_freq: 250000
85
+ save_freq: 250000
86
+ eval_freq: null
87
+ finite_horizon_gae: true
88
+ torch_deterministic: true
89
+ save_backup_ckpts: false
90
+ num_steps: 100
91
+ num_envs: 189
92
+ num_eval_envs: 63
93
+ batch_size: 18900
94
+ minibatch_size: 1181
95
+ num_iterations: 52911
96
+ logger:
97
+ workspace: mshab_exps
98
+ exp_name: rcad-prepare_groceries-navigate-all
99
+ clear_out: true
100
+ tensorboard: true
101
+ wandb: false
102
+ model_ckpt: "mshab_checkpoints/rl/prepare_groceries/navigate/all/policy.pt"
rl/prepare_groceries/navigate/all/policy.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:957da18169588d9d7a8b630418d1c5b5a448273c1dcec0ec01daebb650a680ce
3
+ size 68156042
rl/set_table/navigate/all/policy.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84c8ee51cb27d595f4c318b8c56544a17a79aaf0b4d00bbe43635192f5f40c77
3
  size 68156042
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c31c4a1d16daff9e5ce6eff0760f02da5383ffa242d1e97141261e080cf8e2a
3
  size 68156042