mbreuss commited on
Commit
0b14c68
1 Parent(s): 85dde4e

Create config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +528 -0
config.yaml ADDED
@@ -0,0 +1,528 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ save_top_k: 1
268
+ verbose: true
269
+ monitor: eval_lh/avg_seq_len
270
+ mode: max
271
+ dirpath: saved_models
272
+ filename: '{epoch:02d}_{eval_lh/avg_seq_len:.2f}'
273
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
274
+ datamodule:
275
+ transforms:
276
+ train:
277
+ rgb_static:
278
+ - _target_: torchvision.transforms.Resize
279
+ size: 224
280
+ antialias: true
281
+ - _target_: mode.utils.transforms.RandomShiftsAug
282
+ pad: 10
283
+ - _target_: mode.utils.transforms.ScaleImageTensor
284
+ - _target_: torchvision.transforms.Normalize
285
+ mean:
286
+ - 0.48145466
287
+ - 0.4578275
288
+ - 0.40821073
289
+ std:
290
+ - 0.26862954
291
+ - 0.26130258
292
+ - 0.27577711
293
+ rgb_gripper:
294
+ - _target_: torchvision.transforms.Resize
295
+ size: 112
296
+ antialias: true
297
+ - _target_: mode.utils.transforms.RandomShiftsAug
298
+ pad: 4
299
+ - _target_: mode.utils.transforms.ScaleImageTensor
300
+ - _target_: torchvision.transforms.Normalize
301
+ mean:
302
+ - 0.48145466
303
+ - 0.4578275
304
+ - 0.40821073
305
+ std:
306
+ - 0.26862954
307
+ - 0.26130258
308
+ - 0.27577711
309
+ robot_obs:
310
+ - _target_: mode.utils.transforms.NormalizeVector
311
+ scene_obs:
312
+ - _target_: mode.utils.transforms.NormalizeVector
313
+ val:
314
+ rgb_static:
315
+ - _target_: torchvision.transforms.Resize
316
+ size: 224
317
+ antialias: true
318
+ - _target_: mode.utils.transforms.ScaleImageTensor
319
+ - _target_: torchvision.transforms.Normalize
320
+ mean:
321
+ - 0.48145466
322
+ - 0.4578275
323
+ - 0.40821073
324
+ std:
325
+ - 0.26862954
326
+ - 0.26130258
327
+ - 0.27577711
328
+ rgb_gripper:
329
+ - _target_: torchvision.transforms.Resize
330
+ size: 112
331
+ antialias: true
332
+ - _target_: mode.utils.transforms.ScaleImageTensor
333
+ - _target_: torchvision.transforms.Normalize
334
+ mean:
335
+ - 0.48145466
336
+ - 0.4578275
337
+ - 0.40821073
338
+ std:
339
+ - 0.26862954
340
+ - 0.26130258
341
+ - 0.27577711
342
+ robot_obs:
343
+ - _target_: mode.utils.transforms.NormalizeVector
344
+ scene_obs:
345
+ - _target_: mode.utils.transforms.NormalizeVector
346
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
347
+ _recursive_: false
348
+ root_data_dir: ${root_data_dir}
349
+ action_space: 7
350
+ action_max:
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ - 1.0
356
+ - 1.0
357
+ - 1.0
358
+ action_min:
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1.0
363
+ - -1.0
364
+ - -1.0
365
+ - -1
366
+ shuffle_val: false
367
+ observation_space:
368
+ rgb_obs:
369
+ - rgb_static
370
+ - rgb_gripper
371
+ depth_obs: []
372
+ state_obs:
373
+ - robot_obs
374
+ actions:
375
+ - rel_actions
376
+ language:
377
+ - language
378
+ proprioception_dims:
379
+ n_state_obs: 8
380
+ keep_indices:
381
+ - - 0
382
+ - 7
383
+ - - 14
384
+ - 15
385
+ robot_orientation_idx:
386
+ - 3
387
+ - 6
388
+ normalize: true
389
+ normalize_robot_orientation: true
390
+ datasets:
391
+ lang_dataset:
392
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
393
+ key: lang
394
+ save_format: npz
395
+ batch_size: ${batch_size}
396
+ min_window_size: ${act_seq_len}
397
+ max_window_size: ${act_seq_len}
398
+ proprio_state: ${datamodule.proprioception_dims}
399
+ obs_space: ${datamodule.observation_space}
400
+ skip_frames: 1
401
+ pad: false
402
+ lang_folder: ${lang_folder}
403
+ aux_lang_loss_window: 8
404
+ num_workers: ${num_workers}
405
+ action_seq_len: ${act_seq_len}
406
+ obs_seq_len: ${obs_seq_len}
407
+ future_range: 1
408
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
409
+ model:
410
+ _target_: mode.models.mode_agent.MoDEAgent
411
+ _recursive_: false
412
+ multistep: ${multistep}
413
+ use_lr_scheduler: true
414
+ entropy_gamma: 0.0
415
+ router_z_delta: 0.0
416
+ use_proprio: false
417
+ seed: ${seed}
418
+ sampler_type: ddim
419
+ num_sampling_steps: 10
420
+ sigma_data: 0.5
421
+ sigma_min: 0.001
422
+ sigma_max: 80
423
+ noise_scheduler: exponential
424
+ sigma_sample_density_type: loglogistic
425
+ ckpt_path: /home/hk-project-sustainebot/ft4740/code/MoDE_Diffusion_Policy/pretrained_models/300k
426
+ start_from_pretrained: true
427
+ act_window_size: ${act_seq_len}
428
+ latent_dim: 1024
429
+ obs_enc_dim: ${obs_dim}
430
+ cond_dim: 512
431
+ resnet_type: '50'
432
+ optimizer:
433
+ _target_: torch.optim.AdamW
434
+ transformer_weight_decay: 0.05
435
+ obs_encoder_weight_decay: 0.05
436
+ learning_rate: 0.0001
437
+ betas:
438
+ - 0.9
439
+ - 0.95
440
+ lr_scheduler:
441
+ lr_scheduler:
442
+ init_lr: 0.0001
443
+ init_lr_scale: 0.1
444
+ final_lr_scale: 1.0e-06
445
+ total_steps: 45000
446
+ phase_ratio: (0.02, 0.08, 0.9)
447
+ lr: 0.0001
448
+ model:
449
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
450
+ _recursive_: false
451
+ sigma_data: ${model.sigma_data}
452
+ inner_model:
453
+ _target_: mode.models.networks.modedit.MoDeDiT
454
+ action_dim: ${datamodule.action_space}
455
+ goal_dim: ${model.cond_dim}
456
+ obs_dim: 2048
457
+ goal_conditioned: true
458
+ causal: true
459
+ use_custom_attn_mask: false
460
+ use_proprio: ${model.use_proprio}
461
+ state_dim: ${proprio_dims}
462
+ embed_dim: ${model.latent_dim}
463
+ n_layers: 12
464
+ goal_seq_len: 1
465
+ obs_seq_len: ${obs_seq_len}
466
+ action_seq_len: ${act_seq_len}
467
+ embed_pdrob: 0
468
+ goal_drop: 0.1
469
+ attn_pdrop: 0.3
470
+ mlp_pdrop: 0.1
471
+ n_heads: 8
472
+ device: ${device}
473
+ linear_output: true
474
+ cond_router: true
475
+ num_experts: 4
476
+ top_k: 2
477
+ router_normalize: true
478
+ use_goal_in_routing: false
479
+ use_argmax: false
480
+ use_shared_expert: false
481
+ use_noise_token_as_input: true
482
+ init_style: olmoe
483
+ language_goal:
484
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
485
+ _recursive_: false
486
+ model_name: ${clip_lang_model_name}
487
+ root_data_dir: /hkfs/work/workspace/scratch/ft4740-play3/data/task_ABCD_D
488
+ lang_folder: lang_clip_resnet50
489
+ vis_clip_model_name: ViT-B/16
490
+ clip_lang_model_name: ViT-B/32
491
+ log_dir: ./logs
492
+ slurm: false
493
+ seed: 42
494
+ device: cuda
495
+ batch_size: 64
496
+ devices: 4
497
+ act_dim: 7
498
+ proprio_dims: 7
499
+ obs_dim: 512
500
+ goal_dim: 512
501
+ obs_seq_len: 1
502
+ act_seq_len: 10
503
+ multistep: 10
504
+ p_last_state: 0
505
+ gen_img_res: 112
506
+ max_epochs: 20
507
+ rollout_lh_skip_epochs: 4
508
+ num_workers: 12
509
+ benchmark_name: calvin_abcd
510
+ use_extracted_rel_actions: true
511
+ trainer:
512
+ devices: ${devices}
513
+ precision: 16
514
+ max_epochs: ${max_epochs}
515
+ sync_batchnorm: true
516
+ accelerator: gpu
517
+ strategy: ddp
518
+ limit_train_batches: 1000
519
+ limit_val_batches: 4
520
+ logger:
521
+ _target_: pytorch_lightning.loggers.WandbLogger
522
+ save_dir: .
523
+ name: logger
524
+ group: mode
525
+ log_model: false
526
+ project: ${benchmark_name}
527
+ entity: bennoq
528
+ id: ???