liufanfanlff commited on
Commit
2b4e819
·
verified ·
1 Parent(s): 31bee0b

Upload folder using huggingface_hub

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
checkpoint_D_D/checkpoint_gripper_UVformer_hist_1_state_aug_10_4_traj_cons_ws_12_mpt_dolly_3b_9.pth9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4781613a67353b6e5fcd60a0f4811f41243ea2f51c5c3ab354d0f2c705c5bc5f
3
+ size 17787834140
checkpoint_D_D/config.yaml ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ fusion_mode: UVformer
2
+ Linear: true
3
+ load_from_checkpoint:
4
+ from_scratch: false
5
+ resume_from_checkpoint: null
6
+ train_uvformer: false
7
+ train_uvformer_gripper: true
8
+ colour_aug: [0, 0, 0, 0]
9
+ occ_loss: false
10
+ occ_loss_weight: [0.5,0.25,0.25,0.25] # occ, r, g, b
11
+ train_action: true
12
+ eval: true
13
+ rotate: true
14
+ data_path_list: []
15
+ loss_weight: {occ: 0, action: 1}
16
+ validation: false
17
+ data_tasks_groups: None
18
+ num_epochs: 20
19
+ window_size: 12
20
+ learning_rate: 0.0001
21
+ lr_scheduler: constant
22
+ calvin_dataset: task_D_D
23
+ batch_size_calvin: 5
24
+ save_dir:
25
+
26
+ original_image_shapes:
27
+ rgb_static: [200, 200, 3]
28
+ rgb_gripper: [84, 84, 3]
29
+ cam_trained: ["rgb_static","rgb_gripper"]
30
+ image_feature_out: [0]
31
+ extrinsic_jitter: 0
32
+ UVformer:
33
+ cam_trained: ["rgb_static","rgb_gripper"]
34
+ original_image_shapes:
35
+ rgb_static: [200, 200, 3]
36
+ rgb_gripper: [84, 84, 3]
37
+ type: DeformableTransformer
38
+ transformer_config:
39
+ task_name: LLD
40
+ hidden_dim: 1024
41
+ nhead: 8
42
+ num_decoder_layers: 2
43
+ dim_feedforward: 1024
44
+ dropout: 0.1
45
+ PreProcessing: {left: 0.5, right: 0.5, front: 0.5 , back: 0.5, dilate: 1}
46
+ grid_resolution: [0.05, 0.05, 0.1]
47
+ ref_z_range: [0.3, 0.8]
48
+ rotate: true
49
+ upsample: 2
50
+ self_attn_type: cosformer
51
+ reuse_ref_point: false
52
+ norm: None
53
+ use_ffn: false
54
+ PETR:
55
+ hidden_dim: 1024
56
+ depth_step: 0.05
57
+ depth_num: 4
58
+ depth_start: 0.05
59
+ position_range: [-0.2, -0.2, -0.05, 0.2, 0.2, 0.3]
60
+
61
+
62
+ vision_encoder_path: ViT-L-14
63
+ replan: -1
64
+ visualize: false
65
+ vision_encoder_pretrained: openai
66
+ lm_path:
67
+ calvin_conf_path:
68
+ batch_size_sim: 1
69
+ calvin_seq_path:
70
+ tokenizer_path:
71
+ reset: false
72
+ diverse_inst: false
73
+ future_act_len: -1
74
+ cross_attn_every_n_layers: 4
75
+ run_name: RobotFlamingoDBG
76
+ use_media_placement_augmentation: false
77
+ offline: false
78
+ logging_steps: 100
79
+ clip_cache_dir:
80
+ gradient_accumulation_steps: 1
81
+ openflamingo_checkpoint:
82
+ delete_previous_checkpoint: false
83
+ seed: 42
84
+ loss_multiplier_calvin: 1.0
85
+ warmup_steps: 5000
86
+ local_rank: 0
87
+ weight_decay: 0.1
88
+ precision: fp32
89
+ workers: 4
90
+ train_num_samples_calvin: 100
91
+ dataset_resampled: true
92
+ dist_url: env://
93
+ dist_backend: nccl
94
+ horovod: false
95
+ no_set_device_rank: false
96
+ report_to_wandb: false
97
+ wandb_project: RoboFlamingo_D2D
98
+ wandb_entity: null
99
+ save_checkpoints_to_wandb: false
100
+ freeze_embed: false
101
+ use_gripper: true
102
+ use_state: true
103
+ hist_window: 1
104
+ eval_hist_size: -1
105
+ sep_resampler: false
106
+ train_params: -1
107
+ rgb_pad: 10
108
+ gripper_pad: 4
109
+ n_timesteps: 150
110
+ predict_epsilon: false
111
+ head_type: lstm
112
+ n_obs_steps: 6
113
+ diff_horizon: 32
114
+ last_action: false
115
+ use_hist: false
116
+ traj_cons: true
117
+ debug: false
118
+ sep_lm_head: false
119
+ clip_state: false
120
+ unfreeze_vit: false
121
+ text_aug: false
122
+ residual: false
123
+ tcp_rel: false
124
+ dif_ws: false
125
+ partial_data: false
126
+ freeze_sampler: false
127
+ fwd_pred: false
128
+ fwd_pred_hand: false
129
+ no_pretrain: false
130
+ real_data: false
131
+ no_image_patch: false
132
+ cotrain: false
133
+ batch_size_vl: 20
134
+ vl_task_weights: 0.005
135
+ global_latent: 1
136
+ save_every_iter: 10000
137
+ pad_length: -1
138
+ hidden_size: 768
139
+ decoder_type: lstm
140
+ data_type: calvin
141
+ min_window_size: 12
142
+ max_window_size: 24
143
+ llm_name: mpt_dolly_3b
144
+ pooling: max
145
+ multi_step_action: 1