File size: 809 Bytes
3eb682b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 |
image_res: 224
batch_size_train: 8
batch_size_test: 16
k_test: 64
warm_up: True
optimizer: {opt: adamW, lr: 2e-4, weight_decay: 0.02, prompt_lr: 1e-3}
schedular: {sched: cosine, scheduler_groups: 0 , lr: 2e-4, epochs: 35, min_lr: 1e-5, decay_rate: 1, warmup_lr: 1e-4, warmup_epochs: 4, cooldown_epochs: 0}
use_vis_prefix: True
start_layer_idx: 19
end_layer_idx: 31
injected_hidden_states: 6
shared_connector: True
lm_loss_weight: 0.1
unfreeze_text_layer_norm: False
unfreeze_vision_layer_norm: False
num_workers: 4
special_answer_token: '</a>'
replace_added_tokens: True
use_cache: False
connector_per_text_layer: False
text_step: 1
num_beams: 3
do_sample: False
# Prompt tuning
prompt_tuning: True
prompt_len: 10
mlp: False
train_split: 'train'
val_split: 'valid'
test_split: 'test' |