|
anno_len_threshold: 40 |
|
base_folder: /home/mog29/compgen_saved_files/experiments/joint_training |
|
batch_size: 2 |
|
checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run/checkpoints |
|
comprehension_prompt: verbose_instruction |
|
context_size: 10 |
|
data_dir: /home/mog29/compgen_saved_files/kilogram/dataset |
|
deployment_round: 3 |
|
evaluation_type: multitask |
|
expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run |
|
from_scratch: true |
|
generation_prompt: information_after |
|
gradient_accumulation_steps: 32 |
|
gradient_clip_norm: 1 |
|
img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs |
|
ips_clip: 5 |
|
learning_rate: 0.0001 |
|
listener_filter: '' |
|
listener_lambda: 0.5 |
|
load_from_checkpoint: false |
|
logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run/logging |
|
lora_dropout: 0.05 |
|
lora_r: 16 |
|
lora_subset: vision_resampler |
|
max_steps: 30 |
|
model_family_name: baseline |
|
n_epochs: 15 |
|
name: joint and multitask training defaults |
|
name_suffix: '' |
|
no_lora: false |
|
no_shuffling: false |
|
noise_filter: '' |
|
num_samples: 10 |
|
num_training_steps: 17500 |
|
num_warmup_steps: 0 |
|
num_workers: 4 |
|
only_seed: false |
|
past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/checkpoints |
|
past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/logging |
|
past_name_suffix: '' |
|
past_round: -1 |
|
patience_cutoff: 5 |
|
ref_strat: no_ips_for_pos |
|
repetition_penalty: 1 |
|
replacement_family_name: '' |
|
sampling_type: nucleus |
|
save_each_epoch: true |
|
seed: 835313 |
|
shared_parameters: true |
|
speaker_filter: '' |
|
speaker_lambda: 0.5 |
|
split_dir: /home/mog29/compgen_saved_files/split_info/ |
|
temperature: 0.7 |
|
test_batch_size: 2 |
|
top_k: 50 |
|
top_p: 1 |
|
training_type: multitask |
|
use_separate_dataloaders: false |
|
use_wandb: true |
|
wandb_experiment_name: r3_baseline_may |
|
wandb_project_name: tangram_continual_learning_final |
|
weight_decay: 0.1 |
|
|