strexp / configs /train_matrn.yaml
markytools's picture
added strexp
d61b9c7
global:
name: train-matrn
phase: train
stage: train-super
workdir: results
seed: ~
dataset:
train: {
roots: ['data/training/MJ/MJ_train/',
'data/training/MJ/MJ_test/',
'data/training/MJ/MJ_valid/',
'data/training/ST'],
batch_size: 384
}
test: {
roots: ['datasets/data_lmdb_release/evaluation/SVTP'],
batch_size: 1
}
valid: {
roots: ['data/validation'],
batch_size: 384
}
data_aug: True
multiscales: False
num_workers: 0
training:
epochs: 10
show_iters: 50
eval_iters: 3000
save_iters: 3000
optimizer:
type: Adam
true_wd: False
wd: 0.0
bn_wd: False
clip_grad: 20
lr: 0.0001
args: {
betas: !!python/tuple [0.9, 0.999], # for default Adam
}
scheduler: {
periods: [6, 4],
gamma: 0.1,
}
model:
name: 'modules_matrn.model_matrn_iter.MATRN'
iter_size: 3
ensemble: ''
use_vision: False
vision: {
checkpoint: 'pretrained/best-pretrain-vision-model.pth',
loss_weight: 1.,
attention: 'position',
backbone: 'transformer',
backbone_ln: 3,
}
language: {
checkpoint: 'pretrained/pretrain-language-model.pth',
num_layers: 4,
loss_weight: 1.,
detach: True,
use_self_attn: False
}
alignment: {
checkpoint: ~,
num_layers: 2,
loss_weight: 1.,
use_self_attn: False,
}