ansr-models / v8.0 /train.yaml
psaegert
Add v8.0
83807c8 unverified
model: ./nsr.yaml
optimizer:
name: AdamW
kwargs:
lr: 1
weight_decay: 0.01
amsgrad: true
lr_scheduler:
name: WarmupLinearAnnealing
kwargs:
min_lr: 0
max_lr: 1e-4
warmup_steps: 10000
total_steps: 1500000
batch_size: 128
train_dataset: ./dataset_train.yaml
val_dataset: ./dataset_val.yaml
val_batch_size: 128
val_size: 100000
contrastive_n_per_class: 4
contrastive_margin: 0.0
contrastive_temperature: 0.5
numeric_prediction_loss_weight: 0
contrastive_loss_weight: 0.2
steps: 1500000
device: cuda