model: ./nsr.yaml | |
optimizer: | |
name: AdamW | |
kwargs: | |
lr: 1 | |
weight_decay: 0.01 | |
amsgrad: true | |
lr_scheduler: | |
name: WarmupLinearAnnealing | |
kwargs: | |
min_lr: 0 | |
max_lr: 1e-4 | |
warmup_steps: 10000 | |
total_steps: 1500000 | |
batch_size: 128 | |
train_dataset: ./dataset_train.yaml | |
val_dataset: ./dataset_val.yaml | |
val_batch_size: 128 | |
val_size: 100000 | |
contrastive_n_per_class: 4 | |
contrastive_margin: 0.0 | |
contrastive_temperature: 0.5 | |
numeric_prediction_loss_weight: 0 | |
contrastive_loss_weight: 0.2 | |
steps: 1500000 | |
device: cuda | |