Spaces:
Sleeping
Sleeping
seed: 42 | |
monitor: pearson | |
metric_mode: max | |
early_stopping: True | |
patience: 1 | |
min_delta: 0.0 | |
save_top_k: 2 | |
save_weights_only: False | |
min_epochs: 1 | |
max_epochs: 100 | |
gradient_clip_val: 1.0 | |
gpus: 1 | |
precision: 32 | |
batch_size: 64 | |
accumulate_grad_batches: 4 | |
loader_workers: 4 | |
optimizer: Adam | |
learning_rate: 3.0e-05 | |
encoder_learning_rate: 1.0e-05 | |
layerwise_decay: 0.95 | |
nr_frozen_epochs: 100000 | |
scheduler: constant | |
train_path: data_en/polaris/polaris_train.csv | |
val_path: data_en/polaris/polaris_val.csv | |
test_path: data_en/polaris/polaris_test.csv | |
train_img_dir_path: data_en/polaris/images | |
val_img_dir_path: data_en/polaris/images | |
test_img_dir_path: data_en/polaris/images | |
model: PolosEstimator | |
loss: mse | |
encoder_model: BERT | |
# pretrained_model: princeton-nlp/sup-simcse-roberta-large | |
pretrained_model: princeton-nlp/sup-simcse-roberta-base | |
layer: mix | |
scalar_mix_dropout: 0.1 | |
pool: cls | |
dropout: 0.1 | |
activations: Tanh | |
hidden_sizes: "2304,1152" | |
final_activation: False | |