File size: 621 Bytes
fbb7c63
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
trainer: "sts"
model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
base_model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-v1"
loss_function: "cosent"
seed: 1
learning_rate: 1e-6
warmup_ratio: 0.1
weight_decay: 0.01
batch_size: 16
use_amp: True
epochs: 10
validations_per_epoch: 10

# HPs used by JRodrigues to train albertina-100m-portuguese-ptpt-encoder:
# learning_rate 1e-5
# lr_scheduler_type linear
# weight_decay 0.01
# per_device_train_batch_size 192
# gradient_accumulation_steps 1
# num_train_epochs 150
# num_warmup_steps 10000