|
{ |
|
"lr_encoder": "1e-5", |
|
"lr_others": "5e-5", |
|
"num_steps": 30000, |
|
"warmup_ratio": 0.1, |
|
"train_batch_size": 8, |
|
"eval_every": 5000, |
|
"max_width": 1, |
|
"model_name": "allenai/longformer-large-4096", |
|
"fine_tune": true, |
|
"subtoken_pooling": "first", |
|
"hidden_size": 768, |
|
"span_mode": "marker", |
|
"dropout": 0.4, |
|
"root_dir": "ablation_backbone", |
|
"train_data": "NuMinds_custom_data_mix.json", |
|
"prev_path": "none", |
|
"size_sup": -1, |
|
"max_types": 25, |
|
"shuffle_types": true, |
|
"random_drop": true, |
|
"max_neg_type_ratio": 1, |
|
"max_len": 384, |
|
"name": "large", |
|
"log_dir": "logs" |
|
} |