File size: 616 Bytes
83d0e56 02619ac 83d0e56 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
{
"output_dir": "./results",
"overwrite_output_dir": True,
"max_steps": 200000,
"per_device_train_batch_size": 32,
"per_device_eval_batch_size": 32,
"gradient_accumulation_steps": 1,
"learning_rate": 0.0001,
"weight_decay": 0.0,
"adam_beta1": 0.9,
"adam_beta2": 0.999,
"adam_epsilon": 1e-08,
"max_grad_norm": 1.0,
"num_train_epochs": 20,
"warmup_steps": 500,
"logging_steps": 1000,
"save_steps": 5000,
"eval_steps": 5000,
"load_best_model_at_end": True,
"metric_for_best_model": "eval_loss",
"greater_is_better": False,
"fp16": True,
"fp16_backend": "auto",
"seed": 42
} |