shibing624
commited on
Commit
·
416c468
1
Parent(s):
f2b975b
Update README.md
Browse files
README.md
CHANGED
@@ -33,18 +33,30 @@ The overall performance of model on QA **test**:
|
|
33 |
training args:
|
34 |
|
35 |
```
|
36 |
-
{"per_device_train_batch_size": 8,
|
37 |
-
"
|
38 |
-
"
|
39 |
-
"
|
40 |
-
"
|
41 |
-
"
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
45 |
-
"
|
46 |
-
"
|
47 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
```
|
49 |
|
50 |
train loss:
|
|
|
33 |
training args:
|
34 |
|
35 |
```
|
36 |
+
{"per_device_train_batch_size": 8,
|
37 |
+
"per_device_eval_batch_size": 8,
|
38 |
+
"gradient_accumulation_steps": 1,
|
39 |
+
"learning_rate": 2e-05,
|
40 |
+
"num_train_epochs": 10.0,
|
41 |
+
"max_steps": -1,
|
42 |
+
"lr_scheduler_type": "linear",
|
43 |
+
"warmup_ratio": 0.0,
|
44 |
+
"warmup_steps": 50,
|
45 |
+
"save_strategy": "steps",
|
46 |
+
"save_steps": 500,
|
47 |
+
"save_total_limit": 13,
|
48 |
+
"seed": 42,
|
49 |
+
"bf16": false,
|
50 |
+
"fp16": true,
|
51 |
+
"eval_steps": 50,
|
52 |
+
"remove_unused_columns": false,
|
53 |
+
"load_best_model_at_end": true,
|
54 |
+
"metric_for_best_model": "loss",
|
55 |
+
"optim": "adamw_torch",
|
56 |
+
"report_to": [ "tensorboard" ],
|
57 |
+
"ddp_timeout": 1800,
|
58 |
+
"torch_compile": false
|
59 |
+
}
|
60 |
```
|
61 |
|
62 |
train loss:
|