Training in progress, step 657, checkpoint
Browse files- checkpoint-657/1_AdvancedWeightedPooling/config.json +3 -3
- checkpoint-657/1_AdvancedWeightedPooling/pytorch_model.bin +2 -2
- checkpoint-657/README.md +0 -0
- checkpoint-657/optimizer.pt +2 -2
- checkpoint-657/rng_state.pth +1 -1
- checkpoint-657/trainer_state.json +0 -0
- checkpoint-657/training_args.bin +1 -1
checkpoint-657/1_AdvancedWeightedPooling/config.json
CHANGED
@@ -3,8 +3,8 @@
|
|
3 |
"num_heads": 8,
|
4 |
"dropout": 0.05,
|
5 |
"bias": true,
|
6 |
-
"use_layernorm":
|
7 |
-
"use_MLP":
|
8 |
-
"MLP_h_size":
|
9 |
"use_residual": false
|
10 |
}
|
|
|
3 |
"num_heads": 8,
|
4 |
"dropout": 0.05,
|
5 |
"bias": true,
|
6 |
+
"use_layernorm": true,
|
7 |
+
"use_MLP": true,
|
8 |
+
"MLP_h_size": 2048,
|
9 |
"use_residual": false
|
10 |
}
|
checkpoint-657/1_AdvancedWeightedPooling/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a26a4f2a6305818bd12baebbe68a1a142d6d525f04c79a2203424a386926cd92
|
3 |
+
size 33595276
|
checkpoint-657/README.md
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-657/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdc5b203c890ef3d8838bfdc9ba4e03953104addd70ad5950507e6fcc3db9801
|
3 |
+
size 67191488
|
checkpoint-657/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea74daec0f7adbf6f2b3fb952e20e57279aed18c8fe54a44d2b3f0252a07ec8f
|
3 |
size 14244
|
checkpoint-657/trainer_state.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-657/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:845321cafd8553e30026f9c6fea66eb5820d6f58e9ea4a0042d4e1d71fd924e8
|
3 |
size 5880
|