bobox commited on
Commit
f2f8d1d
·
verified ·
1 Parent(s): fbe6786

Training in progress, step 657, checkpoint

Browse files
checkpoint-657/1_AdvancedWeightedPooling/config.json CHANGED
@@ -3,8 +3,8 @@
3
  "num_heads": 8,
4
  "dropout": 0.05,
5
  "bias": true,
6
- "use_layernorm": false,
7
- "use_MLP": false,
8
- "MLP_h_size": 1024,
9
  "use_residual": false
10
  }
 
3
  "num_heads": 8,
4
  "dropout": 0.05,
5
  "bias": true,
6
+ "use_layernorm": true,
7
+ "use_MLP": true,
8
+ "MLP_h_size": 2048,
9
  "use_residual": false
10
  }
checkpoint-657/1_AdvancedWeightedPooling/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:192031eaa51e6c7e16d624ce1ecf51c07d10e2497f42917ba584b010b704897a
3
- size 16795776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26a4f2a6305818bd12baebbe68a1a142d6d525f04c79a2203424a386926cd92
3
+ size 33595276
checkpoint-657/README.md CHANGED
The diff for this file is too large to render. See raw diff
 
checkpoint-657/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea45d56f6bf0c5f88c1c88e3d7878fa8e4e4aabc99f6e28772d6284c38aa8208
3
- size 33591506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdc5b203c890ef3d8838bfdc9ba4e03953104addd70ad5950507e6fcc3db9801
3
+ size 67191488
checkpoint-657/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53528fda7876f4fd66afde130a1e9bfa327dc9073de838efad40ae811ca44f16
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea74daec0f7adbf6f2b3fb952e20e57279aed18c8fe54a44d2b3f0252a07ec8f
3
  size 14244
checkpoint-657/trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
checkpoint-657/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc4e2f1b0b6ec0b954c31a7a2d7392e2f2f817d60f3db0f6f0a80bdf431c25bc
3
  size 5880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:845321cafd8553e30026f9c6fea66eb5820d6f58e9ea4a0042d4e1d71fd924e8
3
  size 5880