bobox commited on
Commit
b189472
·
verified ·
1 Parent(s): 68ca138

Training in progress, step 438, checkpoint

Browse files
checkpoint-438/1_AdvancedWeightedPooling/config.json CHANGED
@@ -3,8 +3,8 @@
3
  "num_heads": 8,
4
  "dropout": 0.05,
5
  "bias": true,
6
- "use_layernorm": false,
7
- "use_MLP": false,
8
- "MLP_h_size": 1024,
9
  "use_residual": false
10
  }
 
3
  "num_heads": 8,
4
  "dropout": 0.05,
5
  "bias": true,
6
+ "use_layernorm": true,
7
+ "use_MLP": true,
8
+ "MLP_h_size": 2048,
9
  "use_residual": false
10
  }
checkpoint-438/1_AdvancedWeightedPooling/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21b456a8c72f1889e87a06cae425b1efd8812bc3f1ee5250ea98bb0a52d9d083
3
- size 16795776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3db2e46ab4e158c1001283cae0babde1168851bee1ccd0c2b51b2ab32b6df4bc
3
+ size 33595276
checkpoint-438/README.md CHANGED
The diff for this file is too large to render. See raw diff
 
checkpoint-438/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a282a7cab76b925a0b1fa9fde5249fcd7fc34b00745c368338e9fe225d1e4ad
3
- size 33591506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e79351fdb02817e5b9041624651305a5eee7d534dcd97a5cd6f40887ac3f751
3
+ size 67191488
checkpoint-438/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63b4d9d674854b1885bcc0cd458d694df71630ad65a46be2f43987f0d38042b8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b526e61c2b6d6ebe2c29fa4b351a23a0cb0f992c6064f8a4a5bb5c078731ffff
3
  size 14244
checkpoint-438/trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
checkpoint-438/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc4e2f1b0b6ec0b954c31a7a2d7392e2f2f817d60f3db0f6f0a80bdf431c25bc
3
  size 5880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:845321cafd8553e30026f9c6fea66eb5820d6f58e9ea4a0042d4e1d71fd924e8
3
  size 5880