ZongqianLi commited on
Commit
a56b5cd
1 Parent(s): 9d5a956

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes. 聽 See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. global_step550/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step550/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step550/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step550/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step550/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step550/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step550/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step550/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step550/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step550/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step550/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step550/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step550/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step550/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step550/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step550/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step550/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step550/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step550/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step550/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step550/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step550/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step550/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step550/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step550/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step550/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step550/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step550/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step550/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step550/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step550/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step550/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step550/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step550/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step550/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step550/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step550/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step550/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step550/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step550/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step550/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step550/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step550/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step550/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step550/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step550/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step550/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step550/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step550/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ZongqianLi/bert_large_cased_scsmall",
3
+ "architectures": [
4
+ "BertForQuestionAnswering"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 16,
19
+ "num_hidden_layers": 24,
20
+ "pad_token_id": 0,
21
+ "pooler_fc_size": 768,
22
+ "pooler_num_attention_heads": 12,
23
+ "pooler_num_fc_layers": 3,
24
+ "pooler_size_per_head": 128,
25
+ "pooler_type": "first_token_transform",
26
+ "position_embedding_type": "absolute",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.25.1",
29
+ "type_vocab_size": 2,
30
+ "use_cache": true,
31
+ "vocab_size": 28996
32
+ }
global_step550/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76aee7ec3cca702269b9a3bd66e33417fad96ec6c661580590776091b46c6264
3
+ size 99764579
global_step550/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1958dc81bdbd1ca7f401645ab16d0037d86df8a8ba4d368895eb5047124607a6
3
+ size 99764579
global_step550/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673
global_step550/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:105f487103c3deb0634506c22004add971634f2375a062cd19c18dbd4ca33689
3
+ size 99764579
global_step550/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e756cd81538d8938c203cedd6f6086e5c9c9b3185cdd0bc7d76277529cf6e494
3
+ size 99764579
global_step550/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5320fac2ca1e0596b57e4e62e6b483f8d020e52f321a7fff7e76c3e76dcadfb
3
+ size 99764579
global_step550/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37564a778f523a27f687ba0cc0daa16fe6711989e9cfbf1ec97f87b33c58085b
3
+ size 99764579
global_step550/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673
global_step550/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:330f452e643fed9411007f56e382643ccf3b53a295410554b1676081d4d5ce88
3
+ size 99764579
global_step550/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b52a97eebcfa1d50d583070d9a8b6809bc362c8f977d3baf63ceefa05004c054
3
+ size 99764579
global_step550/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4363a8c17a776b0e9bf2168dc1ed5c83783d6f9bc6137482b583b78a6c4df2
3
+ size 99764579
global_step550/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e606c470c7b5f40d7476c7444549983da4174e1160cf65c10e9f2c771349652
3
+ size 99764579
global_step550/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673
global_step550/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3cf8384772725d0cbaaa0216ad87c9bb3924101d68c0128e20b75199c28172a
3
+ size 99764579
global_step550/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:530d37a391a007601b711d9048e4a08fbea29a94e13ea7494a6fd6f3f8ebfe7f
3
+ size 99764579
global_step550/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5e90b03039c9daf9b65fdb337084fb616f490e347aa222d3c13854b5ac7809
3
+ size 99764579
global_step550/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebb1aa4c09dce863c75fddda6debd8dc82f690ef55b56e9510257d88bdef0445
3
+ size 99764579
global_step550/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e61ed5dc6990d2ff9568183cb0db8be3ca3c542260b523bc684421c6372c5fd0
3
+ size 99764579
global_step550/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673
global_step550/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aca07d91731c4ea932f6f146bc8607c808b2ecde0d960ad5c556502b62ad385e
3
+ size 99764579
global_step550/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99f1452886ba7a68633c2393314bce467eeb46d5ace6075454f8de9ea67f4af9
3
+ size 99764579
global_step550/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2045283bcc78b3ed4504f1b8ff42378399d94300818d82919742ac45913edc65
3
+ size 99764579
global_step550/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32075f2db2044979e7e737576915b5ed18eca8497c6bae525572dad0e66ae130
3
+ size 99764579
global_step550/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673
global_step550/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d825026e747c36f2729e22e8e5dfad0b20d545e30677d618412ff95796705ed
3
+ size 99764579
global_step550/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9fd38703d3c6f408fa5c29faa7dce4dda2c084a31fad629383ac4031684298
3
+ size 170673
global_step550/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98948dd501c1a6cc9dcb141e3fb17754b743533cf59aafcd77a31047265e4547
3
+ size 99764579
global_step550/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b1085c5d6661fa0bae886f9db6d3ce7f9a185c5a8d6de8ba433d3245518405
3
+ size 170673
global_step550/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0e20f2a0a233bbc61a5a7d4fdc2d2f404952f1f784e7759578781e8b774c877
3
+ size 99764579
global_step550/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbd21899859e600059caf60139823c6940c65e42dae7455ab0b659cea51ebcb6
3
+ size 99764579
global_step550/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc3f1eeb69eb870e5bd0dc9bad1c982d5812c731e8eb81296c287bef8073f3b
3
+ size 170673
global_step550/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be02b1e9bf816a3a6827a2c48984f293e75c44309c009da5ee34ea6abeed1c2b
3
+ size 99764579
global_step550/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5809dd56bb17f832e36a041234bf9bbe5cf27f0acfd212a8cbf9ac8795dfd0e
3
+ size 170673