ZongqianLi commited on
Commit
85ee1ae
·
1 Parent(s): 42fe4c6

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. global_step19200/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step19200/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step19200/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step19200/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step19200/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step19200/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step19200/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step19200/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step19200/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step19200/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step19200/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step19200/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step19200/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step19200/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step19200/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step19200/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step19200/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step19200/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step19200/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step19200/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step19200/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step19200/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step19200/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step19200/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step19200/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step19200/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step19200/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step19200/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step19200/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step19200/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step19200/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step19200/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step19200/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step19200/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step19200/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step19200/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step19200/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step19200/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step19200/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step19200/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step19200/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step19200/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step19200/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step19200/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step19200/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step19200/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step19200/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step19200/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step19200/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-large-cased",
3
+ "architectures": [
4
+ "BertForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 16,
19
+ "num_hidden_layers": 24,
20
+ "pad_token_id": 0,
21
+ "pooler_fc_size": 768,
22
+ "pooler_num_attention_heads": 12,
23
+ "pooler_num_fc_layers": 3,
24
+ "pooler_size_per_head": 128,
25
+ "pooler_type": "first_token_transform",
26
+ "position_embedding_type": "absolute",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.25.1",
29
+ "type_vocab_size": 2,
30
+ "use_cache": true,
31
+ "vocab_size": 28996
32
+ }
global_step19200/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27642a019ae0f07ae93ee182778418d64d62b37e3157ad96a95351f4c3b06de3
3
+ size 100088099
global_step19200/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9afed5b5353342b511c466f7e403fa3ef0ded92b4baa887b66fc0a61780a0ce5
3
+ size 100088099
global_step19200/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267
global_step19200/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4f2a18111468ac17749db28df9c3e8269c2e178ff4566ed3ad73a3f8da5993e
3
+ size 100088099
global_step19200/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f14eb58f41303ed0fe47fbb096a80fd121ca40294b08591995bc1c158b9534c2
3
+ size 100088099
global_step19200/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:708e58e622a25ba621aa67a98bb310efa2170af14b56aaf1ac3cb3bac82fdfca
3
+ size 100088099
global_step19200/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdbefd4ca36fcbdf03c82ad7e5fa157b268eaf1de79f2d44585203d0d02894c9
3
+ size 100088099
global_step19200/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267
global_step19200/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b308f74e4aed314dc41b5faff392d251773af8e42b6b9fc42b97ac88ceb3e0
3
+ size 100088099
global_step19200/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d44d9804a6354063a6b424101439f0d9086c37ffd80a196a8bea6133854eb2e
3
+ size 100088099
global_step19200/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c30308562b9c394ee94ad363002f0fab0a4ba10637a69f8501d3270798492e
3
+ size 100088099
global_step19200/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:377857a24095962590c2ca8c8a996438ea620a0e65ccc742a70e77017c4ba189
3
+ size 100088099
global_step19200/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267
global_step19200/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b3499cbae2f5b8182e47d853075871bd686dc33929f6ebb216df84ce1f00b0f
3
+ size 100088099
global_step19200/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b96a9a72fb4d163c3d578d223e9b90f828b3804bfbca2f8023086678e4563b6a
3
+ size 100088099
global_step19200/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e415fd19af01e88f3c0942e117d7cc706ad59d47917ff51a3408ec9fb78e2b7f
3
+ size 100088099
global_step19200/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef6d48c927f4fe318be23d090a222c9e69886ed771ae147b598a01ec4ffc892
3
+ size 100088099
global_step19200/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:984400a333f4b3a3d5282fdf0292b222ca72d42c177d203315be017e9cd2a35e
3
+ size 100088099
global_step19200/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267
global_step19200/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43da5c6105fea51e413f9e3d92de9c47f3a6eeb73207e33cdaca202b3a025039
3
+ size 100088099
global_step19200/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d738a5953a3002ef523090b7f3c195d315ae222a6f4c5b0bc4f792b6a537cc0
3
+ size 100088099
global_step19200/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1454d4dfaf8e20d976e0e04abbc012a6556c9deaaa441a7c0eaf4564ced04855
3
+ size 100088099
global_step19200/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b37988237f146d3e1af023b83c16443522632125c913d88146e1df1d186f38
3
+ size 100088099
global_step19200/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267
global_step19200/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d40a29f7aa0cb13011e2a95c087f2786aa25f7ac9b24e5738f1e7f38ed271f9
3
+ size 100088099
global_step19200/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25cf8581a0dea6082ced7e9aefaf10e0bf8b8788c72cef9015d201b17bf4ae3
3
+ size 172267
global_step19200/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d12f9a798748d3ee5c75dc31669412f6700e9217f731f249e68a017ba4ae25e
3
+ size 100088099
global_step19200/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1d064e34038ce735f02dfd115e63382a9010d924979e970ecb3822c90dddc8
3
+ size 172267
global_step19200/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a482a363db9fb58f520e8c450b9f53e46cdcd70f97a816d01b5f9fca7a26dfb7
3
+ size 100088099
global_step19200/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d98c35034e12dc2b737239424d62ced04cbe597d5b2dfb39fa99c34c4f23c526
3
+ size 100088099
global_step19200/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d231f729a2e4c08a244fbeee1291e9bb6d000a926942cbf8f0dd0842548ffcd
3
+ size 172267
global_step19200/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54da3c735c00397e0ba604441c65e66ae296688ab4b19a5c3d889354295451a5
3
+ size 100088099
global_step19200/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fd47acea1858c613afc22c47736bb424ec00bc68a242852019c8e4d431ffc7
3
+ size 172267