diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..85d0f77d513a4bac90a6a25951e3f0e1a0b6e29e 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +compiled/42892ca1835c7f1ee360.neff filter=lfs diff=lfs merge=lfs -text +compiled/5f563a8109c06154fd1a.neff filter=lfs diff=lfs merge=lfs -text +compiled/81e045aa41db6708aa20.neff filter=lfs diff=lfs merge=lfs -text +compiled/9e156236317bf9a3f88c.neff filter=lfs diff=lfs merge=lfs -text +compiled/a5a606ee7f9b51e4eb22.neff filter=lfs diff=lfs merge=lfs -text +compiled/ba2c6f82564581eac7de.neff filter=lfs diff=lfs merge=lfs -text +compiled/bc1b3efbe17382b052dc.neff filter=lfs diff=lfs merge=lfs -text +compiled/c13580424e448f3adb62.neff filter=lfs diff=lfs merge=lfs -text +compiled/cd7da042b94df6a02f61.neff filter=lfs diff=lfs merge=lfs -text +compiled/d0dad260213be0bab13e.neff filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoint/config.json b/checkpoint/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3d91c6d77a499f5d75ee7d5ad4f018866e9c194d --- /dev/null +++ b/checkpoint/config.json @@ -0,0 +1,26 @@ +{ + "_name_or_path": "Mistral-7B-Instruct-v0.2", + "architectures": [ + "MistralForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 1, + "eos_token_id": 2, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 32768, + "model_type": "mistral", + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-05, + "rope_theta": 1000000.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "torch_dtype": "float32", + "transformers_version": "4.36.2", + "use_cache": true, + "vocab_size": 32000 +} diff --git a/checkpoint/generation_config.json b/checkpoint/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c533f934c6359393a56a3ea067a0df118c14797e --- /dev/null +++ b/checkpoint/generation_config.json @@ -0,0 +1,6 @@ +{ + "_from_model_config": true, + "bos_token_id": 1, + "eos_token_id": 2, + "transformers_version": "4.36.2" +} diff --git a/checkpoint/pytorch_model.bin/key_to_filename.json b/checkpoint/pytorch_model.bin/key_to_filename.json new file mode 100644 index 0000000000000000000000000000000000000000..39fadb632bb7b865701d2e790c233178a7fc6c33 --- /dev/null +++ b/checkpoint/pytorch_model.bin/key_to_filename.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825d20f4a18183eff3963e805edd13ef7eb35b0aff7a850e8153ca1eeeb37970 +size 26397 diff --git a/checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight b/checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight new file mode 100644 index 0000000000000000000000000000000000000000..8ae350d87dba5e579002a98351394f2db73d4f86 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f84f240f56b9b91a4eb546cf2763b9669ab2322e7a4d11ec408029f1e0ccf3f +size 524288789 diff --git a/checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..16b76671492b944a0adcdbe11bb9e656eaa9d6ba --- /dev/null +++ b/checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9f59084e4ae45d0b66bb22229aae343297240dae5f6e4cbc43c6359e6bb6b1 +size 67109756 diff --git a/checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..23628d4dd20ca6ed8ac11f8d39b1329513e39bdb --- /dev/null +++ b/checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62eead0f0fb665ee7d32dba7ab975aa0b363384d1a282d9f5979d9b3f4f83a79 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..60d6d5cea5c7d00993e6d09cd47b014d2b32de27 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a590c98c41d2bfc4031baba4a682ea0dec309a11332a64af3a61b95046c5941a +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7d18cb2a74d036aa67177441bb630486b4931bfa --- /dev/null +++ b/checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e53f21af0b3434d12d6265df2d228b179fdddbda2a125d549c669d54847631 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ba10a38dee53b4e1069db4ef622cba2e314b2980 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9316efe8dc37ab8c49c95904f0a9897a4589457f7a4432cb642c02cc84d8823 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..4855cf35c834179d13c44592323f046fca8091ff --- /dev/null +++ b/checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d08d5319c0e0bf37103ece966f1bc576090c12366fe1f4631f2e1ba1678038 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c3aced7f6b4374ecdce93d869b807e69b659b69a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab7fa48bd4b58319e976722893fb464ad0cd6b2b51afad3217604885c5b6419 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e376ccfbb986251de5ac2dcb31fce191fcd72e86 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704c2e3eeecb7412a1716b1923910c38d06fde684cdd9a85b75305ca6b131b1a +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c3821013e5dd3d0f81af16307eb18390e0e467e6 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c25fed67c919b8cf27459ac82f1b08ac24ef52d495c224d44ce062c68547b9e1 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight b/checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..fec906952a2a85b9b77faa0cb886ff94bfd015ad --- /dev/null +++ b/checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8872587aa5a7c6b09a03ad8978ebc59736a87a6409a7252e26e838a91988bb4d +size 17282 diff --git a/checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..bf19f4f5c07f77b2d30e221f9fb446002f918480 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9e6e5654ffc98758d06bbc75a504312e5b2d8c9f6b5d044d95a14b012c677a3 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8e4d8343c6744cbda45db3b6a7fe9a0e9dc87e40 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6041795aa0bfb94f5456728f83172735b06189fac06f328f3f78261f319eff3 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..101c32f2bd3f468db03e44609940ec740d6eda8f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5d238915253ae0c29b2d3ece0956c782bf7b1b52030ce39b4460a61e8f23d1b +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cd0b2807445260b8f75f93e3e18eee5d854e6a12 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d228cf0d1c86750b7a01b5d8373de88283b8ae118f29a7b2a1fe8693beeb48 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7eca6b4bb8bbe4edc8de8576025bb88577f84ecb --- /dev/null +++ b/checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04709843b44812e3076d64e28b01daad070e4443e8cd4d0d53ecbfec9ce4af8 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1a6c67bde51289182c8ed4419861412e7cb8b5cc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17aea5825bdea74baaba107e5e2c3d71716a4946dab45ed6484dcae2dfbed235 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..faf07e7dd65aa8e993bf36e678ec6829c26622ac --- /dev/null +++ b/checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b251efe132fa6b87abb0e992a46dba3f8e1187b23f9317eaa36f360c64b78d58 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..616f1b9882ca7fd2b9bdb4a73092de9c9b78f16c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fdabd007a345c86d4e2fbcd77ea30fffeab79517a8ade0c57265fef2bd66659 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..27577ba338656f1b15bc7f6bb9efd18c4a27fed2 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a85ca739da1bb6b1b642d59970922321ada55aaa82d2e55fe1ad4e9528b2df +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight b/checkpoint/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..740f7452fa993c061132c4d9047f9a10ad6451fe --- /dev/null +++ b/checkpoint/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc57b41119719f656e00736c3708bf3f3c89d00d0e63a029f52ad244ba3c4033 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..81e7ba22ada645f7c36680b6831a57674a64d336 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f5304f577a21fe639d08a41d3e9d46d551aef598862913aa73d41d9f2a34f5 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..46fcf31262ed9b4e415c609d0039251c283e02f4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68a10556d04faeac301ded813048a862a56b31a068477cb9fd1d86f3123e3ce +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b89495a07eaf2c4e85726b6b3ddfeea9bda198de --- /dev/null +++ b/checkpoint/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d4c306f8a78598d6ddca36f090da91d738c73479c8eb5073d2de99b12334f5 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8e4fe77f891090902b29d99f690aeaa05702585d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b19bac51a905ba98439c0eac4317a0ee2dad2fe0b577b659e1a1f444f50ff7 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c5036e50026b3f498ebb803a16205ad52fb808d5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e061ad1934cde197aa5b1ae5e600e0a4672b85f56ffafef223447abbdae195 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f6bf27df8f613e2a813f884fcfec742d161a0d47 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd36c78812b8e037752c1945431d735838ad03d552663adeaeae83cb27e7037 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..15eabae9372c035359d267e4f85386d2797115f4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b4846100d0117dfb6293fb572f453fa0447d4364ebd9bc82c3fae8f4101f16 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3ce1256c6bb07cf6e08b89cb05b357f463d5f770 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be8fd1e0646432367e3338e05f01f122b7fb11d18e83a01388e9f099457098d +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7a353e695390b6bf411423a08629f87ee0b7e49f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f41f19c9e6edabf008ac4c85da948f740df87650f1b3ba0e9f60112b4da382 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight b/checkpoint/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..a8faeb69f4e25b239f915e5502a09fe87b6acb8e --- /dev/null +++ b/checkpoint/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3331559688a98ceeed6cbf1ee29c5899db446329c119b4a884d3c8d96f80a0 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..a96aef6b9ae564cc261bd073427f7138cbb58f83 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a7c500dc6dd58b0e553f9cd6760e05ea3aadd415fc33f656cc3fbfe4f400cc0 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..68c51ceb7eeeb68a8125009ed3a5148ed0c95827 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ec278fdccab7b272a9083aaa41eba9f29b79b0bb1034a2dcffa9c7b22dddf9 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cd9db4ace1c02dd600cf5c6e66581d9399cef090 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98ea84530fbdcc894eb45f135a93254a309fcb9e0006c76e646206aa88d42f85 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..88acd57140fea82538ab2dcdd276a90909494318 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d549756460be23ba39a57ab0e533a2117f2b94803b63b8f866b59aee1aa668 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..339c661d4017702917a56015bd49fa5befd0d2ba --- /dev/null +++ b/checkpoint/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779faaa4e467d843ff63a2f137874854ffcfb76bb0be69e37158daf1ae5127ef +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6dd8ed82edfe1e489e90cb4c24113ed33ee6ba52 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468d73e2f7c2f5e7b230331eee3866d1c3e9752b631021dd3d7fe807b8f61fcf +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6a124dd8897decb4f9c11ba5f6185c3c4a2619fd --- /dev/null +++ b/checkpoint/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b4cb11ca22558acc9e96e379727b65f439759ecfff61c130cf85f797269c1c +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..72184b86fdfab4b865d790a49ca7f9ca1a7becf3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b674d69dc8a866a5880af698eaadc457064c83fa813ef830aea1316bae652d81 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..eadd0617d386c9c5a280ceeb7cdb7f89fc143a5e --- /dev/null +++ b/checkpoint/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc5b1c495f19f8072f14a2b6ea066bbd4b6df4b2debce6cc452903943172298 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight b/checkpoint/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..dbc8a62e9fc900e58a998878b9d3d394d598b485 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3849b044aba6f6d937023c864817611e0e99a8ec6aa3601bfc29456ec3c845 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..6d9c1c5f94a11b0a77941121cfd6d716567ff0c5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727af7bdd339f9f3ddd4443e262b1af70a1c45918d70af38070b8c161ab68ac5 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..16b0ef8d9fa15c28a6dfda03b072a0ddbcaa3aaa --- /dev/null +++ b/checkpoint/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584d2de0f4e3fa08b858aebaba495c7a4d6cc4e887034558da2a3c323d13b252 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..39104df26107310ad53dbcb646c36e6566f2c75c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65dbad15ee15952caa17360d8aa3a13d2e0f3116b2858766145b27afd40d019 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a786d562583ecc8291c0797dd4a70ced9c8f4a83 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d994d1e43e7ff4cf5d46ff0a953de0f70ddd0119e3e9d5370298b221accbd94 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..eaa68a2227524f8133b98bccc025021bcbddb0ca --- /dev/null +++ b/checkpoint/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a3c0719f72d70ae5d5350d9a879353f9cd78e590a46bc2b145a6fb242fee8c +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..943f94fdf7de4ae6f1d6df939d478ea2ef9c2a3d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586198e8817e6a33711becbf518aada2bc908a1afa4c49c89a84795d5330d35a +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..db35256494556fc84740ee7253762c1e8315e5df --- /dev/null +++ b/checkpoint/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e819c7a8b7e83698aa0b0330008fdd48e31b06424482fd2bc64e10d66d33eb00 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..80c7ce0ec58d7d37a60dfe7733b8d366e0699f00 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15113477d5d132ccf14f10aea37d57cd61f57f0a48d398076a0d9ff3521bf0f +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5c71ba05e888be3980ea12955740c0e482bdad64 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44d6fcb824134e3c76a5eaad52d71d71bd827f1f21ac38ec7a0412dcd19ce25 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight b/checkpoint/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..4c35dd271fbc1c0bb78d8e01c506ef25aa0986ca --- /dev/null +++ b/checkpoint/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c434b226eb8abab564bc3d06591142dac1c290d82f66a6bf8b88813011d9c108 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..d7dd7bb5a4a45c7c780072691be1bdec831efc1a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ddcfa4bfbfba0bf16c0d96111514f136f312ff7f23553d2b3c0c73bfaa481c +size 17309 diff --git a/checkpoint/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..4e0a2f9d9f28ba85c27a9716683c2148cf3c02cc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96dd22e952a7486f2e7b772b61881a4daa86bb69077db55cf00a0fac1df8c99f +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..0e4756bcabf1e846ed674c6f93db7da5f4e1d246 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239129cb03c8003414e1afc2fa1351999ac56dc49175ad3b6f33b26ae9ec8519 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2aeae7e8611f9cd33c0b002097161fba8c8ea61a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8090cfcf500c51e217ebc494491d8ba13b1d1caf57703a4fd13bc30f80b8c2 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..42038a9f69947dc75f056d7b44a5b0a4a975b6f0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e956666e3040feaa1f700b00956df8c7f0c4fbb190a7e6195550fc1a88e0def3 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..16fd3c08d3ddba0ef4627fb54fdb1184960994b4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8edfe2be48111ab647f0ce4a6e9e1b5debe14c66322462c5a39c2bd7eae7d88 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bfc7fe02a0826ee38261d0eaf811b2b60e3818b4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909e60112e40ab765231d66ff8d035dce7a19f01d34071d3ba27a38a5362930c +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b8da1f0ec472916ec57da7a787a26b72fa02daec --- /dev/null +++ b/checkpoint/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e82743c006df27b88100e2f93159cffff58fef4107728efbfd8d35289510486 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..427fe65a63f708abc1c554a1fa89928f0e5c3c10 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef5484aa62ed64b9373797e73faa1d6ea1edb32b7cdbc554f0c265ce20227f6 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight b/checkpoint/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..2a2b28826f758d9dd60e90e1b743d945f507387c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a466577b05450bd315b89464527c4c5ccf1cee3cf6959508554e222afcdee199 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..6e96747433c2951f3c18c3a26579713b8a3f1bdd --- /dev/null +++ b/checkpoint/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87f7ec1793faf30ea1cf12f45f55d8522d9f02fc1a108f87589a6b3e2c0c5462 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..d45426bab05eacca54e2ebe96a16be7ed52f21ed --- /dev/null +++ b/checkpoint/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa3cca3b815e095cdd932d4f2bac50ed0e93b34fe1d60dba5697ae98c68e69a +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9afc999b2164e5c454f3398866e90ba825b0129a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c92c8ee5716b38c26c031b3a0e0a319aa8ccc0473d056019fbf63f3337c288 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6ce26d91d78cd1d310167e64302deb9720e48e17 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5fafdf28ed9cf58e44a8f4b5a1da8ad00813d0599c6a0bcd23f6a588525fb5 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..0d94a8b4ad31b3f0df66d93b3b9286a58e1340e3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c11af06d1b502d8074b4c1df73da73c603395c02331f28b957865ba1b42118 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bd68968a71ee2e72cdee41b1feb6ce20a044231d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b9f4bbcef9b59722ef778d68e3e1c22410419e6308521aefecce59db6f3291 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e17c0666fa823ae064e7cbdfdce641d72fbcb865 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745847a5b6c2a4768132362a45a21f9124c4567882c446d5311f171b8179bf4e +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ad06f49d905e7c32034743c1ebdbc4385d30a9cc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82520ac8b209e1a7bc15118761a7382f34a48c78c370e4a53d763a0cc5bdf8b +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2ae0dc8c9efc45cac2b758fe67cf2c2ee684f2ae --- /dev/null +++ b/checkpoint/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6386cb9604f564ed2f4ffcd77d876e1a26d9493eca5e1939ad432d663c48c91 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight b/checkpoint/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..c4f3379b7ea9a03b209d37f5196f5758a86589b4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747a3c74f7ec4f4f9266d89701f5a5701411b8465411a666c74f7178040a15d8 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..a0d2856648d2dd1971abea14d72d12e9a96e06cc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61bb132ad598a3a9fd4a3d258a41073a6ee82fdbf386fbbfe371b2327bd9f9c7 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8353ffe7be75738d66ac4eec95ee63140c669d4c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed623e7146c7a18af1e42ce8f6e99b86cb21d38aa2407fa4c10ae905249d51e7 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3b1e63bbf369909ded7ef50070cb018f5f42db7d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf8c7bb3749130be526776f4c68c648d321e7d6571c1d0cbae88754a053b1de +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e94091606d1b37bb714d1de70466fe3da9a4e850 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f7b5112c3153df4110489d23cdc8656e10148b40dcbb5d3d51001e753e4418 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..dbfda739ffcda32f23fa6ee39c9121bc19ef4724 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db480112cdaef821f410ccbb3fd8659d89583fcdfbe904295ba6d83614b07c8b +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ef3db58395ab5ca9b058d09ddf68567ce0ee8a3d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12888a425b0b51dac79d9ccd645b0b0f7750ff51f1da0594aec12f63eec94a18 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..28a395399122291e9a0d7dee5ece7437848129d5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b899a0ed5c9b26a0963f37ee726385677eec950803580dd345401e56d6fa4858 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..143f4ad9d9907734fc3546a5645707429f6b1407 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29251ae5440a6f9ce9d9cc547183f0e1a88afc75dac8d4491c13fc1099c4f33c +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight b/checkpoint/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..7e94dd237c4b173e6de75c54eebefcac1d14d01c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d20ee6e40ef19e49b5280395f4da43d0c43ae27a7e2da30a414a0e3c99e454e +size 17276 diff --git a/checkpoint/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight b/checkpoint/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..d2b878b202a09078d708cd8a4571924db62ea199 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d523135f2d17f6b3ee92b2acd550378914bbace88da2629bf46933475c45c0 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..4583832dde53b573e68e1d0f0859df4e6c2bb770 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63857e390be1fa1445b09276ac6e87d4bb0b691277e9bd15f25bdb7ab40aaea9 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c5eb8eae8adb892b1a25ee69a84063b61124f682 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6125daac8995760c32663f75cb96a54b2a415c4fb019a51ae996de71132b5eab +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..d38d934b8d8ce212c1735d6c8b904a5a93359691 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f6ad68b25ed4e47fbda42f8b3350093c16df6d1b98b045ffb7a2de77c3b3be +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..793ecc2977900a5f857ed8c2ae20c7d6199bc32c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403c81d77a705101dde98115677ea8980c78ab20544b07c5b5f218c12711e262 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..04897909669b116feed6d37aae24ee1505fbb35b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90dbd40c4cb557df23de10304fd58ccdef0843b29547ccb95835a8f7c84ae4d6 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1f30fa497b24d97643d360cfd53a5824ad487545 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf0b332a22cac5e52aa59da96b28b15ce9cbbbb1e3f5e1599ea057e26c3810c +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..80a1c65040751919f3997a924a4ccf337939d02f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379f5d1cf9fdc6b8723cc61ba9417d47fe6c10ef2df423002d72370a5b586aed +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c1a30dd9b515fcab3c86e34b8ea202b3fde1f47a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7079db721c02e7ee4886bac35ffd2625ab6cb84b8024739efbe03648804b0faa +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight b/checkpoint/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..3601d8c929140fd7a842c8c6dc3566a359bdd9f1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62ba817a636e55c969c5f2f4c7c1e78bb19db63db1d99be0cfde2fc25c173b4 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..d919d5ed57cd47b9c567ba5323e59503019f8dac --- /dev/null +++ b/checkpoint/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c04ddabcba1d533bc820849435b7440ce76e699e87518eee06d16e512ca1a5 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..e8e36868e81f29e839acf37bc57de98345c88cc1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55500131d43e8db9d470acce44be36b702dee32ee129847e35b3e1f0e54b7212 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b475e335274129e534d4b03a10582d2061d824bd --- /dev/null +++ b/checkpoint/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a4f3626f4b6b06af694501c0e1a20566d9eb25f23a77d8b13ad82d19fdb1547 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3093abf44a041b167ed9e13ff762cbb4a844eae3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f67f5b72665addf2fe1afadc836f9c49304c5c0bcbddf3502441db9adb3eef +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ff2f3f6c236c9372cb61ed0293367af19731abdf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35da3c4b4f87b4b1d59c7e838798f62a252952e8a98611ca6541e16f8a43f808 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1fde69cd4359db28b82b5fb4a7c5fb9fba9196b0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55aad615b826b528357c61e974a84c8fa1e13688632fbfffb3e450495407f27f +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f02442be82eb2866c447adf4fefc016ca85c14aa --- /dev/null +++ b/checkpoint/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c3db75f17bfdfac46890a78a6c1975bb4258c9679bf088712b7ab651c8a250 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6178052c8a2d6836bacba503e55305df5f093b7a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd0192129917358ccf09472239f2b8f3e82f81aa8abcafc7d630d54b41d64bb +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6b10212249888d43268d35f7b2f4807afd7b505c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6a940e94b62bcbade391cb510a84d9eb3b9c554095af50acd1a1c6bb3b1b6e +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight b/checkpoint/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..023a4c74545ec8b307fc6327db1113be943e7825 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad2b5a8be53f3e6abdc0ab3fc5a2d96a5b072c11b147dd2a2805a9c728eb8ea +size 17282 diff --git a/checkpoint/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..f1749d62d3c336f9c07ea3b56b4bd245887cfc41 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169f2cb1056d8cc12e0a83b4965a50c5793d4ef7b7b0041881700f50e11c7cdb +size 17309 diff --git a/checkpoint/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3f2f47ea81a55dbd20d9916312f51c3bc9888b0e --- /dev/null +++ b/checkpoint/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d6dae944dc04364bf1f088655ce896605768633594a5edd1679261036e4612 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..17389f39098518231197183694c0a82ff23f15f6 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b894e2c30fa9bfaaa0e7e1d1f68edd009a6503ddc36c3b3150e7f70d37be627 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..938edb5b58679a687500f6bc78774832ba59d923 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb702e708e8313c2cb1ad36ac13adbbacc4c0eb4ff4c056333b83c85bb3f55f2 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a157da9996a1e693c139a47e975bd1ab1d256e63 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6490c74443487a12dda2dd3d6a038ec679d41612734efcec1e9ecd55514dde74 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..790b6070a92bf7224d0d793f35c5fb56518f2c96 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36928b9da5721034560f52940f7c2f388adc69417b797d524ea04960d7c7fcba +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9832572dbc1cde237aa628b7ce17858b12435231 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43cfb7e5a00875f47d4a61d450aa10c91f9d29f92c9e5173c51734bfcd952ca4 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..151d036606f8fb8ec7470cab04e86afa33595b42 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded413807b79810bb276d1d572acadbb212674c915056f8d82b8777a1b4eca04 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a787ce888ffe4f0ac9e1da8d892652d82fa1b9f1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5631e7f346b55fc040b445861ea58f6b1ab1d439bf3c7b0d248f25fc547434 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight b/checkpoint/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..f4954c7199e1a347c1bc5db93065d0618388b3b9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd1bc5630612678c90d3b41b9cdb4fa06fd32730eff5f8d21622ad1af4710f11 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..c78411a58f502a54f29702960797f12b66c45c90 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8741f4d2bb2046b15d090fde282227f8924cfc227b1aa25ed09f8d84b49840f6 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7c003f20d9dcabd17449d7e60065f1102c67452a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5c1f8c6aab40d690a8e3fc8a718a812556c155b7b3f5167e1759d84bcc9dd4 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e854adafba575c725432d1c8f5b096bdf6765082 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1e67479cdb37ff42b21560e0cc2153c2e91d8ff178acc13af8142483265f49 +size 16778108 diff --git a/checkpoint/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2144afd940a24f5235e0b607387991498a074127 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db9848e7fbf678a05324eebda01305eebac878c00eff46576356891d1009e1a +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..71f017f5e2f0e57114d6c6fa915f303e7eecb1e6 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e9c6246cc22189b874e50883e5692953e5048c1f403cb50547ce59cdad707f +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8c277a52bca1b859e79d98107ddca58d04ff2435 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbfcf65316042c9734f916cc370ec413d7af682f9ed59cf16ae7a9be9b9fcd01 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5e93812baa0e697c7942411627b926f2a2178b64 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a2613bd25c8df61596c8d715d9401a691a1db9b307b71ef860b2dc90010d72c +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e8f60813453b71713554c489d94a6f68ea5ab4bd --- /dev/null +++ b/checkpoint/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43c10864ac999f59cf1fa45fe8e841bb958c67a2d876c9842c52cf5d9b1ca1e +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3eceedbff6f1fb4c08db515885cf6f366679455b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c16fab3a161ff793d362c308645beec424225592318cd5d163b34d981937e91 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..fd068263bcfb74382c594fa8a754abdd701dfc67 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9555cc5fddeb6ef22ca4cf41b23137afe246c493e1346cdf760db562524a0a +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight b/checkpoint/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..1f1838e35879dfe8969c694b9e1f9f589c4dd359 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a1ec0350d0df44864e09526a21860450f0d2e8d53a8055ff4128c744358e69 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..b2ed7c87d544f37cfcad738287906203ccb2c8b4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8051158c07f2a85ae6ac6f7e1c49c5d93428c2a6a833ecac2ff917349c16170c +size 17309 diff --git a/checkpoint/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..17b644404e14e740fa890ff6724ca22f5b50140c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f9e88eb9972c3e26fb03083d59152875d372df510912be237b2bf761cde7f0 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a499ee7da7b4fd49851311384e41d7842c13bc77 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ab3b98fd2caf1b50e6340354f4815e27c32000639548c812075514c5f518ef +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..77f5ce697b2c1a29c4bddc7a485fa7667149da3f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b31b6b263d0598c288bb145eb3add2f5a63209c26968fba4d64974dae36f104 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..50f7448fce5012e56b0c9bfd58e8679d35b12465 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7517d3291dc489b55e0021317b5ed3a1b9b13f514d3f9d7f6e6797a9e215026 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7ec9a581b773406c54caef88dfb92d7fcda62c5a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29e75a7a2bb3ef97c7df8502c9fa8526f976e41d31bbdadfadba8702a718e71 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9ed740d64d3b1bb12cb34cbcdc0b9e53bb1292e7 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f2068c6070b46ff5584eaecba27242e223124a057420880273e79d238b542d +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ce218431208509a971519774dd4c4beca6f945bc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb54bf97815e01602e1218ddc4b7ffbaebd77330c8c438002a28aeb451e8930 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b251189319acbdfaab57b8786f3a3ded35eb1796 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148d633c61b1d2f367af508cf57cf600ae2e5dac6fb85d93808d64dde676d725 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight b/checkpoint/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..fb7975cdfa6d49e76779fd7ee1b174c7bc3adade --- /dev/null +++ b/checkpoint/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f0f7bce9adfc1ceb03a292920747bed3de921802c35a0481fddd387e3fb6fe +size 17282 diff --git a/checkpoint/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..4929472234e050864a8437075b8063b0fbeebe8f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e202112b52b1b9ae8909528367568a6764c2a6f2677be1e9a0b66ec12512aaee +size 17309 diff --git a/checkpoint/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..0a08f0b3d4e397f596d9b270b13458313c8cece3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d390a159267648ff7e49f8f410da29a5ff167107971be6ce6d8f488f4463513 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..14e6e5ff6c72e4898c5fe9e3395b74fb76d1b1cb --- /dev/null +++ b/checkpoint/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e8c3f8ddd81043a03d2431d1536381782198ca45919fd02328129d7e82abcd +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..42c7c8820b835f69c075b1192bf6155367a45594 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d98a6b4ad4fde6f158b555cfae0a218431fa72cbe1f4a97b016f3773ac02685 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..95367e0e5416495382270f1ced4a5d7335de197c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16360853d658a7288ef7fa38fe560aa02a07741889a5e3172d118f265f2e7f05 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..75bb037545a34997370bcfe5b996ee47f24d330a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b94777363ba4225b7d4adb2a477db97b6e301ac8bde11d989caee0d9f3773873 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..588ae48db91fc4851405f099a37a7404402cdee3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b17e4862cdb2bc6f95a47837496a343974c50df2a9a753d1b8f1cf239f148ee +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c5cd395cb3df3d1eb680e8d6db56e38ee89e93b3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b00e0d0c6604516319ef5e30f647a6e49262f3d20b52ac5dc7334cfa58df97e +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cf1115f1786b732491a910ed1a49c197b3815d63 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d49b6d3291af390ad594c4503f05a5184a14035302471a228f0c29bf207b6a2c +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight b/checkpoint/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..ed575b5f668cd17fe430e69650e0e8348a1ff4e1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7dacab917176f079765334a5188f3ef7417a22bde48f81d37a9c60a21324a7 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..1eef089f34a6de8feff9d6286a37e31188758085 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6090f364ab1260b43a819e886d3291258bb7ca9b613786366975622bb8764b +size 17309 diff --git a/checkpoint/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bee73141b71937e8f77a3d55629069950742b335 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f18c7a548267fd6947d96abbfd165acd12e16eaffd5ec1ece3596cac6ff83b +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..960ee4bf2bce542d6b07955b4175361ae51fc27d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1f5d37cdb8d87d34d7721fe07e169a9cc18ce0f23db7886fb910fde4173505 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..532b7aab67126ee2986d88ee3993fe61c5f8b03a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2afc6090bb0c78becceb76c9e901a997de24f39dde58d7583989143128e1bde4 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..fd2c5f2088ac63598e199546cb15f350b87f2ee2 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44af518949656357ec8dab9db407b6b60767ca8d2d7a8a59769547f9cf2e346e +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..d3d60c28b7e98f2c0af702429752715b1753f87a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff44bbb71043d87bdd5d1cd9e898b8802af62f3b67e010f750bdb6400f96f4e +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f4980b1830066eda75d94d384c8a679cb4e87143 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862ef21245b1dfbcc1194f20e257c7c99ee78b480373372993715bd2036ef6e0 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5782042a702fa9b882bbd70b28f720e75ef395c4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b378398612abd69845bd2171884ada4584b6097d8b66edf38f66e7f29d210c75 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9c1356d79e81fec6040971efbf4ad1e65a69b1b7 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab050e948dc2350d208f68db8b4af5f8b3a48ddf4ffeb58f5079e47a5aefa05 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight b/checkpoint/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..a1d744bb3d54a30f4a36b3d6af54f6d912b7ee23 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153645548b3d67719eb849bac077490f0438692403d9b578f19f1008ac6a7fb5 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..2afd7f1dad1445a78aa4c15b8cf1bf961288d840 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde42d6adec7336eb813160997e7661f991454f70a391e1626392a39d91533a6 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3df32117782f4dac1f3913bd4d06fba8549b65ab --- /dev/null +++ b/checkpoint/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d78cc82cc014eb01fba82b12b049266c563ab02d676c9d901f453caf1e738c6 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7d26b2715edf97cce0c30f34402c2b9f9975a60a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:472951fcb41a937bd2b0b786f4a8e7556a8a8c30156b60c2f8dd04f9f874fc77 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2cdc5af07988acd53141fabf1c33966f7d2671ee --- /dev/null +++ b/checkpoint/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4376033577df50f157671c38fcaf9bc709ddff69c4d84030bfc221ce544ceca +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ed34d862739694b214b45ead3103f226d6e5e21a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:076827473eaa08c857bea3335bfd1b0e3e6ec3cf6be6a9891702ceced0dd4a5a +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..fd91ba2ee9aada151f97872cebe6134785504138 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99308ed59ca6945f94be99763b4a936cde7367ad03d1eb17b3a765b0f116d1bb +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c342b25b984ff222799619c9f96dfea7ac65b0b5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee667abdfda416bc1e655edba121ae860e7020e64d2eb84def7e2daccd9d7b6 +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..988d9b85f8a68459dc1cc4ac1632374006fa9fa1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5cf66a9ad6e35594a7bff81b82ed55798cecf75684deec2ee03cd820b9e4f5 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a5f0754267c8d095ad0b732436daee1d50456f1a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04d717b1189441c2a5ea6da0b3b2c09c87cfb2133761af985549594368ea8da +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight b/checkpoint/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..0994ca8fc8e443f752e3c9674c8f98615f95d6e1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5140efd61006fabbba38331585d077327b0bc73b17c5b1d6b3cf2bc20ce3da96 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..7b2d2d6447fe6973134b8aa09ceaa69d67c59d1d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f378ec419d870d2e77fc76040702755711656d7547211fa787588f0cac2ca61 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..44b21eb615a8d8c4d34846fcbcd56d0889fb3faf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b577925ec0a18cf584463c2f3219469cacd0300b08332909febbc425b60fdf2 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..861f825a222cde2963876b069b61f257ac042f6f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e631064d7cbc5ee91348e1b7ae8c2cfd60a317b0d86d2720766b5df9c0bb79 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..40bb24cc5545bb2cc295cddab5d1512694dfa228 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7234bcb7d9ea77cbc4729002321b34859276dadc739765e7ee047018a4e5d78c +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a583d424199168d4860c17bacba1e92a7bc824ee --- /dev/null +++ b/checkpoint/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2e40013d9b17fc35ce3025c11cb245f967f86376e1493630f688a9b6157680 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..098b6f21d72677f0af03ac08cde599d98da034fb --- /dev/null +++ b/checkpoint/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56bad65ac08ffe836217ce9c4e9a27d7ec4449da6a1bbe3e6d28a73662ca8ea +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e1ac94ab5e21ae9d132306c3a8d317f4b8cdc49b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef48636d5d0b91c8d775fdd5cfc70d53b70fc909cb133dd6d9f7b8a2f529e8e2 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f3a3bb7fa08079f76a3ff4ee9ca33e3485549b80 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526a4326832fb3b8921e8c8e6efd93c14c1f3a4e6180341381f2edb81ec90d8b +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f91115a156e8f5f629f75d9bbecaa8cb5eba0c73 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a66143cb81d37c9e39241b9c45ad70644ae323188859ce007cf6aca15612366 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight b/checkpoint/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..eeffb0aafcbff880c33ebda31a02e51796c3e4c0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c76edd5005a0610b1b1f5c1f46630cb4155ec0ec8757faf01efc73b2b5cccc9 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..62bf1ca193b0958db38e51e3316a7c70857a8f31 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4625d94274a604fbe861f821803d6af56cd9d3476b38b28adf74dd13251037ea +size 17309 diff --git a/checkpoint/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bfe5b0c52fb02b8b5751474bf4a5b3f1249fcce0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edbb4104517a44ddd310a0cef50750cb5c39827caba89830cf5309eb0d78c439 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ce57d19ce82003e6c3d3a36e08ca968118e39ead --- /dev/null +++ b/checkpoint/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48cff0548761e678d7b9409108a7729adc3d5e90f401b995d1d6fba7cc6ab5a +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..fec9921b2a08ddff2aa63795aeb5b966c37cfae3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3acfd3bf5a63d2ff50eba6c2473f16a921f43f94f743977f8924f32d5465701b +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..4ecf5c5530e12e09825f6c4b1bea9a0e01ac66e4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30063f6fbdeac99bf30278fbca79b8c1a5eab72d1c7a5c6bdb704191db0593dd +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5c42d4e9f27a21a7b537c6bfb08724c816dad3e3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6d6c9c3caa50101560a3dfd86f87368cd16ebfe7aa65e91a6ce7fabc5b334b +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3596c97312172172141a9c15d5ba619d20905c96 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7976f25e29ada18d7e28364acef75e5558e8f7f6a80cd0021d92b57474498cc4 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f63ab444966b4eef57eda284d3b19faf187b39f8 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d6df37acace1e880b21b8d1ca787388d087da9257583bcf9d55fce25be1181 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight b/checkpoint/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..763e0cd014670d506e340b58d5c3df4040423fc9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38715db73eaac1e0f1c3b04da8a6ef854f138cbda00e2ad5500d60d1c5cdf901 +size 17276 diff --git a/checkpoint/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight b/checkpoint/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..6c252936773e9a72b7aad5dc1c4958d825484081 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4f1d5d08f37bcef701c33848f321a10a6504ccc929cb572517b0d44c67af5eb +size 17282 diff --git a/checkpoint/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..6a3f39f593a84c80ff3b211e06d94ac728f6ce45 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ee60cbea7d41192be0dfb8b5aab42da3213ad2a202216022744956ce9d24f9d +size 17309 diff --git a/checkpoint/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..4768b5e9461bfde3db10df518b2fae37e8d82838 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927c6f88d2edfaf0d2c6a269798285282871566ed72aa91431baa8c98049b963 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f7de53aeed2442e59aeb987db14ab16eb041decf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b564db2fce7c05e1a4f6330ae1bff497eb604c6cc36ad5875807a9253e0c1e3 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..56e2c1acc777d07bbc63e62a48e0432778ddb23f --- /dev/null +++ b/checkpoint/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc79bac1ee19125bb1f4dd9417b2126bf342a93a8cb7059d9da1a0b1accb54a6 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ac611851a7ab0cf9862b79253a21cdfddedb9dda --- /dev/null +++ b/checkpoint/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:972858618eb2976b19436854599c32b6dd928744da311a0883cbf1dacc6cbf75 +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..907cf56918df3c0752f4550dd0c3d5881cbbc29b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:036cb6f60ccc813051ab7734d443bc074f5ebc428e6cbcfd139e4e710816fcc8 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f988581b8a86b55137f51a681f52c45f1635096b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1970df52599ab4b958cd61e14cc233c25ba0e32d49d223d680f6d1d998c4efd6 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..4428a79244cbcbd0ef7e946d1a90cf85c3dfaecc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a9b811f4f1a8d155c1ff83529872a94a31c77b46dc47f43acd829f9c776f5a +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight b/checkpoint/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..687fb09618ce01e3e76eb059e7e5709d6059749b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ac7227c0873c6ce8fb17210d593d6f08eba4c4853a843caf55737d1569aea2 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..45e3e336cb21e15dbb64d79b4678c524982d093d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b632034035a23958f1e19aad3fe0c87ae1b8876528ea9eefd88baf5d77ada21 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..b64d572a5ce7271516a8dfabd14ed2bfba2c9f87 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c0dcef1e1632c229e4fa16c738978e97965f921ef2892d7e7c2794fcaa29280 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5bb2c0277f8833a58c5995a20208e51ef72ef40b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5497bc9181f9f7b229238788a08b0c8f6ca06c9616b98f3d1da395338a5578b +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6a55095714214f43dfff929e8025c04a18caf243 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07142a200c139978135125a2c6dc4035fb1d79aeb5177cb0a4c6c05ce71ceb2 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3e829a9565e27920eaef068ddc5fc6d7dd95645d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9103efe33c289626c1ee89909291616fde2c3a19fba800e6b90602e164caad +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..59a8d8b2bb8a65f540c7e7843e369a5435018da6 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d03109af8b694a23e84457f9c933041d8d9b541c2f1f88761280d82ffacafcfe +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bf1e4bccad79c452118f4d0a56333e501958fad4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26db524fa2d97b9f6b7cfb56d6435e0245c5fffac39673ff1b633e40f5f0fb26 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..51e03162a8a2a8f7f6410cff5917bb8da7cb1f4c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c354c734df8cb9cede3bc0f02625fcee30556d110bac12d3c7a0388c884aa7e3 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..66fc2b5d3dffdaacdf23bd25e5411abcf9cb4fa2 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4dc455bbfc00a5b5bd18dc31e839fbbe52e14f06184757529a51539dedba55 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight b/checkpoint/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..6c5f004ac989e3f3d74d3b93cf3f707a2e8e83c8 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690042eb390cee960eaeb4b4e93f4a0c4b606a346aacb4c9035a2742070b9ec2 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..cc7b8ac0bc6f991292ef1f1e64a295d40c13eccf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf73d2caf0d09e5c290d0c4475510b3503e7ff1f600d509f9cf7fbd045b5545 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2afc27c6678b5617227ae1fa6a88371afb85fe50 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4be0b6259b40c334027ed3197fd16f8a02a4dd35c667073a301f0a74d7955d3 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..528c607db33941d4094b111ed3bfd5268ec59006 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b7e4d827071499958140bf31b483c9aeb25997bc068d3dbc5d43d1a3e7a6af +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8fe48a036a9513ef3ed8dd4852965ee5fad4a3e5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072a68039d9244d8117eb4f9aa5a65bc355ce4ccf4ad56cdac6e8f547f9557e6 +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6f3e41edd76ced657ef03fca17c2f9f9a174eb27 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdaaca877453dff4e86a1071a44f0cb3ccc749cf7f0ad3c2f53861e53ac8fc6f +size 16778117 diff --git a/checkpoint/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..34d8be02648429283e73dbd32857054797e0d305 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8da2afe160a49a5d3104b26bec7aa42e3141d9b21223467e695b30c7e4510fd +size 67109765 diff --git a/checkpoint/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..aceb8f6b67058f28e309b11521f52a1dbeeb6b55 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf447d6d0a4ed94342ba1f4d5022ed7169d4d57ccd55dfc5fb5010abbd446c9 +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9126b007f9294f0cbb16def9852d662a52267139 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22cb5c096317c9c1d0a0ce41ad03d9084ea97f2e7bae86c3d1871ad71299b50b +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a20c0e03332cdab4efc4a0adfdab816eacc91ebc --- /dev/null +++ b/checkpoint/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddcce6c90091307ee0ddbdf8a34b530371828d23038e6b3df3c0ceb968347dd +size 234881916 diff --git a/checkpoint/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight b/checkpoint/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..64dcb76bb47cf1958dfd80baf8ea6547547a9534 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ceeb5462b0052ad6d61efcac3b9710ee338b40840e3f345abdc7767ab604fa4 +size 17282 diff --git a/checkpoint/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..e493466cf7e460dcf9d3d56940e0c8741aaf124d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7aba6dc88628b1cdf7be05dc86bb679ee41ac1a5db7ff1553ac46a0c612ac98 +size 17309 diff --git a/checkpoint/pytorch_model.bin/p289.model.norm.weight b/checkpoint/pytorch_model.bin/p289.model.norm.weight new file mode 100644 index 0000000000000000000000000000000000000000..aa87701aa4252c07414dfe3aeeb842a03db9111b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p289.model.norm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0823f2fb24b8143b2aad532aea8362f42471fdd0c45bd8115af2c475bca6590b +size 17155 diff --git a/checkpoint/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3b4004fa976000a43bc8e8df3e4989b04e7bc906 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee19110c6d5b6ca94979ec5783f915f970949b306f7a03483671365804ddd709 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p290.lm_head.weight b/checkpoint/pytorch_model.bin/p290.lm_head.weight new file mode 100644 index 0000000000000000000000000000000000000000..e4374710fc718da2c4696cc89a5d5e8d16ac63bf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p290.lm_head.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e5f8818f0f5e4e37feaad7e000489afe1cb99ea974155ab80c0231b6655146 +size 524288762 diff --git a/checkpoint/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cc2df6af8ee68b63d73564e2ce9c8285db59b0de --- /dev/null +++ b/checkpoint/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872901360c6f3dccf7096ab9bf9949e4a8798a17be2641a5c3b241857e834d53 +size 16778108 diff --git a/checkpoint/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7f4a934d059e0f02688dc6934348b622843cf378 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d575fd78a7061bce8bd5dc07b94d239d6bc6243ddc02998a90b033bf403eb28 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..24a450c934bc1d79380631ca513e909c66e12369 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc9e5be263c8a3f5ce182deb8923b3a1744c0d55c48a7a25e7f88c3349e590a0 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..29b4c7983ccf4aa958f3d129ce2366c958de392e --- /dev/null +++ b/checkpoint/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92853652403a4ba1916eccef6be8b3b5a54dd38f72dbd991dd646c0339e8a4b +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1ba865a46d9d75d13ae9fc779e7d8d25fbdd3892 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c60c2a4ce1bc8aabf22e0a9426d64f7309b1278105bfb6a1f617a371014973 +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7ec2e3d47ad912b92ba5088d903b984dcccf5520 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60b54006f85de0b1f87cfde6f3567a59576337a749fe19e09381da5daf11427 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight b/checkpoint/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..98c58bf8d70c1b3ccdd6b67d544a5fa857d45407 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e800e7aca5d65977ca139e5a5ed46c520ba305d9b22f046b7ac82d10e6a14808 +size 17276 diff --git a/checkpoint/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..9869ab5ea9efbd29c01a23830b434d61bf79c9cf --- /dev/null +++ b/checkpoint/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9701b538371a6db93185522cdcdea12edcf9dce3b0dae3ec21957bfe07980f8 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a01e894df444ebe3c12f570ec304bc0663bf18d7 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca333ac1dea16d72de5eef93384752be9859a03e99374348c90994af10c5eb8 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8a6ef9bba5ae1eead51b157d76887fe7957e30b4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9200b669d615e0b6358639b477a49b2009ec406ec7d20c251e5f7c7ab16d36c +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..04113a73965f8288932b9a4bc926f11a61ac3216 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2dda95c5a3ac2d6989208dfb4aec623ec034b5ad70b869fd22dc69db9b0a0f +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8963eab207a7d07e9033146f973a12728f0b2fb2 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3026ee4c6a18ed59667ca3a8786c9759f06b7f2b0cd8b0a03007bca52c3a568b +size 67109756 diff --git a/checkpoint/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..495b7e7038e617f9331f52ff2ef57ba00044aac3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09496ed58db33c4fbcd551c33ee815579781d2f932d57af8126a85590d3873cd +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9dcf99a02f5372179e92ff6aa6493776a1b9cc3d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30a4cf1887195bf2195d2f8abfe59279265692d2c848d364e14b96f751fafdc +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b6914c655f91ca5ec2b24986b8bdd9172dd0a3b9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5cb9c1289315f26ea8635d18c5cf54f1fbeca26d4b782bd81522b68f8de440 +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..e2a9fadcfde5d857d60a15a38bf7e3ab534bd063 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b464a79df431c80009a1fd02094cf3dc38d690a608276b28411008c13826529 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight b/checkpoint/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..c6e71931ccc4c26feb6a019f2c935cc617a7778d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b67f7fd221644d2dc03ffc691e70104d506c0779434d12fc23faa136d4b1de0 +size 17276 diff --git a/checkpoint/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..1d98129bafa8fb241db4b74c2d182d99045ea04a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d75c8580537b74405ec44b9c3f0a2313dc19b60f2ec9d10bfdd2c056de2675f9 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1430547959e695654b916f99d9225b61ce9a254c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3047572c0a6b555dc5d0c437a8415d6113f52aab6621796b0de6fdce2f007900 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a6eed95900b865c6d897838a3412f19e12548e5d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c561366b8cdd07c763e53f0847eadf9c10c5255bb739224cf56c8c12a94074d7 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..c2c92ec6d6b135d3c273d72fe75733c0bed7dfb0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ba115f5a63444f637daddbbaad06cf34df4c2cbc88508492f0469fea005380 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..77538f5661c9286fe4ca4bd7cba70ef7d0a5e004 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa33b2d3f7fe4017315c30a77a2a8a8addb23a6bc4a4dacb6d2ff0b34fa5744 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ab91a5c7e19506c8b75cedd8fcf0c9c73fdff946 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107ef85ba31af6c68e107574ec007322c2a9aa492517bf68163c4d38b18da990 +size 234881907 diff --git a/checkpoint/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cb5c357deccf525f05ae0eb91f1c928a630e7548 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d6c758a02a3c02c1801d8b214b7c36491edda74ecfae9d470d90b610c95518 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..83e4a58de7a90a5f569d2b72f7fa1cb684cc96fe --- /dev/null +++ b/checkpoint/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7400d5c216243e4da6ae01000a5b9daea08df2929f952fcfa3cd42385b2e5efd +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cf021dddfd70c3ebb9c2fb09e4c9a64848e20f0b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de8724204efe0ad8a47a01a9ca693d570b910d8396734a56f064d7f29524aa3 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight b/checkpoint/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..7f10297410fa1456b085a3d7647f628895ada529 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa8c1dac7bfa0919229a850341e6399560752e7f4d2acd79b880dca4bd8c61d +size 17276 diff --git a/checkpoint/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..06680b1af24f1cde05f2c9c0befd4fe0ecd9a47c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8271141727186934ec04365884d5ec2ca0e8ffae6f779506de1c342d17d0c11d +size 17303 diff --git a/checkpoint/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..0646b3bd165f6eee3210192992bb3b275bd10e4c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ead4b679506e36fc4eacacd44cc594db1d80877b452948c8056eff9664f205 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3753445a05920581ff0f0f589bab31253ec29aa2 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459f3e85c2ad1e89990eda29be99770d473c3fc17fa60c5e191b838527f41c6f +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..3a94f5dfee026c7f963b9f6458b2fe03480f4283 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a2b3a2066e4334d1e0a41999f8d9b835a5e5dc0a18a842bd14d44c6a63e723 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..35a6f7c72d1beecb084f20b45e5282040bc91c5a --- /dev/null +++ b/checkpoint/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2d9e43837eb485e6844cfd94b5988d5e20b09f193457c9301a64208042d7a6 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bd70fba87c302ef4a1860826bde6355094ff3517 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fe29246e72e9dffa244eb1cffd415c729b43306bb4a8e759f9c8e3b9d4d4e1 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..60c217e46eb65fac115d8d6049e2d598b14be3ee --- /dev/null +++ b/checkpoint/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3cbc045a92da00d37c7c270612c8ec6fe6e3ef13ba2b4c1cbf2212be350511 +size 234881901 diff --git a/checkpoint/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..960a0396ffd67824dd370a63a6d001295036fa21 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63553a6a3cb3d9b86876fcf57d4d629741f2b4db17635d9ceca085668db6fcfd +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..dbcf569d8f93d3cc6145b1d5a9711d9efc0f1eba --- /dev/null +++ b/checkpoint/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8016edc1b7d3ed82403ab7106471bcd664b506f81bf35400a090b747f5b026a2 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight b/checkpoint/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..41372d4e7fa7d00be00ce2c7f0ac29c51e3c121e --- /dev/null +++ b/checkpoint/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3290473c62028bf6927bf204dd92baab7253a1ef5cefe4e3776dfc4ff36f2c +size 17276 diff --git a/checkpoint/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..2ef3b19dcbef920455bc81053abf61c5fa4a3640 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86995eceee10fc04457618de91f7a55e63e1f193078aa87dccd7132601a952b0 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f7b48fa0549e63f03eebdde957e7c97bd9b1a6af --- /dev/null +++ b/checkpoint/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058d44315759983c287fa4cbc9b55dcf435bcf0094ee68c1118d065d4a9623e5 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7069cd50d7c3ca264cca9e4e3e8a3e414491fa75 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e14c049cf918002c1a530dd8e88fd4ada13f3e290a5f6f2ba384fe3b7dfafcb +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..6d27cb81a0584b3144f0d48a8e953731f7c443b9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241e9a2e92ee598619a6f79e75820475ccdd3cc5e7205d9e208bc18ea3046b2c +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..bbf3f369447cc57fb7c16bf680461e7458289131 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f76b6aa74f175619b660d878ba7862aafd18e7f2675e97f6c7b9b02426b00992 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2b0b8d5b756303559a365f08aae8c1e611e849a0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cd2ab4f32cb671e591a2db539c90cd290444aa74fb836b2566e1dd649e8156 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..26e10c5411b5aa21422ee796674592069c30710b --- /dev/null +++ b/checkpoint/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17fcdee443613486486feccdaae009fe7a67b2ee488b84347c65a6e647448692 +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..dd6002507cc35d979c05f2978b73b20cd0853a47 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d83269426ea2148c0ecb892c41b7cbd14ef18a1f1c0660a0fd3860fbf040e13 +size 234881907 diff --git a/checkpoint/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..f54ad575410bbeeed04e384dac46c58d136d0cf3 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b157befa018fa018e4a57009fa35dc66db8a1f4ce3a39485c117d3d6ad64999 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight b/checkpoint/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..9b0377921b000da108f40e2c588b6a0ebb2f5358 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc36b626ab57054952e1ac3e120f740e33dbdf6f33307f0ce62311a2131abf23 +size 17276 diff --git a/checkpoint/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..59395b0e60cef530b85a7dfde71d25f4ff30bcd9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ed36a395f0b03d3522e73ebad59c2dc25c007439c9cb607a54d36395a49887 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ef96fe086f9d4f44e65bc8cdb08dcbc96453e182 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd87b959bfa41d8d6f112904fc579d0f46e608895c453fa0dabe8e108828faf +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..293f43f4d8fe19ceabbb07b7c325807447fe94e8 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2d5c3de961821e24fee1d8b8b56a78e8b445258d6fdc176f68808bd66b1f65 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..faf1181507adb1ccf0cbdbc9eebadf80efea56b1 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff2dad4ddc679532d7353bff3ca471aadbffa9293800c4374b08317daf0e035 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..1da82207babe6c598771374e39c07a3599167c6c --- /dev/null +++ b/checkpoint/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9bea7591adfd87b759a743616c1f0e3d4da5e8382dd6b087aa89932943c8f2a +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..a7fa2318cfc75a6e95244a8a6e284cd4c90575b5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57810360420d6dd749af28cd1f3dbf8e7c84d5c4868bb5fb3f07c1ae33037597 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..0bb54e89bc0fd4aa6d153389f9ff496d8c159c74 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3fd5fccadfce643e9d1ad00e3dc6fe3ac029594ce6e81b416beb0abf1de99c +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..54a3adc4b608b9a37741ab6e34bc4de99fdf5fa5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c84b02f147f88c17bc33978f1d05dfad4d51db4982e32429c8e909d1d7118387 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight b/checkpoint/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..a0796e1256dc0724b10867ae37121ff414b87c00 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db8a85891dba6e37d35dfe3ffd5f18305ccdcc104d8941ac0632b0178f5e912 +size 17273 diff --git a/checkpoint/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight b/checkpoint/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..56854dba6f74b8809daa365a51c6a9889a5d5f97 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe1decf2e21cbc4bf713f5547c2a6083a3b6fccc471a153fcdca823b7a27e2b +size 17276 diff --git a/checkpoint/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..9fbb3083ed0cc56f23a417a09ce14bb80e79d564 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb869042178f1c6d38c58f9e4d5b03a820e281c6d6724655348772bebb339c74 +size 17303 diff --git a/checkpoint/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ec53b2ddab5a7fe80b0f056d62df4a6ed6b99ca9 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0087663a717093d04070251b7cb915c30db412e30f7cf69b8a3cfb83df8cddf9 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..9a4f7a0fdd60e9441b10ea2d4c75c615e13a2671 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ffc879f39aa4702a2b389f7aa4af124b4a4f6de7a1d8580755508298666914d +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5bdd8f263c7509baa5a501863c2d7f3ddd8d8830 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4792b60c188ccd7f66d98da639657f680fcac783eebb2e7266bd649dbde98163 +size 16778111 diff --git a/checkpoint/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..8d90018f97dfb447b6a5c3e3f4d6572a8e553e14 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7273d61ae39ae46ae3018c8aef85c393da1bd1b047fcddaf43481f1d15b054 +size 67109759 diff --git a/checkpoint/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..5924fdbfed96568aea3ae4fbda374067288deab0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac3c7bc30164e413385a8d9dfefe6b40464452ce68946abccb9cc7a107767d8 +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..2f54b17f444cd45aee7b08151000fa8172e336eb --- /dev/null +++ b/checkpoint/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a365bbf7d0f13b5b174733d29784289d2b5724155a81f5c38d961019435779 +size 234881904 diff --git a/checkpoint/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..7f3893676eff2416c56538dfad9ce02090bd80ae --- /dev/null +++ b/checkpoint/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed6ee9edfbe4b96f4c453779128b3d99077453accbcbc35ad7ff613bae97d4f +size 234881910 diff --git a/checkpoint/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight b/checkpoint/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..65b37cc5cc337efc16b194ebd7b8ad63cbb314b5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56900faba8b4fb13a14c1714f4f370479685e1bc52d35e4378a35ea8365ffaf +size 17276 diff --git a/checkpoint/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..478488636fc2dc884e720c0d415d839e62ce4049 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39bf5930bc9d6a6dd149c66bd6e6387fb756d62a93222dab3e2b9807e071f17f +size 17300 diff --git a/checkpoint/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..5c04711c8f8ecccd4c8ad19e3356d9552672438d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38814ec421354a60fcb43474ffb00700eb1e7b594a4e5aaa7e2f864eb41b241f +size 17303 diff --git a/checkpoint/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight b/checkpoint/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..b6ab45b086368ecc24cdb2fa21e547b2b891c9e0 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3b8e9df28b3118b02a0c69ab44948b3c66732b04038ecbc72c61cce520ff78 +size 67109762 diff --git a/checkpoint/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight b/checkpoint/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..671f00aa5fcc06489b2bd612a88698eb301c6ab4 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e09e8ffe98f0eff3f6569b55f2529d877d836961fa55661b5978c624381f63d +size 16778114 diff --git a/checkpoint/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight b/checkpoint/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ee930eabd044b382ce406747512572c922f6a1ba --- /dev/null +++ b/checkpoint/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be7ee00920dca57679f2ee541d36831dfe815ba5460fcd069eed1d9064e8445 +size 16778114 diff --git a/checkpoint/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight b/checkpoint/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..213b91f13cf374e2c5b36a80a0236351129aaaf5 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa95ddc69c23b3d7728827662d6b8a70af6e88be469dc737dbf273153bbaef1 +size 67109762 diff --git a/checkpoint/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight b/checkpoint/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..cbf36c4c71df41f7560806d3e9d626e2b57c553d --- /dev/null +++ b/checkpoint/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc62e091ac24078b9ad1fd987b37bd602cd716046f56bafd2c5390128a9082c5 +size 234881913 diff --git a/checkpoint/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight b/checkpoint/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..ca34b3035a23cd0d24c44cb665a6ccae35b61293 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ddcf0fdc37c330e1e4b95f04ef2438e1280d7c27b050fb1a27fa3b1fdd65e9 +size 234881907 diff --git a/checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight b/checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight new file mode 100644 index 0000000000000000000000000000000000000000..63abda731886733bd7373a2b5c9e3729e6ed4a47 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f14b99d819888161a9c1ff3f501ae31baa362f769fc6d99f2c07ee0ea7a2b86 +size 234881913 diff --git a/checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight b/checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..1919f15a2bb40875e41a47971bc0b7e818d67f66 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4787f2932a6f6e1b19067a860815a6dd488b45f411035cc3084a7a0df8896d82 +size 17279 diff --git a/checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight b/checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight new file mode 100644 index 0000000000000000000000000000000000000000..9b53fc161a14f673cbe60031fb8ca82bd8696874 --- /dev/null +++ b/checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1129e2dedc5186a59a3ecb2582634b4e20dfffcbd24ed09444c75d2dcdd0135c +size 17306 diff --git a/compiled/42892ca1835c7f1ee360.neff b/compiled/42892ca1835c7f1ee360.neff new file mode 100644 index 0000000000000000000000000000000000000000..ccfecd5212cae67b12b464196c1a377e3a8d10d5 --- /dev/null +++ b/compiled/42892ca1835c7f1ee360.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2360b5a2fbcc8f95842dd05d82d0a33e314c4255b16a1bb4e3ded98aa1ebd619 +size 26829824 diff --git a/compiled/5f563a8109c06154fd1a.neff b/compiled/5f563a8109c06154fd1a.neff new file mode 100644 index 0000000000000000000000000000000000000000..571f9f1ea54754673a27105f1b650766b7721811 --- /dev/null +++ b/compiled/5f563a8109c06154fd1a.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955ae6b6a812e0f92a9ef0f773f76f459b00df2cd20dd83d76c18cf28610710c +size 11367424 diff --git a/compiled/81e045aa41db6708aa20.neff b/compiled/81e045aa41db6708aa20.neff new file mode 100644 index 0000000000000000000000000000000000000000..82ae71a84cc0767c9fd1603e9404b03aca8289fd --- /dev/null +++ b/compiled/81e045aa41db6708aa20.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ac6027ce5c9b520f2bb0ab380a6cc350195f33be0c96d6d006ad6d3ba22b27 +size 7947264 diff --git a/compiled/9e156236317bf9a3f88c.neff b/compiled/9e156236317bf9a3f88c.neff new file mode 100644 index 0000000000000000000000000000000000000000..833fe9ce229f3995a1100253a4fe3423c99d1f12 --- /dev/null +++ b/compiled/9e156236317bf9a3f88c.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f89c094db7ed55c0db17abf5ee08bdad14b0c02f67fa1c30d6198a46edc9620 +size 7988224 diff --git a/compiled/a5a606ee7f9b51e4eb22.neff b/compiled/a5a606ee7f9b51e4eb22.neff new file mode 100644 index 0000000000000000000000000000000000000000..dc0a59f248f6f4ec550358d08c8f2514ad2009de --- /dev/null +++ b/compiled/a5a606ee7f9b51e4eb22.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08fec642d1ecac1f81dfc60018abec3b3d3c6135fdb71e45c7d4ec43303b5390 +size 9042944 diff --git a/compiled/ba2c6f82564581eac7de.neff b/compiled/ba2c6f82564581eac7de.neff new file mode 100644 index 0000000000000000000000000000000000000000..e26d6b40206f0e4db9848e6a987992e151fa2d87 --- /dev/null +++ b/compiled/ba2c6f82564581eac7de.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42519f9424c5f94aaf9b006d42f3c02925a44db85140b240bc0dab5b519100ba +size 7640064 diff --git a/compiled/bc1b3efbe17382b052dc.neff b/compiled/bc1b3efbe17382b052dc.neff new file mode 100644 index 0000000000000000000000000000000000000000..5cdef8597d0782f4c10754f45d94e6736ce180d5 --- /dev/null +++ b/compiled/bc1b3efbe17382b052dc.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655eb5bb5ef10c66fc10131cbede36ff06d7d3f05633bd5023fbee1bcf0171a9 +size 7681024 diff --git a/compiled/c13580424e448f3adb62.neff b/compiled/c13580424e448f3adb62.neff new file mode 100644 index 0000000000000000000000000000000000000000..d3e8fc98f4a7c45efe5d4472f0f0ff86bcd3f895 --- /dev/null +++ b/compiled/c13580424e448f3adb62.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d3345a258c792d64b5b732a2ef8d3ca1d483c991b110e6f876e98a129d0913 +size 8459264 diff --git a/compiled/cd7da042b94df6a02f61.neff b/compiled/cd7da042b94df6a02f61.neff new file mode 100644 index 0000000000000000000000000000000000000000..54498957deeb8e025f97207336fbe3ccec418d7c --- /dev/null +++ b/compiled/cd7da042b94df6a02f61.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48db029b385ad0c8af8c3d22562565e61043f96747de7ae137a0b282873daa93 +size 7742464 diff --git a/compiled/d0dad260213be0bab13e.neff b/compiled/d0dad260213be0bab13e.neff new file mode 100644 index 0000000000000000000000000000000000000000..0b37e355d31617f4fe2c1e3372a84529ced723f1 --- /dev/null +++ b/compiled/d0dad260213be0bab13e.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3127242cd45689e7c0e45e892dc0e0d53420039cb98470916287b9ce92df56bb +size 7558144 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e633c79736a6025ec6736f0f6cc1fe8eb021cd17 --- /dev/null +++ b/config.json @@ -0,0 +1,37 @@ +{ + "_name_or_path": "Mistral-7B-Instruct-v0.2/config.json", + "architectures": [ + "MistralForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 1, + "eos_token_id": 2, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 32768, + "model_type": "mistral", + "neuron": { + "auto_cast_type": "fp16", + "batch_size": 1, + "checkpoint_id": null, + "checkpoint_revision": null, + "compiler_type": "neuronx-cc", + "compiler_version": "2.12.68.0+4480452af", + "num_cores": 2, + "sequence_length": 2048, + "task": "text-generation" + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-05, + "rope_theta": 1000000.0, + "sliding_window": 4096, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.36.2", + "use_cache": true, + "vocab_size": 32000 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c533f934c6359393a56a3ea067a0df118c14797e --- /dev/null +++ b/generation_config.json @@ -0,0 +1,6 @@ +{ + "_from_model_config": true, + "bos_token_id": 1, + "eos_token_id": 2, + "transformers_version": "4.36.2" +}