zembers commited on
Commit
e483980
·
0 Parent(s):
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +35 -0
  2. config.json +30 -0
  3. generation_config.json +6 -0
  4. pytorch_model-00001-of-00098.bin +3 -0
  5. pytorch_model-00002-of-00098.bin +3 -0
  6. pytorch_model-00003-of-00098.bin +3 -0
  7. pytorch_model-00004-of-00098.bin +3 -0
  8. pytorch_model-00005-of-00098.bin +3 -0
  9. pytorch_model-00006-of-00098.bin +3 -0
  10. pytorch_model-00007-of-00098.bin +3 -0
  11. pytorch_model-00008-of-00098.bin +3 -0
  12. pytorch_model-00009-of-00098.bin +3 -0
  13. pytorch_model-00010-of-00098.bin +3 -0
  14. pytorch_model-00011-of-00098.bin +3 -0
  15. pytorch_model-00012-of-00098.bin +3 -0
  16. pytorch_model-00014-of-00098.bin +3 -0
  17. pytorch_model-00015-of-00098.bin +3 -0
  18. pytorch_model-00016-of-00098.bin +3 -0
  19. pytorch_model-00017-of-00098.bin +3 -0
  20. pytorch_model-00018-of-00098.bin +3 -0
  21. pytorch_model-00019-of-00098.bin +3 -0
  22. pytorch_model-00020-of-00098.bin +3 -0
  23. pytorch_model-00021-of-00098.bin +3 -0
  24. pytorch_model-00022-of-00098.bin +3 -0
  25. pytorch_model-00023-of-00098.bin +3 -0
  26. pytorch_model-00024-of-00098.bin +3 -0
  27. pytorch_model-00025-of-00098.bin +3 -0
  28. pytorch_model-00026-of-00098.bin +3 -0
  29. pytorch_model-00027-of-00098.bin +3 -0
  30. pytorch_model-00028-of-00098.bin +3 -0
  31. pytorch_model-00029-of-00098.bin +3 -0
  32. pytorch_model-00030-of-00098.bin +3 -0
  33. pytorch_model-00031-of-00098.bin +3 -0
  34. pytorch_model-00032-of-00098.bin +3 -0
  35. pytorch_model-00033-of-00098.bin +3 -0
  36. pytorch_model-00034-of-00098.bin +3 -0
  37. pytorch_model-00035-of-00098.bin +3 -0
  38. pytorch_model-00036-of-00098.bin +3 -0
  39. pytorch_model-00037-of-00098.bin +3 -0
  40. pytorch_model-00038-of-00098.bin +3 -0
  41. pytorch_model-00039-of-00098.bin +3 -0
  42. pytorch_model-00040-of-00098.bin +3 -0
  43. pytorch_model-00041-of-00098.bin +3 -0
  44. pytorch_model-00042-of-00098.bin +3 -0
  45. pytorch_model-00043-of-00098.bin +3 -0
  46. pytorch_model-00044-of-00098.bin +3 -0
  47. pytorch_model-00045-of-00098.bin +3 -0
  48. pytorch_model-00046-of-00098.bin +3 -0
  49. pytorch_model-00047-of-00098.bin +3 -0
  50. pytorch_model-00048-of-00098.bin +3 -0
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/NFS/models/mistralai/Mixtral-8x7B-Instruct-v0.1",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 4096,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 14336,
13
+ "max_position_embeddings": 32768,
14
+ "model_type": "mixtral",
15
+ "num_attention_heads": 32,
16
+ "num_experts_per_tok": 2,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "num_local_experts": 8,
20
+ "output_router_logits": false,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_theta": 1000000.0,
23
+ "router_aux_loss_coef": 0.02,
24
+ "sliding_window": null,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.36.2",
28
+ "use_cache": true,
29
+ "vocab_size": 32000
30
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.36.2"
6
+ }
pytorch_model-00001-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c2c0476a2f2f33538300d96d608294aa5062fd1b9285fa2c8465aaca863b1d3
3
+ size 933302768
pytorch_model-00002-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:248ebc6d41a163305f6f9d088a02264130ce16f25bca3ca8dd95bb4076e15a1f
3
+ size 939527804
pytorch_model-00003-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:180025e77c6c8e8bf84abb3579fb665411c0c7e09dea7757e1a42cce1d4fce1e
3
+ size 939527804
pytorch_model-00004-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:015b464d5d85902b1f256da917a0ce025427c10350433d59d59c006f497c7552
3
+ size 906057190
pytorch_model-00005-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3e6737993b044fd550ec4a9a496faeac60a80e4179b2269fb7262ef248a6ddc
3
+ size 939527804
pytorch_model-00006-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be993201935c4b7f5044b2c0fc8897cbb9dc0f10a3bd67e5256540ee427bd66f
3
+ size 939527804
pytorch_model-00007-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1d0d0a3d18f516625b11b986b14bcf7a71f9e145cea3dd7a7ea14bffa64cd1
3
+ size 906057190
pytorch_model-00008-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c0807aa215d79d55096ed321ecc7fbc86467d8e5e09b880ac4def317284acfe
3
+ size 939527804
pytorch_model-00009-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11f769117df63150808e8662d48bcdd3c19afd2695cccb7f72f69465d4026d90
3
+ size 939527804
pytorch_model-00010-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25066bd2de14ca157fc2d55275a87c5135f243838b54fccae65f3a4d222f2661
3
+ size 906057190
pytorch_model-00011-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:170e8eb20b1c3b5dd67515cd660daef830cd5089e212dadf4daebf3ca4cdf016
3
+ size 939527804
pytorch_model-00012-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e319965d719370a6933d99c4ca352e66ae2231d6c97bb57d5c5f7afc1b3d85a
3
+ size 939527804
pytorch_model-00014-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6068aa7a2426e384ba7ec2e56b7aa5a8b55a6478151447ee8dad6e65afd012d0
3
+ size 939527804
pytorch_model-00015-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82932e07a66f68f6d9958504a8f02516cdaaeaa66a757b0c3104c19787eb3316
3
+ size 939527804
pytorch_model-00016-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9655fb9223fba76a6fdeebe737f667e193493930446fdc3efa8e5e76ab050d91
3
+ size 906057190
pytorch_model-00017-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b6cbcb5dd895c4af14f1aac60ffa54b9d8fca18942b8532a68996e0551c0b9c
3
+ size 939527804
pytorch_model-00018-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd80ac97a16c1b7505e92ee176429f41c0d907aefeebe56f548a95aa70514d0b
3
+ size 939527804
pytorch_model-00019-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a75613cfcad1b45790658b0ea150a88b75582a61e1c7986577dd6905158a3967
3
+ size 989877396
pytorch_model-00020-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:756dc2aa6d324c2ccf97f5c8d4ac4f47896063862b025dbaacb0d5682c4a9835
3
+ size 973148382
pytorch_model-00021-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c9bb53091d9453b25f72506b567696e4164aeee97304744348be00e2dba7bfe
3
+ size 939527804
pytorch_model-00022-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:742b2d3fb4e723e487010ad66cd5afca0dd3ca417ab7e530ac7d9772cc4dd05a
3
+ size 989877396
pytorch_model-00023-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38e9f38786f29caa36fe5db46b692740e7297e53b34cbc1c0bf6eb75bd35b159
3
+ size 973148382
pytorch_model-00024-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc011c33ff4c617cb4f6aa8ba5301ec59586e95648a52d2c991546e5f06017b
3
+ size 939527804
pytorch_model-00025-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:096bff31b851362095ab8c0fcb30b4fd666433cc194951a60ac65786f615d905
3
+ size 989877396
pytorch_model-00026-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5cc2ec37bd9f9f672ea1caadbc070cd2c280966dfac7fc8f86ce506c2cd0b7c
3
+ size 973148382
pytorch_model-00027-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038bba896b515d4d5ddacd3d0ed3187cf8ea9d22a1fe8b3225719ecbdbd7459e
3
+ size 939527804
pytorch_model-00028-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02fdae8ba9625a9f705eb90a5bcc5fb49239ffa51b10891f9bc2dc182d216c7b
3
+ size 989877396
pytorch_model-00029-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62568fc189b93d61653aa14bc83f9799a69df10701af5045969ee959ea486dfd
3
+ size 973148382
pytorch_model-00030-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83f04304aed095bc0af09c471deb33e0eadec7ac7559f55f039854262e27886f
3
+ size 939527804
pytorch_model-00031-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9adffdf2e0189319c8c97d1cd04fcca208c1cea509598560ef3e7697748b0cbd
3
+ size 989877396
pytorch_model-00032-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4466c099fb62237641d8d3e7eb8ecc9db88ebef3a7aa2354d917c25c78d454e
3
+ size 973148446
pytorch_model-00033-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8ab55eda2b1d6df2c516631b781aa447043265026506e63df9088312a3e0f49
3
+ size 939527804
pytorch_model-00034-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fae83b39f6f649b08af841c344a55f1a2d6ee4f826cbd1449776d56a94b873a
3
+ size 989877396
pytorch_model-00035-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec83f6c391a41c94e8a0793724d0248e25d0ec5d437e269112526bf81bce416
3
+ size 973148446
pytorch_model-00036-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3b5e7fc20db845f94f4c05af70af5d1e34a1da0657328e7086a9d473537d477
3
+ size 939527804
pytorch_model-00037-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da4fc8c7f2f8a0b04b3be1fd34325e1b84eeb6ba0d87a573971ec733bcd261cf
3
+ size 989877396
pytorch_model-00038-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a755ac7ee34f34e1067ccea7111f3dd6f89253f0ae4100f05af2adb2b45f21
3
+ size 973148446
pytorch_model-00039-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e90480d963210881d8f771eff6da71ca87b61ad379132f6441696e31ef5a63c3
3
+ size 939527804
pytorch_model-00040-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cc0f3e6ec165a4f698ee4b851b08d039e4e912d2f7cd22ea551f2a37423d35d
3
+ size 989877396
pytorch_model-00041-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1182ef8f7e069b17a62e0199e8bc609686e6980795893cb37d83aecfbba4ed0a
3
+ size 973148446
pytorch_model-00042-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e00f41dcf8fd09c95c75d1cc3d473e6a03ff4ac3020e5621654d413f859e752c
3
+ size 939527804
pytorch_model-00043-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:366327a3333be2572a1be038d7779f566247ffa7c14e37945c7a3ec5851e149a
3
+ size 989877396
pytorch_model-00044-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d16ccd90827329155dd8d1d21f2c3f1f33bb27cfd89ed73a409ea6d5b4b12e12
3
+ size 973148446
pytorch_model-00045-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb1b1b70afea85431be52135c85de4f5a2d2ad7319de7aab30ce5dbfc5d720a
3
+ size 939527804
pytorch_model-00046-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cee3222e9623c3d0c5123d945d5f5b64d6c0d02f834628d4432752970ac1da9
3
+ size 989877396
pytorch_model-00047-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61768c9d3f0f9db76ea536cd96f27fda8378c661913144f9c1137e28f0850e23
3
+ size 973148446
pytorch_model-00048-of-00098.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d215ce5248d72d8e1950190873b4469e8dfb630d44f392276069174d2e15633
3
+ size 939527804