yahavb commited on
Commit
59835e9
·
verified ·
1 Parent(s): dfff87c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ compiled/09637ea11ae6545f05c3.neff filter=lfs diff=lfs merge=lfs -text
37
+ compiled/58855406abc6bff25a24.neff filter=lfs diff=lfs merge=lfs -text
38
+ compiled/5a7c0239f2ab37cc9b31.neff filter=lfs diff=lfs merge=lfs -text
39
+ compiled/68c6b8f316592f7e9781.neff filter=lfs diff=lfs merge=lfs -text
40
+ compiled/6cf5f6929761b153bdd8.neff filter=lfs diff=lfs merge=lfs -text
41
+ compiled/79096725e6d9ed8363b8.neff filter=lfs diff=lfs merge=lfs -text
42
+ compiled/a0546f57e080fe6c147a.neff filter=lfs diff=lfs merge=lfs -text
43
+ compiled/b12667ab0698d566d36f.neff filter=lfs diff=lfs merge=lfs -text
44
+ compiled/d8bda12e438ae4ea0439.neff filter=lfs diff=lfs merge=lfs -text
45
+ compiled/ea25b05a9d522255e601.neff filter=lfs diff=lfs merge=lfs -text
compiled/09637ea11ae6545f05c3.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a1f438c7c8699e90e03c40cab81351aea81e07cde7f9207bc219550815034b0
3
+ size 4281344
compiled/58855406abc6bff25a24.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5b586cf6169504bbe123bd1b68d39bd55c06e2926742d897e01c02cfdb71a52
3
+ size 9769984
compiled/5a7c0239f2ab37cc9b31.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73ec9be37aea6c62f8abd11adbde227fe87cb5aea306d17709d556b1d2f1a3d3
3
+ size 5182464
compiled/68c6b8f316592f7e9781.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1aa0c4bf6f3a60168962311ecb7d60ebeec42a6a2973cb7cc3dd5db206d5298e
3
+ size 2704384
compiled/6cf5f6929761b153bdd8.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65aedc14c0df80fff4ae6002ae4ddbb9bff83a72fc1f405922a599eb4917bde3
3
+ size 3769344
compiled/79096725e6d9ed8363b8.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b3fc4e9347f3ce75dcd2120248c49e391d09dab84679b3747c9572398c9a3b
3
+ size 2796544
compiled/a0546f57e080fe6c147a.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:057fb997ea604818f5b3a898ebfebfea606dd122c8ec432791b7fcc8a50a9cb0
3
+ size 3462144
compiled/b12667ab0698d566d36f.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa055442e1cb839d6533f0c3bdc110140472d3d4e8f204784bf27e0a2230d4b1
3
+ size 2663424
compiled/d8bda12e438ae4ea0439.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d887a22a2fd452f06a9e7b52fa7853ea65f8108bbf90fe3c41bb4aa4b1ef1d5
3
+ size 2653184
compiled/ea25b05a9d522255e601.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1c2faa5a22bbd5eeb31e50b35b7d8bf50835c72b9927ceb8749520c508a16c4
3
+ size 2960384
config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "NousResearch/Llama-2-13b-chat-hf",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 5120,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 13824,
14
+ "max_position_embeddings": 4096,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "neuron": {
18
+ "auto_cast_type": "fp16",
19
+ "batch_size": 1,
20
+ "checkpoint_id": "NousResearch/Llama-2-13b-chat-hf",
21
+ "checkpoint_revision": "d73f5fa9c4bc135502e04c27b39660747172d76b",
22
+ "compiler_type": "neuronx-cc",
23
+ "compiler_version": "2.13.72.0+78a426937",
24
+ "num_cores": 12,
25
+ "sequence_length": 2048,
26
+ "task": "text-generation"
27
+ },
28
+ "num_attention_heads": 40,
29
+ "num_hidden_layers": 40,
30
+ "num_key_value_heads": 40,
31
+ "pad_token_id": 0,
32
+ "pretraining_tp": 1,
33
+ "rms_norm_eps": 1e-05,
34
+ "rope_scaling": null,
35
+ "rope_theta": 10000.0,
36
+ "tie_word_embeddings": false,
37
+ "torch_dtype": "float16",
38
+ "transformers_version": "4.41.1",
39
+ "use_cache": true,
40
+ "vocab_size": 32000
41
+ }
generation_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "do_sample": true,
5
+ "eos_token_id": 2,
6
+ "pad_token_id": 0,
7
+ "temperature": 0.9,
8
+ "top_p": 0.6,
9
+ "transformers_version": "4.41.1"
10
+ }