sequelbox commited on
Commit
6cb5253
1 Parent(s): e437c6c

Upload folder using huggingface_hub (#6)

Browse files

- ce11cb39746f65a3b25cb3836e5ed8d0c59819df371d85a091f2fde5c2d21f7a (367ecbcbec6ca2f476860486290413401bde7e18)
- 7168041f528559ac83dc644ffbf4c4c108b396bd6af11bc01e0f651dcc545ae9 (b69d904fb3977e706849673486e0190d6df24871)
- 13b4469dd304c5cdaf3584d78eab74bd5e8064f932a01f59c157961f241dd023 (f8a72d3bb3e8a79ce28af69790565d3c08edc4e2)
- 38abfef6d41c50686989dec2b885f0f3e795f50a740a74a1a8f6dec5fb3e5e53 (50a7d0ba15377582af435ad4f6ae7d69f29df410)
- bbd47b901e0a856e04fc4d0d12e091cc50085c7931a2ff7813ddccd390e84d60 (01e1d4ea19c59fb8bab44ae83b46f98e0d4fe524)
- c73695c23396308c4b6cbd50283083058836e1bb9835acad174c70e7d9e6bca6 (c13a3c55851981890b03bf2bb600faaf9bfdb9ec)
- 099fe363c7613cde44d35c6c177863f3fb828105759891585bcd174d024d1232 (e7959126b68f5d436b7a706d91225f28ecaedc2e)

.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -25,101 +25,6 @@ datasets:
25
  - sequelbox/Tachibana
26
  - sequelbox/Supernova
27
  model_type: llama
28
- model-index:
29
- - name: Llama3.1-8B-Enigma
30
- results:
31
- - task:
32
- type: text-generation
33
- name: Text Generation
34
- dataset:
35
- name: IFEval (0-Shot)
36
- type: HuggingFaceH4/ifeval
37
- args:
38
- num_few_shot: 0
39
- metrics:
40
- - type: inst_level_strict_acc and prompt_level_strict_acc
41
- value: 55.39
42
- name: strict accuracy
43
- source:
44
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
45
- name: Open LLM Leaderboard
46
- - task:
47
- type: text-generation
48
- name: Text Generation
49
- dataset:
50
- name: BBH (3-Shot)
51
- type: BBH
52
- args:
53
- num_few_shot: 3
54
- metrics:
55
- - type: acc_norm
56
- value: 28.47
57
- name: normalized accuracy
58
- source:
59
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
60
- name: Open LLM Leaderboard
61
- - task:
62
- type: text-generation
63
- name: Text Generation
64
- dataset:
65
- name: MATH Lvl 5 (4-Shot)
66
- type: hendrycks/competition_math
67
- args:
68
- num_few_shot: 4
69
- metrics:
70
- - type: exact_match
71
- value: 10.12
72
- name: exact match
73
- source:
74
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
75
- name: Open LLM Leaderboard
76
- - task:
77
- type: text-generation
78
- name: Text Generation
79
- dataset:
80
- name: GPQA (0-shot)
81
- type: Idavidrein/gpqa
82
- args:
83
- num_few_shot: 0
84
- metrics:
85
- - type: acc_norm
86
- value: 1.57
87
- name: acc_norm
88
- source:
89
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
90
- name: Open LLM Leaderboard
91
- - task:
92
- type: text-generation
93
- name: Text Generation
94
- dataset:
95
- name: MuSR (0-shot)
96
- type: TAUR-Lab/MuSR
97
- args:
98
- num_few_shot: 0
99
- metrics:
100
- - type: acc_norm
101
- value: 11.41
102
- name: acc_norm
103
- source:
104
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
105
- name: Open LLM Leaderboard
106
- - task:
107
- type: text-generation
108
- name: Text Generation
109
- dataset:
110
- name: MMLU-PRO (5-shot)
111
- type: TIGER-Lab/MMLU-Pro
112
- config: main
113
- split: test
114
- args:
115
- num_few_shot: 5
116
- metrics:
117
- - type: acc
118
- value: 26.2
119
- name: accuracy
120
- source:
121
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
122
- name: Open LLM Leaderboard
123
  license: llama3.1
124
  ---
125
 
@@ -135,13 +40,13 @@ Enigma is a code-instruct model built on Llama 3.1 8b.
135
 
136
  ## Version
137
 
138
- This is the **2024-09-04** release of Enigma for Llama 3.1 8b, enhancing code-instruct and general chat capabilities.
139
 
140
  [**Enigma is now available for Llama 3.2 3b** - get it here!](https://huggingface.co/ValiantLabs/Llama3.2-3B-Enigma)
141
 
142
  Help us and recommend Enigma to your friends! We're excited for more Enigma releases in the future.
143
 
144
- Right now, we're working on more new Build Tools to come very soon, built on Llama 3.1 :)
145
 
146
 
147
  ## Prompting Guide
@@ -167,7 +72,7 @@ messages = [
167
 
168
  outputs = pipeline(
169
  messages,
170
- max_new_tokens=1024,
171
  )
172
 
173
  print(outputs[0]["generated_text"][-1])
 
25
  - sequelbox/Tachibana
26
  - sequelbox/Supernova
27
  model_type: llama
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  license: llama3.1
29
  ---
30
 
 
40
 
41
  ## Version
42
 
43
+ This is the **2024-10-02** release of Enigma for Llama 3.1 8b, enhancing code-instruct and general chat capabilities.
44
 
45
  [**Enigma is now available for Llama 3.2 3b** - get it here!](https://huggingface.co/ValiantLabs/Llama3.2-3B-Enigma)
46
 
47
  Help us and recommend Enigma to your friends! We're excited for more Enigma releases in the future.
48
 
49
+ Right now, we're working on more new Build Tools to come very soon, built on Llama 3.1 and 3.2 :)
50
 
51
 
52
  ## Prompting Guide
 
72
 
73
  outputs = pipeline(
74
  messages,
75
+ max_new_tokens=2048,
76
  )
77
 
78
  print(outputs[0]["generated_text"][-1])
config.json CHANGED
@@ -11,6 +11,7 @@
11
  128008,
12
  128009
13
  ],
 
14
  "hidden_act": "silu",
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
@@ -33,7 +34,7 @@
33
  "rope_theta": 500000.0,
34
  "tie_word_embeddings": false,
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.44.2",
37
  "use_cache": true,
38
  "vocab_size": 128256
39
  }
 
11
  128008,
12
  128009
13
  ],
14
+ "head_dim": 128,
15
  "hidden_act": "silu",
16
  "hidden_size": 4096,
17
  "initializer_range": 0.02,
 
34
  "rope_theta": 500000.0,
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "float32",
37
+ "transformers_version": "4.45.1",
38
  "use_cache": true,
39
  "vocab_size": 128256
40
  }
generation_config.json CHANGED
@@ -8,5 +8,5 @@
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
- "transformers_version": "4.44.2"
12
  }
 
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
+ "transformers_version": "4.45.1"
12
  }
model-00001-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08dff18399f4082cd4af329673d8e5f05ba976529cd4b2fd3eaa8a198ad48a0c
3
  size 4886466168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68aff9f2136b3d6262cd029b78a809dfab52da300fe341850cf0262a0e1ae098
3
  size 4886466168
model-00002-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93734a9e3f00cbded5bb06644d1a5a8a247c14f383e61ad49ad0c671e350f262
3
  size 4832007448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29f7d1769f923f139ac4a9d770cd9c042e900a4701088faf88e38d3f1607e8eb
3
  size 4832007448
model-00003-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d58a3870696db28abed0917760f77a5cf11322674209263462ff08935f87ea7e
3
  size 4999813112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef3d1ed8d5a12c5037f45657b420a16cfabf20369b7037f9777735eeb0f6539f
3
  size 4999813112
model-00004-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52bddb21602fc8f2ce0f79d011b6f6280dcf65f659142766b84f9a375524d364
3
  size 4999813128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34778dce4c45e5e45061897d9b0656e07dec836eaffdc31c067e54f13c16cc7f
3
  size 4999813128
model-00005-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f67914bd40d6b748669032e06fd2c36eb83c5354da989052174a97270c3dd1b
3
  size 4832007496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f8e71c56d0f618b4562fd159a21807c7cde8bc6fff596bc63d7fc615ef0d1f
3
  size 4832007496
model-00006-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74a7c7fc0cc3074b7eb787ef4ede238dd0733565edadbb137c497615122e8080
3
  size 4999813120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d0425fea1a6bdd650e6bb22171acfa73e875fde27b70e9f8f6801ed71a0c2cf
3
  size 4999813120
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff