sequelbox commited on
Commit
e795912
1 Parent(s): c13a3c5

099fe363c7613cde44d35c6c177863f3fb828105759891585bcd174d024d1232

Browse files
Files changed (5) hide show
  1. .gitattributes +1 -0
  2. README.md +3 -98
  3. config.json +2 -1
  4. generation_config.json +1 -1
  5. tokenizer.json +0 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -25,101 +25,6 @@ datasets:
25
  - sequelbox/Tachibana
26
  - sequelbox/Supernova
27
  model_type: llama
28
- model-index:
29
- - name: Llama3.1-8B-Enigma
30
- results:
31
- - task:
32
- type: text-generation
33
- name: Text Generation
34
- dataset:
35
- name: IFEval (0-Shot)
36
- type: HuggingFaceH4/ifeval
37
- args:
38
- num_few_shot: 0
39
- metrics:
40
- - type: inst_level_strict_acc and prompt_level_strict_acc
41
- value: 55.39
42
- name: strict accuracy
43
- source:
44
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
45
- name: Open LLM Leaderboard
46
- - task:
47
- type: text-generation
48
- name: Text Generation
49
- dataset:
50
- name: BBH (3-Shot)
51
- type: BBH
52
- args:
53
- num_few_shot: 3
54
- metrics:
55
- - type: acc_norm
56
- value: 28.47
57
- name: normalized accuracy
58
- source:
59
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
60
- name: Open LLM Leaderboard
61
- - task:
62
- type: text-generation
63
- name: Text Generation
64
- dataset:
65
- name: MATH Lvl 5 (4-Shot)
66
- type: hendrycks/competition_math
67
- args:
68
- num_few_shot: 4
69
- metrics:
70
- - type: exact_match
71
- value: 10.12
72
- name: exact match
73
- source:
74
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
75
- name: Open LLM Leaderboard
76
- - task:
77
- type: text-generation
78
- name: Text Generation
79
- dataset:
80
- name: GPQA (0-shot)
81
- type: Idavidrein/gpqa
82
- args:
83
- num_few_shot: 0
84
- metrics:
85
- - type: acc_norm
86
- value: 1.57
87
- name: acc_norm
88
- source:
89
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
90
- name: Open LLM Leaderboard
91
- - task:
92
- type: text-generation
93
- name: Text Generation
94
- dataset:
95
- name: MuSR (0-shot)
96
- type: TAUR-Lab/MuSR
97
- args:
98
- num_few_shot: 0
99
- metrics:
100
- - type: acc_norm
101
- value: 11.41
102
- name: acc_norm
103
- source:
104
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
105
- name: Open LLM Leaderboard
106
- - task:
107
- type: text-generation
108
- name: Text Generation
109
- dataset:
110
- name: MMLU-PRO (5-shot)
111
- type: TIGER-Lab/MMLU-Pro
112
- config: main
113
- split: test
114
- args:
115
- num_few_shot: 5
116
- metrics:
117
- - type: acc
118
- value: 26.2
119
- name: accuracy
120
- source:
121
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-Enigma
122
- name: Open LLM Leaderboard
123
  license: llama3.1
124
  ---
125
 
@@ -135,13 +40,13 @@ Enigma is a code-instruct model built on Llama 3.1 8b.
135
 
136
  ## Version
137
 
138
- This is the **2024-09-04** release of Enigma for Llama 3.1 8b, enhancing code-instruct and general chat capabilities.
139
 
140
  [**Enigma is now available for Llama 3.2 3b** - get it here!](https://huggingface.co/ValiantLabs/Llama3.2-3B-Enigma)
141
 
142
  Help us and recommend Enigma to your friends! We're excited for more Enigma releases in the future.
143
 
144
- Right now, we're working on more new Build Tools to come very soon, built on Llama 3.1 :)
145
 
146
 
147
  ## Prompting Guide
@@ -167,7 +72,7 @@ messages = [
167
 
168
  outputs = pipeline(
169
  messages,
170
- max_new_tokens=1024,
171
  )
172
 
173
  print(outputs[0]["generated_text"][-1])
 
25
  - sequelbox/Tachibana
26
  - sequelbox/Supernova
27
  model_type: llama
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  license: llama3.1
29
  ---
30
 
 
40
 
41
  ## Version
42
 
43
+ This is the **2024-10-02** release of Enigma for Llama 3.1 8b, enhancing code-instruct and general chat capabilities.
44
 
45
  [**Enigma is now available for Llama 3.2 3b** - get it here!](https://huggingface.co/ValiantLabs/Llama3.2-3B-Enigma)
46
 
47
  Help us and recommend Enigma to your friends! We're excited for more Enigma releases in the future.
48
 
49
+ Right now, we're working on more new Build Tools to come very soon, built on Llama 3.1 and 3.2 :)
50
 
51
 
52
  ## Prompting Guide
 
72
 
73
  outputs = pipeline(
74
  messages,
75
+ max_new_tokens=2048,
76
  )
77
 
78
  print(outputs[0]["generated_text"][-1])
config.json CHANGED
@@ -11,6 +11,7 @@
11
  128008,
12
  128009
13
  ],
 
14
  "hidden_act": "silu",
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
@@ -33,7 +34,7 @@
33
  "rope_theta": 500000.0,
34
  "tie_word_embeddings": false,
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.44.2",
37
  "use_cache": true,
38
  "vocab_size": 128256
39
  }
 
11
  128008,
12
  128009
13
  ],
14
+ "head_dim": 128,
15
  "hidden_act": "silu",
16
  "hidden_size": 4096,
17
  "initializer_range": 0.02,
 
34
  "rope_theta": 500000.0,
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "float32",
37
+ "transformers_version": "4.45.1",
38
  "use_cache": true,
39
  "vocab_size": 128256
40
  }
generation_config.json CHANGED
@@ -8,5 +8,5 @@
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
- "transformers_version": "4.44.2"
12
  }
 
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
+ "transformers_version": "4.45.1"
12
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff