morriszms commited on
Commit
05fccf5
1 Parent(s): 1522b8c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,18 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Llama3-70B-Fireplace-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Llama3-70B-Fireplace-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Llama3-70B-Fireplace-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Llama3-70B-Fireplace-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Llama3-70B-Fireplace-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Llama3-70B-Fireplace-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Llama3-70B-Fireplace-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Llama3-70B-Fireplace-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Llama3-70B-Fireplace-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Llama3-70B-Fireplace-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Llama3-70B-Fireplace-Q6_K/Llama3-70B-Fireplace-Q6_K-00001-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Llama3-70B-Fireplace-Q6_K/Llama3-70B-Fireplace-Q6_K-00002-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
48
+ Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00001-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
49
+ Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00002-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
50
+ Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00003-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
Llama3-70B-Fireplace-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba8e23c32685c1381901ddfc87e26cc181261d65884ffdacd5b734a0b122e464
3
+ size 26375108672
Llama3-70B-Fireplace-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2062232ac7e92e0d1d348af202f7af3e383bfa28b338cbdf89352031cadb455e
3
+ size 37140592704
Llama3-70B-Fireplace-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27afdce1cc763960a6d18321446908025a85be603e05af34622fa0c49441e2c4
3
+ size 34267494464
Llama3-70B-Fireplace-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:526ef8e1e4166b7848011e6e4e06b6a468022538d6d036132a457da5fe7be9d3
3
+ size 30912051264
Llama3-70B-Fireplace-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba1f2ce6ce3fc7f58dabcd74b64c181d9b924c11ca37bfce89c38bb218eb031e
3
+ size 39969732672
Llama3-70B-Fireplace-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e12ef047b1879f7cffdb696d914b13632bd68144cdaae3e03a3af4ef345713d
3
+ size 42520393792
Llama3-70B-Fireplace-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436084ff690e6ab840ba21de6175582663a470812d9cf0b9c20a4ff487ed654e
3
+ size 40347220032
Llama3-70B-Fireplace-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a17dbf8962b2d863e6c363e1d54c940279ee65741ce34296e16414fd0b17a8ef
3
+ size 48657446976
Llama3-70B-Fireplace-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba5a622771a94215cf207757f1b73d03f5c37722714623ffba87f089ef4af9d1
3
+ size 49949816896
Llama3-70B-Fireplace-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c95f27490e27d6c7d3529cc98a5712087334d1a258a7a6f93c71ee5dc9a6ce7
3
+ size 48657446976
Llama3-70B-Fireplace-Q6_K/Llama3-70B-Fireplace-Q6_K-00001-of-00002.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38e322e28d7f64f9890290171e5821e22ef7b611c40053f4775d5afa41e8e99f
3
+ size 34847470688
Llama3-70B-Fireplace-Q6_K/Llama3-70B-Fireplace-Q6_K-00002-of-00002.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb8f0224ddef82603ed1ff0406ba80831d1862976053f5cfc76efe185872ac94
3
+ size 23040672928
Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00001-of-00003.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:476b534ae580c7209fa859b17aa03396577db1250cce1ef3b26d9caebbba2862
3
+ size 34980011136
Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00002-of-00003.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1e9421250c80df15f09d53bcfc9a64639cd4d49c4c992fc1199b7adb381e06a
3
+ size 34949976384
Llama3-70B-Fireplace-Q8_0/Llama3-70B-Fireplace-Q8_0-00003-of-00003.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94d54f7e2c08f3bf6a5115950c5264609f4d3a3f49bf8e833005b124066bed32
3
+ size 5045062560
README.md ADDED
@@ -0,0 +1,191 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: llama3
5
+ tags:
6
+ - fireplace
7
+ - valiant
8
+ - valiant-labs
9
+ - llama
10
+ - llama-3
11
+ - llama-3-instruct
12
+ - llama-3-instruct-70b
13
+ - 70b
14
+ - function-calling
15
+ - conversational
16
+ - chat
17
+ - instruct
18
+ - TensorBlock
19
+ - GGUF
20
+ pipeline_tag: text-generation
21
+ model_type: llama
22
+ base_model: ValiantLabs/Llama3-70B-Fireplace
23
+ model-index:
24
+ - name: Llama3-70B-Fireplace
25
+ results:
26
+ - task:
27
+ type: text-generation
28
+ name: Text Generation
29
+ dataset:
30
+ name: IFEval (0-Shot)
31
+ type: HuggingFaceH4/ifeval
32
+ args:
33
+ num_few_shot: 0
34
+ metrics:
35
+ - type: inst_level_strict_acc and prompt_level_strict_acc
36
+ value: 77.74
37
+ name: strict accuracy
38
+ source:
39
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
40
+ name: Open LLM Leaderboard
41
+ - task:
42
+ type: text-generation
43
+ name: Text Generation
44
+ dataset:
45
+ name: BBH (3-Shot)
46
+ type: BBH
47
+ args:
48
+ num_few_shot: 3
49
+ metrics:
50
+ - type: acc_norm
51
+ value: 49.56
52
+ name: normalized accuracy
53
+ source:
54
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
55
+ name: Open LLM Leaderboard
56
+ - task:
57
+ type: text-generation
58
+ name: Text Generation
59
+ dataset:
60
+ name: MATH Lvl 5 (4-Shot)
61
+ type: hendrycks/competition_math
62
+ args:
63
+ num_few_shot: 4
64
+ metrics:
65
+ - type: exact_match
66
+ value: 19.64
67
+ name: exact match
68
+ source:
69
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
70
+ name: Open LLM Leaderboard
71
+ - task:
72
+ type: text-generation
73
+ name: Text Generation
74
+ dataset:
75
+ name: GPQA (0-shot)
76
+ type: Idavidrein/gpqa
77
+ args:
78
+ num_few_shot: 0
79
+ metrics:
80
+ - type: acc_norm
81
+ value: 13.98
82
+ name: acc_norm
83
+ source:
84
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
85
+ name: Open LLM Leaderboard
86
+ - task:
87
+ type: text-generation
88
+ name: Text Generation
89
+ dataset:
90
+ name: MuSR (0-shot)
91
+ type: TAUR-Lab/MuSR
92
+ args:
93
+ num_few_shot: 0
94
+ metrics:
95
+ - type: acc_norm
96
+ value: 16.77
97
+ name: acc_norm
98
+ source:
99
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
100
+ name: Open LLM Leaderboard
101
+ - task:
102
+ type: text-generation
103
+ name: Text Generation
104
+ dataset:
105
+ name: MMLU-PRO (5-shot)
106
+ type: TIGER-Lab/MMLU-Pro
107
+ config: main
108
+ split: test
109
+ args:
110
+ num_few_shot: 5
111
+ metrics:
112
+ - type: acc
113
+ value: 43.25
114
+ name: accuracy
115
+ source:
116
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3-70B-Fireplace
117
+ name: Open LLM Leaderboard
118
+ ---
119
+
120
+ <div style="width: auto; margin-left: auto; margin-right: auto">
121
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
122
+ </div>
123
+ <div style="display: flex; justify-content: space-between; width: 100%;">
124
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
125
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
126
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
127
+ </p>
128
+ </div>
129
+ </div>
130
+
131
+ ## ValiantLabs/Llama3-70B-Fireplace - GGUF
132
+
133
+ This repo contains GGUF format model files for [ValiantLabs/Llama3-70B-Fireplace](https://huggingface.co/ValiantLabs/Llama3-70B-Fireplace).
134
+
135
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4242](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
136
+
137
+ <div style="text-align: left; margin: 20px 0;">
138
+ <a href="https://tensorblock.co/waitlist/client" style="display: inline-block; padding: 10px 20px; background-color: #007bff; color: white; text-decoration: none; border-radius: 5px; font-weight: bold;">
139
+ Run them on the TensorBlock client using your local machine ↗
140
+ </a>
141
+ </div>
142
+
143
+ ## Prompt template
144
+
145
+ ```
146
+ <|begin_of_text|><|start_header_id|>system<|end_header_id|>
147
+
148
+ {system_prompt}<|eot_id|><|start_header_id|>user<|end_header_id|>
149
+
150
+ {prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>
151
+ ```
152
+
153
+ ## Model file specification
154
+
155
+ | Filename | Quant type | File Size | Description |
156
+ | -------- | ---------- | --------- | ----------- |
157
+ | [Llama3-70B-Fireplace-Q2_K.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q2_K.gguf) | Q2_K | 26.375 GB | smallest, significant quality loss - not recommended for most purposes |
158
+ | [Llama3-70B-Fireplace-Q3_K_S.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q3_K_S.gguf) | Q3_K_S | 30.912 GB | very small, high quality loss |
159
+ | [Llama3-70B-Fireplace-Q3_K_M.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q3_K_M.gguf) | Q3_K_M | 34.267 GB | very small, high quality loss |
160
+ | [Llama3-70B-Fireplace-Q3_K_L.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q3_K_L.gguf) | Q3_K_L | 37.141 GB | small, substantial quality loss |
161
+ | [Llama3-70B-Fireplace-Q4_0.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q4_0.gguf) | Q4_0 | 39.970 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
162
+ | [Llama3-70B-Fireplace-Q4_K_S.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q4_K_S.gguf) | Q4_K_S | 40.347 GB | small, greater quality loss |
163
+ | [Llama3-70B-Fireplace-Q4_K_M.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q4_K_M.gguf) | Q4_K_M | 42.520 GB | medium, balanced quality - recommended |
164
+ | [Llama3-70B-Fireplace-Q5_0.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q5_0.gguf) | Q5_0 | 48.657 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
165
+ | [Llama3-70B-Fireplace-Q5_K_S.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q5_K_S.gguf) | Q5_K_S | 48.657 GB | large, low quality loss - recommended |
166
+ | [Llama3-70B-Fireplace-Q5_K_M.gguf](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q5_K_M.gguf) | Q5_K_M | 49.950 GB | large, very low quality loss - recommended |
167
+ | [Llama3-70B-Fireplace-Q8_0](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q8_0) | Q6_K | 74.975 GB | very large, extremely low quality loss |
168
+ | [Llama3-70B-Fireplace-Q6_K](https://huggingface.co/tensorblock/Llama3-70B-Fireplace-GGUF/blob/main/Llama3-70B-Fireplace-Q6_K) | Q8_0 | 57.888 GB | very large, extremely low quality loss - not recommended |
169
+
170
+
171
+ ## Downloading instruction
172
+
173
+ ### Command line
174
+
175
+ Firstly, install Huggingface Client
176
+
177
+ ```shell
178
+ pip install -U "huggingface_hub[cli]"
179
+ ```
180
+
181
+ Then, downoad the individual model file the a local directory
182
+
183
+ ```shell
184
+ huggingface-cli download tensorblock/Llama3-70B-Fireplace-GGUF --include "Llama3-70B-Fireplace-Q2_K.gguf" --local-dir MY_LOCAL_DIR
185
+ ```
186
+
187
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
188
+
189
+ ```shell
190
+ huggingface-cli download tensorblock/Llama3-70B-Fireplace-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
191
+ ```