Spaces:
Running
Running
refactor(quant factors): linearize the factors
Browse files- src/core/scoring.py +9 -9
src/core/scoring.py
CHANGED
@@ -14,15 +14,15 @@ from dataclasses import dataclass, field
|
|
14 |
def get_default_quant_tiers() -> Dict[str, float]:
|
15 |
"""Default quantization tiers with quality factors"""
|
16 |
return {
|
17 |
-
"F16": 1.0, # Full precision
|
18 |
-
"F32": 1.0, # Full precision
|
19 |
-
"Q8": 0.
|
20 |
-
"Q6": 0.
|
21 |
-
"Q5": 0.
|
22 |
-
"Q4": 0.
|
23 |
-
"Q3": 0.
|
24 |
-
"Q2": 0.
|
25 |
-
"Q1": 0.
|
26 |
}
|
27 |
|
28 |
|
|
|
14 |
def get_default_quant_tiers() -> Dict[str, float]:
|
15 |
"""Default quantization tiers with quality factors"""
|
16 |
return {
|
17 |
+
"F16": 1.0, # Full precision (skewed towards quantizations)
|
18 |
+
"F32": 1.0, # Full precision (skewed towards quantizations)
|
19 |
+
"Q8": 0.8, # Almost perfect
|
20 |
+
"Q6": 0.6, # Still fancy
|
21 |
+
"Q5": 0.5, # The "medium rare" of quantization
|
22 |
+
"Q4": 0.4, # Gets the job done
|
23 |
+
"Q3": 0.3, # Nice try
|
24 |
+
"Q2": 0.2, # eh
|
25 |
+
"Q1": 0.1, # At this point, just use a Magic 8-Ball
|
26 |
}
|
27 |
|
28 |
|