agh123 commited on
Commit
9b9ba95
·
1 Parent(s): e9a2b9d

refactor(quant factors): linearize the factors

Browse files
Files changed (1) hide show
  1. src/core/scoring.py +9 -9
src/core/scoring.py CHANGED
@@ -14,15 +14,15 @@ from dataclasses import dataclass, field
14
  def get_default_quant_tiers() -> Dict[str, float]:
15
  """Default quantization tiers with quality factors"""
16
  return {
17
- "F16": 1.0, # Full precision
18
- "F32": 1.0, # Full precision
19
- "Q8": 0.95, # Extremely high quality
20
- "Q6": 0.85, # Very high quality
21
- "Q5": 0.75, # High quality
22
- "Q4": 0.65, # Good quality
23
- "Q3": 0.55, # Lower quality
24
- "Q2": 0.45, # Very low quality
25
- "Q1": 0.35, # Low quality
26
  }
27
 
28
 
 
14
  def get_default_quant_tiers() -> Dict[str, float]:
15
  """Default quantization tiers with quality factors"""
16
  return {
17
+ "F16": 1.0, # Full precision (skewed towards quantizations)
18
+ "F32": 1.0, # Full precision (skewed towards quantizations)
19
+ "Q8": 0.8, # Almost perfect
20
+ "Q6": 0.6, # Still fancy
21
+ "Q5": 0.5, # The "medium rare" of quantization
22
+ "Q4": 0.4, # Gets the job done
23
+ "Q3": 0.3, # Nice try
24
+ "Q2": 0.2, # eh
25
+ "Q1": 0.1, # At this point, just use a Magic 8-Ball
26
  }
27
 
28