baptistecolle HF staff commited on
Commit
39105fc
Β·
1 Parent(s): d2401bd

add intel results to leaderboard

Browse files
Files changed (4) hide show
  1. app.py +2 -2
  2. hardware.yml +8 -4
  3. src/hardware.py +2 -1
  4. src/panel.py +4 -4
app.py CHANGED
@@ -37,7 +37,7 @@ with demo:
37
  optimization_checkboxes,
38
  quantization_checkboxes,
39
  kernels_checkboxes,
40
- ) = create_control_panel(machine=config.machine, subsets=config.subsets, hardware_type=config.hardware_type)
41
  ####################### HARDWARE SUBTABS #######################
42
  with gr.Tabs(elem_classes="subtabs"):
43
  open_llm_perf_df = get_llm_perf_df(machine=config.machine, subsets=config.subsets)
@@ -46,7 +46,7 @@ with demo:
46
  search_bar, columns_checkboxes, leaderboard_table = (
47
  create_leaderboard_table(open_llm_perf_df)
48
  )
49
- if config.hardware_type != "intel": # TODO intel CPU does not measure the memory requirements correctly, so disable the graph feature until we fix the underlying issue
50
  with gr.TabItem("Find Your Best Model 🧭", id=1):
51
  lat_score_mem_plot = create_lat_score_mem_plot(open_llm_perf_df)
52
  ###################### ATTENTIONS SPEEDUP TAB #######################
 
37
  optimization_checkboxes,
38
  quantization_checkboxes,
39
  kernels_checkboxes,
40
+ ) = create_control_panel(machine=config.machine, subsets=config.subsets, hardware_provider=config.hardware_provider)
41
  ####################### HARDWARE SUBTABS #######################
42
  with gr.Tabs(elem_classes="subtabs"):
43
  open_llm_perf_df = get_llm_perf_df(machine=config.machine, subsets=config.subsets)
 
46
  search_bar, columns_checkboxes, leaderboard_table = (
47
  create_leaderboard_table(open_llm_perf_df)
48
  )
49
+ if config.hardware_provider != "intel": # TODO intel CPU does not measure the memory requirements correctly, so disable the graph feature until we fix the underlying issue
50
  with gr.TabItem("Find Your Best Model 🧭", id=1):
51
  lat_score_mem_plot = create_lat_score_mem_plot(open_llm_perf_df)
52
  ###################### ATTENTIONS SPEEDUP TAB #######################
hardware.yml CHANGED
@@ -1,6 +1,7 @@
1
  - machine: 1xA10
2
  description: A10-24GB-150W πŸ–₯️
3
- hardware_type: cuda
 
4
  subsets:
5
  - unquantized
6
  - awq
@@ -11,7 +12,8 @@
11
 
12
  - machine: 1xA100
13
  description: A100-80GB-275W πŸ–₯️
14
- hardware_type: cuda
 
15
  subsets:
16
  - unquantized
17
  - awq
@@ -22,7 +24,8 @@
22
 
23
  - machine: 1xT4
24
  description: T4-16GB-70W πŸ–₯️
25
- hardware_type: cuda
 
26
  subsets:
27
  - unquantized
28
  - awq
@@ -33,7 +36,8 @@
33
 
34
  - machine: c7i
35
  description: 4th-Gen-Intel-Xeon-385W πŸ–₯️
36
- hardware_type: intel
 
37
  subsets:
38
  - unquantized
39
  backends:
 
1
  - machine: 1xA10
2
  description: A10-24GB-150W πŸ–₯️
3
+ hardware_provider: nvidia
4
+ hardware_type: gpu
5
  subsets:
6
  - unquantized
7
  - awq
 
12
 
13
  - machine: 1xA100
14
  description: A100-80GB-275W πŸ–₯️
15
+ hardware_provider: nvidia
16
+ hardware_type: gpu
17
  subsets:
18
  - unquantized
19
  - awq
 
24
 
25
  - machine: 1xT4
26
  description: T4-16GB-70W πŸ–₯️
27
+ hardware_provider: nvidia
28
+ hardware_type: gpu
29
  subsets:
30
  - unquantized
31
  - awq
 
36
 
37
  - machine: c7i
38
  description: 4th-Gen-Intel-Xeon-385W πŸ–₯️
39
+ hardware_provider: intel
40
+ hardware_type: cpu
41
  subsets:
42
  - unquantized
43
  backends:
src/hardware.py CHANGED
@@ -7,6 +7,7 @@ class HardwareConfig:
7
  def __init__(self, data: Dict[str, Any]):
8
  self.machine = data["machine"]
9
  self.description = data["description"]
 
10
  self.hardware_type = data["hardware_type"]
11
  self.subsets = data["subsets"]
12
  self.backends = data["backends"]
@@ -14,7 +15,7 @@ class HardwareConfig:
14
  def __repr__(self):
15
  return (
16
  f"HardwareConfig(machine='{self.machine}', description='{self.description}', "
17
- f"hardware_type={self.hardware_type}, subsets={self.subsets}, backends={self.backends})"
18
  )
19
 
20
 
 
7
  def __init__(self, data: Dict[str, Any]):
8
  self.machine = data["machine"]
9
  self.description = data["description"]
10
+ self.hardware_provider = data["hardware_provider"]
11
  self.hardware_type = data["hardware_type"]
12
  self.subsets = data["subsets"]
13
  self.backends = data["backends"]
 
15
  def __repr__(self):
16
  return (
17
  f"HardwareConfig(machine='{self.machine}', description='{self.description}', "
18
+ f"hardware_provider={self.hardware_provider}, hardware_type={self.hardware_type}, subsets={self.subsets}, backends={self.backends})"
19
  )
20
 
21
 
src/panel.py CHANGED
@@ -10,14 +10,14 @@ from src.llm_perf import get_llm_perf_df
10
  from src.map import get_lat_score_mem_fig
11
 
12
 
13
- def create_control_panel(machine: str, subsets: List[str], hardware_type: str):
14
  # controls
15
  machine_textbox = gr.Textbox(value=machine, visible=False)
16
  subsets_values = gr.State(value=subsets)
17
 
18
 
19
- match hardware_type:
20
- case "cuda":
21
  backends = ["pytorch"]
22
  attention_implementations = ["Eager", "SDPA", "FAv2"]
23
  quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
@@ -28,7 +28,7 @@ def create_control_panel(machine: str, subsets: List[str], hardware_type: str):
28
  quantizations = ["Unquantized"]
29
  kernels = ["No Kernel"]
30
  case _:
31
- raise ValueError(f"Unknown hardware type: {hardware_type}")
32
 
33
 
34
  with gr.Accordion("Control Panel πŸŽ›οΈ", open=False, elem_id="control-panel"):
 
10
  from src.map import get_lat_score_mem_fig
11
 
12
 
13
+ def create_control_panel(machine: str, subsets: List[str], hardware_provider: str):
14
  # controls
15
  machine_textbox = gr.Textbox(value=machine, visible=False)
16
  subsets_values = gr.State(value=subsets)
17
 
18
 
19
+ match hardware_provider:
20
+ case "nvidia":
21
  backends = ["pytorch"]
22
  attention_implementations = ["Eager", "SDPA", "FAv2"]
23
  quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
 
28
  quantizations = ["Unquantized"]
29
  kernels = ["No Kernel"]
30
  case _:
31
+ raise ValueError(f"Unknown hardware provider: {hardware_provider}")
32
 
33
 
34
  with gr.Accordion("Control Panel πŸŽ›οΈ", open=False, elem_id="control-panel"):