Spaces:
Running
Running
Commit
Β·
39105fc
1
Parent(s):
d2401bd
add intel results to leaderboard
Browse files- app.py +2 -2
- hardware.yml +8 -4
- src/hardware.py +2 -1
- src/panel.py +4 -4
app.py
CHANGED
@@ -37,7 +37,7 @@ with demo:
|
|
37 |
optimization_checkboxes,
|
38 |
quantization_checkboxes,
|
39 |
kernels_checkboxes,
|
40 |
-
) = create_control_panel(machine=config.machine, subsets=config.subsets,
|
41 |
####################### HARDWARE SUBTABS #######################
|
42 |
with gr.Tabs(elem_classes="subtabs"):
|
43 |
open_llm_perf_df = get_llm_perf_df(machine=config.machine, subsets=config.subsets)
|
@@ -46,7 +46,7 @@ with demo:
|
|
46 |
search_bar, columns_checkboxes, leaderboard_table = (
|
47 |
create_leaderboard_table(open_llm_perf_df)
|
48 |
)
|
49 |
-
if config.
|
50 |
with gr.TabItem("Find Your Best Model π§", id=1):
|
51 |
lat_score_mem_plot = create_lat_score_mem_plot(open_llm_perf_df)
|
52 |
###################### ATTENTIONS SPEEDUP TAB #######################
|
|
|
37 |
optimization_checkboxes,
|
38 |
quantization_checkboxes,
|
39 |
kernels_checkboxes,
|
40 |
+
) = create_control_panel(machine=config.machine, subsets=config.subsets, hardware_provider=config.hardware_provider)
|
41 |
####################### HARDWARE SUBTABS #######################
|
42 |
with gr.Tabs(elem_classes="subtabs"):
|
43 |
open_llm_perf_df = get_llm_perf_df(machine=config.machine, subsets=config.subsets)
|
|
|
46 |
search_bar, columns_checkboxes, leaderboard_table = (
|
47 |
create_leaderboard_table(open_llm_perf_df)
|
48 |
)
|
49 |
+
if config.hardware_provider != "intel": # TODO intel CPU does not measure the memory requirements correctly, so disable the graph feature until we fix the underlying issue
|
50 |
with gr.TabItem("Find Your Best Model π§", id=1):
|
51 |
lat_score_mem_plot = create_lat_score_mem_plot(open_llm_perf_df)
|
52 |
###################### ATTENTIONS SPEEDUP TAB #######################
|
hardware.yml
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
- machine: 1xA10
|
2 |
description: A10-24GB-150W π₯οΈ
|
3 |
-
|
|
|
4 |
subsets:
|
5 |
- unquantized
|
6 |
- awq
|
@@ -11,7 +12,8 @@
|
|
11 |
|
12 |
- machine: 1xA100
|
13 |
description: A100-80GB-275W π₯οΈ
|
14 |
-
|
|
|
15 |
subsets:
|
16 |
- unquantized
|
17 |
- awq
|
@@ -22,7 +24,8 @@
|
|
22 |
|
23 |
- machine: 1xT4
|
24 |
description: T4-16GB-70W π₯οΈ
|
25 |
-
|
|
|
26 |
subsets:
|
27 |
- unquantized
|
28 |
- awq
|
@@ -33,7 +36,8 @@
|
|
33 |
|
34 |
- machine: c7i
|
35 |
description: 4th-Gen-Intel-Xeon-385W π₯οΈ
|
36 |
-
|
|
|
37 |
subsets:
|
38 |
- unquantized
|
39 |
backends:
|
|
|
1 |
- machine: 1xA10
|
2 |
description: A10-24GB-150W π₯οΈ
|
3 |
+
hardware_provider: nvidia
|
4 |
+
hardware_type: gpu
|
5 |
subsets:
|
6 |
- unquantized
|
7 |
- awq
|
|
|
12 |
|
13 |
- machine: 1xA100
|
14 |
description: A100-80GB-275W π₯οΈ
|
15 |
+
hardware_provider: nvidia
|
16 |
+
hardware_type: gpu
|
17 |
subsets:
|
18 |
- unquantized
|
19 |
- awq
|
|
|
24 |
|
25 |
- machine: 1xT4
|
26 |
description: T4-16GB-70W π₯οΈ
|
27 |
+
hardware_provider: nvidia
|
28 |
+
hardware_type: gpu
|
29 |
subsets:
|
30 |
- unquantized
|
31 |
- awq
|
|
|
36 |
|
37 |
- machine: c7i
|
38 |
description: 4th-Gen-Intel-Xeon-385W π₯οΈ
|
39 |
+
hardware_provider: intel
|
40 |
+
hardware_type: cpu
|
41 |
subsets:
|
42 |
- unquantized
|
43 |
backends:
|
src/hardware.py
CHANGED
@@ -7,6 +7,7 @@ class HardwareConfig:
|
|
7 |
def __init__(self, data: Dict[str, Any]):
|
8 |
self.machine = data["machine"]
|
9 |
self.description = data["description"]
|
|
|
10 |
self.hardware_type = data["hardware_type"]
|
11 |
self.subsets = data["subsets"]
|
12 |
self.backends = data["backends"]
|
@@ -14,7 +15,7 @@ class HardwareConfig:
|
|
14 |
def __repr__(self):
|
15 |
return (
|
16 |
f"HardwareConfig(machine='{self.machine}', description='{self.description}', "
|
17 |
-
f"hardware_type={self.hardware_type}, subsets={self.subsets}, backends={self.backends})"
|
18 |
)
|
19 |
|
20 |
|
|
|
7 |
def __init__(self, data: Dict[str, Any]):
|
8 |
self.machine = data["machine"]
|
9 |
self.description = data["description"]
|
10 |
+
self.hardware_provider = data["hardware_provider"]
|
11 |
self.hardware_type = data["hardware_type"]
|
12 |
self.subsets = data["subsets"]
|
13 |
self.backends = data["backends"]
|
|
|
15 |
def __repr__(self):
|
16 |
return (
|
17 |
f"HardwareConfig(machine='{self.machine}', description='{self.description}', "
|
18 |
+
f"hardware_provider={self.hardware_provider}, hardware_type={self.hardware_type}, subsets={self.subsets}, backends={self.backends})"
|
19 |
)
|
20 |
|
21 |
|
src/panel.py
CHANGED
@@ -10,14 +10,14 @@ from src.llm_perf import get_llm_perf_df
|
|
10 |
from src.map import get_lat_score_mem_fig
|
11 |
|
12 |
|
13 |
-
def create_control_panel(machine: str, subsets: List[str],
|
14 |
# controls
|
15 |
machine_textbox = gr.Textbox(value=machine, visible=False)
|
16 |
subsets_values = gr.State(value=subsets)
|
17 |
|
18 |
|
19 |
-
match
|
20 |
-
case "
|
21 |
backends = ["pytorch"]
|
22 |
attention_implementations = ["Eager", "SDPA", "FAv2"]
|
23 |
quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
|
@@ -28,7 +28,7 @@ def create_control_panel(machine: str, subsets: List[str], hardware_type: str):
|
|
28 |
quantizations = ["Unquantized"]
|
29 |
kernels = ["No Kernel"]
|
30 |
case _:
|
31 |
-
raise ValueError(f"Unknown hardware
|
32 |
|
33 |
|
34 |
with gr.Accordion("Control Panel ποΈ", open=False, elem_id="control-panel"):
|
|
|
10 |
from src.map import get_lat_score_mem_fig
|
11 |
|
12 |
|
13 |
+
def create_control_panel(machine: str, subsets: List[str], hardware_provider: str):
|
14 |
# controls
|
15 |
machine_textbox = gr.Textbox(value=machine, visible=False)
|
16 |
subsets_values = gr.State(value=subsets)
|
17 |
|
18 |
|
19 |
+
match hardware_provider:
|
20 |
+
case "nvidia":
|
21 |
backends = ["pytorch"]
|
22 |
attention_implementations = ["Eager", "SDPA", "FAv2"]
|
23 |
quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
|
|
|
28 |
quantizations = ["Unquantized"]
|
29 |
kernels = ["No Kernel"]
|
30 |
case _:
|
31 |
+
raise ValueError(f"Unknown hardware provider: {hardware_provider}")
|
32 |
|
33 |
|
34 |
with gr.Accordion("Control Panel ποΈ", open=False, elem_id="control-panel"):
|