baptistecolle HF staff commited on
Commit
504caea
β€’
1 Parent(s): d7880b2

add documentation about the intel hardware

Browse files
Files changed (4) hide show
  1. app.py +6 -0
  2. hardware.yml +2 -0
  3. src/hardware.py +1 -0
  4. src/panel.py +12 -13
app.py CHANGED
@@ -25,6 +25,12 @@ with demo:
25
  with gr.Tabs(elem_classes="tabs"):
26
  for id, config in enumerate(configs):
27
  with gr.TabItem(config.description, id=id):
 
 
 
 
 
 
28
  # ####################### CONTROL PANEL #######################
29
  (
30
  filter_button,
 
25
  with gr.Tabs(elem_classes="tabs"):
26
  for id, config in enumerate(configs):
27
  with gr.TabItem(config.description, id=id):
28
+ ####################### HARDWARE DETAILS #######################
29
+ if config.detail:
30
+ gr.Markdown(config.detail, elem_classes="descriptive-text")
31
+
32
+
33
+
34
  # ####################### CONTROL PANEL #######################
35
  (
36
  filter_button,
hardware.yml CHANGED
@@ -36,6 +36,8 @@
36
 
37
  - machine: 32vCPU-C7i
38
  description: 4th-Gen-Intel-Xeon-385W πŸ–₯️
 
 
39
  hardware_provider: intel
40
  hardware_type: cpu
41
  subsets:
 
36
 
37
  - machine: 32vCPU-C7i
38
  description: 4th-Gen-Intel-Xeon-385W πŸ–₯️
39
+ detail: |
40
+ We tested the [32vCPU AWS C7i](https://aws.amazon.com/ec2/instance-types/c7i/) instance for the benchmark.
41
  hardware_provider: intel
42
  hardware_type: cpu
43
  subsets:
src/hardware.py CHANGED
@@ -11,6 +11,7 @@ class HardwareConfig:
11
  self.hardware_type = data["hardware_type"]
12
  self.subsets = data["subsets"]
13
  self.backends = data["backends"]
 
14
 
15
  def __repr__(self):
16
  return (
 
11
  self.hardware_type = data["hardware_type"]
12
  self.subsets = data["subsets"]
13
  self.backends = data["backends"]
14
+ self.detail = data.get("detail", None)
15
 
16
  def __repr__(self):
17
  return (
src/panel.py CHANGED
@@ -16,19 +16,18 @@ def create_control_panel(machine: str, subsets: List[str], hardware_provider: st
16
  subsets_values = gr.State(value=subsets)
17
 
18
 
19
- match hardware_provider:
20
- case "nvidia":
21
- backends = ["pytorch"]
22
- attention_implementations = ["Eager", "SDPA", "FAv2"]
23
- quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
24
- kernels = ["No Kernel", "GPTQ.ExllamaV1", "GPTQ.ExllamaV2", "AWQ.GEMM", "AWQ.GEMV"]
25
- case "intel":
26
- backends = ["pytorch", "onnxruntime", "openvino"]
27
- attention_implementations = ["Eager"]
28
- quantizations = ["Unquantized"]
29
- kernels = ["No Kernel"]
30
- case _:
31
- raise ValueError(f"Unknown hardware provider: {hardware_provider}")
32
 
33
 
34
  with gr.Accordion("Control Panel πŸŽ›οΈ", open=False, elem_id="control-panel"):
 
16
  subsets_values = gr.State(value=subsets)
17
 
18
 
19
+ if hardware_provider == "nvidia":
20
+ backends = ["pytorch"]
21
+ attention_implementations = ["Eager", "SDPA", "FAv2"]
22
+ quantizations = ["Unquantized", "BnB.4bit", "BnB.8bit", "AWQ.4bit", "GPTQ.4bit"]
23
+ kernels = ["No Kernel", "GPTQ.ExllamaV1", "GPTQ.ExllamaV2", "AWQ.GEMM", "AWQ.GEMV"]
24
+ elif hardware_provider == "intel":
25
+ backends = ["pytorch", "onnxruntime", "openvino"]
26
+ attention_implementations = ["Eager"]
27
+ quantizations = ["Unquantized"]
28
+ kernels = ["No Kernel"]
29
+ else:
30
+ raise ValueError(f"Unknown hardware provider: {hardware_provider}")
 
31
 
32
 
33
  with gr.Accordion("Control Panel πŸŽ›οΈ", open=False, elem_id="control-panel"):