File size: 924 Bytes
e47d0b2
 
 
51a4daf
e47d0b2
 
 
 
 
 
 
 
 
 
 
51a4daf
e47d0b2
 
 
 
 
3795233
e47d0b2
 
 
 
 
 
51a4daf
e47d0b2
 
 
 
 
371c49c
e47d0b2
 
 
 
 
 
 
 
 
 
 
 
51a4daf
 
3795233
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
- machine: 1xA10
  description: A10-24GB-150W πŸ–₯️
  hardware_provider: nvidia
  hardware_type: cuda
  subsets:
    - unquantized
    - awq
    - bnb
    - gptq
  backends:
    - pytorch

- machine: 1xA100
  description: A100-80GB-275W πŸ–₯️
  hardware_provider: nvidia
  hardware_type: cuda
  subsets:
    - unquantized
    - awq
    - bnb
    - gptq
    - torchao
  backends:
    - pytorch

- machine: 1xT4
  description: T4-16GB-70W πŸ–₯️
  hardware_provider: nvidia
  hardware_type: cuda
  subsets:
    - unquantized
    - awq
    - bnb
    - gptq
    - torchao
  backends:
    - pytorch

- machine: 32vCPU-C7i
  description: Intel-Xeon-SPR-385W πŸ–₯️
  detail: |
    We tested the [32vCPU AWS C7i](https://aws.amazon.com/ec2/instance-types/c7i/) instance for the benchmark.
  hardware_provider: intel
  hardware_type: cpu
  subsets:
    - unquantized
  backends:
    - pytorch
    - openvino
    - onnxruntime