File size: 703 Bytes
10318fd
 
 
 
 
f011c00
 
 
 
 
 
 
 
 
a02734e
 
 
 
 
 
 
 
f011c00
10318fd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
"""Module containing performance results for the Virtuoso-Small model."""

results_virtuoso_small = {
    "name": "Virtuoso-Small",
    "modelType": "Qwen2.5 14B",
    "configurations": [
        {
            "instanceType": "g6e.48xlarge",
            "quantization": "none",
            "container": "LMI 0.30+vLLM 0.6.2",
            "status": "OK",
            "tokensPerSecond": "78",
            "notes": "",
        },
        {
            "instanceType": "r8g.8xlarge",
            "quantization": "Q4_0 (repacked)",
            "container": "llama.cpp 1/17/25",
            "status": "OK",
            "tokensPerSecond": "32",
            "notes": "with Flash Attention",
        },
    ],
}