|
|
@@ -1,401 +1,89 @@
|
|
|
{
|
|
|
"all_metrics": {
|
|
|
- "codellama:13b-instruct-q5_K_M": {
|
|
|
- "avg_tok_per_sec": 4.1,
|
|
|
+ "deepseek-coder-v2": {
|
|
|
+ "avg_tok_per_sec": 19.8,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.568,
|
|
|
- "coding_quality": 0.804,
|
|
|
- "general_composite": 0.508,
|
|
|
- "general_quality": 0.671,
|
|
|
- "latency_ms": 1126.4,
|
|
|
- "latency_score": 0.775,
|
|
|
- "toks_norm": 0.041
|
|
|
- },
|
|
|
- "codestral:22b-v0.1-q4_K_M": {
|
|
|
- "avg_tok_per_sec": 2.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.32,
|
|
|
- "coding_quality": 0.696,
|
|
|
- "general_composite": 0.406,
|
|
|
- "general_quality": 0.887,
|
|
|
- "latency_ms": 58429.3,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.023
|
|
|
- },
|
|
|
- "deepseek-coder-v2:16b-lite-instruct-q4_K_M": {
|
|
|
- "avg_tok_per_sec": 21.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.618,
|
|
|
- "coding_quality": 0.855,
|
|
|
- "general_composite": 0.683,
|
|
|
- "general_quality": 1.0,
|
|
|
- "latency_ms": 1617.0,
|
|
|
- "latency_score": 0.677,
|
|
|
- "toks_norm": 0.213
|
|
|
- },
|
|
|
- "deepseek-r1:14b": {
|
|
|
- "avg_tok_per_sec": 6.4,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.519,
|
|
|
- "coding_quality": 0.853,
|
|
|
- "general_composite": 0.562,
|
|
|
+ "coding_composite": 0.602,
|
|
|
+ "coding_quality": 0.55,
|
|
|
+ "general_composite": 0.781,
|
|
|
"general_quality": 0.948,
|
|
|
- "latency_ms": 2677.7,
|
|
|
- "latency_score": 0.464,
|
|
|
- "toks_norm": 0.064
|
|
|
- },
|
|
|
- "dolphin-mixtral:8x7b": {
|
|
|
- "avg_tok_per_sec": 4.8,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.451,
|
|
|
- "coding_quality": 0.755,
|
|
|
- "general_composite": 0.437,
|
|
|
- "general_quality": 0.725,
|
|
|
- "latency_ms": 3065.7,
|
|
|
- "latency_score": 0.387,
|
|
|
- "toks_norm": 0.048
|
|
|
- },
|
|
|
- "gpt-oss:20b": {
|
|
|
- "avg_tok_per_sec": 10.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.471,
|
|
|
- "coding_quality": 0.978,
|
|
|
- "general_composite": 0.447,
|
|
|
- "general_quality": 0.925,
|
|
|
- "latency_ms": 8158.0,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.103
|
|
|
- },
|
|
|
- "mistral:7b-instruct": {
|
|
|
- "avg_tok_per_sec": 12.1,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.417,
|
|
|
- "coding_quality": 0.846,
|
|
|
- "general_composite": 0.359,
|
|
|
- "general_quality": 0.717,
|
|
|
- "latency_ms": 6696.2,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.121
|
|
|
- },
|
|
|
- "phi4:14b": {
|
|
|
- "avg_tok_per_sec": 6.6,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.457,
|
|
|
- "coding_quality": 0.904,
|
|
|
- "general_composite": 0.469,
|
|
|
- "general_quality": 0.931,
|
|
|
- "latency_ms": 4394.9,
|
|
|
- "latency_score": 0.121,
|
|
|
- "toks_norm": 0.066
|
|
|
+ "latency_ms": 1875.8,
|
|
|
+ "latency_score": 0.625,
|
|
|
+ "toks_norm": 0.661
|
|
|
},
|
|
|
- "qwen2.5-coder:14b-instruct-q4_K_M": {
|
|
|
- "avg_tok_per_sec": 4.9,
|
|
|
+ "llama3.2:3b": {
|
|
|
+ "avg_tok_per_sec": 21.8,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.393,
|
|
|
- "coding_quality": 0.84,
|
|
|
- "general_composite": 0.396,
|
|
|
- "general_quality": 0.848,
|
|
|
- "latency_ms": 6865.3,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.049
|
|
|
- },
|
|
|
- "qwen2.5-coder:7b-instruct-q4_K_M": {
|
|
|
- "avg_tok_per_sec": 11.5,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.593,
|
|
|
- "coding_quality": 0.83,
|
|
|
- "general_composite": 0.619,
|
|
|
- "general_quality": 0.887,
|
|
|
- "latency_ms": 1301.7,
|
|
|
- "latency_score": 0.74,
|
|
|
- "toks_norm": 0.115
|
|
|
- },
|
|
|
- "qwen2.5-coder:7b-instruct-q5_K_M": {
|
|
|
- "avg_tok_per_sec": 9.0,
|
|
|
+ "coding_composite": 0.748,
|
|
|
+ "coding_quality": 0.7,
|
|
|
+ "general_composite": 0.86,
|
|
|
+ "general_quality": 0.949,
|
|
|
+ "latency_ms": 697.1,
|
|
|
+ "latency_score": 0.861,
|
|
|
+ "toks_norm": 0.728
|
|
|
+ },
|
|
|
+ "qwen2.5-coder:7b": {
|
|
|
+ "avg_tok_per_sec": 12.3,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.496,
|
|
|
- "coding_quality": 0.81,
|
|
|
- "general_composite": 0.548,
|
|
|
- "general_quality": 0.925,
|
|
|
- "latency_ms": 2900.9,
|
|
|
- "latency_score": 0.42,
|
|
|
- "toks_norm": 0.09
|
|
|
- },
|
|
|
- "qwen2.5-coder:7b-instruct-q6_K": {
|
|
|
- "avg_tok_per_sec": 5.9,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.536,
|
|
|
- "coding_quality": 0.832,
|
|
|
- "general_composite": 0.576,
|
|
|
- "general_quality": 0.919,
|
|
|
- "latency_ms": 2112.8,
|
|
|
- "latency_score": 0.577,
|
|
|
- "toks_norm": 0.059
|
|
|
- },
|
|
|
- "qwen3-coder-next:latest": {
|
|
|
- "avg_tok_per_sec": 4.6,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.444,
|
|
|
- "coding_quality": 0.785,
|
|
|
- "general_composite": 0.492,
|
|
|
- "general_quality": 0.892,
|
|
|
- "latency_ms": 3462.7,
|
|
|
- "latency_score": 0.307,
|
|
|
- "toks_norm": 0.046
|
|
|
- },
|
|
|
- "qwen3-coder:30b": {
|
|
|
- "avg_tok_per_sec": 7.9,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.584,
|
|
|
- "coding_quality": 0.885,
|
|
|
- "general_composite": 0.578,
|
|
|
- "general_quality": 0.872,
|
|
|
- "latency_ms": 1769.0,
|
|
|
- "latency_score": 0.646,
|
|
|
- "toks_norm": 0.079
|
|
|
- },
|
|
|
- "qwen3.5:35b": {
|
|
|
- "avg_tok_per_sec": 5.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.411,
|
|
|
- "coding_quality": 0.879,
|
|
|
- "general_composite": 0.466,
|
|
|
- "general_quality": 1.0,
|
|
|
- "latency_ms": 133176.0,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.053
|
|
|
+ "coding_composite": 0.518,
|
|
|
+ "coding_quality": 0.6,
|
|
|
+ "general_composite": 0.65,
|
|
|
+ "general_quality": 0.895,
|
|
|
+ "latency_ms": 2501.0,
|
|
|
+ "latency_score": 0.5,
|
|
|
+ "toks_norm": 0.41
|
|
|
}
|
|
|
},
|
|
|
"coding_ranking": [],
|
|
|
"general_ranking": [
|
|
|
{
|
|
|
- "composite": 0.683,
|
|
|
+ "composite": 0.86,
|
|
|
"metrics": {
|
|
|
- "avg_tok_per_sec": 21.3,
|
|
|
+ "avg_tok_per_sec": 21.8,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.618,
|
|
|
- "coding_quality": 0.855,
|
|
|
- "general_composite": 0.683,
|
|
|
- "general_quality": 1.0,
|
|
|
- "latency_ms": 1617.0,
|
|
|
- "latency_score": 0.677,
|
|
|
- "toks_norm": 0.213
|
|
|
+ "coding_composite": 0.748,
|
|
|
+ "coding_quality": 0.7,
|
|
|
+ "general_composite": 0.86,
|
|
|
+ "general_quality": 0.949,
|
|
|
+ "latency_ms": 697.1,
|
|
|
+ "latency_score": 0.861,
|
|
|
+ "toks_norm": 0.728
|
|
|
},
|
|
|
- "name": "deepseek-coder-v2:16b-lite-instruct-q4_K_M"
|
|
|
+ "name": "llama3.2:3b"
|
|
|
},
|
|
|
{
|
|
|
- "composite": 0.619,
|
|
|
+ "composite": 0.781,
|
|
|
"metrics": {
|
|
|
- "avg_tok_per_sec": 11.5,
|
|
|
+ "avg_tok_per_sec": 19.8,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.593,
|
|
|
- "coding_quality": 0.83,
|
|
|
- "general_composite": 0.619,
|
|
|
- "general_quality": 0.887,
|
|
|
- "latency_ms": 1301.7,
|
|
|
- "latency_score": 0.74,
|
|
|
- "toks_norm": 0.115
|
|
|
- },
|
|
|
- "name": "qwen2.5-coder:7b-instruct-q4_K_M"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.578,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 7.9,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.584,
|
|
|
- "coding_quality": 0.885,
|
|
|
- "general_composite": 0.578,
|
|
|
- "general_quality": 0.872,
|
|
|
- "latency_ms": 1769.0,
|
|
|
- "latency_score": 0.646,
|
|
|
- "toks_norm": 0.079
|
|
|
- },
|
|
|
- "name": "qwen3-coder:30b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.576,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 5.9,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.536,
|
|
|
- "coding_quality": 0.832,
|
|
|
- "general_composite": 0.576,
|
|
|
- "general_quality": 0.919,
|
|
|
- "latency_ms": 2112.8,
|
|
|
- "latency_score": 0.577,
|
|
|
- "toks_norm": 0.059
|
|
|
- },
|
|
|
- "name": "qwen2.5-coder:7b-instruct-q6_K"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.562,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 6.4,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.519,
|
|
|
- "coding_quality": 0.853,
|
|
|
- "general_composite": 0.562,
|
|
|
+ "coding_composite": 0.602,
|
|
|
+ "coding_quality": 0.55,
|
|
|
+ "general_composite": 0.781,
|
|
|
"general_quality": 0.948,
|
|
|
- "latency_ms": 2677.7,
|
|
|
- "latency_score": 0.464,
|
|
|
- "toks_norm": 0.064
|
|
|
- },
|
|
|
- "name": "deepseek-r1:14b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.548,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 9.0,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.496,
|
|
|
- "coding_quality": 0.81,
|
|
|
- "general_composite": 0.548,
|
|
|
- "general_quality": 0.925,
|
|
|
- "latency_ms": 2900.9,
|
|
|
- "latency_score": 0.42,
|
|
|
- "toks_norm": 0.09
|
|
|
- },
|
|
|
- "name": "qwen2.5-coder:7b-instruct-q5_K_M"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.508,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 4.1,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.568,
|
|
|
- "coding_quality": 0.804,
|
|
|
- "general_composite": 0.508,
|
|
|
- "general_quality": 0.671,
|
|
|
- "latency_ms": 1126.4,
|
|
|
- "latency_score": 0.775,
|
|
|
- "toks_norm": 0.041
|
|
|
- },
|
|
|
- "name": "codellama:13b-instruct-q5_K_M"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.492,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 4.6,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.444,
|
|
|
- "coding_quality": 0.785,
|
|
|
- "general_composite": 0.492,
|
|
|
- "general_quality": 0.892,
|
|
|
- "latency_ms": 3462.7,
|
|
|
- "latency_score": 0.307,
|
|
|
- "toks_norm": 0.046
|
|
|
- },
|
|
|
- "name": "qwen3-coder-next:latest"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.469,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 6.6,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.457,
|
|
|
- "coding_quality": 0.904,
|
|
|
- "general_composite": 0.469,
|
|
|
- "general_quality": 0.931,
|
|
|
- "latency_ms": 4394.9,
|
|
|
- "latency_score": 0.121,
|
|
|
- "toks_norm": 0.066
|
|
|
- },
|
|
|
- "name": "phi4:14b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.466,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 5.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.411,
|
|
|
- "coding_quality": 0.879,
|
|
|
- "general_composite": 0.466,
|
|
|
- "general_quality": 1.0,
|
|
|
- "latency_ms": 133176.0,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.053
|
|
|
- },
|
|
|
- "name": "qwen3.5:35b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.447,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 10.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.471,
|
|
|
- "coding_quality": 0.978,
|
|
|
- "general_composite": 0.447,
|
|
|
- "general_quality": 0.925,
|
|
|
- "latency_ms": 8158.0,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.103
|
|
|
- },
|
|
|
- "name": "gpt-oss:20b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.437,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 4.8,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.451,
|
|
|
- "coding_quality": 0.755,
|
|
|
- "general_composite": 0.437,
|
|
|
- "general_quality": 0.725,
|
|
|
- "latency_ms": 3065.7,
|
|
|
- "latency_score": 0.387,
|
|
|
- "toks_norm": 0.048
|
|
|
- },
|
|
|
- "name": "dolphin-mixtral:8x7b"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.406,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 2.3,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.32,
|
|
|
- "coding_quality": 0.696,
|
|
|
- "general_composite": 0.406,
|
|
|
- "general_quality": 0.887,
|
|
|
- "latency_ms": 58429.3,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.023
|
|
|
- },
|
|
|
- "name": "codestral:22b-v0.1-q4_K_M"
|
|
|
- },
|
|
|
- {
|
|
|
- "composite": 0.396,
|
|
|
- "metrics": {
|
|
|
- "avg_tok_per_sec": 4.9,
|
|
|
- "category": "general",
|
|
|
- "coding_composite": 0.393,
|
|
|
- "coding_quality": 0.84,
|
|
|
- "general_composite": 0.396,
|
|
|
- "general_quality": 0.848,
|
|
|
- "latency_ms": 6865.3,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.049
|
|
|
+ "latency_ms": 1875.8,
|
|
|
+ "latency_score": 0.625,
|
|
|
+ "toks_norm": 0.661
|
|
|
},
|
|
|
- "name": "qwen2.5-coder:14b-instruct-q4_K_M"
|
|
|
+ "name": "deepseek-coder-v2"
|
|
|
},
|
|
|
{
|
|
|
- "composite": 0.359,
|
|
|
+ "composite": 0.65,
|
|
|
"metrics": {
|
|
|
- "avg_tok_per_sec": 12.1,
|
|
|
+ "avg_tok_per_sec": 12.3,
|
|
|
"category": "general",
|
|
|
- "coding_composite": 0.417,
|
|
|
- "coding_quality": 0.846,
|
|
|
- "general_composite": 0.359,
|
|
|
- "general_quality": 0.717,
|
|
|
- "latency_ms": 6696.2,
|
|
|
- "latency_score": 0,
|
|
|
- "toks_norm": 0.121
|
|
|
+ "coding_composite": 0.518,
|
|
|
+ "coding_quality": 0.6,
|
|
|
+ "general_composite": 0.65,
|
|
|
+ "general_quality": 0.895,
|
|
|
+ "latency_ms": 2501.0,
|
|
|
+ "latency_score": 0.5,
|
|
|
+ "toks_norm": 0.41
|
|
|
},
|
|
|
- "name": "mistral:7b-instruct"
|
|
|
+ "name": "qwen2.5-coder:7b"
|
|
|
}
|
|
|
],
|
|
|
- "slot1_general": "deepseek-coder-v2:16b-lite-instruct-q4_K_M",
|
|
|
- "slot2_general": "qwen2.5-coder:7b-instruct-q4_K_M",
|
|
|
- "slot3_coding": "deepseek-coder-v2:16b-lite-instruct-q4_K_M",
|
|
|
+ "slot1_general": "llama3.2:3b",
|
|
|
+ "slot2_general": "deepseek-coder-v2",
|
|
|
+ "slot3_coding": "llama3.2:3b",
|
|
|
"slot4_coding": "none"
|
|
|
}
|