|
@@ -0,0 +1,401 @@
|
|
|
|
|
+{
|
|
|
|
|
+ "all_metrics": {
|
|
|
|
|
+ "codellama:13b-instruct-q5_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.1,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.568,
|
|
|
|
|
+ "coding_quality": 0.804,
|
|
|
|
|
+ "general_composite": 0.508,
|
|
|
|
|
+ "general_quality": 0.671,
|
|
|
|
|
+ "latency_ms": 1126.4,
|
|
|
|
|
+ "latency_score": 0.775,
|
|
|
|
|
+ "toks_norm": 0.041
|
|
|
|
|
+ },
|
|
|
|
|
+ "codestral:22b-v0.1-q4_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 2.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.32,
|
|
|
|
|
+ "coding_quality": 0.696,
|
|
|
|
|
+ "general_composite": 0.406,
|
|
|
|
|
+ "general_quality": 0.887,
|
|
|
|
|
+ "latency_ms": 58429.3,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.023
|
|
|
|
|
+ },
|
|
|
|
|
+ "deepseek-coder-v2:16b-lite-instruct-q4_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 21.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.618,
|
|
|
|
|
+ "coding_quality": 0.855,
|
|
|
|
|
+ "general_composite": 0.683,
|
|
|
|
|
+ "general_quality": 1.0,
|
|
|
|
|
+ "latency_ms": 1617.0,
|
|
|
|
|
+ "latency_score": 0.677,
|
|
|
|
|
+ "toks_norm": 0.213
|
|
|
|
|
+ },
|
|
|
|
|
+ "deepseek-r1:14b": {
|
|
|
|
|
+ "avg_tok_per_sec": 6.4,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.519,
|
|
|
|
|
+ "coding_quality": 0.853,
|
|
|
|
|
+ "general_composite": 0.562,
|
|
|
|
|
+ "general_quality": 0.948,
|
|
|
|
|
+ "latency_ms": 2677.7,
|
|
|
|
|
+ "latency_score": 0.464,
|
|
|
|
|
+ "toks_norm": 0.064
|
|
|
|
|
+ },
|
|
|
|
|
+ "dolphin-mixtral:8x7b": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.8,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.451,
|
|
|
|
|
+ "coding_quality": 0.755,
|
|
|
|
|
+ "general_composite": 0.437,
|
|
|
|
|
+ "general_quality": 0.725,
|
|
|
|
|
+ "latency_ms": 3065.7,
|
|
|
|
|
+ "latency_score": 0.387,
|
|
|
|
|
+ "toks_norm": 0.048
|
|
|
|
|
+ },
|
|
|
|
|
+ "gpt-oss:20b": {
|
|
|
|
|
+ "avg_tok_per_sec": 10.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.471,
|
|
|
|
|
+ "coding_quality": 0.978,
|
|
|
|
|
+ "general_composite": 0.447,
|
|
|
|
|
+ "general_quality": 0.925,
|
|
|
|
|
+ "latency_ms": 8158.0,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.103
|
|
|
|
|
+ },
|
|
|
|
|
+ "mistral:7b-instruct": {
|
|
|
|
|
+ "avg_tok_per_sec": 12.1,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.417,
|
|
|
|
|
+ "coding_quality": 0.846,
|
|
|
|
|
+ "general_composite": 0.359,
|
|
|
|
|
+ "general_quality": 0.717,
|
|
|
|
|
+ "latency_ms": 6696.2,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.121
|
|
|
|
|
+ },
|
|
|
|
|
+ "phi4:14b": {
|
|
|
|
|
+ "avg_tok_per_sec": 6.6,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.457,
|
|
|
|
|
+ "coding_quality": 0.904,
|
|
|
|
|
+ "general_composite": 0.469,
|
|
|
|
|
+ "general_quality": 0.931,
|
|
|
|
|
+ "latency_ms": 4394.9,
|
|
|
|
|
+ "latency_score": 0.121,
|
|
|
|
|
+ "toks_norm": 0.066
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen2.5-coder:14b-instruct-q4_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.393,
|
|
|
|
|
+ "coding_quality": 0.84,
|
|
|
|
|
+ "general_composite": 0.396,
|
|
|
|
|
+ "general_quality": 0.848,
|
|
|
|
|
+ "latency_ms": 6865.3,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.049
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen2.5-coder:7b-instruct-q4_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 11.5,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.593,
|
|
|
|
|
+ "coding_quality": 0.83,
|
|
|
|
|
+ "general_composite": 0.619,
|
|
|
|
|
+ "general_quality": 0.887,
|
|
|
|
|
+ "latency_ms": 1301.7,
|
|
|
|
|
+ "latency_score": 0.74,
|
|
|
|
|
+ "toks_norm": 0.115
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen2.5-coder:7b-instruct-q5_K_M": {
|
|
|
|
|
+ "avg_tok_per_sec": 9.0,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.496,
|
|
|
|
|
+ "coding_quality": 0.81,
|
|
|
|
|
+ "general_composite": 0.548,
|
|
|
|
|
+ "general_quality": 0.925,
|
|
|
|
|
+ "latency_ms": 2900.9,
|
|
|
|
|
+ "latency_score": 0.42,
|
|
|
|
|
+ "toks_norm": 0.09
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen2.5-coder:7b-instruct-q6_K": {
|
|
|
|
|
+ "avg_tok_per_sec": 5.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.536,
|
|
|
|
|
+ "coding_quality": 0.832,
|
|
|
|
|
+ "general_composite": 0.576,
|
|
|
|
|
+ "general_quality": 0.919,
|
|
|
|
|
+ "latency_ms": 2112.8,
|
|
|
|
|
+ "latency_score": 0.577,
|
|
|
|
|
+ "toks_norm": 0.059
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen3-coder-next:latest": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.6,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.444,
|
|
|
|
|
+ "coding_quality": 0.785,
|
|
|
|
|
+ "general_composite": 0.492,
|
|
|
|
|
+ "general_quality": 0.892,
|
|
|
|
|
+ "latency_ms": 3462.7,
|
|
|
|
|
+ "latency_score": 0.307,
|
|
|
|
|
+ "toks_norm": 0.046
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen3-coder:30b": {
|
|
|
|
|
+ "avg_tok_per_sec": 7.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.584,
|
|
|
|
|
+ "coding_quality": 0.885,
|
|
|
|
|
+ "general_composite": 0.578,
|
|
|
|
|
+ "general_quality": 0.872,
|
|
|
|
|
+ "latency_ms": 1769.0,
|
|
|
|
|
+ "latency_score": 0.646,
|
|
|
|
|
+ "toks_norm": 0.079
|
|
|
|
|
+ },
|
|
|
|
|
+ "qwen3.5:35b": {
|
|
|
|
|
+ "avg_tok_per_sec": 5.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.411,
|
|
|
|
|
+ "coding_quality": 0.879,
|
|
|
|
|
+ "general_composite": 0.466,
|
|
|
|
|
+ "general_quality": 1.0,
|
|
|
|
|
+ "latency_ms": 133176.0,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.053
|
|
|
|
|
+ }
|
|
|
|
|
+ },
|
|
|
|
|
+ "coding_ranking": [],
|
|
|
|
|
+ "general_ranking": [
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.683,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 21.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.618,
|
|
|
|
|
+ "coding_quality": 0.855,
|
|
|
|
|
+ "general_composite": 0.683,
|
|
|
|
|
+ "general_quality": 1.0,
|
|
|
|
|
+ "latency_ms": 1617.0,
|
|
|
|
|
+ "latency_score": 0.677,
|
|
|
|
|
+ "toks_norm": 0.213
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "deepseek-coder-v2:16b-lite-instruct-q4_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.619,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 11.5,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.593,
|
|
|
|
|
+ "coding_quality": 0.83,
|
|
|
|
|
+ "general_composite": 0.619,
|
|
|
|
|
+ "general_quality": 0.887,
|
|
|
|
|
+ "latency_ms": 1301.7,
|
|
|
|
|
+ "latency_score": 0.74,
|
|
|
|
|
+ "toks_norm": 0.115
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen2.5-coder:7b-instruct-q4_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.578,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 7.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.584,
|
|
|
|
|
+ "coding_quality": 0.885,
|
|
|
|
|
+ "general_composite": 0.578,
|
|
|
|
|
+ "general_quality": 0.872,
|
|
|
|
|
+ "latency_ms": 1769.0,
|
|
|
|
|
+ "latency_score": 0.646,
|
|
|
|
|
+ "toks_norm": 0.079
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen3-coder:30b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.576,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 5.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.536,
|
|
|
|
|
+ "coding_quality": 0.832,
|
|
|
|
|
+ "general_composite": 0.576,
|
|
|
|
|
+ "general_quality": 0.919,
|
|
|
|
|
+ "latency_ms": 2112.8,
|
|
|
|
|
+ "latency_score": 0.577,
|
|
|
|
|
+ "toks_norm": 0.059
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen2.5-coder:7b-instruct-q6_K"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.562,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 6.4,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.519,
|
|
|
|
|
+ "coding_quality": 0.853,
|
|
|
|
|
+ "general_composite": 0.562,
|
|
|
|
|
+ "general_quality": 0.948,
|
|
|
|
|
+ "latency_ms": 2677.7,
|
|
|
|
|
+ "latency_score": 0.464,
|
|
|
|
|
+ "toks_norm": 0.064
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "deepseek-r1:14b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.548,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 9.0,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.496,
|
|
|
|
|
+ "coding_quality": 0.81,
|
|
|
|
|
+ "general_composite": 0.548,
|
|
|
|
|
+ "general_quality": 0.925,
|
|
|
|
|
+ "latency_ms": 2900.9,
|
|
|
|
|
+ "latency_score": 0.42,
|
|
|
|
|
+ "toks_norm": 0.09
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen2.5-coder:7b-instruct-q5_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.508,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.1,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.568,
|
|
|
|
|
+ "coding_quality": 0.804,
|
|
|
|
|
+ "general_composite": 0.508,
|
|
|
|
|
+ "general_quality": 0.671,
|
|
|
|
|
+ "latency_ms": 1126.4,
|
|
|
|
|
+ "latency_score": 0.775,
|
|
|
|
|
+ "toks_norm": 0.041
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "codellama:13b-instruct-q5_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.492,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.6,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.444,
|
|
|
|
|
+ "coding_quality": 0.785,
|
|
|
|
|
+ "general_composite": 0.492,
|
|
|
|
|
+ "general_quality": 0.892,
|
|
|
|
|
+ "latency_ms": 3462.7,
|
|
|
|
|
+ "latency_score": 0.307,
|
|
|
|
|
+ "toks_norm": 0.046
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen3-coder-next:latest"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.469,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 6.6,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.457,
|
|
|
|
|
+ "coding_quality": 0.904,
|
|
|
|
|
+ "general_composite": 0.469,
|
|
|
|
|
+ "general_quality": 0.931,
|
|
|
|
|
+ "latency_ms": 4394.9,
|
|
|
|
|
+ "latency_score": 0.121,
|
|
|
|
|
+ "toks_norm": 0.066
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "phi4:14b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.466,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 5.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.411,
|
|
|
|
|
+ "coding_quality": 0.879,
|
|
|
|
|
+ "general_composite": 0.466,
|
|
|
|
|
+ "general_quality": 1.0,
|
|
|
|
|
+ "latency_ms": 133176.0,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.053
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen3.5:35b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.447,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 10.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.471,
|
|
|
|
|
+ "coding_quality": 0.978,
|
|
|
|
|
+ "general_composite": 0.447,
|
|
|
|
|
+ "general_quality": 0.925,
|
|
|
|
|
+ "latency_ms": 8158.0,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.103
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "gpt-oss:20b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.437,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.8,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.451,
|
|
|
|
|
+ "coding_quality": 0.755,
|
|
|
|
|
+ "general_composite": 0.437,
|
|
|
|
|
+ "general_quality": 0.725,
|
|
|
|
|
+ "latency_ms": 3065.7,
|
|
|
|
|
+ "latency_score": 0.387,
|
|
|
|
|
+ "toks_norm": 0.048
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "dolphin-mixtral:8x7b"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.406,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 2.3,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.32,
|
|
|
|
|
+ "coding_quality": 0.696,
|
|
|
|
|
+ "general_composite": 0.406,
|
|
|
|
|
+ "general_quality": 0.887,
|
|
|
|
|
+ "latency_ms": 58429.3,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.023
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "codestral:22b-v0.1-q4_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.396,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 4.9,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.393,
|
|
|
|
|
+ "coding_quality": 0.84,
|
|
|
|
|
+ "general_composite": 0.396,
|
|
|
|
|
+ "general_quality": 0.848,
|
|
|
|
|
+ "latency_ms": 6865.3,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.049
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "qwen2.5-coder:14b-instruct-q4_K_M"
|
|
|
|
|
+ },
|
|
|
|
|
+ {
|
|
|
|
|
+ "composite": 0.359,
|
|
|
|
|
+ "metrics": {
|
|
|
|
|
+ "avg_tok_per_sec": 12.1,
|
|
|
|
|
+ "category": "general",
|
|
|
|
|
+ "coding_composite": 0.417,
|
|
|
|
|
+ "coding_quality": 0.846,
|
|
|
|
|
+ "general_composite": 0.359,
|
|
|
|
|
+ "general_quality": 0.717,
|
|
|
|
|
+ "latency_ms": 6696.2,
|
|
|
|
|
+ "latency_score": 0,
|
|
|
|
|
+ "toks_norm": 0.121
|
|
|
|
|
+ },
|
|
|
|
|
+ "name": "mistral:7b-instruct"
|
|
|
|
|
+ }
|
|
|
|
|
+ ],
|
|
|
|
|
+ "slot1_general": "deepseek-coder-v2:16b-lite-instruct-q4_K_M",
|
|
|
|
|
+ "slot2_general": "qwen2.5-coder:7b-instruct-q4_K_M",
|
|
|
|
|
+ "slot3_coding": "deepseek-coder-v2:16b-lite-instruct-q4_K_M",
|
|
|
|
|
+ "slot4_coding": "none"
|
|
|
|
|
+}
|