237 lines
8.7 KiB
Plaintext
237 lines
8.7 KiB
Plaintext
Benchmark Run: 20250303_174821
|
||
Server: http://localhost:11434
|
||
|
||
CPU Information:
|
||
python_version: 3.10.16.final.0 (64 bit)
|
||
cpuinfo_version: [9, 0, 0]
|
||
cpuinfo_version_string: 9.0.0
|
||
arch: ARM_8
|
||
bits: 64
|
||
count: 10
|
||
arch_string_raw: arm64
|
||
brand_raw: Apple M1 Pro
|
||
|
||
Benchmark Results:
|
||
|
||
[38;5;147m[1m🏆 Final Model Leaderboard:[0m
|
||
|
||
[1m[38;5;221mqwen2.5-coder:7b-instruct-q4_K_M[0m
|
||
[1mOverall Success Rate:[0m 100.0% (72/72 cases)
|
||
[1mAverage Tokens/sec:[0m 19.33 (18.75 - 19.58)
|
||
[1mAverage Duration:[0m 17.32s
|
||
[1mMin/Max Avg Duration:[0m 8.67s / 17.99s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mfalcon3:10b[0m
|
||
[1mOverall Success Rate:[0m 100.0% (72/72 cases)
|
||
[1mAverage Tokens/sec:[0m 13.21 (12.53 - 13.31)
|
||
[1mAverage Duration:[0m 13.46s
|
||
[1mMin/Max Avg Duration:[0m 6.76s / 13.46s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mqwen2.5:14b[0m
|
||
[1mOverall Success Rate:[0m 100.0% (72/72 cases)
|
||
[1mAverage Tokens/sec:[0m 9.78 (9.78 - 9.88)
|
||
[1mAverage Duration:[0m 35.25s
|
||
[1mMin/Max Avg Duration:[0m 30.09s / 35.25s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mqwen2.5-coder:14b-instruct-q4_K_M[0m
|
||
[1mOverall Success Rate:[0m 100.0% (72/72 cases)
|
||
[1mAverage Tokens/sec:[0m 9.68 (9.65 - 9.88)
|
||
[1mAverage Duration:[0m 37.18s
|
||
[1mMin/Max Avg Duration:[0m 23.06s / 37.18s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mphi4:latest[0m
|
||
[1mOverall Success Rate:[0m 100.0% (72/72 cases)
|
||
[1mAverage Tokens/sec:[0m 9.01 (8.96 - 9.32)
|
||
[1mAverage Duration:[0m 23.44s
|
||
[1mMin/Max Avg Duration:[0m 23.44s / 38.82s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mdeepseek-r1:14b[0m
|
||
[1mOverall Success Rate:[0m 97.2% (70/72 cases)
|
||
[1mAverage Tokens/sec:[0m 9.05 (8.90 - 9.38)
|
||
[1mAverage Duration:[0m 278.32s
|
||
[1mMin/Max Avg Duration:[0m 174.30s / 482.10s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ❌ 16/18 cases (88.9%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mllama3.2-vision:11b-instruct-q4_K_M[0m
|
||
[1mOverall Success Rate:[0m 95.8% (69/72 cases)
|
||
[1mAverage Tokens/sec:[0m 15.68 (14.92 - 15.92)
|
||
[1mAverage Duration:[0m 22.33s
|
||
[1mMin/Max Avg Duration:[0m 16.31s / 28.85s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 16/18 cases (88.9%)
|
||
- Binary Search: ❌ 17/18 cases (94.4%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mllama3.2:3b[0m
|
||
[1mOverall Success Rate:[0m 94.4% (68/72 cases)
|
||
[1mAverage Tokens/sec:[0m 36.09 (30.85 - 37.53)
|
||
[1mAverage Duration:[0m 2.67s
|
||
[1mMin/Max Avg Duration:[0m 1.04s / 2.76s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 14/18 cases (77.8%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mllama3.1:8b[0m
|
||
[1mOverall Success Rate:[0m 94.4% (68/72 cases)
|
||
[1mAverage Tokens/sec:[0m 17.92 (17.92 - 18.45)
|
||
[1mAverage Duration:[0m 18.04s
|
||
[1mMin/Max Avg Duration:[0m 14.68s / 19.56s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 14/18 cases (77.8%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mhhao/qwen2.5-coder-tools:7b[0m
|
||
[1mOverall Success Rate:[0m 91.7% (66/72 cases)
|
||
[1mAverage Tokens/sec:[0m 17.75 (16.05 - 17.75)
|
||
[1mAverage Duration:[0m 9.35s
|
||
[1mMin/Max Avg Duration:[0m 4.17s / 9.35s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 12/18 cases (66.7%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mQwen2.5-Coder-7B-Instruct-s1k:latest[0m
|
||
[1mOverall Success Rate:[0m 88.9% (64/72 cases)
|
||
[1mAverage Tokens/sec:[0m 18.38 (18.38 - 18.94)
|
||
[1mAverage Duration:[0m 9.95s
|
||
[1mMin/Max Avg Duration:[0m 9.06s / 12.91s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 16/18 cases (88.9%)
|
||
- Binary Search: ❌ 12/18 cases (66.7%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mdeepseek-r1:8b[0m
|
||
[1mOverall Success Rate:[0m 86.1% (62/72 cases)
|
||
[1mAverage Tokens/sec:[0m 17.43 (17.29 - 18.01)
|
||
[1mAverage Duration:[0m 168.97s
|
||
[1mMin/Max Avg Duration:[0m 107.91s / 168.97s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ❌ 16/18 cases (88.9%)
|
||
- Anagram Check: ❌ 10/18 cases (55.6%)
|
||
|
||
[1m[38;5;221mllama3.2:1b-instruct-q4_K_M[0m
|
||
[1mOverall Success Rate:[0m 81.9% (59/72 cases)
|
||
[1mAverage Tokens/sec:[0m 88.24 (88.24 - 88.93)
|
||
[1mAverage Duration:[0m 3.64s
|
||
[1mMin/Max Avg Duration:[0m 1.87s / 4.93s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 5/18 cases (27.8%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221msamantha-mistral:latest[0m
|
||
[1mOverall Success Rate:[0m 80.6% (58/72 cases)
|
||
[1mAverage Tokens/sec:[0m 23.92 (23.91 - 24.79)
|
||
[1mAverage Duration:[0m 12.21s
|
||
[1mMin/Max Avg Duration:[0m 7.59s / 12.21s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 8/18 cases (44.4%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ❌ 16/18 cases (88.9%)
|
||
- Anagram Check: ❌ 16/18 cases (88.9%)
|
||
|
||
[1m[38;5;221mmarco-o1:latest[0m
|
||
[1mOverall Success Rate:[0m 80.6% (58/72 cases)
|
||
[1mAverage Tokens/sec:[0m 19.19 (19.19 - 19.39)
|
||
[1mAverage Duration:[0m 41.14s
|
||
[1mMin/Max Avg Duration:[0m 33.28s / 51.50s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ✅ 18/18 cases (100.0%)
|
||
- Binary Search: ❌ 6/18 cases (33.3%)
|
||
- Palindrome: ✅ 18/18 cases (100.0%)
|
||
- Anagram Check: ❌ 16/18 cases (88.9%)
|
||
|
||
[1m[38;5;221mdeepseek-r1:7b[0m
|
||
[1mOverall Success Rate:[0m 80.6% (58/72 cases)
|
||
[1mAverage Tokens/sec:[0m 18.01 (18.01 - 19.07)
|
||
[1mAverage Duration:[0m 336.87s
|
||
[1mMin/Max Avg Duration:[0m 78.71s / 336.87s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 10/18 cases (55.6%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ❌ 12/18 cases (66.7%)
|
||
- Anagram Check: ✅ 18/18 cases (100.0%)
|
||
|
||
[1m[38;5;221mdeepseek-r1:1.5b-qwen-distill-q8_0[0m
|
||
[1mOverall Success Rate:[0m 52.8% (38/72 cases)
|
||
[1mAverage Tokens/sec:[0m 57.37 (53.88 - 59.60)
|
||
[1mAverage Duration:[0m 137.59s
|
||
[1mMin/Max Avg Duration:[0m 41.38s / 371.13s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 11/18 cases (61.1%)
|
||
- Binary Search: ❌ 12/18 cases (66.7%)
|
||
- Palindrome: ❌ 6/18 cases (33.3%)
|
||
- Anagram Check: ❌ 9/18 cases (50.0%)
|
||
|
||
[1m[38;5;221mopenthinker:7b[0m
|
||
[1mOverall Success Rate:[0m 47.2% (34/72 cases)
|
||
[1mAverage Tokens/sec:[0m 18.16 (17.98 - 18.29)
|
||
[1mAverage Duration:[0m 263.00s
|
||
[1mMin/Max Avg Duration:[0m 168.91s / 302.79s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 0/18 cases (0.0%)
|
||
- Binary Search: ✅ 18/18 cases (100.0%)
|
||
- Palindrome: ❌ 12/18 cases (66.7%)
|
||
- Anagram Check: ❌ 4/18 cases (22.2%)
|
||
|
||
[1m[38;5;221mwizard-vicuna-uncensored:latest[0m
|
||
[1mOverall Success Rate:[0m 9.7% (7/72 cases)
|
||
[1mAverage Tokens/sec:[0m 22.01 (22.01 - 24.42)
|
||
[1mAverage Duration:[0m 9.06s
|
||
[1mMin/Max Avg Duration:[0m 5.60s / 11.45s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 0/18 cases (0.0%)
|
||
- Binary Search: ❌ 0/18 cases (0.0%)
|
||
- Palindrome: ❌ 6/18 cases (33.3%)
|
||
- Anagram Check: ❌ 1/18 cases (5.6%)
|
||
|
||
[1m[38;5;221mmxbai-embed-large:latest[0m
|
||
[1mOverall Success Rate:[0m 0.0% (0/72 cases)
|
||
[1mAverage Tokens/sec:[0m 0.00 (0.00 - 0.00)
|
||
[1mAverage Duration:[0m 0.00s
|
||
[1mMin/Max Avg Duration:[0m 0.00s / 0.00s
|
||
[1mTest Results:[0m
|
||
- Fibonacci: ❌ 0/18 cases (0.0%)
|
||
- Binary Search: ❌ 0/18 cases (0.0%)
|
||
- Palindrome: ❌ 0/18 cases (0.0%)
|
||
- Anagram Check: ❌ 0/18 cases (0.0%)
|