{
  "version": "2026-04-04",
  "count": 109,
  "methodology": "Q4_K_M quantization, 256-token input, 512-token output, 3 runs averaged, freshly booted system",
  "reference_hardware": "M5 Max 128GB Unified Memory",
  "benchmarks": [
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 142,
      "ttft": 0.3,
      "date": "2026-03"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 108,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "MLX",
      "tps": 95,
      "ttft": 0.3,
      "date": "2026-02"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 8,
      "engine": "Ollama",
      "tps": 72,
      "ttft": 0.5,
      "date": "2026-01"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.6,
      "date": "2025-12"
    },
    {
      "model": "Qwen 3.5 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 148,
      "ttft": 0.2,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3.5 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "Ollama",
      "tps": 92,
      "ttft": 0.4,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 8,
      "engine": "Ollama",
      "tps": 52,
      "ttft": 0.7,
      "date": "2026-01"
    },
    {
      "model": "Qwen 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 118,
      "ttft": 0.3,
      "date": "2026-02"
    },
    {
      "model": "Gemma 4 E2B",
      "params": "2.3B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 158,
      "ttft": 0.1,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E2B",
      "params": "2.3B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 95,
      "ttft": 0.2,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E2B",
      "params": "2.3B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 82,
      "ttft": 0.3,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E2B",
      "params": "2.3B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 8,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.5,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 128,
      "ttft": 0.2,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M5 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 92,
      "ttft": 0.3,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 78,
      "ttft": 0.3,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 62,
      "ttft": 0.4,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 E4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 8,
      "engine": "Ollama",
      "tps": 42,
      "ttft": 0.6,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 26B-A4B",
      "params": "26B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 50,
      "ttft": 0.5,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 26B-A4B",
      "params": "26B",
      "quant": "Q4_K_M",
      "chip": "M5 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 35,
      "ttft": 0.8,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 26B-A4B",
      "params": "26B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "MLX",
      "tps": 40,
      "ttft": 0.7,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 26B-A4B",
      "params": "26B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 28,
      "ttft": 1.0,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 31B",
      "params": "31B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 26,
      "ttft": 0.7,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 31B",
      "params": "31B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 22,
      "ttft": 0.9,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 31B",
      "params": "31B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "MLX",
      "tps": 18,
      "ttft": 1.1,
      "date": "2026-04"
    },
    {
      "model": "Gemma 4 31B",
      "params": "31B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 14,
      "ttft": 1.4,
      "date": "2026-04"
    },
    {
      "model": "Gemma 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 132,
      "ttft": 0.3,
      "date": "2026-03"
    },
    {
      "model": "Gemma 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 8,
      "engine": "Ollama",
      "tps": 48,
      "ttft": 0.8,
      "date": "2025-12"
    },
    {
      "model": "Gemma 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M3 Pro",
      "ram": 18,
      "engine": "MLX",
      "tps": 88,
      "ttft": 0.4,
      "date": "2026-01"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 105,
      "ttft": 0.5,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "LM Studio",
      "tps": 72,
      "ttft": 0.6,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.7,
      "date": "2026-01"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 35,
      "ttft": 1.1,
      "date": "2025-12"
    },
    {
      "model": "Qwen 3 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 98,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 8B",
      "params": "8B",
      "quant": "Q8_0",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 68,
      "ttft": 0.5,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 16,
      "engine": "Ollama",
      "tps": 55,
      "ttft": 0.7,
      "date": "2026-01"
    },
    {
      "model": "DeepSeek R1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 97,
      "ttft": 0.5,
      "date": "2026-03"
    },
    {
      "model": "DeepSeek R1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "MLX",
      "tps": 78,
      "ttft": 0.5,
      "date": "2026-02"
    },
    {
      "model": "DeepSeek R1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 16,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.8,
      "date": "2026-01"
    },
    {
      "model": "DeepSeek R1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 38,
      "ttft": 1.2,
      "date": "2025-11"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 122,
      "ttft": 0.3,
      "date": "2026-03"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 98,
      "ttft": 0.4,
      "date": "2026-02"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 62,
      "ttft": 0.6,
      "date": "2026-01"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 42,
      "ttft": 1.2,
      "date": "2025-12"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 138,
      "ttft": 0.3,
      "date": "2026-03"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "Ollama",
      "tps": 75,
      "ttft": 0.6,
      "date": "2026-02"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M3 Pro",
      "ram": 18,
      "engine": "Ollama",
      "tps": 62,
      "ttft": 0.7,
      "date": "2026-01"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 40,
      "ttft": 1.1,
      "date": "2025-12"
    },
    {
      "model": "Ministral 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 98,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Ministral 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "LM Studio",
      "tps": 55,
      "ttft": 0.7,
      "date": "2026-01"
    },
    {
      "model": "Gemma 3 12B",
      "params": "12B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 68,
      "ttft": 0.6,
      "date": "2026-03"
    },
    {
      "model": "Gemma 3 12B",
      "params": "12B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 52,
      "ttft": 0.7,
      "date": "2026-02"
    },
    {
      "model": "Gemma 3 12B",
      "params": "12B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 38,
      "ttft": 1.1,
      "date": "2026-01"
    },
    {
      "model": "Gemma 3 12B",
      "params": "12B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 16,
      "engine": "Ollama",
      "tps": 32,
      "ttft": 1.3,
      "date": "2025-12"
    },
    {
      "model": "Qwen 3 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.8,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "LM Studio",
      "tps": 38,
      "ttft": 1.0,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "Ollama",
      "tps": 30,
      "ttft": 1.2,
      "date": "2026-01"
    },
    {
      "model": "Phi-4 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 62,
      "ttft": 0.6,
      "date": "2026-03"
    },
    {
      "model": "Phi-4 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "Ollama",
      "tps": 38,
      "ttft": 1.0,
      "date": "2026-02"
    },
    {
      "model": "Phi-4 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 16,
      "engine": "MLX",
      "tps": 28,
      "ttft": 1.3,
      "date": "2026-01"
    },
    {
      "model": "Ministral 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 58,
      "ttft": 0.7,
      "date": "2026-03"
    },
    {
      "model": "Ministral 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 40,
      "ttft": 0.9,
      "date": "2026-02"
    },
    {
      "model": "Gemma 3 27B",
      "params": "27B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 42,
      "ttft": 0.9,
      "date": "2026-03"
    },
    {
      "model": "Gemma 3 27B",
      "params": "27B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "LM Studio",
      "tps": 25,
      "ttft": 1.5,
      "date": "2026-02"
    },
    {
      "model": "Gemma 3 27B",
      "params": "27B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "MLX",
      "tps": 35,
      "ttft": 1.1,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 30B-A3B",
      "params": "30B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 62,
      "ttft": 0.7,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 30B-A3B",
      "params": "30B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "Ollama",
      "tps": 42,
      "ttft": 0.9,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 30B-A3B",
      "params": "30B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 35,
      "ttft": 1.0,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 30B-A3B",
      "params": "30B",
      "quant": "Q4_K_M",
      "chip": "M3 Max",
      "ram": 36,
      "engine": "Ollama",
      "tps": 28,
      "ttft": 1.3,
      "date": "2026-01"
    },
    {
      "model": "Qwen 3.5 35B",
      "params": "35B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 52,
      "ttft": 0.9,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3.5 35B",
      "params": "35B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "Ollama",
      "tps": 34,
      "ttft": 1.2,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3.5 35B",
      "params": "35B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 48,
      "ttft": 0.9,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 28,
      "ttft": 1.1,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 22,
      "ttft": 1.4,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 32,
      "engine": "Ollama",
      "tps": 15,
      "ttft": 1.8,
      "date": "2026-01"
    },
    {
      "model": "DeepSeek R1 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 27,
      "ttft": 1.2,
      "date": "2026-03"
    },
    {
      "model": "DeepSeek R1 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "LM Studio",
      "tps": 18,
      "ttft": 1.8,
      "date": "2026-01"
    },
    {
      "model": "DeepSeek R1 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M3 Max",
      "ram": 36,
      "engine": "Ollama",
      "tps": 14,
      "ttft": 2.0,
      "date": "2025-12"
    },
    {
      "model": "Llama 3.3 70B",
      "params": "70B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 12,
      "ttft": 2.8,
      "date": "2026-03"
    },
    {
      "model": "Llama 3.3 70B",
      "params": "70B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "MLX",
      "tps": 18,
      "ttft": 2.0,
      "date": "2026-02"
    },
    {
      "model": "Llama 3.3 70B",
      "params": "70B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 15,
      "ttft": 2.4,
      "date": "2026-03"
    },
    {
      "model": "DeepSeek R1 70B",
      "params": "70B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 11,
      "ttft": 3.0,
      "date": "2026-03"
    },
    {
      "model": "DeepSeek R1 70B",
      "params": "70B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "MLX",
      "tps": 16,
      "ttft": 2.2,
      "date": "2026-02"
    },
    {
      "model": "Qwen 2.5 72B",
      "params": "72B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 10,
      "ttft": 3.2,
      "date": "2026-03"
    },
    {
      "model": "Qwen 2.5 72B",
      "params": "72B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "Ollama",
      "tps": 15,
      "ttft": 2.5,
      "date": "2026-02"
    },
    {
      "model": "GPT-oss 120B",
      "params": "120B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 7,
      "ttft": 5.5,
      "date": "2026-03"
    },
    {
      "model": "GPT-oss 120B",
      "params": "120B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "MLX",
      "tps": 10,
      "ttft": 4.2,
      "date": "2026-02"
    },
    {
      "model": "Llama 4 Scout",
      "params": "109B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "Ollama",
      "tps": 22,
      "ttft": 1.8,
      "date": "2026-03"
    },
    {
      "model": "Llama 4 Scout",
      "params": "109B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "MLX",
      "tps": 30,
      "ttft": 1.3,
      "date": "2026-02"
    },
    {
      "model": "Llama 4 Scout",
      "params": "109B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 26,
      "ttft": 1.5,
      "date": "2026-03"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 88,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Mistral 7B",
      "params": "7B",
      "quant": "Q8_0",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 65,
      "ttft": 0.5,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 78,
      "ttft": 0.5,
      "date": "2026-03"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 82,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 14B",
      "params": "14B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 128,
      "engine": "MLX",
      "tps": 42,
      "ttft": 0.9,
      "date": "2026-03"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 112,
      "ttft": 0.3,
      "date": "2026-03"
    },
    {
      "model": "Phi-4 Mini",
      "params": "3.8B",
      "quant": "Q4_K_M",
      "chip": "M4 Max",
      "ram": 48,
      "engine": "MLX",
      "tps": 125,
      "ttft": 0.3,
      "date": "2026-02"
    },
    {
      "model": "Gemma 3 4B",
      "params": "4B",
      "quant": "Q8_0",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 95,
      "ttft": 0.3,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3.5 35B",
      "params": "35B",
      "quant": "Q4_K_M",
      "chip": "M3 Max",
      "ram": 96,
      "engine": "Ollama",
      "tps": 22,
      "ttft": 1.5,
      "date": "2026-01"
    },
    {
      "model": "DeepSeek R1 8B",
      "params": "8B",
      "quant": "Q8_0",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "MLX",
      "tps": 75,
      "ttft": 0.5,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "Ollama",
      "tps": 82,
      "ttft": 0.5,
      "date": "2026-02"
    },
    {
      "model": "Qwen 3 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M1",
      "ram": 16,
      "engine": "Ollama",
      "tps": 38,
      "ttft": 1.0,
      "date": "2025-12"
    },
    {
      "model": "Ministral 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M4",
      "ram": 16,
      "engine": "MLX",
      "tps": 72,
      "ttft": 0.5,
      "date": "2026-02"
    },
    {
      "model": "Ministral 14B",
      "params": "14B",
      "quant": "Q4_K_M",
      "chip": "M3",
      "ram": 16,
      "engine": "LM Studio",
      "tps": 30,
      "ttft": 1.2,
      "date": "2026-01"
    },
    {
      "model": "Gemma 3 27B",
      "params": "27B",
      "quant": "Q4_K_M",
      "chip": "M3 Max",
      "ram": 96,
      "engine": "MLX",
      "tps": 28,
      "ttft": 1.3,
      "date": "2026-01"
    },
    {
      "model": "Qwen 3 32B",
      "params": "32B",
      "quant": "Q4_K_M",
      "chip": "M4 Ultra",
      "ram": 192,
      "engine": "Ollama",
      "tps": 32,
      "ttft": 1.0,
      "date": "2026-02"
    },
    {
      "model": "Llama 3.1 8B",
      "params": "8B",
      "quant": "Q4_K_M",
      "chip": "M2",
      "ram": 8,
      "engine": "Ollama",
      "tps": 48,
      "ttft": 0.8,
      "date": "2025-12"
    },
    {
      "model": "Qwen 3.5 9B",
      "params": "9B",
      "quant": "Q4_K_M",
      "chip": "M4 Pro",
      "ram": 24,
      "engine": "MLX",
      "tps": 92,
      "ttft": 0.4,
      "date": "2026-03"
    },
    {
      "model": "Qwen 3 4B",
      "params": "4B",
      "quant": "Q4_K_M",
      "chip": "M5 Max",
      "ram": 64,
      "engine": "Ollama",
      "tps": 135,
      "ttft": 0.2,
      "date": "2026-03"
    }
  ]
}