{
 "version": 1,
 "generated_at": "2026-06-09T22:12:37+00:00",
 "count": 83,
 "entries": [
  {
   "key": "qwen3-0.6b",
   "family": "llm",
   "name": "Qwen3 0.6B",
   "repo_id": "Qwen/Qwen3-0.6B",
   "params_b": 0.75,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-0.6B-GGUF",
   "ollama_tag": "qwen3:0.6b",
   "good_for": "Quick simple chat and text tidy-up. Runs on almost anything.",
   "aliases": [
    "Qwen/Qwen3-0.6B-Base"
   ],
   "stale": false,
   "gated": false,
   "downloads_30d": 21649861,
   "arch": {
    "n_layers": 28,
    "hidden": 1024,
    "n_heads": 16,
    "n_kv_heads": 8
   },
   "context_len": 40960,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 0.64,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 0.5,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 0.44,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 0.4,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 0.37,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.35,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.3,
     "source_repo": "unsloth/Qwen3-0.6B-GGUF",
     "filename": "Qwen3-0.6B-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-0.6B",
    "gguf": "https://huggingface.co/unsloth/Qwen3-0.6B-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:0.6b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-0.6B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-1.7b",
   "family": "llm",
   "name": "Qwen3 1.7B",
   "repo_id": "Qwen/Qwen3-1.7B",
   "params_b": 2.03,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-1.7B-GGUF",
   "ollama_tag": "qwen3:1.7b",
   "good_for": "Light everyday chat and summarising on weak hardware.",
   "aliases": [
    "Qwen/Qwen3-1.7B-Base"
   ],
   "stale": false,
   "gated": false,
   "downloads_30d": 4452758,
   "arch": {
    "n_layers": 28,
    "hidden": 2048,
    "n_heads": 16,
    "n_kv_heads": 8
   },
   "context_len": 40960,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 1.83,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 1.42,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 1.26,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 1.11,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 1.01,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.94,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.78,
     "source_repo": "unsloth/Qwen3-1.7B-GGUF",
     "filename": "Qwen3-1.7B-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-1.7B",
    "gguf": "https://huggingface.co/unsloth/Qwen3-1.7B-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:1.7b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-1.7B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-4b",
   "family": "llm",
   "name": "Qwen3 4B Instruct (2507)",
   "repo_id": "Qwen/Qwen3-4B-Instruct-2507",
   "params_b": 4.02,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
   "ollama_tag": "qwen3:4b",
   "good_for": "Surprisingly capable everyday assistant: chat, summarising, light coding.",
   "aliases": [
    "Qwen/Qwen3-4B",
    "Qwen/Qwen3-4B-Base",
    "Qwen/Qwen3-4B-Thinking-2507"
   ],
   "stale": false,
   "gated": false,
   "downloads_30d": 4349929,
   "arch": {
    "n_layers": 36,
    "hidden": 2560,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 4.28,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 3.31,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.89,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.5,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 2.27,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 2.08,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 1.67,
     "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
     "filename": "Qwen3-4B-Instruct-2507-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507",
    "gguf": "https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:4b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-4B-Instruct-2507-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-8b",
   "family": "llm",
   "name": "Qwen3 8B",
   "repo_id": "Qwen/Qwen3-8B",
   "params_b": 8.19,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-8B-GGUF",
   "ollama_tag": "qwen3:8b",
   "good_for": "A solid all-rounder: good chat, real coding help, decent reasoning.",
   "aliases": [
    "Qwen/Qwen3-8B-Base"
   ],
   "stale": false,
   "gated": false,
   "downloads_30d": 10950977,
   "arch": {
    "n_layers": 36,
    "hidden": 4096,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 40960,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 8.71,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 6.73,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 5.85,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 5.03,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 4.58,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 4.12,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 3.28,
     "source_repo": "unsloth/Qwen3-8B-GGUF",
     "filename": "Qwen3-8B-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-8B",
    "gguf": "https://huggingface.co/unsloth/Qwen3-8B-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:8b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-8B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-14b",
   "family": "llm",
   "name": "Qwen3 14B",
   "repo_id": "Qwen/Qwen3-14B",
   "params_b": 14.77,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-14B-GGUF",
   "ollama_tag": "qwen3:14b",
   "good_for": "Noticeably smarter and more reliable. Wants a real graphics card.",
   "aliases": [
    "Qwen/Qwen3-14B-Base"
   ],
   "stale": false,
   "gated": false,
   "downloads_30d": 1640580,
   "arch": {
    "n_layers": 40,
    "hidden": 5120,
    "n_heads": 40,
    "n_kv_heads": 8
   },
   "context_len": 40960,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 15.7,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 12.12,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 10.51,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 9.0,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 8.14,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 7.32,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 5.75,
     "source_repo": "unsloth/Qwen3-14B-GGUF",
     "filename": "Qwen3-14B-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-14B",
    "gguf": "https://huggingface.co/unsloth/Qwen3-14B-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:14b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-14B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-32b",
   "family": "llm",
   "name": "Qwen3 32B",
   "repo_id": "Qwen/Qwen3-32B",
   "params_b": 32.76,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-32B-GGUF",
   "ollama_tag": "qwen3:32b",
   "good_for": "Near-premium quality. Needs a strong GPU or a lot of memory.",
   "stale": false,
   "gated": false,
   "downloads_30d": 3167218,
   "arch": {
    "n_layers": 64,
    "hidden": 5120,
    "n_heads": 64,
    "n_kv_heads": 8
   },
   "context_len": 40960,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 34.82,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 26.88,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 23.21,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 19.76,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 17.71,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 15.97,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 12.34,
     "source_repo": "unsloth/Qwen3-32B-GGUF",
     "filename": "Qwen3-32B-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-32B",
    "gguf": "https://huggingface.co/unsloth/Qwen3-32B-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:32b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-32B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-30b-a3b",
   "family": "llm",
   "name": "Qwen3 30B-A3B (2507, MoE)",
   "repo_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
   "params_b": 30.53,
   "active_params_b": 3.0,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
   "ollama_tag": "qwen3:30b",
   "good_for": "Big-model quality that runs fast: only 3B of its 30B work per word, so it flies even part-offloaded to RAM.",
   "stale": false,
   "gated": false,
   "downloads_30d": 821913,
   "arch": {
    "n_layers": 48,
    "hidden": 2048,
    "n_heads": 32,
    "n_kv_heads": 4
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 32.48,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 25.09,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 21.73,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 18.56,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 16.38,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 14.71,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 11.26,
     "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
     "filename": "Qwen3-30B-A3B-Instruct-2507-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507",
    "gguf": "https://huggingface.co/unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF",
    "ollama": "https://ollama.com/library/qwen3"
   },
   "run": {
    "ollama": "ollama run qwen3:30b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-coder-30b",
   "family": "llm",
   "name": "Qwen3 Coder 30B-A3B (MoE)",
   "repo_id": "Qwen/Qwen3-Coder-30B-A3B-Instruct",
   "params_b": 30.53,
   "active_params_b": 3.0,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
   "ollama_tag": "qwen3-coder:30b",
   "good_for": "The local coding specialist. Fast despite its size (3B active).",
   "stale": false,
   "gated": false,
   "downloads_30d": 1961682,
   "arch": {
    "n_layers": 48,
    "hidden": 2048,
    "n_heads": 32,
    "n_kv_heads": 4
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 32.48,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 25.09,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 21.73,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 18.56,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 16.38,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 14.71,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 11.26,
     "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-Coder-30B-A3B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct",
    "gguf": "https://huggingface.co/unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/qwen3-coder"
   },
   "run": {
    "ollama": "ollama run qwen3-coder:30b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "llama-3.2-1b",
   "family": "llm",
   "name": "Llama 3.2 1B",
   "repo_id": "meta-llama/Llama-3.2-1B-Instruct",
   "params_b": 1.24,
   "license": "llama3.2",
   "gguf_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
   "ollama_tag": "llama3.2:1b",
   "good_for": "Quick simple chat from the Llama family. Runs on almost anything.",
   "stale": false,
   "gated": true,
   "downloads_30d": 7481230,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 1.32,
     "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
     "filename": "Llama-3.2-1B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 1.02,
     "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
     "filename": "Llama-3.2-1B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 0.91,
     "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
     "filename": "Llama-3.2-1B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 0.81,
     "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
     "filename": "Llama-3.2-1B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 0.74,
     "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF",
     "filename": "Llama-3.2-1B-Instruct-IQ4_XS.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct",
    "gguf": "https://huggingface.co/bartowski/Llama-3.2-1B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/llama3.2"
   },
   "run": {
    "ollama": "ollama run llama3.2:1b",
    "llamacpp": "llama-server -hf bartowski/Llama-3.2-1B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "llama-3.2-3b",
   "family": "llm",
   "name": "Llama 3.2 3B",
   "repo_id": "meta-llama/Llama-3.2-3B-Instruct",
   "params_b": 3.21,
   "license": "llama3.2",
   "gguf_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
   "ollama_tag": "llama3.2:3b",
   "good_for": "Capable small assistant with the huge Llama ecosystem behind it.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1509782,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 3.42,
     "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
     "filename": "Llama-3.2-3B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 2.64,
     "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
     "filename": "Llama-3.2-3B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.32,
     "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
     "filename": "Llama-3.2-3B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.02,
     "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
     "filename": "Llama-3.2-3B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 1.83,
     "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF",
     "filename": "Llama-3.2-3B-Instruct-IQ4_XS.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct",
    "gguf": "https://huggingface.co/bartowski/Llama-3.2-3B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/llama3.2"
   },
   "run": {
    "ollama": "ollama run llama3.2:3b",
    "llamacpp": "llama-server -hf bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "llama-3.1-8b",
   "family": "llm",
   "name": "Llama 3.1 8B",
   "repo_id": "meta-llama/Llama-3.1-8B-Instruct",
   "params_b": 8.03,
   "license": "llama3.1",
   "gguf_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
   "ollama_tag": "llama3.1:8b",
   "good_for": "The classic dependable 8B: chat, coding help, tool use.",
   "stale": false,
   "gated": true,
   "downloads_30d": 10031112,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 8.54,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 6.6,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 5.73,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 4.92,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 4.45,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 4.02,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 3.18,
     "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
     "filename": "Meta-Llama-3.1-8B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct",
    "gguf": "https://huggingface.co/bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/llama3.1"
   },
   "run": {
    "ollama": "ollama run llama3.1:8b",
    "llamacpp": "llama-server -hf bartowski/Meta-Llama-3.1-8B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "llama-4-scout",
   "family": "llm",
   "name": "Llama 4 Scout (109B MoE)",
   "repo_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
   "params_b": 108.64,
   "active_params_b": 17.0,
   "license": "other",
   "gguf_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
   "ollama_tag": "llama4:scout",
   "good_for": "Frontier-class open model. Workstation territory: it is honest to say most PCs cannot run this.",
   "stale": false,
   "gated": true,
   "downloads_30d": 421808,
   "context_len": 10485760,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 114.53,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Q8_0/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 88.43,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Q6_K/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 76.55,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Q5_K_M/Llama-4-Scout-17B-16E-Instruct-Q5_K_M-00001-of-00002.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 65.36,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Q4_K_M/Llama-4-Scout-17B-16E-Instruct-Q4_K_M-00001-of-00002.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 57.65,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "IQ4_XS/Llama-4-Scout-17B-16E-Instruct-IQ4_XS-00001-of-00002.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 51.76,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Q3_K_M/Llama-4-Scout-17B-16E-Instruct-Q3_K_M-00001-of-00002.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 39.56,
     "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
     "filename": "Llama-4-Scout-17B-16E-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/meta-llama/Llama-4-Scout-17B-16E-Instruct",
    "gguf": "https://huggingface.co/unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF",
    "ollama": "https://ollama.com/library/llama4"
   },
   "run": {
    "ollama": "ollama run llama4:scout",
    "llamacpp": "llama-server -hf unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3-270m",
   "family": "llm",
   "name": "Gemma 3 270M",
   "repo_id": "google/gemma-3-270m-it",
   "params_b": 0.27,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3-270m-it-GGUF",
   "ollama_tag": "gemma3:270m",
   "good_for": "Tiny and instant. Fine for simple completions, not real conversation.",
   "stale": false,
   "gated": true,
   "downloads_30d": 127163,
   "context_len": 32768,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 0.29,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 0.28,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 0.26,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 0.25,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 0.24,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.24,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.24,
     "source_repo": "unsloth/gemma-3-270m-it-GGUF",
     "filename": "gemma-3-270m-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3-270m-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3"
   },
   "run": {
    "ollama": "ollama run gemma3:270m",
    "llamacpp": "llama-server -hf unsloth/gemma-3-270m-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3-1b",
   "family": "llm",
   "name": "Gemma 3 1B",
   "repo_id": "google/gemma-3-1b-it",
   "params_b": 1.0,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3-1b-it-GGUF",
   "ollama_tag": "gemma3:1b",
   "good_for": "Google's small chat model. Light and friendly on weak hardware.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1658957,
   "context_len": 32768,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 1.07,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 1.01,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 0.85,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 0.81,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 0.71,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.72,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.69,
     "source_repo": "unsloth/gemma-3-1b-it-GGUF",
     "filename": "gemma-3-1b-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3-1b-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3-1b-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3"
   },
   "run": {
    "ollama": "ollama run gemma3:1b",
    "llamacpp": "llama-server -hf unsloth/gemma-3-1b-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3-4b",
   "family": "llm",
   "name": "Gemma 3 4B",
   "repo_id": "google/gemma-3-4b-it",
   "params_b": 4.3,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3-4b-it-GGUF",
   "ollama_tag": "gemma3:4b",
   "good_for": "Warm-toned everyday assistant; can also look at images.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1601809,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 4.13,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 3.19,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.83,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.49,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 2.26,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 2.1,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 1.73,
     "source_repo": "unsloth/gemma-3-4b-it-GGUF",
     "filename": "gemma-3-4b-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3-4b-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3-4b-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3"
   },
   "run": {
    "ollama": "ollama run gemma3:4b",
    "llamacpp": "llama-server -hf unsloth/gemma-3-4b-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3-12b",
   "family": "llm",
   "name": "Gemma 3 12B",
   "repo_id": "google/gemma-3-12b-it",
   "params_b": 12.19,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3-12b-it-GGUF",
   "ollama_tag": "gemma3:12b",
   "good_for": "Strong mid-size model with vision support.",
   "stale": false,
   "gated": true,
   "downloads_30d": 2810935,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 12.51,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 9.66,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 8.45,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 7.3,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 6.55,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 6.01,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 4.77,
     "source_repo": "unsloth/gemma-3-12b-it-GGUF",
     "filename": "gemma-3-12b-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3-12b-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3-12b-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3"
   },
   "run": {
    "ollama": "ollama run gemma3:12b",
    "llamacpp": "llama-server -hf unsloth/gemma-3-12b-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3-27b",
   "family": "llm",
   "name": "Gemma 3 27B",
   "repo_id": "google/gemma-3-27b-it",
   "params_b": 27.43,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3-27b-it-GGUF",
   "ollama_tag": "gemma3:27b",
   "good_for": "Google's big open model. Needs a serious GPU or lots of memory.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1418920,
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 28.71,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 22.17,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 19.27,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 16.55,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 14.77,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 13.44,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 10.5,
     "source_repo": "unsloth/gemma-3-27b-it-GGUF",
     "filename": "gemma-3-27b-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3-27b-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3-27b-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3"
   },
   "run": {
    "ollama": "ollama run gemma3:27b",
    "llamacpp": "llama-server -hf unsloth/gemma-3-27b-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3n-e2b",
   "family": "llm",
   "name": "Gemma 3n E2B",
   "repo_id": "google/gemma-3n-E2B-it",
   "params_b": 5.44,
   "active_params_b": 2.0,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3n-E2B-it-GGUF",
   "ollama_tag": "gemma3n:e2b",
   "good_for": "Phone-class design: feels like a 2B while knowing more.",
   "stale": false,
   "gated": true,
   "downloads_30d": 372825,
   "context_len": 32768,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 4.79,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 4.21,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 3.29,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 3.03,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 2.91,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 2.48,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 2.22,
     "source_repo": "unsloth/gemma-3n-E2B-it-GGUF",
     "filename": "gemma-3n-E2B-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3n-E2B-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3n-E2B-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3n"
   },
   "run": {
    "ollama": "ollama run gemma3n:e2b",
    "llamacpp": "llama-server -hf unsloth/gemma-3n-E2B-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "gemma-3n-e4b",
   "family": "llm",
   "name": "Gemma 3n E4B",
   "repo_id": "google/gemma-3n-E4B-it",
   "params_b": 7.85,
   "active_params_b": 4.0,
   "license": "gemma",
   "gguf_repo": "unsloth/gemma-3n-E4B-it-GGUF",
   "ollama_tag": "gemma3n:e4b",
   "good_for": "Efficient on-device design with 4B-class speed.",
   "stale": false,
   "gated": true,
   "downloads_30d": 17622,
   "context_len": 32768,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 7.35,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 6.27,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 5.02,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 4.54,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 4.27,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 3.69,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 3.19,
     "source_repo": "unsloth/gemma-3n-E4B-it-GGUF",
     "filename": "gemma-3n-E4B-it-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/google/gemma-3n-E4B-it",
    "gguf": "https://huggingface.co/unsloth/gemma-3n-E4B-it-GGUF",
    "ollama": "https://ollama.com/library/gemma3n"
   },
   "run": {
    "ollama": "ollama run gemma3n:e4b",
    "llamacpp": "llama-server -hf unsloth/gemma-3n-E4B-it-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "mistral-7b",
   "family": "llm",
   "name": "Mistral 7B (v0.3)",
   "repo_id": "mistralai/Mistral-7B-Instruct-v0.3",
   "params_b": 7.25,
   "license": "apache-2.0",
   "gguf_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
   "ollama_tag": "mistral:7b",
   "good_for": "The classic open 7B. Still a solid, fast all-rounder.",
   "stale": false,
   "gated": false,
   "downloads_30d": 3392572,
   "arch": {
    "n_layers": 32,
    "hidden": 4096,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 32768,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 7.7,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 5.95,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 5.14,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 4.37,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 3.91,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 3.52,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 2.72,
     "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF",
     "filename": "Mistral-7B-Instruct-v0.3-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.3",
    "gguf": "https://huggingface.co/bartowski/Mistral-7B-Instruct-v0.3-GGUF",
    "ollama": "https://ollama.com/library/mistral"
   },
   "run": {
    "ollama": "ollama run mistral:7b",
    "llamacpp": "llama-server -hf bartowski/Mistral-7B-Instruct-v0.3-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "mistral-small-3.2",
   "family": "llm",
   "name": "Mistral Small 3.2 (24B)",
   "repo_id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506",
   "params_b": 24.01,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
   "ollama_tag": "mistral-small3.2",
   "good_for": "Excellent quality-for-size; a favourite on 24 GB cards.",
   "stale": false,
   "gated": false,
   "downloads_30d": 537956,
   "arch": {
    "n_layers": 40,
    "hidden": 5120,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 25.05,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 19.35,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 16.76,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 14.33,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 12.78,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 11.47,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 8.89,
     "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
     "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/mistralai/Mistral-Small-3.2-24B-Instruct-2506",
    "gguf": "https://huggingface.co/unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF",
    "ollama": "https://ollama.com/library/mistral-small3.2"
   },
   "run": {
    "ollama": "ollama run mistral-small3.2",
    "llamacpp": "llama-server -hf unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "devstral-small",
   "family": "llm",
   "name": "Devstral Small (24B, coding)",
   "repo_id": "mistralai/Devstral-Small-2507",
   "params_b": 23.57,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Devstral-Small-2507-GGUF",
   "ollama_tag": "devstral",
   "good_for": "Built for coding agents and repo-level work.",
   "stale": false,
   "gated": false,
   "downloads_30d": 24427,
   "arch": {
    "n_layers": 40,
    "hidden": 5120,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 25.05,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 19.35,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 16.76,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 14.33,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 12.78,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 11.47,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 8.89,
     "source_repo": "unsloth/Devstral-Small-2507-GGUF",
     "filename": "Devstral-Small-2507-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/mistralai/Devstral-Small-2507",
    "gguf": "https://huggingface.co/unsloth/Devstral-Small-2507-GGUF",
    "ollama": "https://ollama.com/library/devstral"
   },
   "run": {
    "ollama": "ollama run devstral",
    "llamacpp": "llama-server -hf unsloth/Devstral-Small-2507-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "phi-4",
   "family": "llm",
   "name": "Phi-4 (14B)",
   "repo_id": "microsoft/phi-4",
   "params_b": 14.66,
   "license": "mit",
   "gguf_repo": "unsloth/phi-4-GGUF",
   "ollama_tag": "phi4",
   "good_for": "Microsoft's strong 14B, great at reasoning and maths.",
   "stale": false,
   "gated": false,
   "downloads_30d": 809973,
   "arch": {
    "n_layers": 40,
    "hidden": 5120,
    "n_heads": 40,
    "n_kv_heads": 10
   },
   "context_len": 16384,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 15.58,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 12.03,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 10.41,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 8.89,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 7.19,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 5.61,
     "source_repo": "unsloth/phi-4-GGUF",
     "filename": "phi-4-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/microsoft/phi-4",
    "gguf": "https://huggingface.co/unsloth/phi-4-GGUF",
    "ollama": "https://ollama.com/library/phi4"
   },
   "run": {
    "ollama": "ollama run phi4",
    "llamacpp": "llama-server -hf unsloth/phi-4-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "phi-4-mini",
   "family": "llm",
   "name": "Phi-4 Mini (3.8B)",
   "repo_id": "microsoft/Phi-4-mini-instruct",
   "params_b": 3.84,
   "license": "mit",
   "gguf_repo": "unsloth/Phi-4-mini-instruct-GGUF",
   "ollama_tag": "phi4-mini",
   "good_for": "Small, MIT-licensed, punchy for its size.",
   "stale": false,
   "gated": false,
   "downloads_30d": 1221436,
   "arch": {
    "n_layers": 32,
    "hidden": 3072,
    "n_heads": 24,
    "n_kv_heads": 8
   },
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 4.08,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct.Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 3.16,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.85,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.49,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 2.12,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 1.68,
     "source_repo": "unsloth/Phi-4-mini-instruct-GGUF",
     "filename": "Phi-4-mini-instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/microsoft/Phi-4-mini-instruct",
    "gguf": "https://huggingface.co/unsloth/Phi-4-mini-instruct-GGUF",
    "ollama": "https://ollama.com/library/phi4-mini"
   },
   "run": {
    "ollama": "ollama run phi4-mini",
    "llamacpp": "llama-server -hf unsloth/Phi-4-mini-instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "granite-4.0-1b",
   "family": "llm",
   "name": "Granite 4.0 1B",
   "repo_id": "ibm-granite/granite-4.0-1b",
   "params_b": 1.63,
   "license": "apache-2.0",
   "gguf_repo": "ibm-granite/granite-4.0-1b-GGUF",
   "good_for": "IBM's tiny enterprise-grade model; official GGUFs.",
   "stale": false,
   "gated": false,
   "downloads_30d": 4653,
   "arch": {
    "n_layers": 40,
    "hidden": 2048,
    "n_heads": 16,
    "n_kv_heads": 4
   },
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 1.74,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 1.34,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 1.18,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 1.02,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.86,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.7,
     "source_repo": "ibm-granite/granite-4.0-1b-GGUF",
     "filename": "granite-4.0-1b-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/ibm-granite/granite-4.0-1b",
    "gguf": "https://huggingface.co/ibm-granite/granite-4.0-1b-GGUF"
   },
   "run": {
    "ollama": "ollama run hf.co/ibm-granite/granite-4.0-1b-GGUF:Q4_K_M",
    "llamacpp": "llama-server -hf ibm-granite/granite-4.0-1b-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "granite-4.0-micro",
   "family": "llm",
   "name": "Granite 4.0 Micro (3B)",
   "repo_id": "ibm-granite/granite-4.0-micro",
   "params_b": 3.4,
   "license": "apache-2.0",
   "gguf_repo": "ibm-granite/granite-4.0-micro-GGUF",
   "ollama_tag": "granite4:micro",
   "good_for": "Grounded, RAG-friendly small model from IBM.",
   "stale": false,
   "gated": false,
   "downloads_30d": 129738,
   "arch": {
    "n_layers": 40,
    "hidden": 2560,
    "n_heads": 40,
    "n_kv_heads": 8
   },
   "context_len": 131072,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 3.62,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 2.8,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.44,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.1,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 1.73,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 1.37,
     "source_repo": "ibm-granite/granite-4.0-micro-GGUF",
     "filename": "granite-4.0-micro-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/ibm-granite/granite-4.0-micro",
    "gguf": "https://huggingface.co/ibm-granite/granite-4.0-micro-GGUF",
    "ollama": "https://ollama.com/library/granite4"
   },
   "run": {
    "ollama": "ollama run granite4:micro",
    "llamacpp": "llama-server -hf ibm-granite/granite-4.0-micro-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "granite-4.0-h-tiny",
   "family": "llm",
   "name": "Granite 4.0 H-Tiny (7B-A1B MoE)",
   "repo_id": "ibm-granite/granite-4.0-h-tiny",
   "params_b": 6.94,
   "active_params_b": 1.0,
   "license": "apache-2.0",
   "gguf_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
   "ollama_tag": "granite4:tiny-h",
   "good_for": "Hybrid design: 7B knowledge, 1B-speed replies.",
   "stale": false,
   "gated": false,
   "downloads_30d": 93730,
   "arch": {
    "n_layers": 40,
    "hidden": 1536,
    "n_heads": 12,
    "n_kv_heads": 4
   },
   "context_len": 1048576,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 7.39,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 5.71,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 4.95,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 4.23,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 3.35,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 2.59,
     "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF",
     "filename": "granite-4.0-h-tiny-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/ibm-granite/granite-4.0-h-tiny",
    "gguf": "https://huggingface.co/ibm-granite/granite-4.0-h-tiny-GGUF",
    "ollama": "https://ollama.com/library/granite4"
   },
   "run": {
    "ollama": "ollama run granite4:tiny-h",
    "llamacpp": "llama-server -hf ibm-granite/granite-4.0-h-tiny-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "granite-4.0-h-small",
   "family": "llm",
   "name": "Granite 4.0 H-Small (32B-A9B MoE)",
   "repo_id": "ibm-granite/granite-4.0-h-small",
   "params_b": 32.21,
   "active_params_b": 9.0,
   "license": "apache-2.0",
   "gguf_repo": "ibm-granite/granite-4.0-h-small-GGUF",
   "ollama_tag": "granite4:small-h",
   "good_for": "Big hybrid that stays responsive thanks to 9B active.",
   "stale": false,
   "gated": false,
   "downloads_30d": 569199,
   "arch": {
    "n_layers": 40,
    "hidden": 4096,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 1048576,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 34.26,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 26.47,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 22.87,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 19.48,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q4_K_M.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 15.36,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 11.78,
     "source_repo": "ibm-granite/granite-4.0-h-small-GGUF",
     "filename": "granite-4.0-h-small-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/ibm-granite/granite-4.0-h-small",
    "gguf": "https://huggingface.co/ibm-granite/granite-4.0-h-small-GGUF",
    "ollama": "https://ollama.com/library/granite4"
   },
   "run": {
    "ollama": "ollama run granite4:small-h",
    "llamacpp": "llama-server -hf ibm-granite/granite-4.0-h-small-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "smollm3-3b",
   "family": "llm",
   "name": "SmolLM3 3B",
   "repo_id": "HuggingFaceTB/SmolLM3-3B",
   "params_b": 3.08,
   "license": "apache-2.0",
   "gguf_repo": "ggml-org/SmolLM3-3B-GGUF",
   "good_for": "Hugging Face's own fully-open small model, trained in public.",
   "stale": false,
   "gated": false,
   "downloads_30d": 519434,
   "arch": {
    "n_layers": 36,
    "hidden": 2048,
    "n_heads": 16,
    "n_kv_heads": 4
   },
   "context_len": 65536,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 3.28,
     "source_repo": "ggml-org/SmolLM3-3B-GGUF",
     "filename": "SmolLM3-Q8_0.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 1.92,
     "source_repo": "ggml-org/SmolLM3-3B-GGUF",
     "filename": "SmolLM3-Q4_K_M.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/HuggingFaceTB/SmolLM3-3B",
    "gguf": "https://huggingface.co/ggml-org/SmolLM3-3B-GGUF"
   },
   "run": {
    "ollama": "ollama run hf.co/ggml-org/SmolLM3-3B-GGUF:Q4_K_M",
    "llamacpp": "llama-server -hf ggml-org/SmolLM3-3B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "minicpm-4.1-8b",
   "family": "llm",
   "name": "MiniCPM 4.1 8B",
   "repo_id": "openbmb/MiniCPM4.1-8B",
   "params_b": 8.19,
   "license": "apache-2.0",
   "gguf_repo": "openbmb/MiniCPM4.1-8B-GGUF",
   "good_for": "Tuned hard for running on ordinary devices; official GGUFs.",
   "stale": false,
   "gated": false,
   "downloads_30d": 50634,
   "arch": {
    "n_layers": 32,
    "hidden": 4096,
    "n_heads": 32,
    "n_kv_heads": 2
   },
   "context_len": 65536,
   "quants": [
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 4.97,
     "source_repo": "openbmb/MiniCPM4.1-8B-GGUF",
     "filename": "MiniCPM4.1-8B-Q4_K_M.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/openbmb/MiniCPM4.1-8B",
    "gguf": "https://huggingface.co/openbmb/MiniCPM4.1-8B-GGUF"
   },
   "run": {
    "ollama": "ollama run hf.co/openbmb/MiniCPM4.1-8B-GGUF:Q4_K_M",
    "llamacpp": "llama-server -hf openbmb/MiniCPM4.1-8B-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "nemotron-nano-9b",
   "family": "llm",
   "name": "NVIDIA Nemotron Nano 9B v2",
   "repo_id": "nvidia/NVIDIA-Nemotron-Nano-9B-v2",
   "params_b": 8.89,
   "license": "other",
   "gguf_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
   "good_for": "Hybrid Mamba design: strong reasoning with fast, steady output.",
   "stale": false,
   "gated": false,
   "downloads_30d": 545070,
   "arch": {
    "n_layers": 56,
    "hidden": 4480,
    "n_heads": 40,
    "n_kv_heads": 8
   },
   "context_len": 1048576,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 9.46,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 9.14,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 7.07,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 6.53,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 5.27,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 5.38,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 5.01,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/nvidia/NVIDIA-Nemotron-Nano-9B-v2",
    "gguf": "https://huggingface.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF"
   },
   "run": {
    "ollama": "ollama run hf.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF:Q4_K_M",
    "llamacpp": "llama-server -hf bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "nemotron-nano-12b",
   "family": "llm",
   "name": "NVIDIA Nemotron Nano 12B v2",
   "repo_id": "nvidia/NVIDIA-Nemotron-Nano-12B-v2",
   "params_b": 12.31,
   "license": "other",
   "gguf_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
   "good_for": "The bigger Nemotron Nano; reasoning-first hybrid.",
   "stale": false,
   "gated": false,
   "downloads_30d": 15998,
   "arch": {
    "n_layers": 62,
    "hidden": 5120,
    "n_heads": 40,
    "n_kv_heads": 8
   },
   "context_len": 1048576,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 13.09,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 10.11,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 8.76,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 7.49,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 6.75,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 6.02,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 4.7,
     "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF",
     "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/nvidia/NVIDIA-Nemotron-Nano-12B-v2",
    "gguf": "https://huggingface.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF"
   },
   "run": {
    "ollama": "ollama run hf.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF:Q4_K_M",
    "llamacpp": "llama-server -hf bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-vl-2b",
   "family": "vlm",
   "name": "Qwen3-VL 2B",
   "repo_id": "Qwen/Qwen3-VL-2B-Instruct",
   "params_b": 2.13,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
   "ollama_tag": "qwen3-vl:2b",
   "good_for": "Chat about images on very light hardware.",
   "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).",
   "stale": false,
   "gated": false,
   "downloads_30d": 1944930,
   "arch": {
    "n_layers": 28,
    "hidden": 2048,
    "n_heads": 16,
    "n_kv_heads": 8
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 1.83,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 1.42,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 1.26,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 1.11,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 1.01,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 0.94,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 0.78,
     "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF",
     "filename": "Qwen3-VL-2B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-VL-2B-Instruct",
    "gguf": "https://huggingface.co/unsloth/Qwen3-VL-2B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/qwen3-vl"
   },
   "run": {
    "ollama": "ollama run qwen3-vl:2b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-VL-2B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-vl-4b",
   "family": "vlm",
   "name": "Qwen3-VL 4B",
   "repo_id": "Qwen/Qwen3-VL-4B-Instruct",
   "params_b": 4.44,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
   "ollama_tag": "qwen3-vl:4b",
   "good_for": "The sweet spot for asking questions about images and screenshots.",
   "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).",
   "stale": false,
   "gated": false,
   "downloads_30d": 3769866,
   "arch": {
    "n_layers": 36,
    "hidden": 2560,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 4.28,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 3.31,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 2.89,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 2.5,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 2.27,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 2.08,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 1.67,
     "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF",
     "filename": "Qwen3-VL-4B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-VL-4B-Instruct",
    "gguf": "https://huggingface.co/unsloth/Qwen3-VL-4B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/qwen3-vl"
   },
   "run": {
    "ollama": "ollama run qwen3-vl:4b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-VL-4B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-vl-8b",
   "family": "vlm",
   "name": "Qwen3-VL 8B",
   "repo_id": "Qwen/Qwen3-VL-8B-Instruct",
   "params_b": 8.77,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
   "ollama_tag": "qwen3-vl:8b",
   "good_for": "Strong image understanding: documents, charts, photos.",
   "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).",
   "stale": false,
   "gated": false,
   "downloads_30d": 7690985,
   "arch": {
    "n_layers": 36,
    "hidden": 4096,
    "n_heads": 32,
    "n_kv_heads": 8
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 8.71,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 6.73,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 5.85,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 5.03,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 4.58,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 4.12,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 3.28,
     "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF",
     "filename": "Qwen3-VL-8B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-VL-8B-Instruct",
    "gguf": "https://huggingface.co/unsloth/Qwen3-VL-8B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/qwen3-vl"
   },
   "run": {
    "ollama": "ollama run qwen3-vl:8b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-VL-8B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-vl-30b-a3b",
   "family": "vlm",
   "name": "Qwen3-VL 30B-A3B (MoE)",
   "repo_id": "Qwen/Qwen3-VL-30B-A3B-Instruct",
   "params_b": 31.07,
   "active_params_b": 3.0,
   "license": "apache-2.0",
   "gguf_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
   "ollama_tag": "qwen3-vl:30b",
   "good_for": "Top-tier local vision-language quality, fast thanks to 3B active.",
   "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).",
   "stale": false,
   "gated": false,
   "downloads_30d": 783446,
   "arch": {
    "n_layers": 48,
    "hidden": 2048,
    "n_heads": 32,
    "n_kv_heads": 4
   },
   "context_len": 262144,
   "quants": [
    {
     "key": "Q8_0",
     "plain": "Near-full (8-bit)",
     "file_gb": 32.48,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q8_0.gguf"
    },
    {
     "key": "Q6_K",
     "plain": "High (6-bit)",
     "file_gb": 25.09,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q6_K.gguf"
    },
    {
     "key": "Q5_K_M",
     "plain": "Balanced+ (5-bit)",
     "file_gb": 21.73,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q5_K_M.gguf"
    },
    {
     "key": "Q4_K_M",
     "plain": "Balanced (4-bit)",
     "file_gb": 18.56,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q4_K_M.gguf"
    },
    {
     "key": "IQ4_XS",
     "plain": "Compact (4-bit)",
     "file_gb": 16.38,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-IQ4_XS.gguf"
    },
    {
     "key": "Q3_K_M",
     "plain": "Compact (3-bit)",
     "file_gb": 14.71,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q3_K_M.gguf"
    },
    {
     "key": "Q2_K",
     "plain": "Tiny (2-bit)",
     "file_gb": 11.26,
     "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
     "filename": "Qwen3-VL-30B-A3B-Instruct-Q2_K.gguf"
    }
   ],
   "provenance": "filesize",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-VL-30B-A3B-Instruct",
    "gguf": "https://huggingface.co/unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF",
    "ollama": "https://ollama.com/library/qwen3-vl"
   },
   "run": {
    "ollama": "ollama run qwen3-vl:30b",
    "llamacpp": "llama-server -hf unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF:Q4_K_M"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "smolvlm2-2.2b",
   "family": "vlm",
   "name": "SmolVLM2 2.2B",
   "repo_id": "HuggingFaceTB/SmolVLM2-2.2B-Instruct",
   "params_b": 2.25,
   "license": "apache-2.0",
   "mem_gb": 6.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install transformers torch",
   "good_for": "Small open video+image understanding; also a common base for robot-policy finetunes.",
   "stale": false,
   "gated": false,
   "downloads_30d": 272382,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/HuggingFaceTB/SmolVLM2-2.2B-Instruct"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "moondream2",
   "family": "vlm",
   "name": "Moondream2",
   "repo_id": "vikhyatk/moondream2",
   "params_b": 1.93,
   "license": "apache-2.0",
   "ollama_tag": "moondream",
   "mem_gb": 4.5,
   "mem_provenance": "estimated",
   "run_pip": "pip install moondream",
   "good_for": "Tiny image-question model that runs almost anywhere.",
   "stale": false,
   "gated": false,
   "downloads_30d": 2074069,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/vikhyatk/moondream2",
    "ollama": "https://ollama.com/library/moondream"
   },
   "run": {
    "ollama": "ollama run moondream",
    "pip": "pip install moondream"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "yolo26-n",
   "family": "vision",
   "use_cases": [
    "detect",
    "classify",
    "pose",
    "train-vision"
   ],
   "name": "YOLO26 Nano",
   "repo_id": "Ultralytics/YOLO26",
   "params_b": 0.0026,
   "license": "agpl-3.0",
   "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.",
   "mem_gb": 1.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install ultralytics",
   "good_for": "Real-time detection even on weak hardware or a webcam.",
   "docs": "https://docs.ultralytics.com/models/yolo26",
   "stale": false,
   "gated": false,
   "downloads_30d": 7012,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Ultralytics/YOLO26",
    "docs": "https://docs.ultralytics.com/models/yolo26"
   },
   "run": {
    "pip": "pip install ultralytics"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "yolo26-s",
   "family": "vision",
   "use_cases": [
    "detect",
    "classify",
    "pose",
    "train-vision"
   ],
   "name": "YOLO26 Small",
   "repo_id": "Ultralytics/YOLO26",
   "params_b": 0.0096,
   "license": "agpl-3.0",
   "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.",
   "mem_gb": 1.2,
   "mem_provenance": "estimated",
   "run_pip": "pip install ultralytics",
   "good_for": "Fast and clearly more accurate than Nano.",
   "docs": "https://docs.ultralytics.com/models/yolo26",
   "stale": false,
   "gated": false,
   "downloads_30d": 7012,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Ultralytics/YOLO26",
    "docs": "https://docs.ultralytics.com/models/yolo26"
   },
   "run": {
    "pip": "pip install ultralytics"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "yolo26-m",
   "family": "vision",
   "use_cases": [
    "detect",
    "classify",
    "pose",
    "train-vision"
   ],
   "name": "YOLO26 Medium",
   "repo_id": "Ultralytics/YOLO26",
   "params_b": 0.0202,
   "license": "agpl-3.0",
   "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.",
   "mem_gb": 1.6,
   "mem_provenance": "estimated",
   "run_pip": "pip install ultralytics",
   "good_for": "Balanced accuracy and speed for real work.",
   "docs": "https://docs.ultralytics.com/models/yolo26",
   "stale": false,
   "gated": false,
   "downloads_30d": 7012,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Ultralytics/YOLO26",
    "docs": "https://docs.ultralytics.com/models/yolo26"
   },
   "run": {
    "pip": "pip install ultralytics"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "yolo26-l",
   "family": "vision",
   "use_cases": [
    "detect",
    "classify",
    "pose",
    "train-vision"
   ],
   "name": "YOLO26 Large",
   "repo_id": "Ultralytics/YOLO26",
   "params_b": 0.0337,
   "license": "agpl-3.0",
   "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.",
   "mem_gb": 2.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install ultralytics",
   "good_for": "High accuracy when you have a real GPU.",
   "docs": "https://docs.ultralytics.com/models/yolo26",
   "stale": false,
   "gated": false,
   "downloads_30d": 7012,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Ultralytics/YOLO26",
    "docs": "https://docs.ultralytics.com/models/yolo26"
   },
   "run": {
    "pip": "pip install ultralytics"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "yolo26-x",
   "family": "vision",
   "use_cases": [
    "detect",
    "classify",
    "pose",
    "train-vision"
   ],
   "name": "YOLO26 X-Large",
   "repo_id": "Ultralytics/YOLO26",
   "params_b": 0.0569,
   "license": "agpl-3.0",
   "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.",
   "mem_gb": 2.5,
   "mem_provenance": "estimated",
   "run_pip": "pip install ultralytics",
   "good_for": "Highest accuracy in the family, slowest.",
   "docs": "https://docs.ultralytics.com/models/yolo26",
   "stale": false,
   "gated": false,
   "downloads_30d": 7012,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Ultralytics/YOLO26",
    "docs": "https://docs.ultralytics.com/models/yolo26"
   },
   "run": {
    "pip": "pip install ultralytics"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sam-2.1-tiny",
   "family": "vision",
   "use_cases": [
    "segment"
   ],
   "name": "SAM 2.1 Tiny",
   "repo_id": "facebook/sam2.1-hiera-tiny",
   "params_b": 0.04,
   "license": "apache-2.0",
   "mem_gb": 1.5,
   "mem_provenance": "community",
   "run_pip": "pip install sam2",
   "good_for": "Click-to-segment anything in images; light and quick.",
   "stale": false,
   "gated": false,
   "downloads_30d": 30268,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/facebook/sam2.1-hiera-tiny"
   },
   "run": {
    "pip": "pip install sam2"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sam-2.1-small",
   "family": "vision",
   "use_cases": [
    "segment"
   ],
   "name": "SAM 2.1 Small",
   "repo_id": "facebook/sam2.1-hiera-small",
   "params_b": 0.05,
   "license": "apache-2.0",
   "mem_gb": 1.8,
   "mem_provenance": "community",
   "run_pip": "pip install sam2",
   "good_for": "Solid segmentation quality, still light.",
   "stale": false,
   "gated": false,
   "downloads_30d": 12700,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/facebook/sam2.1-hiera-small"
   },
   "run": {
    "pip": "pip install sam2"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sam-2.1-large",
   "family": "vision",
   "use_cases": [
    "segment"
   ],
   "name": "SAM 2.1 Large",
   "repo_id": "facebook/sam2.1-hiera-large",
   "params_b": 0.22,
   "license": "apache-2.0",
   "mem_gb": 3.0,
   "mem_provenance": "community",
   "mem_note": "Image segmentation is light; tracking through video needs much more (community reports: 12 GB+).",
   "run_pip": "pip install sam2",
   "good_for": "Best SAM quality for images and video object tracking.",
   "stale": false,
   "gated": false,
   "downloads_30d": 70422,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/facebook/sam2.1-hiera-large"
   },
   "run": {
    "pip": "pip install sam2"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sam-3",
   "family": "vision",
   "use_cases": [
    "segment"
   ],
   "name": "SAM 3",
   "repo_id": "facebook/sam3",
   "params_b": 0.86,
   "license": "other",
   "mem_gb": 4.0,
   "mem_provenance": "community",
   "run_pip": "pip install transformers torch",
   "good_for": "Segment things by describing them in words, not just clicks.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1879279,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/facebook/sam3"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "da3-small",
   "family": "vision",
   "use_cases": [
    "depth"
   ],
   "name": "Depth Anything 3 Small",
   "repo_id": "depth-anything/DA3-SMALL",
   "params_b": 0.03,
   "license": "apache-2.0",
   "mem_gb": 1.2,
   "mem_provenance": "estimated",
   "run_pip": "pip install transformers torch",
   "good_for": "Depth maps from any photo, fast.",
   "stale": false,
   "gated": false,
   "downloads_30d": 23161,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/depth-anything/DA3-SMALL"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "da3-base",
   "family": "vision",
   "use_cases": [
    "depth"
   ],
   "name": "Depth Anything 3 Base",
   "repo_id": "depth-anything/DA3-BASE",
   "params_b": 0.14,
   "license": "apache-2.0",
   "mem_gb": 1.8,
   "mem_provenance": "estimated",
   "run_pip": "pip install transformers torch",
   "good_for": "Sharper depth, still light.",
   "stale": false,
   "gated": false,
   "downloads_30d": 50537,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/depth-anything/DA3-BASE"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "da3-large",
   "family": "vision",
   "use_cases": [
    "depth"
   ],
   "name": "Depth Anything 3 Large",
   "repo_id": "depth-anything/DA3-LARGE",
   "params_b": 0.41,
   "license": "cc-by-nc-4.0",
   "license_note": "Non-commercial licence.",
   "mem_gb": 3.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install transformers torch",
   "good_for": "Best depth quality; research / personal use only.",
   "stale": false,
   "gated": false,
   "downloads_30d": 135024,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/depth-anything/DA3-LARGE"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "foundationpose",
   "family": "vision",
   "use_cases": [
    "pose"
   ],
   "name": "FoundationPose (6-DoF)",
   "repo_id": "NVlabs/FoundationPose",
   "repo_kind": "github",
   "params_b": 0.3,
   "license": "nvidia-source-code",
   "license_note": "Research-only licence; weights are downloaded from links in the GitHub README, not Hugging Face.",
   "mem_gb": 8.0,
   "mem_provenance": "community",
   "mem_note": "Community reports it running on a 12 GB RTX 3060. Needs CUDA and a custom build: advanced setup.",
   "docs": "https://github.com/NVlabs/FoundationPose",
   "good_for": "Full 6-DoF object pose (position + rotation) for robotics. The serious option.",
   "stale": false,
   "links": {
    "home": "https://github.com/NVlabs/FoundationPose",
    "docs": "https://github.com/NVlabs/FoundationPose"
   },
   "provenance": "community",
   "last_verified": "2026-06-09"
  },
  {
   "key": "paddleocr",
   "family": "vision",
   "use_cases": [
    "ocr"
   ],
   "name": "PaddleOCR (PP-OCRv5)",
   "repo_id": "PaddlePaddle/PP-OCRv5_server_rec",
   "params_b": 0.05,
   "license": "apache-2.0",
   "mem_gb": 1.0,
   "mem_provenance": "community",
   "run_pip": "pip install paddleocr",
   "good_for": "The classic text-from-images toolkit. Works fine on CPU.",
   "stale": false,
   "gated": false,
   "downloads_30d": 196930,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/PaddlePaddle/PP-OCRv5_server_rec"
   },
   "run": {
    "pip": "pip install paddleocr"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "deepseek-ocr",
   "family": "vision",
   "use_cases": [
    "ocr"
   ],
   "name": "DeepSeek-OCR",
   "repo_id": "deepseek-ai/DeepSeek-OCR",
   "params_b": 3.34,
   "license": "mit",
   "mem_gb": 8.0,
   "mem_provenance": "estimated",
   "ollama_tag": "deepseek-ocr",
   "run_pip": "pip install transformers torch",
   "good_for": "Turns whole documents into clean text/markdown, layout and all.",
   "stale": false,
   "gated": false,
   "downloads_30d": 2404442,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/deepseek-ai/DeepSeek-OCR",
    "ollama": "https://ollama.com/library/deepseek-ocr"
   },
   "run": {
    "ollama": "ollama run deepseek-ocr",
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sdxl",
   "family": "imagegen",
   "use_cases": [
    "imagegen",
    "inpaint"
   ],
   "name": "Stable Diffusion XL",
   "repo_id": "stabilityai/stable-diffusion-xl-base-1.0",
   "params_b": 3.5,
   "license": "openrail++",
   "mem_gb": 8.0,
   "mem_provenance": "community",
   "run_pip": "pip install diffusers torch",
   "good_for": "Excellent 1024px images with a huge community of styles and add-ons.",
   "stale": false,
   "gated": false,
   "downloads_30d": 1436868,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sd-3.5-medium",
   "family": "imagegen",
   "use_cases": [
    "imagegen",
    "inpaint"
   ],
   "name": "Stable Diffusion 3.5 Medium",
   "repo_id": "stabilityai/stable-diffusion-3.5-medium",
   "params_b": 2.5,
   "license": "other",
   "license_note": "Free for individuals and businesses under $1M revenue.",
   "mem_gb": 9.9,
   "mem_provenance": "vendor",
   "mem_note": "9.9 GB is Stability's own published figure (excluding text encoders).",
   "run_pip": "pip install diffusers torch",
   "good_for": "Modern image quality tuned to run on consumer cards.",
   "stale": false,
   "gated": true,
   "downloads_30d": 126738,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-medium"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "sd-3.5-large",
   "family": "imagegen",
   "use_cases": [
    "imagegen",
    "inpaint"
   ],
   "name": "Stable Diffusion 3.5 Large",
   "repo_id": "stabilityai/stable-diffusion-3.5-large",
   "params_b": 8.0,
   "license": "other",
   "license_note": "Free for individuals and businesses under $1M revenue.",
   "mem_gb": 24.0,
   "mem_provenance": "vendor",
   "mem_note": "About 24 GB at full quality (vendor figure); quantized builds run in roughly half that.",
   "run_pip": "pip install diffusers torch",
   "good_for": "Stability's top open image model.",
   "stale": false,
   "gated": true,
   "downloads_30d": 22257,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-large"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "flux1-schnell",
   "family": "imagegen",
   "use_cases": [
    "imagegen"
   ],
   "name": "FLUX.1 Schnell",
   "repo_id": "black-forest-labs/FLUX.1-schnell",
   "params_b": 12.0,
   "license": "apache-2.0",
   "mem_gb": 16.0,
   "mem_provenance": "community",
   "mem_note": "Roughly 16 GB at 8-bit, 24 GB at full quality. Community-reported figures.",
   "run_pip": "pip install diffusers torch",
   "good_for": "Near-top image quality in few steps, and Apache-licensed.",
   "stale": false,
   "gated": true,
   "downloads_30d": 337454,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/black-forest-labs/FLUX.1-schnell"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "flux1-dev",
   "family": "imagegen",
   "use_cases": [
    "imagegen",
    "inpaint"
   ],
   "name": "FLUX.1 Dev",
   "repo_id": "black-forest-labs/FLUX.1-dev",
   "params_b": 12.0,
   "license": "other",
   "license_note": "Non-commercial licence; gated (accept terms on Hugging Face).",
   "mem_gb": 16.0,
   "mem_provenance": "community",
   "mem_note": "Roughly 16 GB at 8-bit, 24 GB at full quality. Community-reported figures.",
   "run_pip": "pip install diffusers torch",
   "good_for": "State-of-the-art open image quality (for non-commercial work).",
   "stale": false,
   "gated": true,
   "downloads_30d": 984011,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/black-forest-labs/FLUX.1-dev"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "flux2-dev",
   "family": "imagegen",
   "use_cases": [
    "imagegen"
   ],
   "name": "FLUX.2 Dev (32B)",
   "repo_id": "black-forest-labs/FLUX.2-dev",
   "params_b": 32.0,
   "license": "other",
   "license_note": "Non-commercial licence; gated.",
   "mem_gb": 90.0,
   "mem_provenance": "community",
   "mem_note": "Around 90 GB at full quality; 4-bit with offloading is reported to fit a 24 GB card, slowly.",
   "run_pip": "pip install diffusers torch",
   "good_for": "The frontier of open image generation. Honest answer: workstation hardware.",
   "stale": false,
   "gated": true,
   "downloads_30d": 309301,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/black-forest-labs/FLUX.2-dev"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "real-esrgan",
   "family": "imagegen",
   "use_cases": [
    "upscale"
   ],
   "name": "Real-ESRGAN",
   "repo_id": "ai-forever/Real-ESRGAN",
   "params_b": 0.017,
   "license": "bsd-3-clause",
   "mem_gb": 2.0,
   "mem_provenance": "community",
   "run_pip": "pip install realesrgan",
   "good_for": "The standard for upscaling and restoring photos.",
   "stale": false,
   "gated": false,
   "downloads_30d": 0,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/ai-forever/Real-ESRGAN"
   },
   "run": {
    "pip": "pip install realesrgan"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "birefnet",
   "family": "imagegen",
   "use_cases": [
    "bgremove"
   ],
   "name": "BiRefNet",
   "repo_id": "ZhengPeng7/BiRefNet",
   "params_b": 0.22,
   "license": "mit",
   "mem_gb": 3.0,
   "mem_provenance": "community",
   "run_pip": "pip install transformers torch",
   "good_for": "Crisp background removal, MIT-licensed.",
   "stale": false,
   "gated": false,
   "downloads_30d": 721429,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/ZhengPeng7/BiRefNet"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "rmbg-2.0",
   "family": "imagegen",
   "use_cases": [
    "bgremove"
   ],
   "name": "RMBG 2.0",
   "repo_id": "briaai/RMBG-2.0",
   "params_b": 0.22,
   "license": "other",
   "license_note": "Free for non-commercial use only.",
   "mem_gb": 3.0,
   "mem_provenance": "community",
   "run_pip": "pip install transformers torch",
   "good_for": "Very strong background removal (check the licence for products).",
   "stale": false,
   "gated": true,
   "downloads_30d": 620472,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/briaai/RMBG-2.0"
   },
   "run": {
    "pip": "pip install transformers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "ltx-video",
   "family": "imagegen",
   "use_cases": [
    "videogen"
   ],
   "name": "LTX-Video",
   "repo_id": "Lightricks/LTX-Video",
   "params_b": 2.0,
   "license": "other",
   "mem_gb": 12.0,
   "mem_provenance": "community",
   "run_pip": "pip install diffusers torch",
   "good_for": "Real-time-class local video generation on consumer cards.",
   "stale": false,
   "gated": false,
   "downloads_30d": 446216,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/Lightricks/LTX-Video"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "wan-2.2-ti2v-5b",
   "family": "imagegen",
   "use_cases": [
    "videogen"
   ],
   "name": "Wan 2.2 TI2V 5B",
   "repo_id": "Wan-AI/Wan2.2-TI2V-5B",
   "params_b": 5.0,
   "license": "apache-2.0",
   "mem_gb": 16.0,
   "mem_provenance": "community",
   "run_pip": "pip install diffusers torch",
   "good_for": "Strong open text/image-to-video that fits prosumer cards.",
   "stale": false,
   "gated": false,
   "downloads_30d": 9456,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/Wan-AI/Wan2.2-TI2V-5B"
   },
   "run": {
    "pip": "pip install diffusers torch"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "whisper-base",
   "family": "audio",
   "use_cases": [
    "stt"
   ],
   "name": "Whisper Base",
   "repo_id": "openai/whisper-base",
   "params_b": 0.07,
   "license": "apache-2.0",
   "mem_gb": 1.0,
   "mem_provenance": "vendor",
   "mem_note": "OpenAI's own published VRAM figure.",
   "run_pip": "pip install faster-whisper",
   "good_for": "Quick rough transcription on any machine.",
   "stale": false,
   "gated": false,
   "downloads_30d": 4308029,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/openai/whisper-base"
   },
   "run": {
    "pip": "pip install faster-whisper"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "whisper-small",
   "family": "audio",
   "use_cases": [
    "stt"
   ],
   "name": "Whisper Small",
   "repo_id": "openai/whisper-small",
   "params_b": 0.24,
   "license": "apache-2.0",
   "mem_gb": 2.0,
   "mem_provenance": "vendor",
   "mem_note": "OpenAI's own published VRAM figure.",
   "run_pip": "pip install faster-whisper",
   "good_for": "Good accuracy on clear audio, still fast.",
   "stale": false,
   "gated": false,
   "downloads_30d": 2315618,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/openai/whisper-small"
   },
   "run": {
    "pip": "pip install faster-whisper"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "whisper-large-v3-turbo",
   "family": "audio",
   "use_cases": [
    "stt"
   ],
   "name": "Whisper Large v3 Turbo",
   "repo_id": "openai/whisper-large-v3-turbo",
   "params_b": 0.81,
   "license": "mit",
   "mem_gb": 6.0,
   "mem_provenance": "vendor",
   "mem_note": "OpenAI's own published VRAM figure. faster-whisper in 8-bit roughly halves it.",
   "run_pip": "pip install faster-whisper",
   "good_for": "Near-best accuracy at several times the speed of Large.",
   "stale": false,
   "gated": false,
   "downloads_30d": 7948390,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/openai/whisper-large-v3-turbo"
   },
   "run": {
    "pip": "pip install faster-whisper"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "whisper-large-v3",
   "family": "audio",
   "use_cases": [
    "stt"
   ],
   "name": "Whisper Large v3",
   "repo_id": "openai/whisper-large-v3",
   "params_b": 1.54,
   "license": "apache-2.0",
   "mem_gb": 10.0,
   "mem_provenance": "vendor",
   "mem_note": "OpenAI's own published VRAM figure. faster-whisper in 8-bit roughly halves it.",
   "run_pip": "pip install faster-whisper",
   "good_for": "The best open transcription accuracy, any language.",
   "stale": false,
   "gated": false,
   "downloads_30d": 5054098,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/openai/whisper-large-v3"
   },
   "run": {
    "pip": "pip install faster-whisper"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "kokoro-82m",
   "family": "audio",
   "use_cases": [
    "tts"
   ],
   "name": "Kokoro TTS (82M)",
   "repo_id": "hexgrad/Kokoro-82M",
   "params_b": 0.082,
   "license": "apache-2.0",
   "mem_gb": 1.5,
   "mem_provenance": "community",
   "run_pip": "pip install kokoro",
   "good_for": "Shockingly good small voice model; runs even on CPU.",
   "stale": false,
   "gated": false,
   "downloads_30d": 13198222,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/hexgrad/Kokoro-82M"
   },
   "run": {
    "pip": "pip install kokoro"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "chatterbox",
   "family": "audio",
   "use_cases": [
    "tts"
   ],
   "name": "Chatterbox TTS",
   "repo_id": "ResembleAI/chatterbox",
   "params_b": 0.5,
   "license": "mit",
   "mem_gb": 4.0,
   "mem_provenance": "community",
   "run_pip": "pip install chatterbox-tts",
   "good_for": "Production-grade voice cloning, MIT-licensed.",
   "stale": false,
   "gated": false,
   "downloads_30d": 1694198,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/ResembleAI/chatterbox"
   },
   "run": {
    "pip": "pip install chatterbox-tts"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "f5-tts",
   "family": "audio",
   "use_cases": [
    "tts"
   ],
   "name": "F5-TTS",
   "repo_id": "SWivid/F5-TTS",
   "params_b": 0.3,
   "license": "cc-by-nc-4.0",
   "license_note": "Non-commercial licence.",
   "mem_gb": 8.0,
   "mem_provenance": "community",
   "run_pip": "pip install f5-tts",
   "good_for": "High-quality voice cloning for personal projects.",
   "stale": false,
   "gated": false,
   "downloads_30d": 646717,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/SWivid/F5-TTS"
   },
   "run": {
    "pip": "pip install f5-tts"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "ace-step",
   "family": "audio",
   "use_cases": [
    "music"
   ],
   "name": "ACE-Step (3.5B)",
   "repo_id": "ACE-Step/ACE-Step-v1-3.5B",
   "params_b": 3.5,
   "license": "apache-2.0",
   "mem_gb": 10.0,
   "mem_provenance": "community",
   "run_pip": "pip install acestep",
   "good_for": "The best permissively-licensed local music generator.",
   "stale": false,
   "gated": false,
   "downloads_30d": 0,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/ACE-Step/ACE-Step-v1-3.5B"
   },
   "run": {
    "pip": "pip install acestep"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "musicgen-small",
   "family": "audio",
   "use_cases": [
    "music"
   ],
   "name": "MusicGen Small",
   "repo_id": "facebook/musicgen-small",
   "params_b": 0.59,
   "license": "cc-by-nc-4.0",
   "license_note": "Non-commercial licence.",
   "mem_gb": 6.0,
   "mem_provenance": "community",
   "run_pip": "pip install audiocraft",
   "good_for": "Quick music sketches on modest hardware.",
   "stale": false,
   "gated": false,
   "downloads_30d": 186078,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/facebook/musicgen-small"
   },
   "run": {
    "pip": "pip install audiocraft"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "musicgen-medium",
   "family": "audio",
   "use_cases": [
    "music"
   ],
   "name": "MusicGen Medium",
   "repo_id": "facebook/musicgen-medium",
   "params_b": 1.5,
   "license": "cc-by-nc-4.0",
   "license_note": "Non-commercial licence.",
   "mem_gb": 16.0,
   "mem_provenance": "vendor",
   "mem_note": "Meta's docs say a GPU with at least 16 GB for this size.",
   "run_pip": "pip install audiocraft",
   "good_for": "Meta's well-known music model (non-commercial).",
   "stale": false,
   "gated": false,
   "downloads_30d": 1443963,
   "provenance": "vendor",
   "links": {
    "hf": "https://huggingface.co/facebook/musicgen-medium"
   },
   "run": {
    "pip": "pip install audiocraft"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "all-minilm-l6-v2",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "all-MiniLM-L6-v2",
   "repo_id": "sentence-transformers/all-MiniLM-L6-v2",
   "params_b": 0.02,
   "license": "apache-2.0",
   "mem_gb": 0.5,
   "mem_provenance": "estimated",
   "ollama_tag": "all-minilm",
   "run_pip": "pip install sentence-transformers",
   "good_for": "The classic tiny embedder. Search your notes on any machine.",
   "stale": false,
   "gated": false,
   "downloads_30d": 230826064,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2",
    "ollama": "https://ollama.com/library/all-minilm"
   },
   "run": {
    "ollama": "ollama run all-minilm",
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "nomic-embed-text-v1.5",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "Nomic Embed Text v1.5",
   "repo_id": "nomic-ai/nomic-embed-text-v1.5",
   "params_b": 0.14,
   "license": "apache-2.0",
   "mem_gb": 1.0,
   "mem_provenance": "estimated",
   "ollama_tag": "nomic-embed-text",
   "run_pip": "pip install sentence-transformers",
   "good_for": "Strong long-document search with adjustable size.",
   "stale": false,
   "gated": false,
   "downloads_30d": 17630308,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/nomic-ai/nomic-embed-text-v1.5",
    "ollama": "https://ollama.com/library/nomic-embed-text"
   },
   "run": {
    "ollama": "ollama run nomic-embed-text",
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "embeddinggemma-300m",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "EmbeddingGemma 300M",
   "repo_id": "google/embeddinggemma-300m",
   "params_b": 0.3,
   "license": "gemma",
   "mem_gb": 1.2,
   "mem_provenance": "estimated",
   "ollama_tag": "embeddinggemma",
   "run_pip": "pip install sentence-transformers",
   "good_for": "Google's on-device embedder, great multilingual search.",
   "stale": false,
   "gated": true,
   "downloads_30d": 1701766,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/google/embeddinggemma-300m",
    "ollama": "https://ollama.com/library/embeddinggemma"
   },
   "run": {
    "ollama": "ollama run embeddinggemma",
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "bge-m3",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "BGE-M3",
   "repo_id": "BAAI/bge-m3",
   "params_b": 0.57,
   "license": "mit",
   "mem_gb": 2.5,
   "mem_provenance": "estimated",
   "ollama_tag": "bge-m3",
   "run_pip": "pip install sentence-transformers",
   "good_for": "Heavyweight multilingual search quality.",
   "stale": false,
   "gated": false,
   "downloads_30d": 29227796,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/BAAI/bge-m3",
    "ollama": "https://ollama.com/library/bge-m3"
   },
   "run": {
    "ollama": "ollama run bge-m3",
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-embedding-0.6b",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "Qwen3 Embedding 0.6B",
   "repo_id": "Qwen/Qwen3-Embedding-0.6B",
   "params_b": 0.6,
   "license": "apache-2.0",
   "mem_gb": 1.5,
   "mem_provenance": "estimated",
   "ollama_tag": "qwen3-embedding",
   "run_pip": "pip install sentence-transformers",
   "good_for": "Modern top-ranked small embedder.",
   "stale": false,
   "gated": false,
   "downloads_30d": 8593433,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-Embedding-0.6B",
    "ollama": "https://ollama.com/library/qwen3-embedding"
   },
   "run": {
    "ollama": "ollama run qwen3-embedding",
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "qwen3-embedding-4b",
   "family": "embed",
   "use_cases": [
    "embed"
   ],
   "name": "Qwen3 Embedding 4B",
   "repo_id": "Qwen/Qwen3-Embedding-4B",
   "params_b": 4.02,
   "license": "apache-2.0",
   "mem_gb": 6.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install sentence-transformers",
   "good_for": "Best-in-class search relevance if you have the memory.",
   "stale": false,
   "gated": false,
   "downloads_30d": 2360699,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/Qwen/Qwen3-Embedding-4B"
   },
   "run": {
    "pip": "pip install sentence-transformers"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "chronos-bolt-small",
   "family": "data",
   "use_cases": [
    "forecast"
   ],
   "name": "Chronos-Bolt Small",
   "repo_id": "amazon/chronos-bolt-small",
   "params_b": 0.05,
   "license": "apache-2.0",
   "mem_gb": 0.5,
   "mem_provenance": "estimated",
   "run_pip": "pip install chronos-forecasting",
   "good_for": "Zero-shot time-series forecasting; runs on CPU.",
   "stale": false,
   "gated": false,
   "downloads_30d": 1461124,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/amazon/chronos-bolt-small"
   },
   "run": {
    "pip": "pip install chronos-forecasting"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "chronos-bolt-base",
   "family": "data",
   "use_cases": [
    "forecast"
   ],
   "name": "Chronos-Bolt Base",
   "repo_id": "amazon/chronos-bolt-base",
   "params_b": 0.21,
   "license": "apache-2.0",
   "mem_gb": 1.0,
   "mem_provenance": "estimated",
   "run_pip": "pip install chronos-forecasting",
   "good_for": "Stronger forecasts, still laptop-friendly.",
   "stale": false,
   "gated": false,
   "downloads_30d": 1253619,
   "provenance": "estimated",
   "links": {
    "hf": "https://huggingface.co/amazon/chronos-bolt-base"
   },
   "run": {
    "pip": "pip install chronos-forecasting"
   },
   "last_verified": "2026-06-09"
  },
  {
   "key": "tabpfn-v2",
   "family": "data",
   "use_cases": [
    "tabular"
   ],
   "name": "TabPFN v2",
   "repo_id": "Prior-Labs/TabPFN-v2-clf",
   "params_b": 0.011,
   "license": "other",
   "mem_gb": 2.0,
   "mem_provenance": "community",
   "run_pip": "pip install tabpfn",
   "good_for": "Spreadsheet predictions (classification) that beat tuned baselines on small data.",
   "stale": false,
   "gated": false,
   "downloads_30d": 34302,
   "provenance": "community",
   "links": {
    "hf": "https://huggingface.co/Prior-Labs/TabPFN-v2-clf"
   },
   "run": {
    "pip": "pip install tabpfn"
   },
   "last_verified": "2026-06-09"
  }
 ]
}