{ "version": 1, "generated_at": "2026-06-09T22:12:37+00:00", "count": 83, "entries": [ { "key": "qwen3-0.6b", "family": "llm", "name": "Qwen3 0.6B", "repo_id": "Qwen/Qwen3-0.6B", "params_b": 0.75, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-0.6B-GGUF", "ollama_tag": "qwen3:0.6b", "good_for": "Quick simple chat and text tidy-up. Runs on almost anything.", "aliases": [ "Qwen/Qwen3-0.6B-Base" ], "stale": false, "gated": false, "downloads_30d": 21649861, "arch": { "n_layers": 28, "hidden": 1024, "n_heads": 16, "n_kv_heads": 8 }, "context_len": 40960, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 0.64, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 0.5, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 0.44, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 0.4, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 0.37, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.35, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.3, "source_repo": "unsloth/Qwen3-0.6B-GGUF", "filename": "Qwen3-0.6B-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-0.6B", "gguf": "https://huggingface.co/unsloth/Qwen3-0.6B-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:0.6b", "llamacpp": "llama-server -hf unsloth/Qwen3-0.6B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-1.7b", "family": "llm", "name": "Qwen3 1.7B", "repo_id": "Qwen/Qwen3-1.7B", "params_b": 2.03, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-1.7B-GGUF", "ollama_tag": "qwen3:1.7b", "good_for": "Light everyday chat and summarising on weak hardware.", "aliases": [ "Qwen/Qwen3-1.7B-Base" ], "stale": false, "gated": false, "downloads_30d": 4452758, "arch": { "n_layers": 28, "hidden": 2048, "n_heads": 16, "n_kv_heads": 8 }, "context_len": 40960, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 1.83, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 1.42, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 1.26, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 1.11, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 1.01, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.94, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.78, "source_repo": "unsloth/Qwen3-1.7B-GGUF", "filename": "Qwen3-1.7B-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-1.7B", "gguf": "https://huggingface.co/unsloth/Qwen3-1.7B-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:1.7b", "llamacpp": "llama-server -hf unsloth/Qwen3-1.7B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-4b", "family": "llm", "name": "Qwen3 4B Instruct (2507)", "repo_id": "Qwen/Qwen3-4B-Instruct-2507", "params_b": 4.02, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "ollama_tag": "qwen3:4b", "good_for": "Surprisingly capable everyday assistant: chat, summarising, light coding.", "aliases": [ "Qwen/Qwen3-4B", "Qwen/Qwen3-4B-Base", "Qwen/Qwen3-4B-Thinking-2507" ], "stale": false, "gated": false, "downloads_30d": 4349929, "arch": { "n_layers": 36, "hidden": 2560, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 4.28, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 3.31, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.89, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.5, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 2.27, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 2.08, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 1.67, "source_repo": "unsloth/Qwen3-4B-Instruct-2507-GGUF", "filename": "Qwen3-4B-Instruct-2507-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507", "gguf": "https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:4b", "llamacpp": "llama-server -hf unsloth/Qwen3-4B-Instruct-2507-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-8b", "family": "llm", "name": "Qwen3 8B", "repo_id": "Qwen/Qwen3-8B", "params_b": 8.19, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-8B-GGUF", "ollama_tag": "qwen3:8b", "good_for": "A solid all-rounder: good chat, real coding help, decent reasoning.", "aliases": [ "Qwen/Qwen3-8B-Base" ], "stale": false, "gated": false, "downloads_30d": 10950977, "arch": { "n_layers": 36, "hidden": 4096, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 40960, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 8.71, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 6.73, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 5.85, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 5.03, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 4.58, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 4.12, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 3.28, "source_repo": "unsloth/Qwen3-8B-GGUF", "filename": "Qwen3-8B-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-8B", "gguf": "https://huggingface.co/unsloth/Qwen3-8B-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:8b", "llamacpp": "llama-server -hf unsloth/Qwen3-8B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-14b", "family": "llm", "name": "Qwen3 14B", "repo_id": "Qwen/Qwen3-14B", "params_b": 14.77, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-14B-GGUF", "ollama_tag": "qwen3:14b", "good_for": "Noticeably smarter and more reliable. Wants a real graphics card.", "aliases": [ "Qwen/Qwen3-14B-Base" ], "stale": false, "gated": false, "downloads_30d": 1640580, "arch": { "n_layers": 40, "hidden": 5120, "n_heads": 40, "n_kv_heads": 8 }, "context_len": 40960, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 15.7, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 12.12, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 10.51, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 9.0, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 8.14, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 7.32, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 5.75, "source_repo": "unsloth/Qwen3-14B-GGUF", "filename": "Qwen3-14B-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-14B", "gguf": "https://huggingface.co/unsloth/Qwen3-14B-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:14b", "llamacpp": "llama-server -hf unsloth/Qwen3-14B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-32b", "family": "llm", "name": "Qwen3 32B", "repo_id": "Qwen/Qwen3-32B", "params_b": 32.76, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-32B-GGUF", "ollama_tag": "qwen3:32b", "good_for": "Near-premium quality. Needs a strong GPU or a lot of memory.", "stale": false, "gated": false, "downloads_30d": 3167218, "arch": { "n_layers": 64, "hidden": 5120, "n_heads": 64, "n_kv_heads": 8 }, "context_len": 40960, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 34.82, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 26.88, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 23.21, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 19.76, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 17.71, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 15.97, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 12.34, "source_repo": "unsloth/Qwen3-32B-GGUF", "filename": "Qwen3-32B-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-32B", "gguf": "https://huggingface.co/unsloth/Qwen3-32B-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:32b", "llamacpp": "llama-server -hf unsloth/Qwen3-32B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-30b-a3b", "family": "llm", "name": "Qwen3 30B-A3B (2507, MoE)", "repo_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", "params_b": 30.53, "active_params_b": 3.0, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "ollama_tag": "qwen3:30b", "good_for": "Big-model quality that runs fast: only 3B of its 30B work per word, so it flies even part-offloaded to RAM.", "stale": false, "gated": false, "downloads_30d": 821913, "arch": { "n_layers": 48, "hidden": 2048, "n_heads": 32, "n_kv_heads": 4 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 32.48, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 25.09, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 21.73, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 18.56, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 16.38, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 14.71, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 11.26, "source_repo": "unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "filename": "Qwen3-30B-A3B-Instruct-2507-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507", "gguf": "https://huggingface.co/unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF", "ollama": "https://ollama.com/library/qwen3" }, "run": { "ollama": "ollama run qwen3:30b", "llamacpp": "llama-server -hf unsloth/Qwen3-30B-A3B-Instruct-2507-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-coder-30b", "family": "llm", "name": "Qwen3 Coder 30B-A3B (MoE)", "repo_id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "params_b": 30.53, "active_params_b": 3.0, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "ollama_tag": "qwen3-coder:30b", "good_for": "The local coding specialist. Fast despite its size (3B active).", "stale": false, "gated": false, "downloads_30d": 1961682, "arch": { "n_layers": 48, "hidden": 2048, "n_heads": 32, "n_kv_heads": 4 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 32.48, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 25.09, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 21.73, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 18.56, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 16.38, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 14.71, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 11.26, "source_repo": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "filename": "Qwen3-Coder-30B-A3B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct", "gguf": "https://huggingface.co/unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF", "ollama": "https://ollama.com/library/qwen3-coder" }, "run": { "ollama": "ollama run qwen3-coder:30b", "llamacpp": "llama-server -hf unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "llama-3.2-1b", "family": "llm", "name": "Llama 3.2 1B", "repo_id": "meta-llama/Llama-3.2-1B-Instruct", "params_b": 1.24, "license": "llama3.2", "gguf_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "ollama_tag": "llama3.2:1b", "good_for": "Quick simple chat from the Llama family. Runs on almost anything.", "stale": false, "gated": true, "downloads_30d": 7481230, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 1.32, "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "filename": "Llama-3.2-1B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 1.02, "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "filename": "Llama-3.2-1B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 0.91, "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "filename": "Llama-3.2-1B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 0.81, "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "filename": "Llama-3.2-1B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 0.74, "source_repo": "bartowski/Llama-3.2-1B-Instruct-GGUF", "filename": "Llama-3.2-1B-Instruct-IQ4_XS.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct", "gguf": "https://huggingface.co/bartowski/Llama-3.2-1B-Instruct-GGUF", "ollama": "https://ollama.com/library/llama3.2" }, "run": { "ollama": "ollama run llama3.2:1b", "llamacpp": "llama-server -hf bartowski/Llama-3.2-1B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "llama-3.2-3b", "family": "llm", "name": "Llama 3.2 3B", "repo_id": "meta-llama/Llama-3.2-3B-Instruct", "params_b": 3.21, "license": "llama3.2", "gguf_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "ollama_tag": "llama3.2:3b", "good_for": "Capable small assistant with the huge Llama ecosystem behind it.", "stale": false, "gated": true, "downloads_30d": 1509782, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 3.42, "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "filename": "Llama-3.2-3B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 2.64, "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "filename": "Llama-3.2-3B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.32, "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "filename": "Llama-3.2-3B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.02, "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "filename": "Llama-3.2-3B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 1.83, "source_repo": "bartowski/Llama-3.2-3B-Instruct-GGUF", "filename": "Llama-3.2-3B-Instruct-IQ4_XS.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct", "gguf": "https://huggingface.co/bartowski/Llama-3.2-3B-Instruct-GGUF", "ollama": "https://ollama.com/library/llama3.2" }, "run": { "ollama": "ollama run llama3.2:3b", "llamacpp": "llama-server -hf bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "llama-3.1-8b", "family": "llm", "name": "Llama 3.1 8B", "repo_id": "meta-llama/Llama-3.1-8B-Instruct", "params_b": 8.03, "license": "llama3.1", "gguf_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "ollama_tag": "llama3.1:8b", "good_for": "The classic dependable 8B: chat, coding help, tool use.", "stale": false, "gated": true, "downloads_30d": 10031112, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 8.54, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 6.6, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 5.73, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 4.92, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 4.45, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 4.02, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 3.18, "source_repo": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "filename": "Meta-Llama-3.1-8B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct", "gguf": "https://huggingface.co/bartowski/Meta-Llama-3.1-8B-Instruct-GGUF", "ollama": "https://ollama.com/library/llama3.1" }, "run": { "ollama": "ollama run llama3.1:8b", "llamacpp": "llama-server -hf bartowski/Meta-Llama-3.1-8B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "llama-4-scout", "family": "llm", "name": "Llama 4 Scout (109B MoE)", "repo_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", "params_b": 108.64, "active_params_b": 17.0, "license": "other", "gguf_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "ollama_tag": "llama4:scout", "good_for": "Frontier-class open model. Workstation territory: it is honest to say most PCs cannot run this.", "stale": false, "gated": true, "downloads_30d": 421808, "context_len": 10485760, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 114.53, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Q8_0/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 88.43, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Q6_K/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 76.55, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Q5_K_M/Llama-4-Scout-17B-16E-Instruct-Q5_K_M-00001-of-00002.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 65.36, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Q4_K_M/Llama-4-Scout-17B-16E-Instruct-Q4_K_M-00001-of-00002.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 57.65, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "IQ4_XS/Llama-4-Scout-17B-16E-Instruct-IQ4_XS-00001-of-00002.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 51.76, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Q3_K_M/Llama-4-Scout-17B-16E-Instruct-Q3_K_M-00001-of-00002.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 39.56, "source_repo": "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "filename": "Llama-4-Scout-17B-16E-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/meta-llama/Llama-4-Scout-17B-16E-Instruct", "gguf": "https://huggingface.co/unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF", "ollama": "https://ollama.com/library/llama4" }, "run": { "ollama": "ollama run llama4:scout", "llamacpp": "llama-server -hf unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3-270m", "family": "llm", "name": "Gemma 3 270M", "repo_id": "google/gemma-3-270m-it", "params_b": 0.27, "license": "gemma", "gguf_repo": "unsloth/gemma-3-270m-it-GGUF", "ollama_tag": "gemma3:270m", "good_for": "Tiny and instant. Fine for simple completions, not real conversation.", "stale": false, "gated": true, "downloads_30d": 127163, "context_len": 32768, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 0.29, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 0.28, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 0.26, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 0.25, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 0.24, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.24, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.24, "source_repo": "unsloth/gemma-3-270m-it-GGUF", "filename": "gemma-3-270m-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3-270m-it", "gguf": "https://huggingface.co/unsloth/gemma-3-270m-it-GGUF", "ollama": "https://ollama.com/library/gemma3" }, "run": { "ollama": "ollama run gemma3:270m", "llamacpp": "llama-server -hf unsloth/gemma-3-270m-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3-1b", "family": "llm", "name": "Gemma 3 1B", "repo_id": "google/gemma-3-1b-it", "params_b": 1.0, "license": "gemma", "gguf_repo": "unsloth/gemma-3-1b-it-GGUF", "ollama_tag": "gemma3:1b", "good_for": "Google's small chat model. Light and friendly on weak hardware.", "stale": false, "gated": true, "downloads_30d": 1658957, "context_len": 32768, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 1.07, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 1.01, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 0.85, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 0.81, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 0.71, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.72, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.69, "source_repo": "unsloth/gemma-3-1b-it-GGUF", "filename": "gemma-3-1b-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3-1b-it", "gguf": "https://huggingface.co/unsloth/gemma-3-1b-it-GGUF", "ollama": "https://ollama.com/library/gemma3" }, "run": { "ollama": "ollama run gemma3:1b", "llamacpp": "llama-server -hf unsloth/gemma-3-1b-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3-4b", "family": "llm", "name": "Gemma 3 4B", "repo_id": "google/gemma-3-4b-it", "params_b": 4.3, "license": "gemma", "gguf_repo": "unsloth/gemma-3-4b-it-GGUF", "ollama_tag": "gemma3:4b", "good_for": "Warm-toned everyday assistant; can also look at images.", "stale": false, "gated": true, "downloads_30d": 1601809, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 4.13, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 3.19, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.83, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.49, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 2.26, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 2.1, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 1.73, "source_repo": "unsloth/gemma-3-4b-it-GGUF", "filename": "gemma-3-4b-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3-4b-it", "gguf": "https://huggingface.co/unsloth/gemma-3-4b-it-GGUF", "ollama": "https://ollama.com/library/gemma3" }, "run": { "ollama": "ollama run gemma3:4b", "llamacpp": "llama-server -hf unsloth/gemma-3-4b-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3-12b", "family": "llm", "name": "Gemma 3 12B", "repo_id": "google/gemma-3-12b-it", "params_b": 12.19, "license": "gemma", "gguf_repo": "unsloth/gemma-3-12b-it-GGUF", "ollama_tag": "gemma3:12b", "good_for": "Strong mid-size model with vision support.", "stale": false, "gated": true, "downloads_30d": 2810935, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 12.51, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 9.66, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 8.45, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 7.3, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 6.55, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 6.01, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 4.77, "source_repo": "unsloth/gemma-3-12b-it-GGUF", "filename": "gemma-3-12b-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3-12b-it", "gguf": "https://huggingface.co/unsloth/gemma-3-12b-it-GGUF", "ollama": "https://ollama.com/library/gemma3" }, "run": { "ollama": "ollama run gemma3:12b", "llamacpp": "llama-server -hf unsloth/gemma-3-12b-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3-27b", "family": "llm", "name": "Gemma 3 27B", "repo_id": "google/gemma-3-27b-it", "params_b": 27.43, "license": "gemma", "gguf_repo": "unsloth/gemma-3-27b-it-GGUF", "ollama_tag": "gemma3:27b", "good_for": "Google's big open model. Needs a serious GPU or lots of memory.", "stale": false, "gated": true, "downloads_30d": 1418920, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 28.71, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 22.17, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 19.27, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 16.55, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 14.77, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 13.44, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 10.5, "source_repo": "unsloth/gemma-3-27b-it-GGUF", "filename": "gemma-3-27b-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3-27b-it", "gguf": "https://huggingface.co/unsloth/gemma-3-27b-it-GGUF", "ollama": "https://ollama.com/library/gemma3" }, "run": { "ollama": "ollama run gemma3:27b", "llamacpp": "llama-server -hf unsloth/gemma-3-27b-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3n-e2b", "family": "llm", "name": "Gemma 3n E2B", "repo_id": "google/gemma-3n-E2B-it", "params_b": 5.44, "active_params_b": 2.0, "license": "gemma", "gguf_repo": "unsloth/gemma-3n-E2B-it-GGUF", "ollama_tag": "gemma3n:e2b", "good_for": "Phone-class design: feels like a 2B while knowing more.", "stale": false, "gated": true, "downloads_30d": 372825, "context_len": 32768, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 4.79, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 4.21, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 3.29, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 3.03, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 2.91, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 2.48, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 2.22, "source_repo": "unsloth/gemma-3n-E2B-it-GGUF", "filename": "gemma-3n-E2B-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3n-E2B-it", "gguf": "https://huggingface.co/unsloth/gemma-3n-E2B-it-GGUF", "ollama": "https://ollama.com/library/gemma3n" }, "run": { "ollama": "ollama run gemma3n:e2b", "llamacpp": "llama-server -hf unsloth/gemma-3n-E2B-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "gemma-3n-e4b", "family": "llm", "name": "Gemma 3n E4B", "repo_id": "google/gemma-3n-E4B-it", "params_b": 7.85, "active_params_b": 4.0, "license": "gemma", "gguf_repo": "unsloth/gemma-3n-E4B-it-GGUF", "ollama_tag": "gemma3n:e4b", "good_for": "Efficient on-device design with 4B-class speed.", "stale": false, "gated": true, "downloads_30d": 17622, "context_len": 32768, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 7.35, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 6.27, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 5.02, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 4.54, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 4.27, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 3.69, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 3.19, "source_repo": "unsloth/gemma-3n-E4B-it-GGUF", "filename": "gemma-3n-E4B-it-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/google/gemma-3n-E4B-it", "gguf": "https://huggingface.co/unsloth/gemma-3n-E4B-it-GGUF", "ollama": "https://ollama.com/library/gemma3n" }, "run": { "ollama": "ollama run gemma3n:e4b", "llamacpp": "llama-server -hf unsloth/gemma-3n-E4B-it-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "mistral-7b", "family": "llm", "name": "Mistral 7B (v0.3)", "repo_id": "mistralai/Mistral-7B-Instruct-v0.3", "params_b": 7.25, "license": "apache-2.0", "gguf_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "ollama_tag": "mistral:7b", "good_for": "The classic open 7B. Still a solid, fast all-rounder.", "stale": false, "gated": false, "downloads_30d": 3392572, "arch": { "n_layers": 32, "hidden": 4096, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 32768, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 7.7, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 5.95, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 5.14, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 4.37, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 3.91, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 3.52, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 2.72, "source_repo": "bartowski/Mistral-7B-Instruct-v0.3-GGUF", "filename": "Mistral-7B-Instruct-v0.3-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.3", "gguf": "https://huggingface.co/bartowski/Mistral-7B-Instruct-v0.3-GGUF", "ollama": "https://ollama.com/library/mistral" }, "run": { "ollama": "ollama run mistral:7b", "llamacpp": "llama-server -hf bartowski/Mistral-7B-Instruct-v0.3-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "mistral-small-3.2", "family": "llm", "name": "Mistral Small 3.2 (24B)", "repo_id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", "params_b": 24.01, "license": "apache-2.0", "gguf_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "ollama_tag": "mistral-small3.2", "good_for": "Excellent quality-for-size; a favourite on 24 GB cards.", "stale": false, "gated": false, "downloads_30d": 537956, "arch": { "n_layers": 40, "hidden": 5120, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 25.05, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 19.35, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 16.76, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 14.33, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 12.78, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 11.47, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 8.89, "source_repo": "unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "filename": "Mistral-Small-3.2-24B-Instruct-2506-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/mistralai/Mistral-Small-3.2-24B-Instruct-2506", "gguf": "https://huggingface.co/unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF", "ollama": "https://ollama.com/library/mistral-small3.2" }, "run": { "ollama": "ollama run mistral-small3.2", "llamacpp": "llama-server -hf unsloth/Mistral-Small-3.2-24B-Instruct-2506-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "devstral-small", "family": "llm", "name": "Devstral Small (24B, coding)", "repo_id": "mistralai/Devstral-Small-2507", "params_b": 23.57, "license": "apache-2.0", "gguf_repo": "unsloth/Devstral-Small-2507-GGUF", "ollama_tag": "devstral", "good_for": "Built for coding agents and repo-level work.", "stale": false, "gated": false, "downloads_30d": 24427, "arch": { "n_layers": 40, "hidden": 5120, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 25.05, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 19.35, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 16.76, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 14.33, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 12.78, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 11.47, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 8.89, "source_repo": "unsloth/Devstral-Small-2507-GGUF", "filename": "Devstral-Small-2507-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/mistralai/Devstral-Small-2507", "gguf": "https://huggingface.co/unsloth/Devstral-Small-2507-GGUF", "ollama": "https://ollama.com/library/devstral" }, "run": { "ollama": "ollama run devstral", "llamacpp": "llama-server -hf unsloth/Devstral-Small-2507-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "phi-4", "family": "llm", "name": "Phi-4 (14B)", "repo_id": "microsoft/phi-4", "params_b": 14.66, "license": "mit", "gguf_repo": "unsloth/phi-4-GGUF", "ollama_tag": "phi4", "good_for": "Microsoft's strong 14B, great at reasoning and maths.", "stale": false, "gated": false, "downloads_30d": 809973, "arch": { "n_layers": 40, "hidden": 5120, "n_heads": 40, "n_kv_heads": 10 }, "context_len": 16384, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 15.58, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 12.03, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 10.41, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 8.89, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 7.19, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 5.61, "source_repo": "unsloth/phi-4-GGUF", "filename": "phi-4-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/microsoft/phi-4", "gguf": "https://huggingface.co/unsloth/phi-4-GGUF", "ollama": "https://ollama.com/library/phi4" }, "run": { "ollama": "ollama run phi4", "llamacpp": "llama-server -hf unsloth/phi-4-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "phi-4-mini", "family": "llm", "name": "Phi-4 Mini (3.8B)", "repo_id": "microsoft/Phi-4-mini-instruct", "params_b": 3.84, "license": "mit", "gguf_repo": "unsloth/Phi-4-mini-instruct-GGUF", "ollama_tag": "phi4-mini", "good_for": "Small, MIT-licensed, punchy for its size.", "stale": false, "gated": false, "downloads_30d": 1221436, "arch": { "n_layers": 32, "hidden": 3072, "n_heads": 24, "n_kv_heads": 8 }, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 4.08, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct.Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 3.16, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.85, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.49, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 2.12, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 1.68, "source_repo": "unsloth/Phi-4-mini-instruct-GGUF", "filename": "Phi-4-mini-instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/microsoft/Phi-4-mini-instruct", "gguf": "https://huggingface.co/unsloth/Phi-4-mini-instruct-GGUF", "ollama": "https://ollama.com/library/phi4-mini" }, "run": { "ollama": "ollama run phi4-mini", "llamacpp": "llama-server -hf unsloth/Phi-4-mini-instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "granite-4.0-1b", "family": "llm", "name": "Granite 4.0 1B", "repo_id": "ibm-granite/granite-4.0-1b", "params_b": 1.63, "license": "apache-2.0", "gguf_repo": "ibm-granite/granite-4.0-1b-GGUF", "good_for": "IBM's tiny enterprise-grade model; official GGUFs.", "stale": false, "gated": false, "downloads_30d": 4653, "arch": { "n_layers": 40, "hidden": 2048, "n_heads": 16, "n_kv_heads": 4 }, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 1.74, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 1.34, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 1.18, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 1.02, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.86, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.7, "source_repo": "ibm-granite/granite-4.0-1b-GGUF", "filename": "granite-4.0-1b-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/ibm-granite/granite-4.0-1b", "gguf": "https://huggingface.co/ibm-granite/granite-4.0-1b-GGUF" }, "run": { "ollama": "ollama run hf.co/ibm-granite/granite-4.0-1b-GGUF:Q4_K_M", "llamacpp": "llama-server -hf ibm-granite/granite-4.0-1b-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "granite-4.0-micro", "family": "llm", "name": "Granite 4.0 Micro (3B)", "repo_id": "ibm-granite/granite-4.0-micro", "params_b": 3.4, "license": "apache-2.0", "gguf_repo": "ibm-granite/granite-4.0-micro-GGUF", "ollama_tag": "granite4:micro", "good_for": "Grounded, RAG-friendly small model from IBM.", "stale": false, "gated": false, "downloads_30d": 129738, "arch": { "n_layers": 40, "hidden": 2560, "n_heads": 40, "n_kv_heads": 8 }, "context_len": 131072, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 3.62, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 2.8, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.44, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.1, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 1.73, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 1.37, "source_repo": "ibm-granite/granite-4.0-micro-GGUF", "filename": "granite-4.0-micro-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/ibm-granite/granite-4.0-micro", "gguf": "https://huggingface.co/ibm-granite/granite-4.0-micro-GGUF", "ollama": "https://ollama.com/library/granite4" }, "run": { "ollama": "ollama run granite4:micro", "llamacpp": "llama-server -hf ibm-granite/granite-4.0-micro-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "granite-4.0-h-tiny", "family": "llm", "name": "Granite 4.0 H-Tiny (7B-A1B MoE)", "repo_id": "ibm-granite/granite-4.0-h-tiny", "params_b": 6.94, "active_params_b": 1.0, "license": "apache-2.0", "gguf_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "ollama_tag": "granite4:tiny-h", "good_for": "Hybrid design: 7B knowledge, 1B-speed replies.", "stale": false, "gated": false, "downloads_30d": 93730, "arch": { "n_layers": 40, "hidden": 1536, "n_heads": 12, "n_kv_heads": 4 }, "context_len": 1048576, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 7.39, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 5.71, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 4.95, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 4.23, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 3.35, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 2.59, "source_repo": "ibm-granite/granite-4.0-h-tiny-GGUF", "filename": "granite-4.0-h-tiny-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/ibm-granite/granite-4.0-h-tiny", "gguf": "https://huggingface.co/ibm-granite/granite-4.0-h-tiny-GGUF", "ollama": "https://ollama.com/library/granite4" }, "run": { "ollama": "ollama run granite4:tiny-h", "llamacpp": "llama-server -hf ibm-granite/granite-4.0-h-tiny-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "granite-4.0-h-small", "family": "llm", "name": "Granite 4.0 H-Small (32B-A9B MoE)", "repo_id": "ibm-granite/granite-4.0-h-small", "params_b": 32.21, "active_params_b": 9.0, "license": "apache-2.0", "gguf_repo": "ibm-granite/granite-4.0-h-small-GGUF", "ollama_tag": "granite4:small-h", "good_for": "Big hybrid that stays responsive thanks to 9B active.", "stale": false, "gated": false, "downloads_30d": 569199, "arch": { "n_layers": 40, "hidden": 4096, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 1048576, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 34.26, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 26.47, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 22.87, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 19.48, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q4_K_M.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 15.36, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 11.78, "source_repo": "ibm-granite/granite-4.0-h-small-GGUF", "filename": "granite-4.0-h-small-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/ibm-granite/granite-4.0-h-small", "gguf": "https://huggingface.co/ibm-granite/granite-4.0-h-small-GGUF", "ollama": "https://ollama.com/library/granite4" }, "run": { "ollama": "ollama run granite4:small-h", "llamacpp": "llama-server -hf ibm-granite/granite-4.0-h-small-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "smollm3-3b", "family": "llm", "name": "SmolLM3 3B", "repo_id": "HuggingFaceTB/SmolLM3-3B", "params_b": 3.08, "license": "apache-2.0", "gguf_repo": "ggml-org/SmolLM3-3B-GGUF", "good_for": "Hugging Face's own fully-open small model, trained in public.", "stale": false, "gated": false, "downloads_30d": 519434, "arch": { "n_layers": 36, "hidden": 2048, "n_heads": 16, "n_kv_heads": 4 }, "context_len": 65536, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 3.28, "source_repo": "ggml-org/SmolLM3-3B-GGUF", "filename": "SmolLM3-Q8_0.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 1.92, "source_repo": "ggml-org/SmolLM3-3B-GGUF", "filename": "SmolLM3-Q4_K_M.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/HuggingFaceTB/SmolLM3-3B", "gguf": "https://huggingface.co/ggml-org/SmolLM3-3B-GGUF" }, "run": { "ollama": "ollama run hf.co/ggml-org/SmolLM3-3B-GGUF:Q4_K_M", "llamacpp": "llama-server -hf ggml-org/SmolLM3-3B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "minicpm-4.1-8b", "family": "llm", "name": "MiniCPM 4.1 8B", "repo_id": "openbmb/MiniCPM4.1-8B", "params_b": 8.19, "license": "apache-2.0", "gguf_repo": "openbmb/MiniCPM4.1-8B-GGUF", "good_for": "Tuned hard for running on ordinary devices; official GGUFs.", "stale": false, "gated": false, "downloads_30d": 50634, "arch": { "n_layers": 32, "hidden": 4096, "n_heads": 32, "n_kv_heads": 2 }, "context_len": 65536, "quants": [ { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 4.97, "source_repo": "openbmb/MiniCPM4.1-8B-GGUF", "filename": "MiniCPM4.1-8B-Q4_K_M.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/openbmb/MiniCPM4.1-8B", "gguf": "https://huggingface.co/openbmb/MiniCPM4.1-8B-GGUF" }, "run": { "ollama": "ollama run hf.co/openbmb/MiniCPM4.1-8B-GGUF:Q4_K_M", "llamacpp": "llama-server -hf openbmb/MiniCPM4.1-8B-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "nemotron-nano-9b", "family": "llm", "name": "NVIDIA Nemotron Nano 9B v2", "repo_id": "nvidia/NVIDIA-Nemotron-Nano-9B-v2", "params_b": 8.89, "license": "other", "gguf_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "good_for": "Hybrid Mamba design: strong reasoning with fast, steady output.", "stale": false, "gated": false, "downloads_30d": 545070, "arch": { "n_layers": 56, "hidden": 4480, "n_heads": 40, "n_kv_heads": 8 }, "context_len": 1048576, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 9.46, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 9.14, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 7.07, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 6.53, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 5.27, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 5.38, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 5.01, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-9B-v2-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/nvidia/NVIDIA-Nemotron-Nano-9B-v2", "gguf": "https://huggingface.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF" }, "run": { "ollama": "ollama run hf.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF:Q4_K_M", "llamacpp": "llama-server -hf bartowski/nvidia_NVIDIA-Nemotron-Nano-9B-v2-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "nemotron-nano-12b", "family": "llm", "name": "NVIDIA Nemotron Nano 12B v2", "repo_id": "nvidia/NVIDIA-Nemotron-Nano-12B-v2", "params_b": 12.31, "license": "other", "gguf_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "good_for": "The bigger Nemotron Nano; reasoning-first hybrid.", "stale": false, "gated": false, "downloads_30d": 15998, "arch": { "n_layers": 62, "hidden": 5120, "n_heads": 40, "n_kv_heads": 8 }, "context_len": 1048576, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 13.09, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 10.11, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 8.76, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 7.49, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 6.75, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 6.02, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 4.7, "source_repo": "bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF", "filename": "nvidia_NVIDIA-Nemotron-Nano-12B-v2-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/nvidia/NVIDIA-Nemotron-Nano-12B-v2", "gguf": "https://huggingface.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF" }, "run": { "ollama": "ollama run hf.co/bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF:Q4_K_M", "llamacpp": "llama-server -hf bartowski/nvidia_NVIDIA-Nemotron-Nano-12B-v2-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-vl-2b", "family": "vlm", "name": "Qwen3-VL 2B", "repo_id": "Qwen/Qwen3-VL-2B-Instruct", "params_b": 2.13, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "ollama_tag": "qwen3-vl:2b", "good_for": "Chat about images on very light hardware.", "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).", "stale": false, "gated": false, "downloads_30d": 1944930, "arch": { "n_layers": 28, "hidden": 2048, "n_heads": 16, "n_kv_heads": 8 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 1.83, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 1.42, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 1.26, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 1.11, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 1.01, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 0.94, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 0.78, "source_repo": "unsloth/Qwen3-VL-2B-Instruct-GGUF", "filename": "Qwen3-VL-2B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-VL-2B-Instruct", "gguf": "https://huggingface.co/unsloth/Qwen3-VL-2B-Instruct-GGUF", "ollama": "https://ollama.com/library/qwen3-vl" }, "run": { "ollama": "ollama run qwen3-vl:2b", "llamacpp": "llama-server -hf unsloth/Qwen3-VL-2B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-vl-4b", "family": "vlm", "name": "Qwen3-VL 4B", "repo_id": "Qwen/Qwen3-VL-4B-Instruct", "params_b": 4.44, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "ollama_tag": "qwen3-vl:4b", "good_for": "The sweet spot for asking questions about images and screenshots.", "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).", "stale": false, "gated": false, "downloads_30d": 3769866, "arch": { "n_layers": 36, "hidden": 2560, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 4.28, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 3.31, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 2.89, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 2.5, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 2.27, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 2.08, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 1.67, "source_repo": "unsloth/Qwen3-VL-4B-Instruct-GGUF", "filename": "Qwen3-VL-4B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-VL-4B-Instruct", "gguf": "https://huggingface.co/unsloth/Qwen3-VL-4B-Instruct-GGUF", "ollama": "https://ollama.com/library/qwen3-vl" }, "run": { "ollama": "ollama run qwen3-vl:4b", "llamacpp": "llama-server -hf unsloth/Qwen3-VL-4B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-vl-8b", "family": "vlm", "name": "Qwen3-VL 8B", "repo_id": "Qwen/Qwen3-VL-8B-Instruct", "params_b": 8.77, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "ollama_tag": "qwen3-vl:8b", "good_for": "Strong image understanding: documents, charts, photos.", "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).", "stale": false, "gated": false, "downloads_30d": 7690985, "arch": { "n_layers": 36, "hidden": 4096, "n_heads": 32, "n_kv_heads": 8 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 8.71, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 6.73, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 5.85, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 5.03, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 4.58, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 4.12, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 3.28, "source_repo": "unsloth/Qwen3-VL-8B-Instruct-GGUF", "filename": "Qwen3-VL-8B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-VL-8B-Instruct", "gguf": "https://huggingface.co/unsloth/Qwen3-VL-8B-Instruct-GGUF", "ollama": "https://ollama.com/library/qwen3-vl" }, "run": { "ollama": "ollama run qwen3-vl:8b", "llamacpp": "llama-server -hf unsloth/Qwen3-VL-8B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "qwen3-vl-30b-a3b", "family": "vlm", "name": "Qwen3-VL 30B-A3B (MoE)", "repo_id": "Qwen/Qwen3-VL-30B-A3B-Instruct", "params_b": 31.07, "active_params_b": 3.0, "license": "apache-2.0", "gguf_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "ollama_tag": "qwen3-vl:30b", "good_for": "Top-tier local vision-language quality, fast thanks to 3B active.", "mem_note": "Vision models load an extra image encoder (~0.5 GB on top of the figures shown).", "stale": false, "gated": false, "downloads_30d": 783446, "arch": { "n_layers": 48, "hidden": 2048, "n_heads": 32, "n_kv_heads": 4 }, "context_len": 262144, "quants": [ { "key": "Q8_0", "plain": "Near-full (8-bit)", "file_gb": 32.48, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q8_0.gguf" }, { "key": "Q6_K", "plain": "High (6-bit)", "file_gb": 25.09, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q6_K.gguf" }, { "key": "Q5_K_M", "plain": "Balanced+ (5-bit)", "file_gb": 21.73, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q5_K_M.gguf" }, { "key": "Q4_K_M", "plain": "Balanced (4-bit)", "file_gb": 18.56, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q4_K_M.gguf" }, { "key": "IQ4_XS", "plain": "Compact (4-bit)", "file_gb": 16.38, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-IQ4_XS.gguf" }, { "key": "Q3_K_M", "plain": "Compact (3-bit)", "file_gb": 14.71, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q3_K_M.gguf" }, { "key": "Q2_K", "plain": "Tiny (2-bit)", "file_gb": 11.26, "source_repo": "unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "filename": "Qwen3-VL-30B-A3B-Instruct-Q2_K.gguf" } ], "provenance": "filesize", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-VL-30B-A3B-Instruct", "gguf": "https://huggingface.co/unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF", "ollama": "https://ollama.com/library/qwen3-vl" }, "run": { "ollama": "ollama run qwen3-vl:30b", "llamacpp": "llama-server -hf unsloth/Qwen3-VL-30B-A3B-Instruct-GGUF:Q4_K_M" }, "last_verified": "2026-06-09" }, { "key": "smolvlm2-2.2b", "family": "vlm", "name": "SmolVLM2 2.2B", "repo_id": "HuggingFaceTB/SmolVLM2-2.2B-Instruct", "params_b": 2.25, "license": "apache-2.0", "mem_gb": 6.0, "mem_provenance": "estimated", "run_pip": "pip install transformers torch", "good_for": "Small open video+image understanding; also a common base for robot-policy finetunes.", "stale": false, "gated": false, "downloads_30d": 272382, "provenance": "estimated", "links": { "hf": "https://huggingface.co/HuggingFaceTB/SmolVLM2-2.2B-Instruct" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "moondream2", "family": "vlm", "name": "Moondream2", "repo_id": "vikhyatk/moondream2", "params_b": 1.93, "license": "apache-2.0", "ollama_tag": "moondream", "mem_gb": 4.5, "mem_provenance": "estimated", "run_pip": "pip install moondream", "good_for": "Tiny image-question model that runs almost anywhere.", "stale": false, "gated": false, "downloads_30d": 2074069, "provenance": "estimated", "links": { "hf": "https://huggingface.co/vikhyatk/moondream2", "ollama": "https://ollama.com/library/moondream" }, "run": { "ollama": "ollama run moondream", "pip": "pip install moondream" }, "last_verified": "2026-06-09" }, { "key": "yolo26-n", "family": "vision", "use_cases": [ "detect", "classify", "pose", "train-vision" ], "name": "YOLO26 Nano", "repo_id": "Ultralytics/YOLO26", "params_b": 0.0026, "license": "agpl-3.0", "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.", "mem_gb": 1.0, "mem_provenance": "estimated", "run_pip": "pip install ultralytics", "good_for": "Real-time detection even on weak hardware or a webcam.", "docs": "https://docs.ultralytics.com/models/yolo26", "stale": false, "gated": false, "downloads_30d": 7012, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Ultralytics/YOLO26", "docs": "https://docs.ultralytics.com/models/yolo26" }, "run": { "pip": "pip install ultralytics" }, "last_verified": "2026-06-09" }, { "key": "yolo26-s", "family": "vision", "use_cases": [ "detect", "classify", "pose", "train-vision" ], "name": "YOLO26 Small", "repo_id": "Ultralytics/YOLO26", "params_b": 0.0096, "license": "agpl-3.0", "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.", "mem_gb": 1.2, "mem_provenance": "estimated", "run_pip": "pip install ultralytics", "good_for": "Fast and clearly more accurate than Nano.", "docs": "https://docs.ultralytics.com/models/yolo26", "stale": false, "gated": false, "downloads_30d": 7012, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Ultralytics/YOLO26", "docs": "https://docs.ultralytics.com/models/yolo26" }, "run": { "pip": "pip install ultralytics" }, "last_verified": "2026-06-09" }, { "key": "yolo26-m", "family": "vision", "use_cases": [ "detect", "classify", "pose", "train-vision" ], "name": "YOLO26 Medium", "repo_id": "Ultralytics/YOLO26", "params_b": 0.0202, "license": "agpl-3.0", "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.", "mem_gb": 1.6, "mem_provenance": "estimated", "run_pip": "pip install ultralytics", "good_for": "Balanced accuracy and speed for real work.", "docs": "https://docs.ultralytics.com/models/yolo26", "stale": false, "gated": false, "downloads_30d": 7012, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Ultralytics/YOLO26", "docs": "https://docs.ultralytics.com/models/yolo26" }, "run": { "pip": "pip install ultralytics" }, "last_verified": "2026-06-09" }, { "key": "yolo26-l", "family": "vision", "use_cases": [ "detect", "classify", "pose", "train-vision" ], "name": "YOLO26 Large", "repo_id": "Ultralytics/YOLO26", "params_b": 0.0337, "license": "agpl-3.0", "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.", "mem_gb": 2.0, "mem_provenance": "estimated", "run_pip": "pip install ultralytics", "good_for": "High accuracy when you have a real GPU.", "docs": "https://docs.ultralytics.com/models/yolo26", "stale": false, "gated": false, "downloads_30d": 7012, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Ultralytics/YOLO26", "docs": "https://docs.ultralytics.com/models/yolo26" }, "run": { "pip": "pip install ultralytics" }, "last_verified": "2026-06-09" }, { "key": "yolo26-x", "family": "vision", "use_cases": [ "detect", "classify", "pose", "train-vision" ], "name": "YOLO26 X-Large", "repo_id": "Ultralytics/YOLO26", "params_b": 0.0569, "license": "agpl-3.0", "license_note": "AGPL-3.0: free for open-source use; commercial products need an Ultralytics license.", "mem_gb": 2.5, "mem_provenance": "estimated", "run_pip": "pip install ultralytics", "good_for": "Highest accuracy in the family, slowest.", "docs": "https://docs.ultralytics.com/models/yolo26", "stale": false, "gated": false, "downloads_30d": 7012, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Ultralytics/YOLO26", "docs": "https://docs.ultralytics.com/models/yolo26" }, "run": { "pip": "pip install ultralytics" }, "last_verified": "2026-06-09" }, { "key": "sam-2.1-tiny", "family": "vision", "use_cases": [ "segment" ], "name": "SAM 2.1 Tiny", "repo_id": "facebook/sam2.1-hiera-tiny", "params_b": 0.04, "license": "apache-2.0", "mem_gb": 1.5, "mem_provenance": "community", "run_pip": "pip install sam2", "good_for": "Click-to-segment anything in images; light and quick.", "stale": false, "gated": false, "downloads_30d": 30268, "provenance": "community", "links": { "hf": "https://huggingface.co/facebook/sam2.1-hiera-tiny" }, "run": { "pip": "pip install sam2" }, "last_verified": "2026-06-09" }, { "key": "sam-2.1-small", "family": "vision", "use_cases": [ "segment" ], "name": "SAM 2.1 Small", "repo_id": "facebook/sam2.1-hiera-small", "params_b": 0.05, "license": "apache-2.0", "mem_gb": 1.8, "mem_provenance": "community", "run_pip": "pip install sam2", "good_for": "Solid segmentation quality, still light.", "stale": false, "gated": false, "downloads_30d": 12700, "provenance": "community", "links": { "hf": "https://huggingface.co/facebook/sam2.1-hiera-small" }, "run": { "pip": "pip install sam2" }, "last_verified": "2026-06-09" }, { "key": "sam-2.1-large", "family": "vision", "use_cases": [ "segment" ], "name": "SAM 2.1 Large", "repo_id": "facebook/sam2.1-hiera-large", "params_b": 0.22, "license": "apache-2.0", "mem_gb": 3.0, "mem_provenance": "community", "mem_note": "Image segmentation is light; tracking through video needs much more (community reports: 12 GB+).", "run_pip": "pip install sam2", "good_for": "Best SAM quality for images and video object tracking.", "stale": false, "gated": false, "downloads_30d": 70422, "provenance": "community", "links": { "hf": "https://huggingface.co/facebook/sam2.1-hiera-large" }, "run": { "pip": "pip install sam2" }, "last_verified": "2026-06-09" }, { "key": "sam-3", "family": "vision", "use_cases": [ "segment" ], "name": "SAM 3", "repo_id": "facebook/sam3", "params_b": 0.86, "license": "other", "mem_gb": 4.0, "mem_provenance": "community", "run_pip": "pip install transformers torch", "good_for": "Segment things by describing them in words, not just clicks.", "stale": false, "gated": true, "downloads_30d": 1879279, "provenance": "community", "links": { "hf": "https://huggingface.co/facebook/sam3" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "da3-small", "family": "vision", "use_cases": [ "depth" ], "name": "Depth Anything 3 Small", "repo_id": "depth-anything/DA3-SMALL", "params_b": 0.03, "license": "apache-2.0", "mem_gb": 1.2, "mem_provenance": "estimated", "run_pip": "pip install transformers torch", "good_for": "Depth maps from any photo, fast.", "stale": false, "gated": false, "downloads_30d": 23161, "provenance": "estimated", "links": { "hf": "https://huggingface.co/depth-anything/DA3-SMALL" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "da3-base", "family": "vision", "use_cases": [ "depth" ], "name": "Depth Anything 3 Base", "repo_id": "depth-anything/DA3-BASE", "params_b": 0.14, "license": "apache-2.0", "mem_gb": 1.8, "mem_provenance": "estimated", "run_pip": "pip install transformers torch", "good_for": "Sharper depth, still light.", "stale": false, "gated": false, "downloads_30d": 50537, "provenance": "estimated", "links": { "hf": "https://huggingface.co/depth-anything/DA3-BASE" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "da3-large", "family": "vision", "use_cases": [ "depth" ], "name": "Depth Anything 3 Large", "repo_id": "depth-anything/DA3-LARGE", "params_b": 0.41, "license": "cc-by-nc-4.0", "license_note": "Non-commercial licence.", "mem_gb": 3.0, "mem_provenance": "estimated", "run_pip": "pip install transformers torch", "good_for": "Best depth quality; research / personal use only.", "stale": false, "gated": false, "downloads_30d": 135024, "provenance": "estimated", "links": { "hf": "https://huggingface.co/depth-anything/DA3-LARGE" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "foundationpose", "family": "vision", "use_cases": [ "pose" ], "name": "FoundationPose (6-DoF)", "repo_id": "NVlabs/FoundationPose", "repo_kind": "github", "params_b": 0.3, "license": "nvidia-source-code", "license_note": "Research-only licence; weights are downloaded from links in the GitHub README, not Hugging Face.", "mem_gb": 8.0, "mem_provenance": "community", "mem_note": "Community reports it running on a 12 GB RTX 3060. Needs CUDA and a custom build: advanced setup.", "docs": "https://github.com/NVlabs/FoundationPose", "good_for": "Full 6-DoF object pose (position + rotation) for robotics. The serious option.", "stale": false, "links": { "home": "https://github.com/NVlabs/FoundationPose", "docs": "https://github.com/NVlabs/FoundationPose" }, "provenance": "community", "last_verified": "2026-06-09" }, { "key": "paddleocr", "family": "vision", "use_cases": [ "ocr" ], "name": "PaddleOCR (PP-OCRv5)", "repo_id": "PaddlePaddle/PP-OCRv5_server_rec", "params_b": 0.05, "license": "apache-2.0", "mem_gb": 1.0, "mem_provenance": "community", "run_pip": "pip install paddleocr", "good_for": "The classic text-from-images toolkit. Works fine on CPU.", "stale": false, "gated": false, "downloads_30d": 196930, "provenance": "community", "links": { "hf": "https://huggingface.co/PaddlePaddle/PP-OCRv5_server_rec" }, "run": { "pip": "pip install paddleocr" }, "last_verified": "2026-06-09" }, { "key": "deepseek-ocr", "family": "vision", "use_cases": [ "ocr" ], "name": "DeepSeek-OCR", "repo_id": "deepseek-ai/DeepSeek-OCR", "params_b": 3.34, "license": "mit", "mem_gb": 8.0, "mem_provenance": "estimated", "ollama_tag": "deepseek-ocr", "run_pip": "pip install transformers torch", "good_for": "Turns whole documents into clean text/markdown, layout and all.", "stale": false, "gated": false, "downloads_30d": 2404442, "provenance": "estimated", "links": { "hf": "https://huggingface.co/deepseek-ai/DeepSeek-OCR", "ollama": "https://ollama.com/library/deepseek-ocr" }, "run": { "ollama": "ollama run deepseek-ocr", "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "sdxl", "family": "imagegen", "use_cases": [ "imagegen", "inpaint" ], "name": "Stable Diffusion XL", "repo_id": "stabilityai/stable-diffusion-xl-base-1.0", "params_b": 3.5, "license": "openrail++", "mem_gb": 8.0, "mem_provenance": "community", "run_pip": "pip install diffusers torch", "good_for": "Excellent 1024px images with a huge community of styles and add-ons.", "stale": false, "gated": false, "downloads_30d": 1436868, "provenance": "community", "links": { "hf": "https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "sd-3.5-medium", "family": "imagegen", "use_cases": [ "imagegen", "inpaint" ], "name": "Stable Diffusion 3.5 Medium", "repo_id": "stabilityai/stable-diffusion-3.5-medium", "params_b": 2.5, "license": "other", "license_note": "Free for individuals and businesses under $1M revenue.", "mem_gb": 9.9, "mem_provenance": "vendor", "mem_note": "9.9 GB is Stability's own published figure (excluding text encoders).", "run_pip": "pip install diffusers torch", "good_for": "Modern image quality tuned to run on consumer cards.", "stale": false, "gated": true, "downloads_30d": 126738, "provenance": "vendor", "links": { "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-medium" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "sd-3.5-large", "family": "imagegen", "use_cases": [ "imagegen", "inpaint" ], "name": "Stable Diffusion 3.5 Large", "repo_id": "stabilityai/stable-diffusion-3.5-large", "params_b": 8.0, "license": "other", "license_note": "Free for individuals and businesses under $1M revenue.", "mem_gb": 24.0, "mem_provenance": "vendor", "mem_note": "About 24 GB at full quality (vendor figure); quantized builds run in roughly half that.", "run_pip": "pip install diffusers torch", "good_for": "Stability's top open image model.", "stale": false, "gated": true, "downloads_30d": 22257, "provenance": "vendor", "links": { "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-large" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "flux1-schnell", "family": "imagegen", "use_cases": [ "imagegen" ], "name": "FLUX.1 Schnell", "repo_id": "black-forest-labs/FLUX.1-schnell", "params_b": 12.0, "license": "apache-2.0", "mem_gb": 16.0, "mem_provenance": "community", "mem_note": "Roughly 16 GB at 8-bit, 24 GB at full quality. Community-reported figures.", "run_pip": "pip install diffusers torch", "good_for": "Near-top image quality in few steps, and Apache-licensed.", "stale": false, "gated": true, "downloads_30d": 337454, "provenance": "community", "links": { "hf": "https://huggingface.co/black-forest-labs/FLUX.1-schnell" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "flux1-dev", "family": "imagegen", "use_cases": [ "imagegen", "inpaint" ], "name": "FLUX.1 Dev", "repo_id": "black-forest-labs/FLUX.1-dev", "params_b": 12.0, "license": "other", "license_note": "Non-commercial licence; gated (accept terms on Hugging Face).", "mem_gb": 16.0, "mem_provenance": "community", "mem_note": "Roughly 16 GB at 8-bit, 24 GB at full quality. Community-reported figures.", "run_pip": "pip install diffusers torch", "good_for": "State-of-the-art open image quality (for non-commercial work).", "stale": false, "gated": true, "downloads_30d": 984011, "provenance": "community", "links": { "hf": "https://huggingface.co/black-forest-labs/FLUX.1-dev" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "flux2-dev", "family": "imagegen", "use_cases": [ "imagegen" ], "name": "FLUX.2 Dev (32B)", "repo_id": "black-forest-labs/FLUX.2-dev", "params_b": 32.0, "license": "other", "license_note": "Non-commercial licence; gated.", "mem_gb": 90.0, "mem_provenance": "community", "mem_note": "Around 90 GB at full quality; 4-bit with offloading is reported to fit a 24 GB card, slowly.", "run_pip": "pip install diffusers torch", "good_for": "The frontier of open image generation. Honest answer: workstation hardware.", "stale": false, "gated": true, "downloads_30d": 309301, "provenance": "community", "links": { "hf": "https://huggingface.co/black-forest-labs/FLUX.2-dev" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "real-esrgan", "family": "imagegen", "use_cases": [ "upscale" ], "name": "Real-ESRGAN", "repo_id": "ai-forever/Real-ESRGAN", "params_b": 0.017, "license": "bsd-3-clause", "mem_gb": 2.0, "mem_provenance": "community", "run_pip": "pip install realesrgan", "good_for": "The standard for upscaling and restoring photos.", "stale": false, "gated": false, "downloads_30d": 0, "provenance": "community", "links": { "hf": "https://huggingface.co/ai-forever/Real-ESRGAN" }, "run": { "pip": "pip install realesrgan" }, "last_verified": "2026-06-09" }, { "key": "birefnet", "family": "imagegen", "use_cases": [ "bgremove" ], "name": "BiRefNet", "repo_id": "ZhengPeng7/BiRefNet", "params_b": 0.22, "license": "mit", "mem_gb": 3.0, "mem_provenance": "community", "run_pip": "pip install transformers torch", "good_for": "Crisp background removal, MIT-licensed.", "stale": false, "gated": false, "downloads_30d": 721429, "provenance": "community", "links": { "hf": "https://huggingface.co/ZhengPeng7/BiRefNet" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "rmbg-2.0", "family": "imagegen", "use_cases": [ "bgremove" ], "name": "RMBG 2.0", "repo_id": "briaai/RMBG-2.0", "params_b": 0.22, "license": "other", "license_note": "Free for non-commercial use only.", "mem_gb": 3.0, "mem_provenance": "community", "run_pip": "pip install transformers torch", "good_for": "Very strong background removal (check the licence for products).", "stale": false, "gated": true, "downloads_30d": 620472, "provenance": "community", "links": { "hf": "https://huggingface.co/briaai/RMBG-2.0" }, "run": { "pip": "pip install transformers torch" }, "last_verified": "2026-06-09" }, { "key": "ltx-video", "family": "imagegen", "use_cases": [ "videogen" ], "name": "LTX-Video", "repo_id": "Lightricks/LTX-Video", "params_b": 2.0, "license": "other", "mem_gb": 12.0, "mem_provenance": "community", "run_pip": "pip install diffusers torch", "good_for": "Real-time-class local video generation on consumer cards.", "stale": false, "gated": false, "downloads_30d": 446216, "provenance": "community", "links": { "hf": "https://huggingface.co/Lightricks/LTX-Video" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "wan-2.2-ti2v-5b", "family": "imagegen", "use_cases": [ "videogen" ], "name": "Wan 2.2 TI2V 5B", "repo_id": "Wan-AI/Wan2.2-TI2V-5B", "params_b": 5.0, "license": "apache-2.0", "mem_gb": 16.0, "mem_provenance": "community", "run_pip": "pip install diffusers torch", "good_for": "Strong open text/image-to-video that fits prosumer cards.", "stale": false, "gated": false, "downloads_30d": 9456, "provenance": "community", "links": { "hf": "https://huggingface.co/Wan-AI/Wan2.2-TI2V-5B" }, "run": { "pip": "pip install diffusers torch" }, "last_verified": "2026-06-09" }, { "key": "whisper-base", "family": "audio", "use_cases": [ "stt" ], "name": "Whisper Base", "repo_id": "openai/whisper-base", "params_b": 0.07, "license": "apache-2.0", "mem_gb": 1.0, "mem_provenance": "vendor", "mem_note": "OpenAI's own published VRAM figure.", "run_pip": "pip install faster-whisper", "good_for": "Quick rough transcription on any machine.", "stale": false, "gated": false, "downloads_30d": 4308029, "provenance": "vendor", "links": { "hf": "https://huggingface.co/openai/whisper-base" }, "run": { "pip": "pip install faster-whisper" }, "last_verified": "2026-06-09" }, { "key": "whisper-small", "family": "audio", "use_cases": [ "stt" ], "name": "Whisper Small", "repo_id": "openai/whisper-small", "params_b": 0.24, "license": "apache-2.0", "mem_gb": 2.0, "mem_provenance": "vendor", "mem_note": "OpenAI's own published VRAM figure.", "run_pip": "pip install faster-whisper", "good_for": "Good accuracy on clear audio, still fast.", "stale": false, "gated": false, "downloads_30d": 2315618, "provenance": "vendor", "links": { "hf": "https://huggingface.co/openai/whisper-small" }, "run": { "pip": "pip install faster-whisper" }, "last_verified": "2026-06-09" }, { "key": "whisper-large-v3-turbo", "family": "audio", "use_cases": [ "stt" ], "name": "Whisper Large v3 Turbo", "repo_id": "openai/whisper-large-v3-turbo", "params_b": 0.81, "license": "mit", "mem_gb": 6.0, "mem_provenance": "vendor", "mem_note": "OpenAI's own published VRAM figure. faster-whisper in 8-bit roughly halves it.", "run_pip": "pip install faster-whisper", "good_for": "Near-best accuracy at several times the speed of Large.", "stale": false, "gated": false, "downloads_30d": 7948390, "provenance": "vendor", "links": { "hf": "https://huggingface.co/openai/whisper-large-v3-turbo" }, "run": { "pip": "pip install faster-whisper" }, "last_verified": "2026-06-09" }, { "key": "whisper-large-v3", "family": "audio", "use_cases": [ "stt" ], "name": "Whisper Large v3", "repo_id": "openai/whisper-large-v3", "params_b": 1.54, "license": "apache-2.0", "mem_gb": 10.0, "mem_provenance": "vendor", "mem_note": "OpenAI's own published VRAM figure. faster-whisper in 8-bit roughly halves it.", "run_pip": "pip install faster-whisper", "good_for": "The best open transcription accuracy, any language.", "stale": false, "gated": false, "downloads_30d": 5054098, "provenance": "vendor", "links": { "hf": "https://huggingface.co/openai/whisper-large-v3" }, "run": { "pip": "pip install faster-whisper" }, "last_verified": "2026-06-09" }, { "key": "kokoro-82m", "family": "audio", "use_cases": [ "tts" ], "name": "Kokoro TTS (82M)", "repo_id": "hexgrad/Kokoro-82M", "params_b": 0.082, "license": "apache-2.0", "mem_gb": 1.5, "mem_provenance": "community", "run_pip": "pip install kokoro", "good_for": "Shockingly good small voice model; runs even on CPU.", "stale": false, "gated": false, "downloads_30d": 13198222, "provenance": "community", "links": { "hf": "https://huggingface.co/hexgrad/Kokoro-82M" }, "run": { "pip": "pip install kokoro" }, "last_verified": "2026-06-09" }, { "key": "chatterbox", "family": "audio", "use_cases": [ "tts" ], "name": "Chatterbox TTS", "repo_id": "ResembleAI/chatterbox", "params_b": 0.5, "license": "mit", "mem_gb": 4.0, "mem_provenance": "community", "run_pip": "pip install chatterbox-tts", "good_for": "Production-grade voice cloning, MIT-licensed.", "stale": false, "gated": false, "downloads_30d": 1694198, "provenance": "community", "links": { "hf": "https://huggingface.co/ResembleAI/chatterbox" }, "run": { "pip": "pip install chatterbox-tts" }, "last_verified": "2026-06-09" }, { "key": "f5-tts", "family": "audio", "use_cases": [ "tts" ], "name": "F5-TTS", "repo_id": "SWivid/F5-TTS", "params_b": 0.3, "license": "cc-by-nc-4.0", "license_note": "Non-commercial licence.", "mem_gb": 8.0, "mem_provenance": "community", "run_pip": "pip install f5-tts", "good_for": "High-quality voice cloning for personal projects.", "stale": false, "gated": false, "downloads_30d": 646717, "provenance": "community", "links": { "hf": "https://huggingface.co/SWivid/F5-TTS" }, "run": { "pip": "pip install f5-tts" }, "last_verified": "2026-06-09" }, { "key": "ace-step", "family": "audio", "use_cases": [ "music" ], "name": "ACE-Step (3.5B)", "repo_id": "ACE-Step/ACE-Step-v1-3.5B", "params_b": 3.5, "license": "apache-2.0", "mem_gb": 10.0, "mem_provenance": "community", "run_pip": "pip install acestep", "good_for": "The best permissively-licensed local music generator.", "stale": false, "gated": false, "downloads_30d": 0, "provenance": "community", "links": { "hf": "https://huggingface.co/ACE-Step/ACE-Step-v1-3.5B" }, "run": { "pip": "pip install acestep" }, "last_verified": "2026-06-09" }, { "key": "musicgen-small", "family": "audio", "use_cases": [ "music" ], "name": "MusicGen Small", "repo_id": "facebook/musicgen-small", "params_b": 0.59, "license": "cc-by-nc-4.0", "license_note": "Non-commercial licence.", "mem_gb": 6.0, "mem_provenance": "community", "run_pip": "pip install audiocraft", "good_for": "Quick music sketches on modest hardware.", "stale": false, "gated": false, "downloads_30d": 186078, "provenance": "community", "links": { "hf": "https://huggingface.co/facebook/musicgen-small" }, "run": { "pip": "pip install audiocraft" }, "last_verified": "2026-06-09" }, { "key": "musicgen-medium", "family": "audio", "use_cases": [ "music" ], "name": "MusicGen Medium", "repo_id": "facebook/musicgen-medium", "params_b": 1.5, "license": "cc-by-nc-4.0", "license_note": "Non-commercial licence.", "mem_gb": 16.0, "mem_provenance": "vendor", "mem_note": "Meta's docs say a GPU with at least 16 GB for this size.", "run_pip": "pip install audiocraft", "good_for": "Meta's well-known music model (non-commercial).", "stale": false, "gated": false, "downloads_30d": 1443963, "provenance": "vendor", "links": { "hf": "https://huggingface.co/facebook/musicgen-medium" }, "run": { "pip": "pip install audiocraft" }, "last_verified": "2026-06-09" }, { "key": "all-minilm-l6-v2", "family": "embed", "use_cases": [ "embed" ], "name": "all-MiniLM-L6-v2", "repo_id": "sentence-transformers/all-MiniLM-L6-v2", "params_b": 0.02, "license": "apache-2.0", "mem_gb": 0.5, "mem_provenance": "estimated", "ollama_tag": "all-minilm", "run_pip": "pip install sentence-transformers", "good_for": "The classic tiny embedder. Search your notes on any machine.", "stale": false, "gated": false, "downloads_30d": 230826064, "provenance": "estimated", "links": { "hf": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2", "ollama": "https://ollama.com/library/all-minilm" }, "run": { "ollama": "ollama run all-minilm", "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "nomic-embed-text-v1.5", "family": "embed", "use_cases": [ "embed" ], "name": "Nomic Embed Text v1.5", "repo_id": "nomic-ai/nomic-embed-text-v1.5", "params_b": 0.14, "license": "apache-2.0", "mem_gb": 1.0, "mem_provenance": "estimated", "ollama_tag": "nomic-embed-text", "run_pip": "pip install sentence-transformers", "good_for": "Strong long-document search with adjustable size.", "stale": false, "gated": false, "downloads_30d": 17630308, "provenance": "estimated", "links": { "hf": "https://huggingface.co/nomic-ai/nomic-embed-text-v1.5", "ollama": "https://ollama.com/library/nomic-embed-text" }, "run": { "ollama": "ollama run nomic-embed-text", "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "embeddinggemma-300m", "family": "embed", "use_cases": [ "embed" ], "name": "EmbeddingGemma 300M", "repo_id": "google/embeddinggemma-300m", "params_b": 0.3, "license": "gemma", "mem_gb": 1.2, "mem_provenance": "estimated", "ollama_tag": "embeddinggemma", "run_pip": "pip install sentence-transformers", "good_for": "Google's on-device embedder, great multilingual search.", "stale": false, "gated": true, "downloads_30d": 1701766, "provenance": "estimated", "links": { "hf": "https://huggingface.co/google/embeddinggemma-300m", "ollama": "https://ollama.com/library/embeddinggemma" }, "run": { "ollama": "ollama run embeddinggemma", "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "bge-m3", "family": "embed", "use_cases": [ "embed" ], "name": "BGE-M3", "repo_id": "BAAI/bge-m3", "params_b": 0.57, "license": "mit", "mem_gb": 2.5, "mem_provenance": "estimated", "ollama_tag": "bge-m3", "run_pip": "pip install sentence-transformers", "good_for": "Heavyweight multilingual search quality.", "stale": false, "gated": false, "downloads_30d": 29227796, "provenance": "estimated", "links": { "hf": "https://huggingface.co/BAAI/bge-m3", "ollama": "https://ollama.com/library/bge-m3" }, "run": { "ollama": "ollama run bge-m3", "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "qwen3-embedding-0.6b", "family": "embed", "use_cases": [ "embed" ], "name": "Qwen3 Embedding 0.6B", "repo_id": "Qwen/Qwen3-Embedding-0.6B", "params_b": 0.6, "license": "apache-2.0", "mem_gb": 1.5, "mem_provenance": "estimated", "ollama_tag": "qwen3-embedding", "run_pip": "pip install sentence-transformers", "good_for": "Modern top-ranked small embedder.", "stale": false, "gated": false, "downloads_30d": 8593433, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-Embedding-0.6B", "ollama": "https://ollama.com/library/qwen3-embedding" }, "run": { "ollama": "ollama run qwen3-embedding", "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "qwen3-embedding-4b", "family": "embed", "use_cases": [ "embed" ], "name": "Qwen3 Embedding 4B", "repo_id": "Qwen/Qwen3-Embedding-4B", "params_b": 4.02, "license": "apache-2.0", "mem_gb": 6.0, "mem_provenance": "estimated", "run_pip": "pip install sentence-transformers", "good_for": "Best-in-class search relevance if you have the memory.", "stale": false, "gated": false, "downloads_30d": 2360699, "provenance": "estimated", "links": { "hf": "https://huggingface.co/Qwen/Qwen3-Embedding-4B" }, "run": { "pip": "pip install sentence-transformers" }, "last_verified": "2026-06-09" }, { "key": "chronos-bolt-small", "family": "data", "use_cases": [ "forecast" ], "name": "Chronos-Bolt Small", "repo_id": "amazon/chronos-bolt-small", "params_b": 0.05, "license": "apache-2.0", "mem_gb": 0.5, "mem_provenance": "estimated", "run_pip": "pip install chronos-forecasting", "good_for": "Zero-shot time-series forecasting; runs on CPU.", "stale": false, "gated": false, "downloads_30d": 1461124, "provenance": "estimated", "links": { "hf": "https://huggingface.co/amazon/chronos-bolt-small" }, "run": { "pip": "pip install chronos-forecasting" }, "last_verified": "2026-06-09" }, { "key": "chronos-bolt-base", "family": "data", "use_cases": [ "forecast" ], "name": "Chronos-Bolt Base", "repo_id": "amazon/chronos-bolt-base", "params_b": 0.21, "license": "apache-2.0", "mem_gb": 1.0, "mem_provenance": "estimated", "run_pip": "pip install chronos-forecasting", "good_for": "Stronger forecasts, still laptop-friendly.", "stale": false, "gated": false, "downloads_30d": 1253619, "provenance": "estimated", "links": { "hf": "https://huggingface.co/amazon/chronos-bolt-base" }, "run": { "pip": "pip install chronos-forecasting" }, "last_verified": "2026-06-09" }, { "key": "tabpfn-v2", "family": "data", "use_cases": [ "tabular" ], "name": "TabPFN v2", "repo_id": "Prior-Labs/TabPFN-v2-clf", "params_b": 0.011, "license": "other", "mem_gb": 2.0, "mem_provenance": "community", "run_pip": "pip install tabpfn", "good_for": "Spreadsheet predictions (classification) that beat tuned baselines on small data.", "stale": false, "gated": false, "downloads_30d": 34302, "provenance": "community", "links": { "hf": "https://huggingface.co/Prior-Labs/TabPFN-v2-clf" }, "run": { "pip": "pip install tabpfn" }, "last_verified": "2026-06-09" } ] }