Spaces:

cstr
/

LLMProviders

Paused

App Files Files Community

CrispStrobe commited on Mar 22

Commit

54c2fe8

1 Parent(s): 128b3b8

feat: achieve 100% public model metadata coverage; improved vLLM-style param estimation; fixed phi-4 and mistral variants

Browse files

Files changed (3) hide show

data/providers.json +0 -0
scripts/fetch-providers.js +145 -253
src/App.tsx +1 -0

data/providers.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

scripts/fetch-providers.js CHANGED Viewed

@@ -16,8 +16,6 @@ const { getJson, getText, fetchRobust } = require('./fetch-utils');
 const DATA_FILE = path.join(__dirname, '..', 'data', 'providers.json');
 // Registry of all available fetchers.
-// Each module must export { providerName, fetch<Name> }.
-// Add new providers here as scripts/providers/<name>.js modules.
 const FETCHER_MODULES = {
   scaleway: require('./providers/scaleway'),
   openrouter: require('./providers/openrouter'),
@@ -32,7 +30,6 @@ const FETCHER_MODULES = {
 };
 const FETCHERS = Object.entries(FETCHER_MODULES).map(([key, mod]) => {
-  // Find the exported async function (the one that isn't providerName)
   const fn = Object.values(mod).find((v) => typeof v === 'function');
   if (!fn) throw new Error(`Module for ${key} exports no function`);
   return { key, providerName: mod.providerName, fn };
@@ -53,7 +50,7 @@ function updateProviderModels(providers, providerName, models) {
     return false;
   }
-  // Smart merge: preserve existing metadata (size_b, hf_id, ollama_id, capabilities, hf_private) if missing in new data
   const existingMap = new Map((provider.models || []).map(m => [m.name, m]));
   provider.models = models.map(newModel => {
@@ -63,8 +60,8 @@ function updateProviderModels(providers, providerName, models) {
     return {
       ...existing, // Start with existing metadata
       ...newModel, // Overwrite with new prices/type
-      // But preserve these if newModel doesn't have them
       size_b: newModel.size_b || existing.size_b,
       hf_id: newModel.hf_id || existing.hf_id,
       ollama_id: newModel.ollama_id || existing.ollama_id,
       hf_private: newModel.hf_private ?? existing.hf_private,
@@ -77,24 +74,21 @@ function updateProviderModels(providers, providerName, models) {
   return true;
 }
-// Normalize a model name/ID for fuzzy matching (same as App.tsx normalizeName).
 const normName = (s) =>
   s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
-// Build an index of normalized OpenRouter model-part → { capabilities, type, size_b, hf_id, ollama_id, hf_private }
-// Only includes entries that carry non-trivial capability data.
 function buildOrIndex(orProvider) {
   if (!orProvider) return [];
   const index = [];
   for (const m of orProvider.models || []) {
     if (!m.capabilities || m.capabilities.length === 0) continue;
-    // Strip :free suffix and take the model part after '/'
     const modelPart = m.name.replace(/:free$/, '').split('/').pop();
     index.push({
       norm: normName(modelPart),
       capabilities: m.capabilities,
       type: m.type,
       size_b: m.size_b,
       hf_id: m.hf_id,
       ollama_id: m.ollama_id,
       hf_private: m.hf_private,
@@ -103,46 +97,30 @@ function buildOrIndex(orProvider) {
   return index;
 }
-// For a given model name, find the best matching OpenRouter index entry.
-// Returns metadata object or null.
 function findOrMatch(modelName, orIndex) {
-  // Use the model part (after last '/') for matching, strip :region/@suffix
   const raw = modelName.replace(/@[^/]+$/, '').replace(/:[^/]+$/, '');
   const modelPart = raw.includes('/') ? raw.split('/').pop() : raw;
-  // Strip reasoning/thinking suffixes that don't appear in OR model IDs
   const n = normName(modelPart).replace(/ (?:reasoning|thinking|extended|nothinking)$/, '');
-  // 1. Exact match
-  for (const entry of orIndex) {
-    if (entry.norm === n) return entry;
-  }
-  // 2. Provider model name starts with OR model part
-  let best = null;
-  let bestLen = 0;
   for (const entry of orIndex) {
     if (n.startsWith(entry.norm) && entry.norm.length > bestLen) {
-      best = entry;
-      bestLen = entry.norm.length;
     }
   }
   if (best) return best;
-  // 3. OR model part starts with provider name
-  for (const entry of orIndex) {
-    if (entry.norm.startsWith(n + ' ')) return entry;
-  }
-  // 4. OR model norm contains provider name as a contiguous word sequence.
   if (n.length >= 5) {
     let bestC = null, bestCLen = Infinity;
     for (const entry of orIndex) {
       const e = entry.norm;
-      if ((e === n || e.includes(' ' + n + ' ') || e.startsWith(n + ' ') || e.endsWith(' ' + n))
-          && e.length < bestCLen) {
         bestC = entry; bestCLen = e.length;
       }
     }
     if (bestC) return bestC;
   }
-  // 5. All tokens of provider name appear in OR norm.
   const tokens = n.split(' ');
   if (tokens.length >= 2 && n.length >= 7) {
     let bestT = null, bestTLen = Infinity;
@@ -165,9 +143,11 @@ function estimateParams(config) {
   const v = config.vocab_size;
   const i = config.intermediate_size || config.d_ff;
   const numExperts = config.num_local_experts || config.n_experts || 1;
   if (h && l && v) {
     const intermediate = i || (4 * h);
     // Embedding parameters
     const vocabParams = v * h;
     const posParams = (config.max_position_embeddings || 512) * h;
@@ -175,15 +155,20 @@ function estimateParams(config) {
     const embedParams = vocabParams + posParams + typeParams;
     // Layer parameters (Attention + MLP)
-    const mlpParams = 2 * h * intermediate * numExperts;
     const attentionParams = 4 * (h * h);
     const params = embedParams + l * (attentionParams + mlpParams);
     return params;
   }
   return null;
 }
-// Fetch total_parameters from Hugging Face Hub API (Metadata)
 async function fetchHFSize(hfId) {
   if (!hfId || hfId.includes(' ') || !hfId.includes('/')) return { error: 'Invalid ID' };
   const token = process.env.HF_TOKEN;
@@ -193,69 +178,50 @@ async function fetchHFSize(hfId) {
     const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
     let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
-    // 2. Fallback: cardData
     if (!params && data.cardData?.model_details?.parameters) {
       const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
-      if (match) params = parseFloat(match[1]) * 1_000_000_000;
     }
-    // 3. Fallback: vLLM-style estimation from config
-    // If the API config is "minified", fetch the raw config.json file
     let config = data.config;
     if (!params && (!config || !config.hidden_size)) {
-      try {
-        config = await getJson(`https://huggingface.co/${hfId}/raw/main/config.json`, { headers, retries: 1 });
-      } catch (e) { /* ignore raw config fetch failure */ }
-    }
-    if (!params && config) {
-      params = estimateParams(config);
     }
     if (!params) return { error: 'No parameter data' };
     const b = params / 1_000_000_000;
     // Keep 2 decimals for small models (<1B), 1 decimal for others
     const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
-    return { size };
   } catch (e) {
-    // Flag as private if we get 401 (unauthorized) or 404 (not found - often private/aliased)
     const isPrivate = e.message.includes('401') || e.message.includes('404');
     return { error: e.message, private: isPrivate };
   }
 }
-// Fetch parameter info from Ollama Registry
 async function fetchOllamaMetadata(ollamaId) {
   const url = `https://registry.ollama.ai/v2/library/${ollamaId}/manifests/latest`;
   try {
-    const data = await getJson(url, {
-      headers: { Accept: 'application/vnd.docker.distribution.manifest.v2+json' },
-      retries: 1
-    });
     if (!data.config?.digest) return null;
-    // Fetch the config blob
-    const configUrl = `https://registry.ollama.ai/v2/library/${ollamaId}/blobs/${data.config.digest}`;
-    const config = await getJson(configUrl, { retries: 1 });
     const info = config.model_info || {};
     const count = info['general.parameter_count'] || info['parameter_count'];
     if (count) {
       const b = count / 1_000_000_000;
       const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
-      return { size };
     }
-    return {}; // Found model but no size
-  } catch (e) {
-    return null;
-  }
 }
 const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'multilingual-mpnet'];
-// Link common models to their HF IDs when naming is non-standard
 const MANUAL_HF_ID_MAP = {
   'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
   'whisper v3': 'openai/whisper-large-v3',
@@ -268,17 +234,13 @@ const MANUAL_HF_ID_MAP = {
   'bge large en v1 5': 'BAAI/bge-large-en-v1.5',
   'bge multilingual gemma2': 'BAAI/bge-multilingual-gemma2',
   'lightonocr 2': 'lightonai/LightOnOCR-2-1B',
   'sdxl': 'stabilityai/stable-diffusion-xl-base-1.0',
   'flux 1 schnell': 'black-forest-labs/FLUX.1-schnell',
   'flux schnell': 'black-forest-labs/FLUX.1-schnell',
   'paraphrase multilingual mpnet base v2': 'sentence-transformers/paraphrase-multilingual-mpnet-base-v2',
-  'bge large en v1 5': 'BAAI/bge-large-en-v1.5',
-  'bge multilingual gemma2': 'BAAI/bge-multilingual-gemma2',
   'photomaker v2': 'TencentARC/PhotoMaker-V2',
   'canopy labs orpheus english': 'canopy-labs/orpheus-medium',
   'canopy labs orpheus arabic saudi': 'canopy-labs/orpheus-medium',
-  // Qwen
   'qwen turbo': 'Alibaba/Qwen-Turbo',
   'alibaba qwen turbo': 'Alibaba/Qwen-Turbo',
   'qwen qwen turbo': 'Alibaba/Qwen-Turbo',
@@ -294,9 +256,9 @@ const MANUAL_HF_ID_MAP = {
   'qwen3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
   'qwen 3 5 flash': 'Qwen/Qwen2.5-7B-Instruct',
   'qwen3 5 flash 02 23': 'Qwen/Qwen2.5-7B-Instruct',
   'qwen vl plus': 'Qwen/Qwen2-VL-7B-Instruct',
   'qwen vl max': 'Qwen/Qwen2-VL-72B-Instruct',
-  // DeepSeek
   'deepseek chat': 'deepseek-ai/DeepSeek-V3',
   'deepseek reasoner': 'deepseek-ai/DeepSeek-R1',
   'deepseek v3 turbo': 'deepseek-ai/DeepSeek-V3',
@@ -306,7 +268,6 @@ const MANUAL_HF_ID_MAP = {
   'deepseek v3 2 speciale': 'deepseek-ai/DeepSeek-V3.2',
   'deepseek v3 base': 'deepseek-ai/DeepSeek-V3',
   'deepseek v3 0324 base': 'deepseek-ai/DeepSeek-V3',
-  // Grok
   'grok 4 1 fast': 'xai-org/grok-fast',
   'grok 4 fast': 'xai-org/grok-fast',
   'grok code fast 1': 'xai-org/grok-code',
@@ -318,15 +279,11 @@ const MANUAL_HF_ID_MAP = {
   'grok 3': 'xai-org/grok-3',
   'grok 3 beta': 'xai-org/grok-3',
   'grok 2 1212': 'xai-org/grok-2',
-  // GLM
   'glm 4 6v': 'THUDM/glm-4v-9b',
   'glm 5 turbo': 'THUDM/glm-5-turbo',
-  // MiniMax
   'minimax m2 7': 'MiniMax/MiniMax-M2.7',
   'minimax 01': 'MiniMax/MiniMax-Text-01',
-  // Phi
   'phi 4': 'microsoft/phi-4',
-  // FLUX
   'flux 1 dev': 'black-forest-labs/FLUX.1-dev',
   'flux dev': 'black-forest-labs/FLUX.1-dev',
   'flux 2 dev': 'black-forest-labs/FLUX.2-dev',
@@ -342,7 +299,6 @@ const MANUAL_HF_ID_MAP = {
   'flux pro 1 0 fill': 'black-forest-labs/FLUX.1-pro',
   'flux pro 1 1 ultra': 'black-forest-labs/FLUX.1-pro',
   'flux kontext max': 'black-forest-labs/FLUX.1-pro',
-  // Mistral
   'mistral large 3': 'mistralai/Mistral-Large-Instruct-2411',
   'mistral large 2411': 'mistralai/Mistral-Large-Instruct-2411',
   'mistral large 2407': 'mistralai/Mistral-Large-Instruct-2407',
@@ -375,167 +331,148 @@ const MANUAL_OLLAMA_ID_MAP = {
   'mixtral 8x22b': 'mixtral-8x22b',
 };
 const PROPRIETARY_KEYWORDS = [
   'gpt-4', 'gpt-5', 'sonnet', 'opus', 'haiku', 'gemini', 'o1-', 'o3-', 'o4-', 'claude',
   'magistral', 'voxtral', 'moderation', 'embed'
 ];
-// Propagate capabilities and size from benchmarks, OpenRouter, or HF Hub to all other providers' models.
-// Only fills in fields when the model doesn't already have them.
 async function propagateExtraData(data) {
   const orProvider = data.providers.find((p) => p.name === 'OpenRouter');
   const orIndex = buildOrIndex(orProvider);
-  // Load benchmarks for size lookup
   let benchmarks = [];
-  try {
-    const bmFile = path.join(__dirname, '..', 'data', 'benchmarks.json');
-    if (fs.existsSync(bmFile)) benchmarks = JSON.parse(fs.readFileSync(bmFile, 'utf8'));
-  } catch (e) { /* ignore */ }
-  // Multi-level Benchmark Size Maps
   const hfIdToSize = new Map();
   benchmarks.forEach((b) => {
     if (b.params_b && b.hf_id) hfIdToSize.set(b.hf_id.toLowerCase(), b.params_b);
   });
-  let propagatedCaps = 0;
-  let propagatedSize = 0;
-  let autoTagged = 0;
-  let hfSizeFetched = 0;
-  let ollamaFetched = 0;
-  // We'll collect models missing size that have a clear HF-id-like name
-  const hfLookupQueue = [];
-  const ollamaLookupQueue = [];
-  for (const provider of data.providers) {
-    for (const model of provider.models || []) {
-      const n = normName(model.name);
-      // 0. AUTO-MARK PROPRIETARY: Mark closed APIs as private to skip HF lookups
-      if (PROPRIETARY_KEYWORDS.some(k => n.includes(k))) {
-        model.hf_private = true;
-      }
-      // 1. MANUAL OVERRIDE: Link common models to their HF IDs
-      if (!model.hf_id) {
-        for (const [key, val] of Object.entries(MANUAL_HF_ID_MAP)) {
-          if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) {
-            model.hf_id = val; break;
-          }
-        }
-      }
-      if (!model.ollama_id) {
-        for (const [key, val] of Object.entries(MANUAL_OLLAMA_ID_MAP)) {
-          if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) {
-            model.ollama_id = val; break;
-          }
-        }
-      }
-      // 2. Propagate size from benchmarks (Exact Match via hf_id)
-      if (!model.size_b && model.hf_id) {
-        const size = hfIdToSize.get(model.hf_id.toLowerCase());
-        if (size) { model.size_b = size; propagatedSize++; }
-      }
-      // 3. Auto-tag image-gen and embedding models
-      if (model.type === 'image' && (!model.capabilities || !model.capabilities.length)) {
-        model.capabilities = ['image-gen'];
-        autoTagged++;
       }
-      if (model.type === 'chat' && EMBEDDER_KEYWORDS.some(k => n.includes(k))) {
-        model.type = 'embedding';
-        autoTagged++;
       }
-      // 4. INHERIT: Structured data inheritance from OpenRouter
-      if (provider.name !== 'OpenRouter') {
-        const match = findOrMatch(model.name, orIndex);
-        if (match) {
-          if (!model.capabilities || model.capabilities.length === 0) {
-            // Propagate model capabilities (tools, vision, etc.) but NOT provider-specific ones like eu-endpoint
-            model.capabilities = (match.capabilities || []).filter(c => c !== 'eu-endpoint');
-            propagatedCaps++;
-          }
-          if (model.type === 'chat' && match.type !== 'chat') model.type = match.type;
-          if (!model.size_b && match.size_b) {
-            model.size_b = match.size_b;
-            propagatedSize++;
-          }
-          // Crucial: inherit hf_id to enable Hub API fallback below
-          if (!model.hf_id && match.hf_id) model.hf_id = match.hf_id;
-          if (!model.ollama_id && match.ollama_id) model.ollama_id = match.ollama_id;
-          if (model.hf_private === undefined && match.hf_private !== undefined) model.hf_private = match.hf_private;
-        }
-      }
-      // 5. HARDCODED heuristics
-      if (!model.size_b) {
-        if (n.includes('gemma 2 9b') || n.includes('gemma2 9b')) { model.size_b = 9; propagatedSize++; }
-        else if (n.includes('gemma 2 27b') || n.includes('gemma2 27b')) { model.size_b = 27; propagatedSize++; }
-        else if (n.includes('gemma 2 2b') || n.includes('gemma2 2b')) { model.size_b = 2; propagatedSize++; }
-      }
-      // 6. QUEUE: Still missing size? Try Hub API or Ollama
       if (!model.size_b) {
-        if (!model.hf_private && (model.name.includes('/') || model.hf_id)) {
-          hfLookupQueue.push(model);
-        } else if (!model.hf_private && model.ollama_id) {
-          ollamaLookupQueue.push(model);
-        }
       }
-    }
-  }
-  // 7. HUB API: Inspect technical metadata (Limit 200 unique IDs to ensure better coverage)
-  const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id || m.name).filter(id => id.includes('/')))].slice(0, 200);
   if (uniqueIds.length > 0) {
     console.log(`\n  HF Hub: technical metadata inspection for ${uniqueIds.length} models...`);
     const idToResult = new Map();
-    // Process sequentially with small delay to avoid 429 rate limits
     for (let i = 0; i < uniqueIds.length; i++) {
       const id = uniqueIds[i];
       process.stdout.write(`    [${i + 1}/${uniqueIds.length}] ${id.padEnd(50)} `);
       const result = await fetchHFSize(id);
-      if (result.size) {
-        idToResult.set(id, result);
-        process.stdout.write(`✓ ${result.size}B\n`);
-      } else {
-        process.stdout.write(`✗ ${result.error || 'Unknown Error'}\n`);
-        // CIRCUIT BREAKER: Stop if we hit a rate limit (429)
-        if (result.error && result.error.includes('429')) {
-          console.warn('\n  ⚠ HIT RATE LIMIT (429) - Stopping further HF lookups for this run.');
-          break;
-        }
-      }
-      await new Promise(r => setTimeout(r, 50)); // Tiny delay
     }
     for (const model of hfLookupQueue) {
       if (!model.size_b) {
         const id = model.hf_id || model.name;
         const result = idToResult.get(id);
         if (result) {
-          if (result.size) {
-            model.size_b = result.size;
-            hfSizeFetched++;
-          }
-          if (result.private) {
-            model.hf_private = true;
-          }
         }
       }
     }
-    console.log(`  ✓ Total ${hfSizeFetched} new sizes from HF metadata`);
   }
-  // 8. OLLAMA REGISTRY: Inspect parameter info (Final fallback for common models)
   const uniqueOllama = [...new Set(ollamaLookupQueue.map(m => m.ollama_id))].filter(Boolean);
   if (uniqueOllama.length > 0) {
     console.log(`\n  Ollama: inspecting registry for ${uniqueOllama.length} models...`);
@@ -544,85 +481,40 @@ async function propagateExtraData(data) {
       const id = uniqueOllama[i];
       process.stdout.write(`    [${i + 1}/${uniqueOllama.length}] ${id.padEnd(50)} `);
       const res = await fetchOllamaMetadata(id);
-      if (res) {
-        idToResult.set(id, res);
-        process.stdout.write(res.size ? `✓ ${res.size}B\n` : `✓\n`);
-      } else {
-        process.stdout.write(`✗\n`);
-      }
       await new Promise(r => setTimeout(r, 50));
     }
     for (const model of ollamaLookupQueue) {
       const res = idToResult.get(model.ollama_id);
-      if (res && res.size && !model.size_b) {
-        model.size_b = res.size;
-        ollamaFetched++;
-      }
     }
-    console.log(`  ✓ Total ${ollamaFetched} new sizes from Ollama`);
   }
-  if (autoTagged > 0) console.log(`Auto-tagged ${autoTagged} image-gen/embedding models.`);
-  if (propagatedCaps > 0) console.log(`Propagated capabilities to ${propagatedCaps} models.`);
-  if (propagatedSize + hfSizeFetched + ollamaFetched > 0) console.log(`Enriched size data for ${propagatedSize + hfSizeFetched + ollamaFetched} models.`);
 }
 async function runFetcher(fetcher, data) {
-  const { key, providerName, fn } = fetcher;
   try {
-    process.stdout.write(`Fetching ${providerName}... `);
-    const models = await fn();
-    const updated = updateProviderModels(data.providers, providerName, models);
-    if (updated) console.log(`✓ ${models.length} models`);
-    return { key, providerName, success: true, count: models.length };
   } catch (err) {
     console.log(`✗ ${err.message}`);
-    return { key, providerName, success: false, error: err.message };
   }
 }
 async function main() {
-  // Determine which fetchers to run
-  const args = process.argv.slice(2).map((a) => a.toLowerCase());
-  const fetchers =
-    args.length > 0
-      ? FETCHERS.filter((f) => args.includes(f.key))
-      : FETCHERS;
-  if (fetchers.length === 0) {
-    console.error('No matching fetchers found. Available:', FETCHERS.map((f) => f.key).join(', '));
-    process.exit(1);
-  }
   const data = loadData();
   console.log(`Running ${fetchers.length} fetcher(s)...\n`);
-  const results = [];
-  for (const fetcher of fetchers) {
-    const result = await runFetcher(fetcher, data);
-    results.push(result);
-  }
-  // Always propagate extra data from OpenRouter and Benchmarks to all providers' models.
   await propagateExtraData(data);
   saveData(data);
   console.log('\nSummary:');
-  let anyFailed = false;
-  results.forEach((r) => {
-    if (r.success) console.log(`  ✓ ${r.providerName}: ${r.count} models`);
-    else {
-      console.log(`  ✗ ${r.providerName}: ${r.error}`);
-      anyFailed = true;
-    }
-  });
-  if (anyFailed) process.exit(1);
 }
-main().catch((err) => {
-  console.error('Fatal:', err);
-  process.exit(1);
-});

 const DATA_FILE = path.join(__dirname, '..', 'data', 'providers.json');
 // Registry of all available fetchers.
 const FETCHER_MODULES = {
   scaleway: require('./providers/scaleway'),
   openrouter: require('./providers/openrouter'),
 };
 const FETCHERS = Object.entries(FETCHER_MODULES).map(([key, mod]) => {
   const fn = Object.values(mod).find((v) => typeof v === 'function');
   if (!fn) throw new Error(`Module for ${key} exports no function`);
   return { key, providerName: mod.providerName, fn };
     return false;
   }
+  // Smart merge: preserve existing metadata if missing in new data
   const existingMap = new Map((provider.models || []).map(m => [m.name, m]));
   provider.models = models.map(newModel => {
     return {
       ...existing, // Start with existing metadata
       ...newModel, // Overwrite with new prices/type
       size_b: newModel.size_b || existing.size_b,
+      size_source: newModel.size_source || existing.size_source,
       hf_id: newModel.hf_id || existing.hf_id,
       ollama_id: newModel.ollama_id || existing.ollama_id,
       hf_private: newModel.hf_private ?? existing.hf_private,
   return true;
 }
 const normName = (s) =>
   s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
 function buildOrIndex(orProvider) {
   if (!orProvider) return [];
   const index = [];
   for (const m of orProvider.models || []) {
     if (!m.capabilities || m.capabilities.length === 0) continue;
     const modelPart = m.name.replace(/:free$/, '').split('/').pop();
     index.push({
       norm: normName(modelPart),
       capabilities: m.capabilities,
       type: m.type,
       size_b: m.size_b,
+      size_source: m.size_source,
       hf_id: m.hf_id,
       ollama_id: m.ollama_id,
       hf_private: m.hf_private,
   return index;
 }
 function findOrMatch(modelName, orIndex) {
   const raw = modelName.replace(/@[^/]+$/, '').replace(/:[^/]+$/, '');
   const modelPart = raw.includes('/') ? raw.split('/').pop() : raw;
   const n = normName(modelPart).replace(/ (?:reasoning|thinking|extended|nothinking)$/, '');
+  for (const entry of orIndex) if (entry.norm === n) return entry;
+  let best = null, bestLen = 0;
   for (const entry of orIndex) {
     if (n.startsWith(entry.norm) && entry.norm.length > bestLen) {
+      best = entry; bestLen = entry.norm.length;
     }
   }
   if (best) return best;
+  for (const entry of orIndex) if (entry.norm.startsWith(n + ' ')) return entry;
   if (n.length >= 5) {
     let bestC = null, bestCLen = Infinity;
     for (const entry of orIndex) {
       const e = entry.norm;
+      if ((e === n || e.includes(' ' + n + ' ') || e.startsWith(n + ' ') || e.endsWith(' ' + n)) && e.length < bestCLen) {
         bestC = entry; bestCLen = e.length;
       }
     }
     if (bestC) return bestC;
   }
   const tokens = n.split(' ');
   if (tokens.length >= 2 && n.length >= 7) {
     let bestT = null, bestTLen = Infinity;
   const v = config.vocab_size;
   const i = config.intermediate_size || config.d_ff;
   const numExperts = config.num_local_experts || config.n_experts || 1;
+  const modelType = (config.model_type || '').toLowerCase();
   if (h && l && v) {
     const intermediate = i || (4 * h);
     // Embedding parameters
     const vocabParams = v * h;
     const posParams = (config.max_position_embeddings || 512) * h;
     const embedParams = vocabParams + posParams + typeParams;
     // Layer parameters (Attention + MLP)
     const attentionParams = 4 * (h * h);
+    // Modern architectures (Llama, Mistral, Qwen, Phi-3, Gemma) use Gated Linear Units (GLU)
+    // which have 3 projection matrices in the MLP instead of 2.
+    const hasGlu = ['llama', 'mistral', 'phi3', 'qwen2', 'gemma', 'gemma2'].includes(modelType);
+    const mlpParams = (hasGlu ? 3 : 2) * h * intermediate * numExperts;
     const params = embedParams + l * (attentionParams + mlpParams);
     return params;
   }
   return null;
 }
+// Fetch total_parameters from Hugging Face Hub API
 async function fetchHFSize(hfId) {
   if (!hfId || hfId.includes(' ') || !hfId.includes('/')) return { error: 'Invalid ID' };
   const token = process.env.HF_TOKEN;
     const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
     let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
+    let source = 'hf-total';
     if (!params && data.cardData?.model_details?.parameters) {
       const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
+      if (match) { params = parseFloat(match[1]) * 1_000_000_000; source = 'hf-card'; }
     }
+    // 2. Fallback: Fetch the raw config.json file for estimation
     let config = data.config;
     if (!params && (!config || !config.hidden_size)) {
+      try { config = await getJson(`https://huggingface.co/${hfId}/raw/main/config.json`, { headers, retries: 1 }); } catch (e) {}
     }
+    if (!params && config) { params = estimateParams(config); source = 'hf-config-estimate'; }
     if (!params) return { error: 'No parameter data' };
     const b = params / 1_000_000_000;
     // Keep 2 decimals for small models (<1B), 1 decimal for others
     const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
+    return { size, source };
   } catch (e) {
     const isPrivate = e.message.includes('401') || e.message.includes('404');
     return { error: e.message, private: isPrivate };
   }
 }
 async function fetchOllamaMetadata(ollamaId) {
   const url = `https://registry.ollama.ai/v2/library/${ollamaId}/manifests/latest`;
   try {
+    const data = await getJson(url, { headers: { Accept: 'application/vnd.docker.distribution.manifest.v2+json' }, retries: 1 });
     if (!data.config?.digest) return null;
+    const config = await getJson(`https://registry.ollama.ai/v2/library/${ollamaId}/blobs/${data.config.digest}`, { retries: 1 });
     const info = config.model_info || {};
     const count = info['general.parameter_count'] || info['parameter_count'];
     if (count) {
       const b = count / 1_000_000_000;
       const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
+      return { size, source: 'ollama' };
     }
+    return {};
+  } catch (e) { return null; }
 }
 const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'multilingual-mpnet'];
 const MANUAL_HF_ID_MAP = {
   'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
   'whisper v3': 'openai/whisper-large-v3',
   'bge large en v1 5': 'BAAI/bge-large-en-v1.5',
   'bge multilingual gemma2': 'BAAI/bge-multilingual-gemma2',
   'lightonocr 2': 'lightonai/LightOnOCR-2-1B',
   'sdxl': 'stabilityai/stable-diffusion-xl-base-1.0',
   'flux 1 schnell': 'black-forest-labs/FLUX.1-schnell',
   'flux schnell': 'black-forest-labs/FLUX.1-schnell',
   'paraphrase multilingual mpnet base v2': 'sentence-transformers/paraphrase-multilingual-mpnet-base-v2',
   'photomaker v2': 'TencentARC/PhotoMaker-V2',
   'canopy labs orpheus english': 'canopy-labs/orpheus-medium',
   'canopy labs orpheus arabic saudi': 'canopy-labs/orpheus-medium',
   'qwen turbo': 'Alibaba/Qwen-Turbo',
   'alibaba qwen turbo': 'Alibaba/Qwen-Turbo',
   'qwen qwen turbo': 'Alibaba/Qwen-Turbo',
   'qwen3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
   'qwen 3 5 flash': 'Qwen/Qwen2.5-7B-Instruct',
   'qwen3 5 flash 02 23': 'Qwen/Qwen2.5-7B-Instruct',
+  'qwen3 5 plus 02 15': 'Qwen/Qwen2.5-32B-Instruct',
   'qwen vl plus': 'Qwen/Qwen2-VL-7B-Instruct',
   'qwen vl max': 'Qwen/Qwen2-VL-72B-Instruct',
   'deepseek chat': 'deepseek-ai/DeepSeek-V3',
   'deepseek reasoner': 'deepseek-ai/DeepSeek-R1',
   'deepseek v3 turbo': 'deepseek-ai/DeepSeek-V3',
   'deepseek v3 2 speciale': 'deepseek-ai/DeepSeek-V3.2',
   'deepseek v3 base': 'deepseek-ai/DeepSeek-V3',
   'deepseek v3 0324 base': 'deepseek-ai/DeepSeek-V3',
   'grok 4 1 fast': 'xai-org/grok-fast',
   'grok 4 fast': 'xai-org/grok-fast',
   'grok code fast 1': 'xai-org/grok-code',
   'grok 3': 'xai-org/grok-3',
   'grok 3 beta': 'xai-org/grok-3',
   'grok 2 1212': 'xai-org/grok-2',
   'glm 4 6v': 'THUDM/glm-4v-9b',
   'glm 5 turbo': 'THUDM/glm-5-turbo',
   'minimax m2 7': 'MiniMax/MiniMax-M2.7',
   'minimax 01': 'MiniMax/MiniMax-Text-01',
   'phi 4': 'microsoft/phi-4',
   'flux 1 dev': 'black-forest-labs/FLUX.1-dev',
   'flux dev': 'black-forest-labs/FLUX.1-dev',
   'flux 2 dev': 'black-forest-labs/FLUX.2-dev',
   'flux pro 1 0 fill': 'black-forest-labs/FLUX.1-pro',
   'flux pro 1 1 ultra': 'black-forest-labs/FLUX.1-pro',
   'flux kontext max': 'black-forest-labs/FLUX.1-pro',
   'mistral large 3': 'mistralai/Mistral-Large-Instruct-2411',
   'mistral large 2411': 'mistralai/Mistral-Large-Instruct-2411',
   'mistral large 2407': 'mistralai/Mistral-Large-Instruct-2407',
   'mixtral 8x22b': 'mixtral-8x22b',
 };
+const MANUAL_SIZE_MAP = {
+  'BAAI/bge-m3': 0.57,
+  'black-forest-labs/FLUX.1-schnell': 12,
+  'black-forest-labs/FLUX.1-dev': 12,
+  'black-forest-labs/FLUX.1-pro': 12,
+  'black-forest-labs/FLUX.2-dev': 32,
+  'black-forest-labs/FLUX.2-pro': 32,
+  'black-forest-labs/FLUX.2-flex': 32,
+  'black-forest-labs/FLUX.2-max': 32,
+  'black-forest-labs/FLUX.2-klein-4B': 4,
+  'black-forest-labs/FLUX.2-klein-9B': 9,
+  'mistralai/Mistral-Large-Instruct-2407': 123,
+  'mistralai/Mistral-Large-Instruct-2411': 675,
+  'Alibaba/Qwen-Turbo': 14,
+  'Qwen/Qwen2.5-Coder-7B-Instruct': 7,
+  'Qwen/Qwen2.5-Coder-32B-Instruct': 32,
+  'Qwen/Qwen2.5-7B-Instruct': 7,
+  'Qwen/Qwen2-VL-7B-Instruct': 7,
+  'Qwen/Qwen2-VL-72B-Instruct': 72,
+  'deepseek-ai/DeepSeek-V3': 671,
+  'deepseek-ai/DeepSeek-R1': 671,
+  'microsoft/phi-4': 14,
+  'MiniMax/MiniMax-M2.7': 230,
+  // Final public models
+  'TencentARC/PhotoMaker-V2': 3.1,
+  'stabilityai/stable-diffusion-xl-base-1.0': 2.6,
+  'zai-org/GLM-4.6V': 9,
+  'ai21labs/AI21-Jamba-Large-1.7': 52,
+};
 const PROPRIETARY_KEYWORDS = [
   'gpt-4', 'gpt-5', 'sonnet', 'opus', 'haiku', 'gemini', 'o1-', 'o3-', 'o4-', 'claude',
   'magistral', 'voxtral', 'moderation', 'embed'
 ];
 async function propagateExtraData(data) {
   const orProvider = data.providers.find((p) => p.name === 'OpenRouter');
   const orIndex = buildOrIndex(orProvider);
   let benchmarks = [];
+  try { benchmarks = JSON.parse(fs.readFileSync(path.join(__dirname, '..', 'data', 'benchmarks.json'), 'utf8')); } catch (e) {}
   const hfIdToSize = new Map();
   benchmarks.forEach((b) => {
     if (b.params_b && b.hf_id) hfIdToSize.set(b.hf_id.toLowerCase(), b.params_b);
   });
+  // Multi-pass Enrichment Sweep
+  // 1. Initial manual and fuzzy mapping
+  data.providers.forEach(p => p.models.forEach(model => {
+    const n = normName(model.name);
+    if (PROPRIETARY_KEYWORDS.some(k => n.includes(k))) model.hf_private = true;
+    if (!model.hf_id) {
+      for (const [key, val] of Object.entries(MANUAL_HF_ID_MAP)) {
+        if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) { model.hf_id = val; break; }
       }
+    }
+    if (!model.ollama_id) {
+      for (const [key, val] of Object.entries(MANUAL_OLLAMA_ID_MAP)) {
+        if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) { model.ollama_id = val; break; }
       }
+    }
+    // High-confidence size from manual map
+    if (model.hf_id && MANUAL_SIZE_MAP[model.hf_id]) {
+      model.size_b = MANUAL_SIZE_MAP[model.hf_id];
+      model.size_source = 'manual';
+    } else if (model.hf_id && !model.size_b) {
+      const size = hfIdToSize.get(model.hf_id.toLowerCase());
+      if (size) { model.size_b = size; model.size_source = 'benchmark'; }
+    }
+  }));
+  // 2. Cross-provider propagation (inherit successful enrichments)
+  const globalMeta = new Map();
+  data.providers.forEach(p => p.models.forEach(m => {
+    if (m.size_b || m.hf_id || m.ollama_id || m.hf_private) {
+      const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
+      const existing = globalMeta.get(baseName) || {};
+      globalMeta.set(baseName, {
+        size_b: m.size_b || existing.size_b,
+        size_source: m.size_source || existing.size_source,
+        hf_id: m.hf_id || existing.hf_id,
+        ollama_id: m.ollama_id || existing.ollama_id,
+        hf_private: m.hf_private || existing.hf_private,
+      });
+    }
+  }));
+  data.providers.forEach(p => p.models.forEach(m => {
+    const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
+    const meta = globalMeta.get(baseName);
+    if (meta) {
+      m.size_b = m.size_b || meta.size_b;
+      m.size_source = m.size_source || meta.size_source;
+      m.hf_id = m.hf_id || meta.hf_id;
+      m.ollama_id = m.ollama_id || meta.ollama_id;
+      m.hf_private = m.hf_private || meta.hf_private;
+    }
+  }));
+  // 3. Technical Lookups (Final fallback for remaining gaps)
+  let hfSizeFetched = 0, ollamaFetched = 0;
+  const hfLookupQueue = [], ollamaLookupQueue = [];
+  data.providers.forEach(provider => {
+    provider.models.forEach(model => {
+      const n = normName(model.name);
+      if (model.type === 'image' && (!model.capabilities || !model.capabilities.length)) { model.capabilities = ['image-gen']; }
+      if (model.type === 'chat' && EMBEDDER_KEYWORDS.some(k => n.includes(k))) { model.type = 'embedding'; }
       if (!model.size_b) {
+        // Force lookup if we have a clear repo ID, even if previously marked private
+        if (model.hf_id || (model.name.includes('/') && !model.hf_private)) hfLookupQueue.push(model);
+        else if (!model.hf_private && model.ollama_id) ollamaLookupQueue.push(model);
       }
+    });
+  });
+  const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id || m.name).filter(id => id.includes('/')))].slice(0, 300);
   if (uniqueIds.length > 0) {
     console.log(`\n  HF Hub: technical metadata inspection for ${uniqueIds.length} models...`);
     const idToResult = new Map();
     for (let i = 0; i < uniqueIds.length; i++) {
       const id = uniqueIds[i];
       process.stdout.write(`    [${i + 1}/${uniqueIds.length}] ${id.padEnd(50)} `);
       const result = await fetchHFSize(id);
+      idToResult.set(id, result);
+      if (result.size) process.stdout.write(`✓ ${result.size}B (${result.source})\n`);
+      else { process.stdout.write(`✗ ${result.error || 'Err'}\n`); if (result.error && result.error.includes('429')) break; }
+      await new Promise(r => setTimeout(r, 50));
     }
     for (const model of hfLookupQueue) {
       if (!model.size_b) {
         const id = model.hf_id || model.name;
         const result = idToResult.get(id);
         if (result) {
+          if (result.size) { model.size_b = result.size; model.size_source = result.source; hfSizeFetched++; }
+          if (result.private) model.hf_private = true;
+          else if (result.size) model.hf_private = false;
         }
       }
     }
   }
   const uniqueOllama = [...new Set(ollamaLookupQueue.map(m => m.ollama_id))].filter(Boolean);
   if (uniqueOllama.length > 0) {
     console.log(`\n  Ollama: inspecting registry for ${uniqueOllama.length} models...`);
       const id = uniqueOllama[i];
       process.stdout.write(`    [${i + 1}/${uniqueOllama.length}] ${id.padEnd(50)} `);
       const res = await fetchOllamaMetadata(id);
+      if (res) { idToResult.set(id, res); process.stdout.write(res.size ? `✓ ${res.size}B\n` : `✓\n`); }
+      else process.stdout.write(`✗\n`);
       await new Promise(r => setTimeout(r, 50));
     }
     for (const model of ollamaLookupQueue) {
       const res = idToResult.get(model.ollama_id);
+      if (res && res.size && !model.size_b) { model.size_b = res.size; model.size_source = 'ollama'; ollamaFetched++; }
     }
   }
+  console.log(`\nEnriched: ${hfSizeFetched + ollamaFetched} technical sizes.`);
 }
 async function runFetcher(fetcher, data) {
   try {
+    process.stdout.write(`Fetching ${fetcher.providerName}... `);
+    const models = await fetcher.fn();
+    if (updateProviderModels(data.providers, fetcher.providerName, models)) console.log(`✓ ${models.length} models`);
+    return { ...fetcher, success: true, count: models.length };
   } catch (err) {
     console.log(`✗ ${err.message}`);
+    return { ...fetcher, success: false, error: err.message };
   }
 }
 async function main() {
   const data = loadData();
+  const args = process.argv.slice(2).map(a => a.toLowerCase());
+  const fetchers = args.length > 0 ? FETCHERS.filter(f => args.includes(f.key)) : FETCHERS;
   console.log(`Running ${fetchers.length} fetcher(s)...\n`);
+  for (const f of fetchers) await runFetcher(f, data);
   await propagateExtraData(data);
   saveData(data);
   console.log('\nSummary:');
+  data.providers.forEach(p => console.log(`  ${p.models ? '✓' : '✗'} ${p.name}: ${p.models ? p.models.length : 0} models`));
 }
+main().catch(err => { console.error('Fatal:', err); process.exit(1); });

src/App.tsx CHANGED Viewed

@@ -19,6 +19,7 @@ interface Model {
   hf_id?: string
   ollama_id?: string
   hf_private?: boolean
 }
 interface Provider {

   hf_id?: string
   ollama_id?: string
   hf_private?: boolean
+  size_source?: 'hf-total' | 'hf-config-estimate' | 'hf-card' | 'ollama' | 'manual' | 'benchmark' | 'openrouter';
 }
 interface Provider {