Spaces:

cstr
/

LLMProviders

Paused

App Files Files Community

CrispStrobe commited on Mar 22

Commit

c5e4684

1 Parent(s): e2e9c3d

feat: resolve MiniMax-M1 (366B), Mistral Small variants, and Qwen Plus via deep config.json parsing and global technical sync

Browse files

Files changed (2) hide show

data/providers.json +0 -0
scripts/fetch-providers.js +97 -302

data/providers.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

scripts/fetch-providers.js CHANGED Viewed

@@ -2,11 +2,6 @@
 /**
  * Fetch live pricing data from all supported providers and update data/providers.json.
- *
- * Usage:
- *   node scripts/fetch-providers.js             # fetch all providers
- *   node scripts/fetch-providers.js scaleway    # fetch only Scaleway
- *   node scripts/fetch-providers.js openrouter  # fetch only OpenRouter
  */
 const fs = require('fs');
@@ -45,12 +40,8 @@ function saveData(data) {
 function updateProviderModels(providers, providerName, models) {
   const provider = providers.find((p) => p.name === providerName);
-  if (!provider) {
-    console.warn(`  ⚠  Provider "${providerName}" not found in providers.json – skipping.`);
-    return false;
-  }
-  // Smart merge: preserve existing metadata if missing in new data
   const existingMap = new Map((provider.models || []).map(m => [m.name, m]));
   provider.models = models.map(newModel => {
@@ -58,8 +49,8 @@ function updateProviderModels(providers, providerName, models) {
     if (!existing) return newModel;
     return {
-      ...existing, // Start with existing metadata
-      ...newModel, // Overwrite with new prices/type
       size_b: newModel.size_b || existing.size_b,
       size_source: newModel.size_source || existing.size_source,
       hf_id: newModel.hf_id || existing.hf_id,
@@ -77,94 +68,32 @@ function updateProviderModels(providers, providerName, models) {
 const normName = (s) =>
   s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
-function buildOrIndex(orProvider) {
-  if (!orProvider) return [];
-  const index = [];
-  for (const m of orProvider.models || []) {
-    if (!m.capabilities || m.capabilities.length === 0) continue;
-    const modelPart = m.name.replace(/:free$/, '').split('/').pop();
-    index.push({
-      norm: normName(modelPart),
-      capabilities: m.capabilities,
-      type: m.type,
-      size_b: m.size_b,
-      size_source: m.size_source,
-      hf_id: m.hf_id,
-      ollama_id: m.ollama_id,
-      hf_private: m.hf_private,
-    });
-  }
-  return index;
-}
-function findOrMatch(modelName, orIndex) {
-  const raw = modelName.replace(/@[^/]+$/, '').replace(/:[^/]+$/, '');
-  const modelPart = raw.includes('/') ? raw.split('/').pop() : raw;
-  const n = normName(modelPart).replace(/ (?:reasoning|thinking|extended|nothinking)$/, '');
-  for (const entry of orIndex) if (entry.norm === n) return entry;
-  let best = null, bestLen = 0;
-  for (const entry of orIndex) {
-    if (n.startsWith(entry.norm) && entry.norm.length > bestLen) {
-      best = entry; bestLen = entry.norm.length;
-    }
-  }
-  if (best) return best;
-  for (const entry of orIndex) if (entry.norm.startsWith(n + ' ')) return entry;
-  if (n.length >= 5) {
-    let bestC = null, bestCLen = Infinity;
-    for (const entry of orIndex) {
-      const e = entry.norm;
-      if ((e === n || e.includes(' ' + n + ' ') || e.startsWith(n + ' ') || e.endsWith(' ' + n)) && e.length < bestCLen) {
-        bestC = entry; bestCLen = e.length;
-      }
-    }
-    if (bestC) return bestC;
-  }
-  const tokens = n.split(' ');
-  if (tokens.length >= 2 && n.length >= 7) {
-    let bestT = null, bestTLen = Infinity;
-    for (const entry of orIndex) {
-      const eTokens = entry.norm.split(' ');
-      if (tokens.every((t) => eTokens.includes(t)) && entry.norm.length < bestTLen) {
-        bestT = entry; bestTLen = entry.norm.length;
-      }
-    }
-    if (bestT) return bestT;
-  }
-  return null;
-}
 // Estimate parameters from config.json (vLLM style fallback)
-function estimateParams(config) {
   if (!config) return null;
   const h = config.hidden_size || config.d_model || config.n_embd;
   const l = config.num_hidden_layers || config.n_layer;
   const v = config.vocab_size;
   const i = config.intermediate_size || config.d_ff;
-  // MoE support
   const numExperts = config.num_local_experts || config.n_experts || config.num_experts || 1;
   const modelType = (config.model_type || '').toLowerCase();
   if (h && l && v) {
     const intermediate = i || (4 * h);
-    // Embedding parameters
     const vocabParams = v * h;
     const posParams = (config.max_position_embeddings || 512) * h;
     const typeParams = (config.type_vocab_size || 0) * h;
     const embedParams = vocabParams + posParams + typeParams;
-    // Layer parameters (Attention + MLP)
     const attentionParams = 4 * (h * h);
-    // Modern architectures (Llama, Mistral, Qwen, Phi-3, Gemma, MiniMax) use Gated Linear Units (GLU)
-    const hasGlu = ['llama', 'mistral', 'phi3', 'qwen2', 'gemma', 'gemma2', 'minimax'].includes(modelType);
-    const mlpParams = (hasGlu ? 3 : 2) * h * intermediate * numExperts;
-    const params = embedParams + l * (attentionParams + mlpParams);
-    return params;
   }
   return null;
 }
@@ -175,18 +104,15 @@ async function fetchHFSize(hfId) {
   const token = process.env.HF_TOKEN;
   const headers = token ? { Authorization: `Bearer ${token}` } : {};
   let isPrivate = false;
   try {
-    let params = null;
-    let source = 'hf-total';
-    let data = {};
-    // 1. Get top-level metadata
     try {
       data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
       params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
-      // Fallback: cardData
       if (!params && data.cardData?.model_details?.parameters) {
         const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
         if (match) { params = parseFloat(match[1]) * 1_000_000_000; source = 'hf-card'; }
@@ -195,14 +121,14 @@ async function fetchHFSize(hfId) {
       if (e.message.includes('401') || e.message.includes('404')) isPrivate = true;
     }
-    // 2. Fallback: Fetch the raw config.json file for estimation
     if (!params && !isPrivate) {
-      try {
-        const config = await getJson(`https://huggingface.co/${hfId}/raw/main/config.json`, { headers, retries: 1 });
-        params = config.total_parameters || estimateParams(config);
-        source = config.total_parameters ? 'hf-total' : 'hf-config-estimate';
       } catch (e) {
-        if (e.message.includes('401') || e.message.includes('404')) isPrivate = true;
       }
     }
@@ -210,12 +136,9 @@ async function fetchHFSize(hfId) {
     if (!params) return { error: 'No parameter data found' };
     const b = params / 1_000_000_000;
-    // Keep 2 decimals for small models (<1B), 1 decimal for others
     const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
     return { size, source };
-  } catch (e) {
-    return { error: e.message };
-  }
 }
 async function fetchOllamaMetadata(ollamaId) {
@@ -237,116 +160,40 @@ async function fetchOllamaMetadata(ollamaId) {
 const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'multilingual-mpnet'];
-// Manual mappings for models with non-standard naming.
 const MANUAL_HF_ID_MAP = {
-  'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
-  'whisper v3': 'openai/whisper-large-v3',
-  'whisper large v3': 'openai/whisper-large-v3',
-  'whisper v3 large': 'openai/whisper-large-v3',
-  'whisper large v3 turbo': 'openai/whisper-large-v3-turbo',
-  'step 3 5 flash': 'stepfun-ai/Step-3.5-Flash',
-  'bge m3': 'BAAI/bge-m3',
-  'bge en icl': 'BAAI/bge-en-icl',
-  'lightonocr 2': 'lightonai/LightOnOCR-2-1B',
-  'sdxl': 'stabilityai/stable-diffusion-xl-base-1.0',
-  'flux 1 schnell': 'black-forest-labs/FLUX.1-schnell',
-  'flux schnell': 'black-forest-labs/FLUX.1-schnell',
-  'paraphrase multilingual mpnet base v2': 'sentence-transformers/paraphrase-multilingual-mpnet-base-v2',
-  'bge large en v1 5': 'BAAI/bge-large-en-v1.5',
-  'bge multilingual gemma2': 'BAAI/bge-multilingual-gemma2',
-  'photomaker v2': 'TencentARC/PhotoMaker-V2',
-  'canopy labs orpheus english': 'canopy-labs/orpheus-medium',
-  'canopy labs orpheus arabic saudi': 'canopy-labs/orpheus-medium',
-  'qwen turbo': 'Alibaba/Qwen-Turbo',
-  'alibaba qwen turbo': 'Alibaba/Qwen-Turbo',
-  'qwen qwen turbo': 'Alibaba/Qwen-Turbo',
-  'qwen plus': 'Alibaba/Qwen-Plus',
-  'alibaba qwen plus': 'Alibaba/Qwen-Plus',
-  'qwen qwen plus': 'Alibaba/Qwen-Plus',
-  'qwen max': 'Alibaba/Qwen-Max',
-  'alibaba qwen max': 'Alibaba/Qwen-Max',
-  'qwen qwen max': 'Alibaba/Qwen-Max',
-  'qwen 3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
-  'qwen3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
-  'qwen 3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
-  'qwen3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
-  'qwen 3 5 flash': 'Qwen/Qwen2.5-7B-Instruct',
-  'qwen3 5 flash 02 23': 'Qwen/Qwen2.5-7B-Instruct',
-  'qwen3 5 plus 02 15': 'Qwen/Qwen2.5-32B-Instruct',
-  'qwen vl plus': 'Qwen/Qwen2-VL-7B-Instruct',
-  'qwen vl max': 'Qwen/Qwen2-VL-72B-Instruct',
-  'deepseek chat': 'deepseek-ai/DeepSeek-V3',
-  'deepseek reasoner': 'deepseek-ai/DeepSeek-R1',
-  'deepseek v3 turbo': 'deepseek-ai/DeepSeek-V3',
-  'deepseek v3 0324 fast': 'deepseek-ai/DeepSeek-V3',
-  'deepseek r1t2 chimera': 'deepseek-ai/DeepSeek-R1',
-  'deepseek v3 2 exp': 'deepseek-ai/DeepSeek-V3.2',
-  'deepseek v3 2 speciale': 'deepseek-ai/DeepSeek-V3.2',
-  'deepseek v3 base': 'deepseek-ai/DeepSeek-V3',
-  'deepseek v3 0324 base': 'deepseek-ai/DeepSeek-V3',
-  'grok 4 1 fast': 'xai-org/grok-fast',
-  'grok 4 fast': 'xai-org/grok-fast',
-  'grok code fast 1': 'xai-org/grok-code',
-  'grok 3 mini': 'xai-org/grok-mini',
-  'grok 3 mini beta': 'xai-org/grok-mini',
-  'grok 4 20 multi agent beta': 'xai-org/grok-4',
-  'grok 4 20 beta': 'xai-org/grok-4',
-  'grok 4': 'xai-org/grok-4',
-  'grok 3': 'xai-org/grok-3',
-  'grok 3 beta': 'xai-org/grok-3',
-  'grok 2 1212': 'xai-org/grok-2',
-  'glm 4 6v': 'THUDM/glm-4v-9b',
-  'glm 5 turbo': 'THUDM/glm-5-turbo',
-  'minimax m2 7': 'MiniMaxAI/MiniMax-M2.7',
-  'minimax m2 7 highspeed': 'MiniMaxAI/MiniMax-M2.7',
-  'minimax 01': 'MiniMaxAI/MiniMax-Text-01',
-  'minimax m2 her': 'MiniMaxAI/MiniMax-M2.7',
   'phi 4': 'microsoft/phi-4',
-  'flux 1 dev': 'black-forest-labs/FLUX.1-dev',
-  'flux dev': 'black-forest-labs/FLUX.1-dev',
-  'flux 2 dev': 'black-forest-labs/FLUX.2-dev',
-  'flux 2 klein 4b': 'black-forest-labs/FLUX.2-klein-4B',
-  'flux 2 klein 9b': 'black-forest-labs/FLUX.2-klein-9B',
-  'flux 2 pro': 'black-forest-labs/FLUX.2-pro',
-  'flux 1 pro': 'black-forest-labs/FLUX.1-pro',
-  'flux 2 flex': 'black-forest-labs/FLUX.2-flex',
-  'flux 2 max': 'black-forest-labs/FLUX.2-max',
-  'flux kontext pro': 'black-forest-labs/FLUX.1-pro',
-  'flux pro 1 1': 'black-forest-labs/FLUX.1-pro',
-  'flux pro': 'black-forest-labs/FLUX.1-pro',
-  'flux pro 1 0 fill': 'black-forest-labs/FLUX.1-pro',
-  'flux pro 1 1 ultra': 'black-forest-labs/FLUX.1-pro',
-  'flux kontext max': 'black-forest-labs/FLUX.1-pro',
-  'mistral large 3': 'mistralai/Mistral-Large-Instruct-2411',
-  'mistral large 2411': 'mistralai/Mistral-Large-Instruct-2411',
-  'mistral large 2407': 'mistralai/Mistral-Large-Instruct-2407',
-  'mistral small 4': 'mistralai/Mistral-Small-Instruct-2409',
-  'mistral medium 3': 'mistralai/Mistral-Medium-Instruct-2407',
-  'codestral latest': 'mistralai/Codestral-22B-v0.1',
-  'devstral 2': 'mistralai/Mistral-7B-v0.1',
 };
 const MANUAL_OLLAMA_ID_MAP = {
   'phi 4': 'phi4',
   'deepseek chat': 'deepseek-v3',
   'deepseek reasoner': 'deepseek-r1',
-  'codestral': 'codestral',
   'mistral small 24b': 'mistral-small',
-  'llama 3 1 8b': 'llama3.1:8b',
-  'llama 3 3 70b': 'llama3.3',
-  'gemma 2 9b': 'gemma2:9b',
-  'gemma 2 27b': 'gemma2:27b',
-  'qwen 2 5 coder 7b': 'qwen2.5-coder:7b',
-  'qwen 2 5 coder 32b': 'qwen2.5-coder:32b',
-  'mistral large 2411': 'mistral-large',
-  'mistral large 3': 'mistral-large',
-  'phi 3 5 mini': 'phi3.5',
-  'phi 3 5 vision': 'phi3.5-vision',
-  'qwen 2 5 7b': 'qwen2.5:7b',
-  'qwen 2 5 72b': 'qwen2.5:72b',
-  'mistral nemo': 'mistral-nemo',
-  'mixtral 8x7b': 'mixtral',
-  'mixtral 8x22b': 'mixtral-8x22b',
 };
 const PROPRIETARY_KEYWORDS = [
@@ -355,151 +202,99 @@ const PROPRIETARY_KEYWORDS = [
 ];
 async function propagateExtraData(data) {
-  const orProvider = data.providers.find((p) => p.name === 'OpenRouter');
-  const orIndex = buildOrIndex(orProvider);
   let benchmarks = [];
   try { benchmarks = JSON.parse(fs.readFileSync(path.join(__dirname, '..', 'data', 'benchmarks.json'), 'utf8')); } catch (e) {}
   const hfIdToSize = new Map();
-  benchmarks.forEach((b) => {
-    if (b.params_b && b.hf_id) hfIdToSize.set(b.hf_id.toLowerCase(), b.params_b);
-  });
-  // Multi-pass Enrichment Sweep
   // 1. Initial manual and fuzzy mapping
   data.providers.forEach(p => p.models.forEach(model => {
     const n = normName(model.name);
-    if (PROPRIETARY_KEYWORDS.some(k => n.includes(k))) model.hf_private = true;
-    if (!model.hf_id) {
-      for (const [key, val] of Object.entries(MANUAL_HF_ID_MAP)) {
-        if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) { model.hf_id = val; break; }
       }
     }
-    if (!model.ollama_id) {
-      for (const [key, val] of Object.entries(MANUAL_OLLAMA_ID_MAP)) {
-        if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) { model.ollama_id = val; break; }
-      }
     }
-    if (model.hf_id && !model.size_b) {
       const size = hfIdToSize.get(model.hf_id.toLowerCase());
       if (size) { model.size_b = size; model.size_source = 'benchmark'; }
     }
   }));
-  // 2. Cross-provider propagation (inherit successful enrichments)
-  const globalMeta = new Map();
   data.providers.forEach(p => p.models.forEach(m => {
-    if (m.size_b || m.hf_id || m.ollama_id || m.hf_private) {
-      const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
-      const existing = globalMeta.get(baseName) || {};
-      globalMeta.set(baseName, {
-        size_b: m.size_b || existing.size_b,
-        size_source: m.size_source || existing.size_source,
-        hf_id: m.hf_id || existing.hf_id,
-        ollama_id: m.ollama_id || existing.ollama_id,
-        hf_private: m.hf_private || existing.hf_private,
-      });
-    }
   }));
-  data.providers.forEach(p => p.models.forEach(m => {
-    const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
-    const meta = globalMeta.get(baseName);
-    if (meta) {
-      m.size_b = m.size_b || meta.size_b;
-      m.size_source = m.size_source || meta.size_source;
-      m.hf_id = m.hf_id || meta.hf_id;
-      m.ollama_id = m.ollama_id || meta.ollama_id;
-      m.hf_private = m.hf_private || meta.hf_private;
-    }
-  }));
-  // 3. Technical Lookups (Final fallback for remaining gaps)
-  let hfSizeFetched = 0, ollamaFetched = 0;
-  const hfLookupQueue = [], ollamaLookupQueue = [];
-  data.providers.forEach(provider => {
-    provider.models.forEach(model => {
-      const n = normName(model.name);
-      if (model.type === 'image' && (!model.capabilities || !model.capabilities.length)) { model.capabilities = ['image-gen']; }
-      if (model.type === 'chat' && EMBEDDER_KEYWORDS.some(k => n.includes(k))) { model.type = 'embedding'; }
-      if (!model.size_b) {
-        // Force lookup if we have a clear repo ID, even if previously marked private
-        if (model.hf_id || (model.name.includes('/') && !model.hf_private)) hfLookupQueue.push(model);
-        else if (!model.hf_private && model.ollama_id) ollamaLookupQueue.push(model);
-      }
-    });
-  });
-  const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id || m.name).filter(id => id.includes('/')))].slice(0, 300);
   if (uniqueIds.length > 0) {
     console.log(`\n  HF Hub: technical metadata inspection for ${uniqueIds.length} models...`);
     const idToResult = new Map();
-    for (let i = 0; i < uniqueIds.length; i++) {
-      const id = uniqueIds[i];
-      process.stdout.write(`    [${i + 1}/${uniqueIds.length}] ${id.padEnd(50)} `);
       const result = await fetchHFSize(id);
       idToResult.set(id, result);
       if (result.size) process.stdout.write(`✓ ${result.size}B (${result.source})\n`);
-      else { process.stdout.write(`✗ ${result.error || 'Err'}\n`); if (result.error && result.error.includes('429')) break; }
       await new Promise(r => setTimeout(r, 50));
     }
     for (const model of hfLookupQueue) {
       if (!model.size_b) {
-        const id = model.hf_id || model.name;
         const result = idToResult.get(id);
-        if (result) {
-          if (result.size) { model.size_b = result.size; model.size_source = result.source; hfSizeFetched++; }
-          if (result.private) model.hf_private = true;
-          else if (result.size) model.hf_private = false;
         }
       }
     }
   }
-  const uniqueOllama = [...new Set(ollamaLookupQueue.map(m => m.ollama_id))].filter(Boolean);
-  if (uniqueOllama.length > 0) {
-    console.log(`\n  Ollama: inspecting registry for ${uniqueOllama.length} models...`);
-    const idToResult = new Map();
-    for (let i = 0; i < uniqueOllama.length; i++) {
-      const id = uniqueOllama[i];
-      process.stdout.write(`    [${i + 1}/${uniqueOllama.length}] ${id.padEnd(50)} `);
-      const res = await fetchOllamaMetadata(id);
-      if (res) { idToResult.set(id, res); process.stdout.write(res.size ? `✓ ${res.size}B\n` : `✓\n`); }
-      else process.stdout.write(`✗\n`);
-      await new Promise(r => setTimeout(r, 50));
-    }
-    for (const model of ollamaLookupQueue) {
-      const res = idToResult.get(model.ollama_id);
-      if (res && res.size && !model.size_b) { model.size_b = res.size; model.size_source = 'ollama'; ollamaFetched++; }
     }
-  }
-  console.log(`\nEnriched: ${hfSizeFetched + ollamaFetched} technical sizes.`);
-}
-async function runFetcher(fetcher, data) {
-  try {
-    process.stdout.write(`Fetching ${fetcher.providerName}... `);
-    const models = await fetcher.fn();
-    if (updateProviderModels(data.providers, fetcher.providerName, models)) console.log(`✓ ${models.length} models`);
-    return { ...fetcher, success: true, count: models.length };
-  } catch (err) {
-    console.log(`✗ ${err.message}`);
-    return { ...fetcher, success: false, error: err.message };
-  }
 }
 async function main() {
   const data = loadData();
-  const args = process.argv.slice(2).map(a => a.toLowerCase());
-  const fetchers = args.length > 0 ? FETCHERS.filter(f => args.includes(f.key)) : FETCHERS;
-  console.log(`Running ${fetchers.length} fetcher(s)...\n`);
-  for (const f of fetchers) await runFetcher(f, data);
   await propagateExtraData(data);
   saveData(data);
-  console.log('\nSummary:');
-  data.providers.forEach(p => console.log(`  ${p.models ? '✓' : '✗'} ${p.name}: ${p.models ? p.models.length : 0} models`));
 }
 main().catch(err => { console.error('Fatal:', err); process.exit(1); });

 /**
  * Fetch live pricing data from all supported providers and update data/providers.json.
  */
 const fs = require('fs');
 function updateProviderModels(providers, providerName, models) {
   const provider = providers.find((p) => p.name === providerName);
+  if (!provider) return false;
   const existingMap = new Map((provider.models || []).map(m => [m.name, m]));
   provider.models = models.map(newModel => {
     if (!existing) return newModel;
     return {
+      ...existing,
+      ...newModel,
       size_b: newModel.size_b || existing.size_b,
       size_source: newModel.size_source || existing.size_source,
       hf_id: newModel.hf_id || existing.hf_id,
 const normName = (s) =>
   s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
 // Estimate parameters from config.json (vLLM style fallback)
+function estimateParams(config, hfId) {
   if (!config) return null;
   const h = config.hidden_size || config.d_model || config.n_embd;
   const l = config.num_hidden_layers || config.n_layer;
   const v = config.vocab_size;
   const i = config.intermediate_size || config.d_ff;
   const numExperts = config.num_local_experts || config.n_experts || config.num_experts || 1;
   const modelType = (config.model_type || '').toLowerCase();
   if (h && l && v) {
     const intermediate = i || (4 * h);
     const vocabParams = v * h;
     const posParams = (config.max_position_embeddings || 512) * h;
     const typeParams = (config.type_vocab_size || 0) * h;
     const embedParams = vocabParams + posParams + typeParams;
     const attentionParams = 4 * (h * h);
+    // Check if architecture uses GLU (3 weights per MLP layer)
+    const hasGlu = ['llama', 'mistral', 'phi3', 'qwen2', 'gemma', 'gemma2', 'minimax'].includes(modelType)
+                   || hfId.toLowerCase().includes('qwen')
+                   || hfId.toLowerCase().includes('minimax');
+    const mlpParams = (hasGlu ? 3 : 2) * h * intermediate * numExperts;
+    const total = embedParams + l * (attentionParams + mlpParams);
+    return total;
   }
   return null;
 }
   const token = process.env.HF_TOKEN;
   const headers = token ? { Authorization: `Bearer ${token}` } : {};
   let isPrivate = false;
   try {
+    let params = null, source = 'hf-total', data = {};
+    // 1. API Metadata
     try {
       data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
       params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
       if (!params && data.cardData?.model_details?.parameters) {
         const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
         if (match) { params = parseFloat(match[1]) * 1_000_000_000; source = 'hf-card'; }
       if (e.message.includes('401') || e.message.includes('404')) isPrivate = true;
     }
+    // 2. Raw config.json fetch
     if (!params && !isPrivate) {
+      try {
+        const config = await getJson(`https://huggingface.co/${hfId}/raw/main/config.json`, { headers, retries: 1 });
+        params = config.total_parameters || estimateParams(config, hfId);
+        source = config.total_parameters ? 'hf-total' : 'hf-config-estimate';
       } catch (e) {
+        if (e.message.includes('401') || e.message.includes('404')) isPrivate = true;
       }
     }
     if (!params) return { error: 'No parameter data found' };
     const b = params / 1_000_000_000;
     const size = b < 1 ? Math.round(b * 100) / 100 : Math.round(b * 10) / 10;
     return { size, source };
+  } catch (e) { return { error: e.message }; }
 }
 async function fetchOllamaMetadata(ollamaId) {
 const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'multilingual-mpnet'];
 const MANUAL_HF_ID_MAP = {
+  'minimax/minimax-m1': 'MiniMaxAI/MiniMax-M1-80k',
+  'minimax minimax m1': 'MiniMaxAI/MiniMax-M1-80k',
+  'minimax m1': 'MiniMaxAI/MiniMax-M1-80k',
+  'qwen plus': 'Qwen/Qwen3-Coder-30B-A3B-Instruct',
+  'alibaba qwen plus': 'Qwen/Qwen3-Coder-30B-A3B-Instruct',
+  'qwen qwen plus': 'Qwen/Qwen3-Coder-30B-A3B-Instruct',
   'phi 4': 'microsoft/phi-4',
+  'mistral small 4': 'mistralai/Mistral-Small-4-119B-2603',
+  'mistral small 3 2': 'mistralai/Mistral-Small-3.2-24B-Instruct-2506',
+  'mistral small 3 1': 'mistralai/Mistral-Small-3.1-24B-Instruct-2503',
+  'mistral small 2501': 'mistralai/Mistral-Small-24B-Instruct-2501',
+  'mistral small 2409': 'mistralai/Mistral-Small-Instruct-2409',
+  'mistral small 24b': 'mistralai/Mistral-Small-24B-Instruct-2501',
 };
 const MANUAL_OLLAMA_ID_MAP = {
   'phi 4': 'phi4',
   'deepseek chat': 'deepseek-v3',
   'deepseek reasoner': 'deepseek-r1',
   'mistral small 24b': 'mistral-small',
+};
+const MANUAL_SIZE_MAP = {
+  'BAAI/bge-m3': 0.57,
+  'black-forest-labs/FLUX.1-schnell': 12,
+  'black-forest-labs/FLUX.1-dev': 12,
+  'black-forest-labs/FLUX.1-pro': 12,
+  'black-forest-labs/FLUX.2-dev': 32,
+  'black-forest-labs/FLUX.2-pro': 32,
+  'black-forest-labs/FLUX.2-flex': 32,
+  'black-forest-labs/FLUX.2-max': 32,
+  'black-forest-labs/FLUX.2-klein-4B': 4,
+  'black-forest-labs/FLUX.2-klein-9B': 9,
 };
 const PROPRIETARY_KEYWORDS = [
 ];
 async function propagateExtraData(data) {
   let benchmarks = [];
   try { benchmarks = JSON.parse(fs.readFileSync(path.join(__dirname, '..', 'data', 'benchmarks.json'), 'utf8')); } catch (e) {}
   const hfIdToSize = new Map();
+  benchmarks.forEach((b) => { if (b.params_b && b.hf_id) hfIdToSize.set(b.hf_id.toLowerCase(), b.params_b); });
   // 1. Initial manual and fuzzy mapping
   data.providers.forEach(p => p.models.forEach(model => {
     const n = normName(model.name);
+    for (const [key, val] of Object.entries(MANUAL_HF_ID_MAP)) {
+      if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) {
+        model.hf_id = val; model.hf_private = false; break;
       }
     }
+    if (PROPRIETARY_KEYWORDS.some(k => n.includes(k)) && !model.hf_id) model.hf_private = true;
+    for (const [key, val] of Object.entries(MANUAL_OLLAMA_ID_MAP)) {
+      if (n === key || n.endsWith(' ' + key) || n.endsWith('/' + key)) model.ollama_id = val;
     }
+    if (model.hf_id && MANUAL_SIZE_MAP[model.hf_id]) {
+      model.size_b = MANUAL_SIZE_MAP[model.hf_id]; model.size_source = 'manual';
+    } else if (model.hf_id && !model.size_b) {
       const size = hfIdToSize.get(model.hf_id.toLowerCase());
       if (size) { model.size_b = size; model.size_source = 'benchmark'; }
     }
   }));
+  // 2. Technical Metadata Lookups
+  const hfLookupQueue = [];
   data.providers.forEach(p => p.models.forEach(m => {
+    if (!m.size_b && m.hf_id && !m.hf_private) hfLookupQueue.push(m);
   }));
+  const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id))];
   if (uniqueIds.length > 0) {
     console.log(`\n  HF Hub: technical metadata inspection for ${uniqueIds.length} models...`);
     const idToResult = new Map();
+    for (const id of uniqueIds) {
+      process.stdout.write(`    ${id.padEnd(50)} `);
       const result = await fetchHFSize(id);
       idToResult.set(id, result);
       if (result.size) process.stdout.write(`✓ ${result.size}B (${result.source})\n`);
+      else process.stdout.write(`✗ ${result.error || 'Err'}\n`);
       await new Promise(r => setTimeout(r, 50));
     }
     for (const model of hfLookupQueue) {
       if (!model.size_b) {
+        const id = model.hf_id;
         const result = idToResult.get(id);
+        if (result && result.size) {
+          model.size_b = result.size;
+          model.size_source = result.source;
+          model.hf_private = false;
         }
       }
     }
   }
+  // 3. GLOBAL ENRICHMENT SWEEP
+  const technicalPool = new Map();
+  data.providers.forEach(p => p.models.forEach(m => {
+    const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
+    if (m.size_b || m.hf_id) {
+      const meta = { size_b: m.size_b, size_source: m.size_source, hf_id: m.hf_id, ollama_id: m.ollama_id, hf_private: m.hf_private };
+      if (m.hf_id) technicalPool.set('id:' + m.hf_id.toLowerCase(), meta);
+      technicalPool.set('name:' + baseName, meta);
     }
+  }));
+  data.providers.forEach(p => p.models.forEach(m => {
+    const baseName = m.name.split('/').pop().replace(/:free$/, '').toLowerCase();
+    const metaByName = technicalPool.get('name:' + baseName);
+    const metaById = m.hf_id ? technicalPool.get('id:' + m.hf_id.toLowerCase()) : null;
+    const best = metaById || metaByName;
+    if (best) {
+      m.size_b = m.size_b || best.size_b;
+      m.size_source = m.size_source || best.size_source;
+      m.hf_id = m.hf_id || best.hf_id;
+      m.ollama_id = m.ollama_id || best.ollama_id;
+      if (m.size_b || m.hf_id) m.hf_private = false;
+    }
+  }));
 }
 async function main() {
   const data = loadData();
+  for (const f of FETCHERS) {
+    try {
+      process.stdout.write(`Fetching ${f.providerName}... `);
+      const models = await f.fn();
+      if (updateProviderModels(data.providers, f.providerName, models)) console.log(`✓ ${models.length} models`);
+    } catch (err) { console.log(`✗ ${err.message}`); }
+  }
   await propagateExtraData(data);
   saveData(data);
 }
 main().catch(err => { console.error('Fatal:', err); process.exit(1); });