Spaces:

gopikrishnait
/

RGBMetrics

Sleeping

RGB Evaluation commited on Jan 9

Commit

1b8d19d

1 Parent(s): ca5ddcb

feat: Add Moonshot Kimi K2 Instruct model to DEFAULT_MODELS

- Added moonshotai/kimi-k2-instruct to primary evaluation models
- Now evaluating with 5 models total
- Kimi K2 provides multi-lingual capabilities and strong reasoning
- Maintains all existing models in list

Files changed (1) hide show

src/config.py +2 -1

src/config.py CHANGED Viewed

@@ -26,12 +26,13 @@ DATASET_URLS = {
     "en_fact.json": "https://raw.githubusercontent.com/chen700564/RGB/main/data/en_fact.json",
 }
-# Default models to evaluate (first 4 as primary)
 DEFAULT_MODELS: List[str] = [
     "meta-llama/llama-4-maverick-17b-128e-instruct",  # Llama 4 Maverick 17B
     "meta-llama/llama-prompt-guard-2-86m",            # Llama Prompt Guard 2 86M
     "llama-3.1-8b-instant",                           # Llama 3.1 8B - Fast
     "openai/gpt-oss-120b",                            # GPT OSS 120B
 ]
 # Additional available models

     "en_fact.json": "https://raw.githubusercontent.com/chen700564/RGB/main/data/en_fact.json",
 }
+# Default models to evaluate (first 5 as primary)
 DEFAULT_MODELS: List[str] = [
     "meta-llama/llama-4-maverick-17b-128e-instruct",  # Llama 4 Maverick 17B
     "meta-llama/llama-prompt-guard-2-86m",            # Llama Prompt Guard 2 86M
     "llama-3.1-8b-instant",                           # Llama 3.1 8B - Fast
     "openai/gpt-oss-120b",                            # GPT OSS 120B
+    "moonshotai/kimi-k2-instruct",                    # Moonshot Kimi K2 Instruct
 ]
 # Additional available models