akhaliq HF Staff commited on
Commit
564ef48
·
1 Parent(s): fa45e57
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -2428,11 +2428,8 @@ def get_inference_client(model_id, provider="auto"):
2428
  base_url="https://api.moonshot.ai/v1",
2429
  )
2430
  elif model_id == "kimi-k2-thinking":
2431
- # Use Moonshot AI (OpenAI-compatible) client for Kimi K2 Thinking
2432
- return OpenAI(
2433
- api_key=os.getenv("MOONSHOT_API_KEY"),
2434
- base_url="https://api.moonshot.ai/v1",
2435
- )
2436
  elif model_id == "stealth-model-1":
2437
  # Use stealth model with generic configuration
2438
  api_key = os.getenv("STEALTH_MODEL_1_API_KEY")
@@ -2475,6 +2472,9 @@ def get_real_model_id(model_id: str) -> str:
2475
  raise ValueError("STEALTH_MODEL_1_ID environment variable is required for Carrot model")
2476
 
2477
  return real_model_id
 
 
 
2478
  return model_id
2479
 
2480
  # Type definitions
 
2428
  base_url="https://api.moonshot.ai/v1",
2429
  )
2430
  elif model_id == "kimi-k2-thinking":
2431
+ # Use HuggingFace InferenceClient with Novita provider for Kimi K2 Thinking
2432
+ provider = "novita"
 
 
 
2433
  elif model_id == "stealth-model-1":
2434
  # Use stealth model with generic configuration
2435
  api_key = os.getenv("STEALTH_MODEL_1_API_KEY")
 
2472
  raise ValueError("STEALTH_MODEL_1_ID environment variable is required for Carrot model")
2473
 
2474
  return real_model_id
2475
+ elif model_id == "kimi-k2-thinking":
2476
+ # Return the full model name with provider tag for Kimi K2 Thinking
2477
+ return "moonshotai/Kimi-K2-Thinking:novita"
2478
  return model_id
2479
 
2480
  # Type definitions