api1

Sleeping

Reality123b commited on Aug 9, 2025

Commit

9172b86

verified ·

1 Parent(s): 1e49580

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,14 +5,14 @@ import torch
 class ModelInput(BaseModel):
     prompt: str
-    max_new_tokens: int = 64000
 app = FastAPI()
 # Initialize text generation pipeline
 generator = pipeline(
     "text-generation",
-    model="deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
     device="cpu"  # Use CPU (change to device=0 for GPU)
 )

 class ModelInput(BaseModel):
     prompt: str
+    max_new_tokens: int = 128000
 app = FastAPI()
 # Initialize text generation pipeline
 generator = pipeline(
     "text-generation",
+    model="Qwen/Qwen3-4B-Thinking-2507",
     device="cpu"  # Use CPU (change to device=0 for GPU)
 )