Update app.py
Browse files
app.py
CHANGED
|
@@ -333,7 +333,7 @@ app.add_middleware(
|
|
| 333 |
class PromptRequest(BaseModel):
|
| 334 |
text: str = Field(..., max_length=2000, description="Texto de entrada")
|
| 335 |
max_tokens: int = Field(default=150, ge=10, le=300, description="Tokens m谩ximos a generar")
|
| 336 |
-
temperature: float = Field(default=0.
|
| 337 |
top_k: int = Field(default=50, ge=1, le=100, description="Top-k sampling")
|
| 338 |
top_p: float = Field(default=0.9, ge=0.1, le=1.0, description="Top-p (nucleus) sampling")
|
| 339 |
repetition_penalty: float = Field(default=1.1, ge=1.0, le=2.0, description="Penalizaci贸n por repetici贸n")
|
|
@@ -393,8 +393,8 @@ async def generate(req: PromptRequest):
|
|
| 393 |
|
| 394 |
# Si es saludo, usar menos tokens y temperatura m谩s alta para respuestas creativas
|
| 395 |
if is_greeting:
|
| 396 |
-
max_tokens =
|
| 397 |
-
temperature = 0.
|
| 398 |
else:
|
| 399 |
max_tokens = req.max_tokens
|
| 400 |
temperature = req.temperature
|
|
|
|
| 333 |
class PromptRequest(BaseModel):
|
| 334 |
text: str = Field(..., max_length=2000, description="Texto de entrada")
|
| 335 |
max_tokens: int = Field(default=150, ge=10, le=300, description="Tokens m谩ximos a generar")
|
| 336 |
+
temperature: float = Field(default=0.6, ge=0.1, le=2.0, description="Temperatura de muestreo")
|
| 337 |
top_k: int = Field(default=50, ge=1, le=100, description="Top-k sampling")
|
| 338 |
top_p: float = Field(default=0.9, ge=0.1, le=1.0, description="Top-p (nucleus) sampling")
|
| 339 |
repetition_penalty: float = Field(default=1.1, ge=1.0, le=2.0, description="Penalizaci贸n por repetici贸n")
|
|
|
|
| 393 |
|
| 394 |
# Si es saludo, usar menos tokens y temperatura m谩s alta para respuestas creativas
|
| 395 |
if is_greeting:
|
| 396 |
+
max_tokens = 40
|
| 397 |
+
temperature = 0.7
|
| 398 |
else:
|
| 399 |
max_tokens = req.max_tokens
|
| 400 |
temperature = req.temperature
|