Spaces:

therandomuser03
/

psypredict-backend

Running

App Files Files Community

psypredict-backend / app /config.py

therandomuser03

feat: replace Ollama with Groq API (llama-3.3-70b-versatile)

befb434 6 days ago

raw

history blame contribute delete

2.68 kB

	"""
	config.py — PsyPredict Production Configuration
	All settings loaded from environment variables via Pydantic Settings.
	"""
	from pydantic_settings import BaseSettings, SettingsConfigDict
	from functools import lru_cache


	class Settings(BaseSettings):
	# ── Groq API (replaces Ollama) ────────────────────────────────────────────
	GROQ_API_KEY: str = ""
	GROQ_MODEL: str = "llama-3.3-70b-versatile"

	# ── Kept for backwards compatibility (health endpoint reads these) ─────────
	OLLAMA_BASE_URL: str = "http://127.0.0.1:11434"
	OLLAMA_MODEL: str = "llama-3.3-70b-versatile"
	OLLAMA_TIMEOUT_S: int = 30
	OLLAMA_RETRIES: int = 3
	OLLAMA_RETRY_DELAY_S: float = 2.0

	# ── DistilBERT Text Emotion ───────────────────────────────────────────────
	DISTILBERT_MODEL: str = "bhadresh-savani/distilbert-base-uncased-emotion"

	# ── Crisis Detection ──────────────────────────────────────────────────────
	CRISIS_THRESHOLD: float = 0.65

	# ── Multimodal Fusion Weights (must sum to ~1.0) ──────────────────────────
	TEXT_WEIGHT: float = 0.65
	FACE_WEIGHT: float = 0.35

	# ── Context Window ────────────────────────────────────────────────────────
	MAX_CONTEXT_TURNS: int = 10

	# ── Logging ───────────────────────────────────────────────────────────────
	LOG_LEVEL: str = "INFO"

	# ── Rate Limiting ─────────────────────────────────────────────────────────
	RATE_LIMIT: str = "30/minute"

	# ── Input Sanitization ───────────────────────────────────────────────────
	MAX_INPUT_CHARS: int = 2000

	model_config = SettingsConfigDict(
	env_file=".env",
	env_file_encoding="utf-8",
	extra="ignore",
	)


	@lru_cache(maxsize=1)
	def get_settings() -> Settings:
	"""Returns a cached singleton Settings instance."""
	return Settings()