Spaces:

chotam
/

fraud-detector-api

Running

File size: 1,293 Bytes

a783939

APP_ENV=dev
DB_URL=sqlite:///./fraud.db

# Primary whisper model — handles Russian audio and auto-detection.
# Default 'small' is vanilla openai/whisper-small, no build-time conversion
# needed. Other values:
#   - tiny / base   — lower-resource alternatives
#   - medium        — better accuracy, ~1.5 GB RAM
WHISPER_MODEL=small

# Optional Kazakh-specialised model.
#
# The Dockerfile converter stage pre-builds a CTranslate2-formatted
# fine-tune from the HF model named by the build arg WHISPER_KK_FINETUNE
# (default akuzdeuov/whisper-base.kk — 15.36% WER on KSC2, 1000h of
# Kazakh audio). On a successful build the converted weights live at
# /app/models/whisper-kk/kk inside the container. The runtime loads them
# from there and routes Kazakh audio through this model.
#
# If the build-time conversion fails (ctranslate2 / transformers version
# drift, network, etc.), the directory is empty and the runtime quietly
# uses the primary model for Kazakh too.
#
# Set to empty string to disable KK routing entirely:
#   WHISPER_KK_MODEL=
WHISPER_KK_MODEL=/app/models/whisper-kk/kk

WHISPER_DEVICE=cpu
WHISPER_COMPUTE_TYPE=int8
WHISPER_BEAM_SIZE=5
WHISPER_CPU_THREADS=4

CLF_PATH=models/clf.pkl

MAX_AUDIO_MB=10
RISK_LOW_THRESHOLD=0.40
RISK_HIGH_THRESHOLD=0.60

APP_VERSION=1.0.0