fraud-detector-api / .env.example
chotam's picture
Deploy fraud detector API
a783939
APP_ENV=dev
DB_URL=sqlite:///./fraud.db
# Primary whisper model — handles Russian audio and auto-detection.
# Default 'small' is vanilla openai/whisper-small, no build-time conversion
# needed. Other values:
# - tiny / base — lower-resource alternatives
# - medium — better accuracy, ~1.5 GB RAM
WHISPER_MODEL=small
# Optional Kazakh-specialised model.
#
# The Dockerfile converter stage pre-builds a CTranslate2-formatted
# fine-tune from the HF model named by the build arg WHISPER_KK_FINETUNE
# (default akuzdeuov/whisper-base.kk — 15.36% WER on KSC2, 1000h of
# Kazakh audio). On a successful build the converted weights live at
# /app/models/whisper-kk/kk inside the container. The runtime loads them
# from there and routes Kazakh audio through this model.
#
# If the build-time conversion fails (ctranslate2 / transformers version
# drift, network, etc.), the directory is empty and the runtime quietly
# uses the primary model for Kazakh too.
#
# Set to empty string to disable KK routing entirely:
# WHISPER_KK_MODEL=
WHISPER_KK_MODEL=/app/models/whisper-kk/kk
WHISPER_DEVICE=cpu
WHISPER_COMPUTE_TYPE=int8
WHISPER_BEAM_SIZE=5
WHISPER_CPU_THREADS=4
CLF_PATH=models/clf.pkl
MAX_AUDIO_MB=10
RISK_LOW_THRESHOLD=0.40
RISK_HIGH_THRESHOLD=0.60
APP_VERSION=1.0.0