Spaces:

Divs0910
/

Digi-Biz

Paused

Digi-Biz / .env.example

Deployment Bot

Automated deployment to Hugging Face

255cbd1 about 1 month ago

2.52 kB

	# ===========================================
	# Environment Configuration for Digi-Biz
	# ===========================================
	# Copy this file to .env and fill in your values

	# ===========================================
	# Groq API (for text AND vision LLM tasks)
	# Get key from: https://console.groq.com
	# ===========================================
	GROQ_API_KEY=gsk_your_api_key_here

	# Model for text tasks (schema mapping, classification)
	GROQ_MODEL=gpt-oss-120b

	# Model for vision tasks (image analysis)
	# Current model: meta-llama/llama-4-scout-17b-16e-instruct
	GROQ_VISION_MODEL=meta-llama/llama-4-scout-17b-16e-instruct

	# ===========================================
	# Ollama Configuration (for Vision)
	# ===========================================
	# Local Ollama host (default is fine for local setup)
	OLLAMA_HOST=http://localhost:11434

	# Vision model for image analysis
	OLLAMA_VISION_MODEL=qwen3.5:0.8b

	# ===========================================
	# Application Settings
	# ===========================================
	# Application environment (development, production)
	APP_ENV=development

	# Log level (DEBUG, INFO, WARNING, ERROR, CRITICAL)
	LOG_LEVEL=INFO

	# Maximum file size for ZIP uploads (in bytes)
	# Default: 500MB
	MAX_FILE_SIZE=524288000

	# Maximum files per ZIP
	MAX_FILES_PER_ZIP=100

	# ===========================================
	# Storage Configuration
	# ===========================================
	# Base directory for all storage
	STORAGE_BASE=./storage

	# Subdirectories (relative to STORAGE_BASE)
	UPLOADS_DIR=uploads
	EXTRACTED_DIR=extracted
	PROFILES_DIR=profiles
	INDEX_DIR=index
	TEMP_DIR=temp

	# ===========================================
	# Processing Settings
	# ===========================================
	# Number of concurrent document parsing tasks
	MAX_CONCURRENT_PARSING=5

	# Number of concurrent image analysis tasks
	MAX_CONCURRENT_VISION=3

	# Timeout for document parsing (seconds)
	PARSING_TIMEOUT=300

	# Timeout for LLM requests (seconds)
	LLM_TIMEOUT=60

	# ===========================================
	# Optional: OCR Settings (for scanned PDFs)
	# ===========================================
	# Enable OCR fallback for scanned PDFs
	ENABLE_OCR_FALLBACK=true

	# Tesseract executable path (leave empty for default)
	TESSERACT_PATH=

	# ===========================================
	# Optional: Rate Limiting
	# ===========================================
	# Groq API requests per minute
	GROQ_RATE_LIMIT=30

	# Ollama requests per minute (local, but manage concurrency)
	OLLAMA_RATE_LIMIT=20