zenlm
/

zen-translator

Model card Files Files and versions

zen-translator / Makefile

zeekay's picture

Upload folder using huggingface_hub

f0b1626 verified 3 months ago

history blame contribute delete

3.43 kB

	# Zen Translator Makefile
	# Real-time multimodal translation with voice cloning and lip sync

	SHELL := /bin/bash
	PYTHON := python3
	UV := uv
	VENV := .venv
	MODEL_DIR := ./models

	.PHONY: all install dev clean test lint format serve train download help

	all: install download

	## Installation

	install: venv ## Install production dependencies
	$(UV) pip install -e .

	dev: venv ## Install development dependencies
	$(UV) pip install -e ".[all]"
	$(UV) pip install git+https://github.com/huggingface/transformers

	venv: ## Create virtual environment
	$(UV) venv $(VENV)
	@echo "Virtual environment created at $(VENV)"
	@echo "Activate with: source $(VENV)/bin/activate"

	## Model Downloads

	download: download-qwen3-omni download-cosyvoice download-wav2lip ## Download all models

	download-qwen3-omni: ## Download Qwen3-Omni (30B)
	@echo "Downloading Qwen3-Omni-30B-A3B-Instruct..."
	$(UV) run hf download Qwen/Qwen3-Omni-30B-A3B-Instruct --local-dir $(MODEL_DIR)/qwen3-omni

	download-cosyvoice: ## Download CosyVoice 2.0
	@echo "Downloading CosyVoice 2.0..."
	$(UV) run hf download FunAudioLLM/CosyVoice2-0.5B --local-dir $(MODEL_DIR)/cosyvoice

	download-wav2lip: ## Download Wav2Lip
	@echo "Downloading Wav2Lip..."
	$(UV) run hf download numz/wav2lip_studio --local-dir $(MODEL_DIR)/wav2lip

	download-quantized: ## Download quantized models (smaller)
	@echo "Downloading quantized Qwen3-Omni AWQ..."
	$(UV) run hf download cpatonn/Qwen3-Omni-30B-A3B-Instruct-AWQ-4bit --local-dir $(MODEL_DIR)/qwen3-omni-4bit

	## Running

	serve: ## Start the translation server
	$(UV) run zen-serve --host 0.0.0.0 --port 8000

	serve-dev: ## Start server with auto-reload
	$(UV) run zen-serve --host 0.0.0.0 --port 8000 --reload

	translate: ## Translate a file (use: make translate FILE=input.mp4)
	$(UV) run zen-translate $(FILE) -o output.mp4

	## Training

	train-identity: ## Train Zen identity
	$(UV) run zen-translate train --type identity --output ./outputs/identity

	train-anchor: ## Train news anchor adaptation
	$(UV) run zen-translate train --type anchor --output ./outputs/anchor

	dataset-build: ## Build news anchor training dataset
	$(UV) run zen-translate dataset build --output ./data/news_anchors --channels cnn,bbc,nhk,dw

	dataset-list: ## List available news channels
	$(UV) run zen-translate dataset list

	swift-train: ## Run ms-swift training (after train-identity generates config)
	swift sft --config ./outputs/identity/train_config.yaml

	## Development

	test: ## Run tests
	$(UV) run pytest tests/ -v --cov=zen_translator

	lint: ## Run linter
	$(UV) run ruff check src/ tests/

	format: ## Format code
	$(UV) run ruff format src/ tests/

	typecheck: ## Run type checker
	$(UV) run mypy src/

	## Docker

	docker-build: ## Build Docker image
	docker build -t zenlm/zen-translator:latest .

	docker-run: ## Run Docker container
	docker run -p 8000:8000 --gpus all zenlm/zen-translator:latest

	## Cleanup

	clean: ## Clean build artifacts
	rm -rf build/ dist/ *.egg-info
	find . -type d -name __pycache__ -exec rm -rf {} +
	find . -type f -name "*.pyc" -delete

	clean-models: ## Remove downloaded models
	rm -rf $(MODEL_DIR)/*

	clean-all: clean clean-models ## Clean everything
	rm -rf $(VENV)

	## Help

	help: ## Show this help
	@grep -E '^[a-zA-Z_-]+:.?## .$$' $(MAKEFILE_LIST) \| sort \| awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36m%-20s\033[0m %s\n", $$1, $$2}'

	# Default target
	.DEFAULT_GOAL := help