Spaces:

HuuDatLego
/

UI-VieNeu

Build error

App Files Files Community

HuuDatLego commited on 27 days ago

Commit

911c66e

verified ·

1 Parent(s): 6376ca1

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +138 -0
.gitignore +3 -4
CHANGELOG.md +34 -0
Dockerfile +23 -17
README-hf.md +12 -0
README.md +78 -8
goi_y_hinh_anh_gameloft.md +19 -0
kich_ban_mau.md +58 -0
main.py +106 -23
prompt_gan_tag_bieu_cam.md +35 -0
prompt_seo_assistant.md +33 -0
prompt_tao_anh_nen.md +123 -0
prompt_tao_kich_ban.md +42 -0
prompt_tao_kich_ban_giai_thich_meme.md +51 -0
prompt_tao_kich_ban_reaction.md +61 -0
prompt_tao_kich_ban_tu_anh.md +33 -0
resize_img.py +28 -0
scratch/check_dims.py +12 -0
scratch/check_green.py +12 -0
scratch/extract_frame.py +10 -0
scratch/extract_last_frame.py +10 -0
scratch/print_args.py +21 -0
scratch/process_green_background.py +44 -0
scratch/resize_cards.py +34 -0
scratch/test_ai_pipeline.py +18 -0
scratch/test_ffmpeg.py +22 -0
scratch/test_ffmpeg2.py +14 -0
scratch/test_pipeline.py +46 -0
scratch/test_studio_output.mp4 +0 -0
scratch/tmp/concat.txt +4 -0
scratch/tmp/frame.jpg +0 -0
scratch/tmp/frame_last.jpg +0 -0
scratch/tmp/part_init.wav +3 -0
scratch/tmp/studio_output.mp4 +3 -0
scratch/tmp/tts_voiceover.wav +3 -0
scratch/tmp/tts_voiceover_mixed.mp3 +3 -0
services/ai_pipeline.py +111 -104
services/audio_service.py +188 -0
services/subtitle_service.py +75 -0
services/video_service.py +83 -0
start.sh +11 -6
static/characters/Anh-mat-chan-thanh.png +3 -0
static/characters/Bat-luc.png +3 -0
static/characters/Bat-ngo.png +3 -0
static/characters/Binh-thuong.png +3 -0
static/characters/Bo-tay.png +3 -0
static/characters/Buon-nhe.png +3 -0
static/characters/Cam-thong.png +3 -0
static/characters/Cau-xin.png +3 -0
static/characters/Chao-khan-gia.png +3 -0

.gitattributes CHANGED Viewed

@@ -1,2 +1,140 @@
 # Auto detect text files and perform LF normalization
 * text=auto

 # Auto detect text files and perform LF normalization
 * text=auto
+scratch/tmp/part_init.wav filter=lfs diff=lfs merge=lfs -text
+scratch/tmp/studio_output.mp4 filter=lfs diff=lfs merge=lfs -text
+scratch/tmp/tts_voiceover.wav filter=lfs diff=lfs merge=lfs -text
+scratch/tmp/tts_voiceover_mixed.mp3 filter=lfs diff=lfs merge=lfs -text
+static/characters/Anh-mat-chan-thanh.png filter=lfs diff=lfs merge=lfs -text
+static/characters/bat-luc-qua.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Bat-luc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Bat-ngo.png filter=lfs diff=lfs merge=lfs -text
+static/characters/bat-thong-bao.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Binh-thuong.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Bo-tay.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Buon-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Cam-thong.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Cau-xin.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Chao-khan-gia.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Chi-tay-man-hinh.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Chiu-thua.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Cuc-ky-nghiem-tuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Cuoi-tuoi.png filter=lfs diff=lfs merge=lfs -text
+static/characters/de-lai-comment.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Doi.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Gian.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Gio-tay-nhan-manh.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Hanh-phuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Kho-hieu.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Khoanh-tay-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Khoanh-tay.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Khoc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Lac-dau.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Lo-lang-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Lo-lang.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Mim-cuoi-ke-chuyen.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Mim-cuoi-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Mot-tay-om-ma.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nghi-ra-roi.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nghiem-tuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nhech-mep-cuoi.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nhin-gie.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nhin-thang.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nhiu-may-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Nhiu-may.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Noi-nghe-ne.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Noi.png filter=lfs diff=lfs merge=lfs -text
+static/characters/nut-like.png filter=lfs diff=lfs merge=lfs -text
+static/characters/nut-subscribe.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Phai-vay-khong.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Phan-tich.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Quyet-tam-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Quyet-tam.png filter=lfs diff=lfs merge=lfs -text
+static/characters/So-hai.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Suy-tu.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tam-biet.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tap-trung.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tay-sau-lung.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tay-truoc-nguc.png filter=lfs diff=lfs merge=lfs -text
+static/characters/That-vong.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tho-dai-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters/tram-tu.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Tsundere.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Ve-mat-am-ap.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Vuot-chan.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Wow.png filter=lfs diff=lfs merge=lfs -text
+static/characters/Xin-chao.png filter=lfs diff=lfs merge=lfs -text
+static/characters/You.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Anh-mat-chan-thanh.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/bat-luc-qua.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Bat-luc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Bat-ngo.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/bat-thong-bao.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Binh-thuong.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Bo-tay.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Buon-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Cam-thong.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Cau-xin.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Chao-khan-gia.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Chi-tay-man-hinh.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Chiu-thua.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Cuc-ky-nghiem-tuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Cuoi-tuoi.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/de-lai-comment.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Doi.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Gian.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Gio-tay-nhan-manh.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Hanh-phuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Kho-hieu.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Khoanh-tay-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Khoanh-tay.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Khoc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Lac-dau.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Lo-lang-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Lo-lang.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Mim-cuoi-ke-chuyen.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Mim-cuoi-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Mot-tay-om-ma.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nghi-ra-roi.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nghiem-tuc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nhech-mep-cuoi.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nhin-gie.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nhin-thang.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nhiu-may-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Nhiu-may.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Noi-nghe-ne.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Noi.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/nut-like.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/nut-subscribe.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Phai-vay-khong.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Phan-tich.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Quyet-tam-2.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Quyet-tam.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/So-hai.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Suy-tu.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tam-biet.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tap-trung.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tay-sau-lung.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tay-truoc-nguc.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/That-vong.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tho-dai-nhe.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/tram-tu.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Tsundere.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Ve-mat-am-ap.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Vuot-chan.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Wow.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/Xin-chao.png filter=lfs diff=lfs merge=lfs -text
+static/characters_green/You.png filter=lfs diff=lfs merge=lfs -text
+static/example/top-ly-do-xin-nghi-hoc.jpg filter=lfs diff=lfs merge=lfs -text
+static/music/Cheel[[:space:]]-[[:space:]]Blue[[:space:]]Dream.mp3 filter=lfs diff=lfs merge=lfs -text
+static/music/Kiss[[:space:]]the[[:space:]]Sky[[:space:]]-[[:space:]]Aakash[[:space:]]Gandhi.mp3 filter=lfs diff=lfs merge=lfs -text
+static/music/Morning[[:space:]]Mandolin[[:space:]]-[[:space:]]Chris[[:space:]]Haugen.mp3 filter=lfs diff=lfs merge=lfs -text
+static/music/Soft[[:space:]]Feeling[[:space:]]-[[:space:]]Cheel.mp3 filter=lfs diff=lfs merge=lfs -text
+static/music/Sunset[[:space:]]Dream[[:space:]]-[[:space:]]Cheel.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/giong-google.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/giong-nu-ke-chuyen.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/giong-nu-review.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/giong-nu-tiktok-hay.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/male1.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/ngoc-oanh.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/nguyet-nga.mp3 filter=lfs diff=lfs merge=lfs -text
+static/voice/thien-tam.mp3 filter=lfs diff=lfs merge=lfs -text

.gitignore CHANGED Viewed

@@ -150,10 +150,9 @@ cython_debug/
 Thumbs.db
 # Project specific
-*.ass
-*.mp4
-*.wav
-*.mp3
 raw_videos/
 rendered/
 references/

 Thumbs.db
 # Project specific
 raw_videos/
 rendered/
 references/

CHANGELOG.md ADDED Viewed

	@@ -0,0 +1,34 @@

+# VieNeu AI - Changelog (Nhật ký cập nhật)
+Tài liệu này ghi lại tất cả các thay đổi và tính năng mới đã được triển khai cho hệ thống VieNeu AI.
+## [2026-04-25] - Giai đoạn 2: Lồng nhạc & Ducking (BGM Mixing)
+### ✨ Tính năng mới
+- **Lồng nhạc nền (BGM)**: Cho phép upload file nhạc để lồng vào video/audio.
+- **Tính năng Ducking tự động**: Tự động giảm âm lượng nhạc nền khi có tiếng người nói và tự động to lại khi kết thúc câu.
+    - Sử dụng bộ lọc `sidechaincompress` chuyên nghiệp của FFmpeg.
+    - Cho phép tùy chỉnh âm lượng nhạc nền (BGM Volume) ngay trên giao diện.
+- **Đổi giọng giữa chừng [v:voice]**: (Đã có) Cho phép thay đổi nhân vật đọc.
+- **Tích hợp giọng mới từ static files**:
+    - **Giọng Google**: Giọng đọc tiêu chuẩn.
+    - **Thiện Tâm**: Giọng nam trầm, chuyên nghiệp.
+    - **Ngọc Oanh**: Giọng nữ kể chuyện truyền cảm.
+    - **Nguyệt Nga**: Giọng nữ review phim năng động.
+### 🛠 Cải tiến Backend
+- **Worker.py**:
+    - Cập nhật logic nhận diện giọng đọc từ đường dẫn file tĩnh (`static/voice/`).
+    - Tự động copy file mẫu vào thư mục tạm để đảm bảo an toàn cho file gốc khi xử lý.
+    - Nâng cấp Regex để không xóa nhầm thẻ `[p:ms]`.
+- **AI Pipeline**:
+    - Thêm hàm `generate_tts_with_pauses` sử dụng `numpy` và `soundfile` để ghép nối âm thanh và khoảng lặng.
+    - Cập nhật quy trình render video trong Studio để đồng bộ chính xác với các đoạn nghỉ.
+### 🎨 Cải tiến UI/UX
+- **Studio.html & TTS.html**:
+    - Cập nhật danh sách giọng chọn lọc.
+    - Thêm gợi ý (Tips) cách sử dụng thẻ `[p:ms]` ngay trong giao diện người dùng.
+### 🧠 Prompting
+- **prompt_gan_tag_bieu_cam.md**: Cập nhật hướng dẫn cho AI tự động chèn thẻ `[p:ms]` khi cần thiết để tối ưu hóa ngữ điệu.

Dockerfile CHANGED Viewed

@@ -1,39 +1,45 @@
 FROM python:3.11-slim
-# Cài đặt công cụ hệ thống (ffmpeg, redis, và trình biên dịch C++ cho các thư viện AI Linux)
 RUN apt-get update && apt-get install -y \
     ffmpeg \
     redis-server \
-    libass-dev \
     curl \
     build-essential \
     cmake \
     python3-dev \
     && rm -rf /var/lib/apt/lists/*
-WORKDIR /app
-# Tạo môi trường ảo truyền thống (Virtualenv)
-RUN python -m venv /app/.venv
-ENV PATH="/app/.venv/bin:$PATH"
-# Copy danh sách thư viện
-COPY requirements.txt ./
-# Cài đặt lõi biên dịch trước để chống lỗi Windows wheel
-RUN pip install --no-cache-dir build wheel setuptools cmake
-# Ép cài đặt llama-cpp-python bản gốc chuẩn Linux trước (để thằng vieneu không thể đòi bản Windows)
-# llama-cpp-python là phần não của vieneu
-RUN pip install --no-cache-dir llama-cpp-python==0.3.16
-# Cuối cùng mới cài các gói còn lại
-RUN pip install --no-cache-dir -r requirements.txt
-# Copy bộ code của bạn lên
 COPY . .
-# Cấp quyền và chạy
 RUN chmod +x start.sh
 EXPOSE 7860
 CMD ["./start.sh"]

 FROM python:3.11-slim
+# Cài đặt các công cụ hệ thống cần thiết
 RUN apt-get update && apt-get install -y \
     ffmpeg \
     redis-server \
     curl \
     build-essential \
     cmake \
     python3-dev \
     && rm -rf /var/lib/apt/lists/*
+# Cài đặt uv để quản lý thư viện nhanh hơn
+COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/
+WORKDIR /app
+# Copy các file cấu hình thư viện
+COPY pyproject.toml uv.lock ./
+# Cài đặt toàn bộ thư viện vào môi trường ảo
+# Chúng ta dùng --system để cài trực tiếp vào môi trường Python của Docker cho nhẹ
+RUN uv pip install --system --no-cache-dir build wheel setuptools cmake
+# Cài đặt llama-cpp-python bản chuẩn cho Linux
+RUN uv pip install --system --no-cache-dir llama-cpp-python==0.3.16
+# Cài đặt các thư viện còn lại từ pyproject.toml hoặc requirements.txt
+# Ở đây dự án bạn đang dùng cả 2, mình sẽ ưu tiên cài theo pyproject.toml nếu có
+RUN uv sync --system --no-dev
+# Copy toàn bộ mã nguồn
 COPY . .
+# Tạo thư mục cho dữ liệu tạm và kết quả (nếu cần)
+RUN mkdir -p static/results temp
+# Cấp quyền cho file chạy
 RUN chmod +x start.sh
+# Cổng mặc định của Hugging Face
 EXPOSE 7860
+# Chạy script khởi động hệ thống
 CMD ["./start.sh"]

README-hf.md ADDED Viewed

	@@ -0,0 +1,12 @@

+---
+title: UI VieNeu
+emoji: 🎥
+colorFrom: blue
+colorTo: purple
+sdk: docker
+app_port: 7860
+---
+# UI-VieNeu Backend API
+Video Subtitle & AI Voiceover Generator Backend.

README.md CHANGED Viewed

@@ -1,12 +1,82 @@
 ---
-title: UI VieNeu
-emoji: 🎥
-colorFrom: blue
-colorTo: purple
-sdk: docker
-app_port: 7860
 ---
-# UI-VieNeu Backend API
-Video Subtitle & AI Voiceover Generator Backend.

+# 🎬 UI-VieNeu: AI Animation & Video Pipeline
+**UI-VieNeu** là một hệ thống Backend mạnh mẽ được thiết kế để tự động hóa quy trình tạo video nội dung số, giải thích meme và hoạt ảnh nhân vật (PNGTuber) sử dụng sức mạnh của AI.
+![Python](https://img.shields.io/badge/Python-3.10+-blue?style=for-the-badge&logo=python)
+![FastAPI](https://img.shields.io/badge/FastAPI-0.100+-green?style=for-the-badge&logo=fastapi)
+![FFmpeg](https://img.shields.io/badge/FFmpeg-Powerful-orange?style=for-the-badge&logo=ffmpeg)
+![Celery](https://img.shields.io/badge/Celery-Distributed-red?style=for-the-badge&logo=celery)
 ---
+## ✨ Tính năng nổi bật
+- 🎙️ **Voice Studio (TTS):** Chuyển đổi văn bản thành giọng nói với hơn 60 sắc thái biểu cảm (Tag) khác nhau.
+- 🎭 **Animation Studio:** Tạo video từ ảnh nhân vật tĩnh, tự động đồng bộ biểu cảm theo kịch bản.
+- 📗 **Green Screen Pipeline:** Tự động xử lý nền xanh (Chroma Key) cho nhân vật để dễ dàng hậu kỳ.
+- ⚡ **Turbo Rendering:** Hệ thống xử lý video không đồng bộ (Asynchronous) dựa trên Celery và Redis, giúp render nhanh và không gây nghẽn server.
+- 🧠 **AI Script Assistant:** Tích hợp các Prompt tối ưu để tạo kịch bản hài hước, giải thích meme hoặc reaction. (cần thông qua gemini hoặc openai  bản web)
 ---
+## 🛠️ Hướng dẫn Cài đặt (Local Setup)
+Dự án sử dụng **`uv`** để quản lý thư viện và môi trường ảo nhằm đảm bảo tốc độ và sự ổn định cao nhất.
+### 1. Cài đặt công cụ quản lý (uv)
+Nếu máy bạn chưa có `uv`, hãy chạy lệnh sau trong PowerShell:
+```powershell
+powershell -c "irm https://astral.sh/uv/install.ps1 | iex"
+```
+### 2. Thiết lập dự án
+```powershell
+# Di chuyển vào thư mục dự án
+cd UI-VieNeu
+# Cài đặt toàn bộ thư viện vào môi trường ảo .venv
+uv sync
+```
+### 3. Khởi động Redis (Memurai)
+Hệ thống cần Redis để quản lý hàng đợi tác vụ:
+1. Mở VSCode/Terminal bằng quyền **Administrator**.
+2. Chạy lệnh: `Start-Service Memurai`
+---
+## 🚀 Cách chạy hệ thống
+Hệ thống bao gồm 2 thành phần chính chạy song song:
+### Terminal 1: Celery Worker (Trái tim xử lý)
+Xử lý các tác vụ nặng như AI TTS và FFmpeg Video Rendering:
+```powershell
+uv run celery -A worker worker --loglevel=info -P solo
+```
+### Terminal 2: FastAPI Server (Cổng kết nối)
+Cung cấp giao diện web và các API endpoint:
+```powershell
+uv run uvicorn main:app --reload
+```
+- **Giao diện người dùng:** [http://127.0.0.1:8000](http://127.0.0.1:8000)
+- **Tài liệu API (Swagger):** [http://127.0.0.1:8000/docs](http://127.0.0.1:8000/docs)
+---
+## 📂 Cấu trúc thư mục quan trọng
+- `/services`: Chứa logic xử lý audio, video và pipeline chính.
+- `/static/characters_green`: Kho ảnh nhân vật đã được tiền xử lý nền xanh.
+- `/templates`: Giao diện Web (HTML/JS) cho TTS và Studio.
+- `prompt_*.md`: Các "bí kíp" prompt để tương tác với AI biên kịch.
+---
+## ⚠️ Lưu ý cho Windows
+- Luôn sử dụng tham số `-P solo` khi chạy Celery.
+- Đảm bảo đã cài đặt **FFmpeg** và thêm vào biến môi trường (Environment Variables) của hệ thống.
+---
+© 2026 **Sao Tinh Nghịch Team** - Tự động hóa sản xuất nội dung, giải phóng sức sáng tạo.

goi_y_hinh_anh_gameloft.md ADDED Viewed

	@@ -0,0 +1,19 @@

+# 🎬 GỢI Ý HÌNH ẢNH (B-ROLL, GAMEPLAY, GRAPHICS) & NGUỒN TÌM KIẾM
+Dưới đây là bảng hướng dẫn chi tiết cách tìm kiếm và lựa chọn hình ảnh, video minh họa (B-roll) cho kịch bản về **Gameloft** – huyền thoại game mobile.
+| Đoạn kịch bản | Gợi ý hình ảnh (B-roll, Gameplay, Graphics) | Nguồn tìm kiếm |
+| :--- | :--- | :--- |
+| **0:00 - 0:15 (Hook):** Logo chữ G, "tuổi thơ", "điện thoại cục gạch". | **CỰC KỲ QUAN TRỌNG:** Ảnh logo G xoay 3D (nếu có thể làm hiệu ứng), video quay chậm một chiếc Nokia cổ đang bật, đoạn phim quay tay ai đó đang bấm phím lia lịa trên điện thoại cũ. | - **YouTube:** Search "Nokia boot animation", "retro mobile gaming b-roll".<br>- **Stock sites:** Pexels, Pixabay (search "retro technology"). |
+| **0:15 - 0:30 (Giới thiệu):** Trụ sở Paris, sáng lập từ Ubisoft, thuộc Vivendi. | Video flycam Paris (Cảnh tháp Eiffel), Logo Ubisoft cổ và hiện đại chuyển cảnh, Logo Vivendi. Có thể dùng đồ họa sơ đồ cho thấy mối liên hệ. | - **YouTube:** Kênh chính thức của Ubisoft.<br>- **Google Images:** Tìm logo chất lượng cao.<br>- **Stock sites:** Pexels (search "Paris aerial view"). |
+| **0:30 - 1:00 (Huyền thoại):** Siêu phẩm Asphalt, N.O.V.A, Dungeon Hunter. | **Mấu chốt:** Footage gameplay thật của các game này từ bản đời đầu cho đến bản mới nhất (Asphalt 9). Nên chọn cảnh cháy nổ, đua xe nhanh, bắn súng kịch tính. Ghép xen kẽ các clip ngắn 3-5 giây. | - **YouTube:** Kênh chính thức của Gameloft (đây là mỏ vàng).<br>- **YouTube:** Search "No commentary gameplay" của từng tựa game cụ thể. |
+| **1:00 - 1:45 (Gameloft chưa chết):** Doanh thu đỉnh cao, 250-280 triệu Euro. | Đồ họa biểu đồ cột/đường nhảy số tăng dần, hình ảnh tiền Euro rơi, video người đang thao tác trên máy tính/điện thoại hiện đại. | - **YouTube:** Search "infographic financial growth b-roll".<br>- **Stock sites:** "Money counting", "business analytics". |
+| **1:45 - 2:30 (Lý do bốc hơi tại VN):** Chỉ sản xuất không phát hành, thị hiếu thay đổi (Gacha, MOBA). | Cảnh studio lập trình viên (stock), logo các game MOBA/Gacha phổ biến (Liên Quân, Free Fire, Genshin) đối lập với game truyền thống. Đồ họa sơ đồ thị trường VN với mũi tên "sản xuất" vs "tiêu thụ". | - **YouTube:** Channel Gameloft Vietnam (lấy footage không khí làm việc).<br>- **Stock sites:** "Tech office Vietnam".<br>- **YouTube:** Trailer game MOBA/Gacha. |
+| **2:30 - Hết (Kết thúc):** Biến mất khỏi truyền thông, mảnh ký ức đẹp, câu hỏi khảo sát. | Video hiệu ứng mờ dần, ảnh ghép các tựa game cũ dạng trắng đen, cảnh người dùng đóng điện thoại Nokia lại. | - **YouTube:** "Nostalgia b-roll", "closing old phone". |
+---
+### 💡 Lưu ý khi tìm kiếm Footage:
+1. **Chất lượng:** Luôn ưu tiên video độ phân giải 1080p hoặc 4K.
+2. **Bản quyền:** Nếu dùng cho YouTube, hãy ưu tiên các nguồn "No copyright" hoặc "Creative Commons". Với gameplay, Gameloft thường cho phép sử dụng nếu có bình luận hoặc biên tập lại.
+3. **Tính nhịp điệu:** Cắt ghép hình ảnh khớp với nhịp nói (VO) và âm nhạc nền để tăng độ cuốn hút.

kich_ban_mau.md ADDED Viewed

	@@ -0,0 +1,58 @@

+# KỊCH BẢN: KHU VƯỜN TRÊN MÂY – KHI CHÚNG TA TỪNG LÀ NHỮNG "NÔNG DÂN" QUYỀN LỰC NHẤT ZING ME
+### **Hook: Cú sốc "nông dân" thời đại 4.0**
+*   **VO:** Bạn có tin được không? Trước khi có những "tổng tài" hay "chủ tịch" trên TikTok, chúng ta từng có một thế hệ "nông dân" quyền lực đến mức... mất ăn mất ngủ chỉ vì vài chậu cây trên mây!
+*   **Hình ảnh:** [Hiệu ứng zoom nhanh vào logo Zing Me cũ, tiếng lạch cạch bàn phím]
+---
+### **Dẫn chuyển tiếp (Bridge)**
+*   **VO:** Nhưng trước khi bắt đầu, các bạn giúp mình nhấn Like, Share và Subscribe nhé. Đó chính là động lực lớn nhất với mình để tiếp tục sản xuất các video tiếp theo gửi đến mọi người. Còn bây giờ, hãy cùng mình bước vào **thế giới của Zing Me và Khu Vườn Trên Mây nhé!**
+---
+### **Phần 1: Zing Me – Đế chế "thống trị" tâm hồn giới trẻ**
+*   **VO:** Trước khi Facebook trở thành "nhà" của mọi người, bạn có nhớ chúng ta từng có một "thủ đô" rực rỡ mang tên **Zing Me** không?
+*   **VO:** Ra mắt vào năm **2009**, Zing Me đã tạo nên một cú nổ thực sự khi trở thành mạng xã hội lớn nhất Việt Nam thời bấy giờ.
+*   **VO:** Với hơn **8 triệu lượt truy cập hằng tháng** và tổng cộng hàng chục triệu tài khoản, Zing Me chính là nơi mà bất kỳ "dân chơi" internet nào cũng phải có một tấm hộ chiếu.
+*   **VO:** Ở đó, chúng ta có cả một hệ sinh thái: từ việc "treo status" sướt mướt để thả thính, nhắn tin xuyên màn đêm với bạn bè, đọc tin tức trên Zing News, cho đến việc "cày" nhạc trên Zing MP3.
+*   **VO:** Nhưng đặc biệt nhất, thứ khiến chúng ta "mất ăn mất ngủ" chính là kho game đồ sộ: từ Đảo Rồng kịch tính, My Fish màu sắc cho đến Hàng Rong đầy bụi bặm... nhưng tất cả đều phải "ngả mũ" trước huyền thoại: **Khu Vườn Trên Mây**.
+---
+### **Phần 2: Kiếp "nông dân" và những tầng mây huyền thoại**
+*   **VO:** Nhắc đến Khu Vườn Trên Mây trên PC, bạn nhớ đến điều gì đầu tiên?
+*   **VO:** Có phải là những chậu cây đầy màu sắc được đặt trên những tầng mây lơ lửng không?
+*   **VO:** Jack và cây đậu thần đã mở ra một thế giới mà ở đó, chúng ta hóa thân thành những bác nông dân thực thụ.
+*   **VO:** Sáng sớm thức dậy, việc đầu tiên không phải là đánh răng, mà là đăng nhập vào Zing Me để xem cây đã chín chưa, có ai "ghé thăm" vườn mình không.
+*   **VO:** Cái thú vui "tao nhã" nhất chính là sang nhà hàng xóm, không phải để chơi, mà là để... bắt sâu đem về nhà mình để nâng cấp chậu.
+*   **VO:** Chúng ta từng đua nhau xem ai sở hữu nhiều chậu độc lạ nhất, từ chậu Đất đơn sơ cho đến chậu Kim Ngân lộng lẫy, rồi hì hục cày cuốc để mở thêm tầng mây mới, leo lên càng cao càng thấy mình "đẳng cấp".
+*   **VO:** Cảm giác nhìn khu vườn của mình rực rỡ sắc hoa và đầy ắp những loài cây kỳ lạ trên trình duyệt web, thực sự là một loại hạnh phúc khó tả bằng lời.
+---
+### **Phần 3: Cuộc "di cư" đầy nuối tiếc và hồi kết trên PC**
+*   **VO:** Tuy nhiên, cuộc vui nào cũng có lúc tàn. Vào năm **2017**, một tin buồn chấn động đã đến khi VNG chính thức thông báo "khai tử" phiên bản Khu Vườn Trên Mây trên PC để tập trung cho phiên bản điện thoại.
+*   **VO:** Chúng ta buộc phải "di cư" sang một thế giới mới mang tên Khu Vườn Trên Mây Mobile.
+*   **VO:** Dù game vẫn ở đó, vẫn đẹp, nhưng những trải nghiệm "nguyên bản" trên PC đã vĩnh viễn mất đi.
+*   **VO:** Đó là nỗi đau khi toàn bộ tiến trình chơi suốt bao nhiêu năm, dàn chậu cực phẩm tích góp từng tí một, danh sách bạn bè thân thiết trên Zing Me và bảng xếp hạng "oanh liệt" ngày nào bỗng chốc trở về con số không tròn trĩnh.
+*   **VO:** Việc thao tác trên màn hình điện thoại bé xíu chẳng bao giờ mang lại cái cảm giác "đã" như khi cầm chuột click từng tầng mây trên chiếc máy tính bàn to đùng nữa.
+---
+### **Kết bài: Thanh xuân gửi lại trên mây**
+*   **VO:** Zing Me có thể đã lùi vào dĩ vãng, Khu Vườn Trên Mây bản PC có thể đã đóng cửa, nhưng những kỷ niệm về một thời "nông dân ảo" sẽ mãi là một phần đẹp nhất của thanh xuân.
+*   **VO:** Bạn còn nhớ mình từng mở đến tầng mây thứ mấy không? Hay có ai từng bị bạn "chôm" sạch sâu trong vườn chưa?
+*   **VO:** Hãy để lại comment để chúng ta cùng ôn lại những ngày tháng "huy hoàng" đó nhé!
+*   **VO:** Đừng quên nhấn Like, Đăng ký kênh và **chia sẻ video này cho hội bạn thân** từng "cày" Zing Me cùng bạn để cùng nhau đi ngược dòng thời gian.
+*   **VO:** Chào tạm biệt, và hẹn gặp lại các bạn trên những tầng mây ký ức!
+---
+### **Gợi ý hình ảnh (B-roll, Gameplay, Graphics)**
+| Đoạn kịch bản | Gợi ý hình ảnh (B-roll, Gameplay, Graphics) | Nguồn tìm kiếm |
+| :--- | :--- | :--- |
+| **Hook & Bridge** | Cảnh zoom vào logo Zing Me, footage người gõ phím máy tính bàn cũ. | YouTube: "Zing Me logo history", "90s office pc b-roll". |
+| **Phần 1** | Ảnh chụp màn hình trang chủ Zing Me, các icon game cũ mờ ảo. | Google Images: "Zing Me homepage 2010". |
+| **Phần 2** | Gameplay Khu Vườn Trên Mây PC: cảnh thu hoạch, bắt sâu, nâng cấp chậu. | YouTube: "Khu Vườn Trên Mây PC gameplay". |
+| **Phần 3** | Cảnh đóng trình duyệt, logo Khu Vườn Trên Mây Mobile, hiệu ứng trắng đen. | YouTube: "Gameloft Vietnam footage". |
+| **Kết bài** | Cảnh mây trôi chậm, hiệu ứng mờ dần, các comment kỷ niệm. | Pexels: "Clouds time-lapse". |

main.py CHANGED Viewed

@@ -1,4 +1,7 @@
 import os
 from dotenv import load_dotenv
 load_dotenv(override=True)
 from fastapi import FastAPI, UploadFile, File, Form, Request
@@ -7,18 +10,24 @@ from fastapi.staticfiles import StaticFiles
 from fastapi.templating import Jinja2Templates
 from pydantic import BaseModel
 from supabase import create_client, Client
-from worker import render_video_task, generate_tts_task
 app = FastAPI(title="VieNeu Video AI processing API")
 # Mount thư mục tĩnh và giao diện HTML
 app.mount("/static", StaticFiles(directory="static"), name="static")
 templates = Jinja2Templates(directory="templates")
-# Setup Supabase
-SUPABASE_URL = os.getenv("SUPABASE_URL", "https://your-project.supabase.co")
-SUPABASE_KEY = os.getenv("SUPABASE_SERVICE_ROLE_KEY", "your-service-key")
-supabase: Client = create_client(SUPABASE_URL, SUPABASE_KEY)
 class RenderJobRequest(BaseModel):
     script_text: str
@@ -32,20 +41,22 @@ async def read_root(request: Request):
 async def read_tts(request: Request):
     return templates.TemplateResponse(request=request, name="tts.html")
 @app.post("/api/v1/jobs/submit")
 async def submit_job(
     script: str = Form(...),
-    video: UploadFile = File(...),
-    ref_audio: UploadFile = File(None)
 ):
     """
-    Receives frontend files, stores them, and dispatches a Celery task.
     """
-    # 1. Upload assets to Supabase Storage temporarily
-    video_bytes = await video.read()
-    video_path = f"raw_videos/{video.filename}"
-    supabase.storage.from_("content").upload(path=video_path, file=video_bytes)
     ref_audio_path = None
     if ref_audio:
         ref_audio_bytes = await ref_audio.read()
@@ -56,13 +67,13 @@ async def submit_job(
     db_resp = supabase.table("video_jobs").insert({
         "status": "pending",
         "script": script,
-        "raw_video_path": video_path
     }).execute()
     job_id = db_resp.data[0]["id"] if db_resp.data else "unknown"
     # 3. Dispatch to Celery queue
-    render_video_task.delay(job_id, video_path, script, ref_audio_path)
     return {"job_id": job_id, "status": "processing_queued"}
@@ -71,27 +82,48 @@ async def submit_tts_job(
     script: str = Form(...),
     temperature: float = Form(0.5),
     voice_preset: str = Form("default"),
-    ref_audio: UploadFile = File(None)
 ):
     """
     Submits a pure Text-To-Speech task to Celery.
     """
-    ref_audio_path = None
     if ref_audio:
         ref_audio_bytes = await ref_audio.read()
-        ref_audio_path = f"references/{ref_audio.filename}"
-        supabase.storage.from_("content").upload(path=ref_audio_path, file=ref_audio_bytes)
     # Note: Using generic "video_jobs" table to track TTS jobs as well to save setup time.
     db_resp = supabase.table("video_jobs").insert({
         "status": "pending",
         "script": script,
-        "raw_video_path": "audio_only"
     }).execute()
     job_id = db_resp.data[0]["id"] if db_resp.data else "unknown"
-    generate_tts_task.delay(job_id, script, voice_preset, temperature, ref_audio_path)
     return {"job_id": job_id, "status": "processing_queued"}
@@ -100,4 +132,55 @@ async def get_job_status(job_id: str):
     response = supabase.table("video_jobs").select("*").eq("id", job_id).execute()
     if not response.data:
         return {"error": "Job not found"}
-    return response.data[0]

 import os
+import re
+import uuid
+import unicodedata
 from dotenv import load_dotenv
 load_dotenv(override=True)
 from fastapi import FastAPI, UploadFile, File, Form, Request
 from fastapi.templating import Jinja2Templates
 from pydantic import BaseModel
 from supabase import create_client, Client
+from worker import render_video_task, generate_tts_task, render_studio_task
+# Setup Supabase
+SUPABASE_URL = os.getenv("SUPABASE_URL", "https://your-project.supabase.co")
+SUPABASE_KEY = os.getenv("SUPABASE_SERVICE_ROLE_KEY", "your-service-key")
+supabase: Client = create_client(SUPABASE_URL, SUPABASE_KEY)
 app = FastAPI(title="VieNeu Video AI processing API")
 # Mount thư mục tĩnh và giao diện HTML
 app.mount("/static", StaticFiles(directory="static"), name="static")
 templates = Jinja2Templates(directory="templates")
+def slugify(text: str) -> str:
+    # Chuyển tiếng Việt có dấu thành không dấu
+    text = unicodedata.normalize('NFD', text).encode('ascii', 'ignore').decode("utf-8")
+    # Xóa ký tự đặc biệt, chuyển sang lowercase, thay khoảng trắng bằng gạch dưới
+    text = re.sub(r'[^\w\s-]', '', text).strip().lower()
+    text = re.sub(r'[-\s]+', '_', text)
+    return text[:40]
 class RenderJobRequest(BaseModel):
     script_text: str
 async def read_tts(request: Request):
     return templates.TemplateResponse(request=request, name="tts.html")
+@app.get("/studio", response_class=HTMLResponse)
+async def read_studio(request: Request):
+    return templates.TemplateResponse(request=request, name="studio.html")
 @app.post("/api/v1/jobs/submit")
 async def submit_job(
     script: str = Form(...),
+    ref_audio: UploadFile = File(None),
+    aspect_ratio: str = Form("9:16"),
+    sub_style: str = Form("karaoke"),
+    font_name: str = Form("Arial"),
+    highlight_color: str = Form("#00FDFF")
 ):
     """
+    Receives frontend parameters, tracks them, and dispatches a Celery task.
     """
     ref_audio_path = None
     if ref_audio:
         ref_audio_bytes = await ref_audio.read()
     db_resp = supabase.table("video_jobs").insert({
         "status": "pending",
         "script": script,
+        "raw_video_path": "green_screen"
     }).execute()
     job_id = db_resp.data[0]["id"] if db_resp.data else "unknown"
     # 3. Dispatch to Celery queue
+    render_video_task.delay(job_id, script, ref_audio_path, aspect_ratio, sub_style, font_name, highlight_color)
     return {"job_id": job_id, "status": "processing_queued"}
     script: str = Form(...),
     temperature: float = Form(0.5),
     voice_preset: str = Form("default"),
+    ref_audio: UploadFile = File(None),
+    existing_ref_path: str = Form(None),
+    bgm_audio: UploadFile = File(None),
+    bgm_volume: float = Form(0.1),
+    bgm_preset: str = Form(None)
 ):
     """
     Submits a pure Text-To-Speech task to Celery.
     """
+    ref_audio_path = existing_ref_path
     if ref_audio:
         ref_audio_bytes = await ref_audio.read()
+        # Clean the filename and add a unique ID to prevent conflicts/accents issues
+        clean_name = slugify(ref_audio.filename.rsplit('.', 1)[0])
+        safe_filename = f"{clean_name}_{uuid.uuid4().hex[:8]}.wav"
+        ref_audio_path = f"references/{safe_filename}"
+        supabase.storage.from_("content").upload(
+            path=ref_audio_path,
+            file=ref_audio_bytes,
+            file_options={"content-type": "audio/wav"}
+        )
     # Note: Using generic "video_jobs" table to track TTS jobs as well to save setup time.
     db_resp = supabase.table("video_jobs").insert({
         "status": "pending",
         "script": script,
+        "raw_video_path": ref_audio_path if ref_audio_path else "audio_only"
     }).execute()
     job_id = db_resp.data[0]["id"] if db_resp.data else "unknown"
+    bgm_path = None
+    if bgm_audio:
+        bgm_bytes = await bgm_audio.read()
+        bgm_filename = f"bgm/{slugify(bgm_audio.filename.rsplit('.', 1)[0])}_{uuid.uuid4().hex[:8]}.mp3"
+        supabase.storage.from_("content").upload(path=bgm_filename, file=bgm_bytes)
+        bgm_path = bgm_filename
+    elif bgm_preset:
+        bgm_path = bgm_preset
+    generate_tts_task.delay(job_id, script, voice_preset, temperature, ref_audio_path, bgm_path, bgm_volume)
     return {"job_id": job_id, "status": "processing_queued"}
     response = supabase.table("video_jobs").select("*").eq("id", job_id).execute()
     if not response.data:
         return {"error": "Job not found"}
+    data = response.data[0]
+    # Fetch progress from Redis
+    try:
+        import redis
+        redis_client = redis.from_url(os.getenv("REDIS_URL", "redis://localhost:6379/0"))
+        progress_data = redis_client.get(f"progress_{job_id}")
+        if progress_data:
+            progress_str = progress_data.decode("utf-8")
+            parts = progress_str.split("|")
+            if len(parts) == 2:
+                data["progress"] = {
+                    "elapsed": parts[0],
+                    "remaining": parts[1]
+                }
+    except Exception as e:
+        print(f"Redis error: {e}")
+    return data
+@app.post("/api/v1/studio/generate")
+async def submit_studio_job(
+    script: str = Form(...),
+    temperature: float = Form(0.5),
+    voice_preset: str = Form("default"),
+    bgm_audio: UploadFile = File(None),
+    bgm_volume: float = Form(0.1),
+    bgm_preset: str = Form(None)
+):
+    """
+    Submits a Studio MP4 rendering task to Celery.
+    """
+    db_resp = supabase.table("video_jobs").insert({
+        "status": "pending",
+        "script": script,
+        "raw_video_path": "studio_render"
+    }).execute()
+    job_id = db_resp.data[0]["id"] if db_resp.data else "unknown"
+    bgm_path = None
+    if bgm_audio:
+        bgm_bytes = await bgm_audio.read()
+        bgm_filename = f"bgm/{slugify(bgm_audio.filename.rsplit('.', 1)[0])}_{uuid.uuid4().hex[:8]}.mp3"
+        supabase.storage.from_("content").upload(path=bgm_filename, file=bgm_bytes)
+        bgm_path = bgm_filename
+    elif bgm_preset:
+        bgm_path = bgm_preset
+    render_studio_task.delay(job_id, script, temperature, voice_preset, bgm_path, bgm_volume)
+    return {"job_id": job_id, "status": "processing_queued"}

prompt_gan_tag_bieu_cam.md ADDED Viewed

	@@ -0,0 +1,35 @@

+# PROMPT GẮN TAG BIỂU CẢM (EXPRESSION TAGGING)
+Bạn là một đạo diễn hình ảnh và chuyên gia biên tập kịch bản video. Nhiệm vụ của bạn là đọc kịch bản video thô của tôi, sau đó ngắt kịch bản ra thành từng câu ngắn gọn. Ở đầu mỗi câu, bạn phải chèn một [Từ khóa biểu cảm] sao cho phù hợp nhất với ngữ cảnh, sắc thái và nội dung của câu nói đó.
+🚨 YÊU CẦU QUAN TRỌNG:
+1. Tuyệt đối CHỈ ĐƯỢC PHÉP sử dụng các từ khóa biểu cảm có trong danh sách 60 từ khóa được cung cấp bên dưới. Không được tự bịa ra từ khóa mới.
+2. Mỗi câu văn chỉ gắn 1 tag ở đầu câu. Nếu một câu quá dài, hãy tách thành 2 câu và gắn tag cho từng câu.
+3. Trả về kết quả dưới dạng văn bản thuần túy (plain text), không cần giải thích gì thêm.
+4. QUY TẮC DẤU CÂU (Quan trọng để tránh lỗi AI rên rỉ/hỏng tiếng):
+   - Chỉ được sử dụng dấu chấm (.) và dấu phẩy (,) trong kịch bản.
+   - Tuyệt đối CẤM sử dụng dấu 3 chấm (...), dấu ngoặc kép (""), hoặc các ký tự lạ. Nếu thấy kịch bản gốc có dấu 3 chấm, hãy chuyển thành dấu phẩy (,) hoặc dấu chấm (.) tùy ngữ cảnh.
+5. GIỮ NGUYÊN VĂN PHONG: Tuyệt đối giữ nguyên toàn bộ lời văn và phong cách của kịch bản gốc. KHÔNG ĐƯỢC rút gọn, tóm tắt hay thay đổi nội dung câu chữ. Hãy đảm bảo kịch bản đầu ra đầy đủ và diễn đạt đúng như bản gốc.
+6. **BỎ QUA CHÚ THÍCH KỸ THUẬT (QUAN TRỌNG):** Tuyệt đối KHÔNG gắn tag biểu cảm và KHÔNG đưa vào kết quả đầu ra các đoạn chú thích về [Hình ảnh/Hiệu ứng], [Âm thanh], [Minh họa] hoặc các ghi chú kỹ thuật tương tự. Chỉ tập trung xử lý và gắn tag cho phần lời thoại (VO) hoặc nội dung văn bản cần đọc. Nếu thấy dòng nào bắt đầu bằng [Hình ảnh/Hiệu ứng] hoặc mô tả cảnh quay, hãy xóa bỏ dòng đó khỏi kết quả.
+7. **SỬ DỤNG THẺ NGHỈ [p:ms]:** Nếu kịch bản có những đoạn cần nghỉ dài hoặc ngắt quãng tự nhiên giữa các câu, hãy chèn thêm thẻ `[p:ms]` (Ví dụ: `[p:500]` cho 0.5s, `[p:1000]` cho 1s). **Lưu ý: Chỉ dùng p khi độ nghỉ từ 500ms trở lên. Tuyệt đối KHÔNG dùng các độ nghỉ ngắn như [p:100] hay [p:200].** Chỉ chèn khi thực sự cần thiết để giọng đọc nghe tự nhiên hơn.
+8. **ĐỘ DÀI VĂN BẢN SAU THẺ (QUAN TRỌNG):** Mỗi thẻ `[Tag]` biểu cảm bắt buộc phải được theo sau bởi **ít nhất 6 từ**. Tuyệt đối không ngắt câu quá ngắn (1-3 từ) sau một thẻ biểu cảm vì sẽ khiến AI bị lỗi giọng (phát ra tiếng ừ, à).
+9. **XỬ LÝ TIÊU ĐỀ PHẦN (CHUYỂN CẢNH):** Nếu kịch bản có các tiêu đề phần (Ví dụ: `PHẦN 1: ...`, `PHẦN 2: ...`), hãy giữ lại nội dung tiêu đề đó. Bạn phải chèn thẻ nghỉ `[p:2000]` (nghỉ 2 giây) vào **NGAY TRƯỚC** và **NGAY SAU** tiêu đề phần để tạo khoảng lặng chuyển cảnh. Không cần gắn tag biểu cảm cho chính tiêu đề phần đó.
+10. **PHIÊN ÂM TÊN RIÊNG (QUAN TRỌNG):** Nếu trong kịch bản có các tên riêng (tên nhân vật, tên người, địa danh tiếng nước ngoài...), bạn phải **phiên âm toàn bộ sang tiếng Việt** để AI đọc chuẩn xác (Ví dụ: Iroha chuyển thành `i rô ha`, Kaguya là `ca gu ya`, Amane là `a ma ne`, Mahiru là `ma hi ru`). Tuyệt đối **KHÔNG** để dấu gạch chân (_) giữa các âm tiết.
+📜 DANH SÁCH TỪ KHÓA ĐƯỢC PHÉP SỬ DỤNG:
+[Ánh mắt chân thành], [Bất lực], [Bất ngờ], [Bình thường], [Bó tay], [Buồn nhẹ], [Cảm thông], [Cầu xin], [Chào khán giả], [Chỉ tay], [Chịu thua], [Cực kỳ nghiêm túc], [Cười tươi], [Đợi], [Giận], [Nhấn mạnh], [Hạnh phúc], [Khó hiểu], [Khoanh tay 2], [Khoanh tay], [Khóc], [Lắc đầu], [Lo lắng 2], [Lo lắng], [Kể chuyện], [Mỉm cười], [Ôm má], [Nghĩ ra rồi], [Nghiêm túc], [Nhếch mép], [Nhìn ghê], [Nhìn thẳng], [Nhíu mày nhẹ], [Nhíu mày], [Nói nghe nè], [Nói], [Phải vậy không], [Phân tích], [Quyết tâm 2], [Quyết tâm], [Sợ hãi], [Suy tư], [Tạm biệt], [Tập trung], [Tay sau lưng], [Tay trước ngực], [Thất vọng], [Thở dài], [Tsundere], [Ấm áp], [Vuốt trán], [Wow], [Xin chào], [You], [Bất lực quá], [Trầm tư], [Vui vẻ], [Buồn], [Giận dữ], [Ngạc nhiên], [Để lại comment], [Bật thông báo], [Nút like], [Nút subscribe].
+Ví dụ minh họa:
+Kịch bản gốc:
+"[VO]: Nội dung video của mình hôm nay rất hay.
+[0:25 - 1:05] PHẦN 1: SỰ KHỞI ĐẦU CỦA ĐẾ CHẾ
+[VO]: Chào mọi người. Quay ngược thời gian về năm 2018."
+Kết quả mong đợi:
+[Nói nghe nè] Nội dung video của mình hôm nay rất hay. [p:2000]
+PHẦN 1: SỰ KHỞI ĐẦU CỦA ĐẾ CHẾ [p:2000]
+[Xin chào] Chào mọi người. [p:500]
+[Kể chuyện] Quay ngược thời gian về năm 2018.
+Dưới đây là kịch bản của tôi, hãy giúp tôi xử lý:

prompt_seo_assistant.md ADDED Viewed

	@@ -0,0 +1,33 @@

+# ROLE
+Bạn là một chuyên gia Marketing và SEO Video hàng đầu toàn cầu, chuyên tối ưu hóa nội dung cho YouTube, TikTok và Facebook Reels. Nhiệm vụ của bạn là phân tích kịch bản video và tạo ra bộ metadata hoàn hảo nhất để tăng tỷ lệ click (CTR) và khả năng hiển thị (Search Visibility).
+# NHIỆM VỤ
+Dựa trên kịch bản được cung cấp, hãy tạo ra các nội dung sau:
+1. **Tiêu đề (Titles)**: 5 tùy chọn tiêu đề gây tò mò, đánh đúng nỗi đau hoặc khao khát của khán giả. (Độ dài tối ưu 30-60 ký tự).
+2. **Mô tả (Description)**: Viết đoạn mô tả ngắn gọn (3-5 dòng), lôi cuốn, chứa từ khóa chính.
+3. **Hashtags**: 5-7 hashtag liên quan nhất.
+4. **Tags**: Danh sách các từ khóa mở rộng (cách nhau bằng dấu phẩy) để nhập vào YouTube Studio.
+5. **Đoạn cảnh (Chapters)**: Phân tích các ý chính trong kịch bản và gợi ý các mốc thời gian (ước tính).
+# ĐỊNH DẠNG PHẢN HỒI (JSON)
+Hãy CHỈ trả về duy nhất một khối JSON với cấu trúc như sau:
+{
+  "titles": [
+    {"text": "Tiêu đề 1", "chars": 45},
+    {"text": "Tiêu đề 2", "chars": 52}
+  ],
+  "description": "Nội dung mô tả...",
+  "hashtags": ["#Tag1", "#Tag2"],
+  "tags": "từ khóa 1, từ khóa 2, từ khóa 3...",
+  "chapters": [
+    {"time": "0:00", "title": "Giới thiệu/Hook"},
+    {"time": "0:30", "title": "Vấn đề chính"},
+    {"time": "2:15", "title": "Giải pháp/Chi tiết"}
+  ]
+}
+# QUY TẮC QUAN TRỌNG
+- Ngôn ngữ: Tiếng Việt.
+- Tiêu đề phải mang tính "Clickbait sạch" (không treo đầu dê bán thịt chó).
+- Mô tả phải thân thiện với thuật toán tìm kiếm.
+- Tags phải bao phủ được cả từ khóa ngắn và từ khóa dài.

prompt_tao_anh_nen.md ADDED Viewed

	@@ -0,0 +1,123 @@

+# 🎨 BỘ 50 PROMPT TẠO ẢNH NỀN 2D VECTOR (SIÊU ĐẦY ĐỦ)
+Dưới đây là danh sách 50 bối cảnh đã được tối ưu hóa theo phong cách **2D Vector, Flat Design** để khớp hoàn toàn với nhân vật Chibi của bạn.
+**Công thức chung:**
+`2D vector art illustration of [CHỦ ĐỀ], flat design, simple clean lines, anime visual novel background style, lofi aesthetic, soft pastel colors, minimal details, no 3D rendering, no gradients, high resolution, wide angle, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🏠 NHÓM 1: TRONG NHÀ & ĐỜI THƯỜNG
+1. **Phòng khách hiện đại:** `2D vector art illustration of a modern living room with a simple sofa and TV, flat design, simple clean lines, anime visual novel style, lofi aesthetic, 16:9 aspect ratio, similar art with character, no character included`
+2. **Phòng khách cổ điển:** `2D vector art illustration of a classic old Vietnamese living room, antique wooden furniture, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+3. **Phòng ngủ ấm cúng:** `2D vector art illustration of a cozy bedroom with warm lamp lighting, flat design, simple clean lines, anime visual novel style, lofi aesthetic, 16:9 aspect ratio, similar art with character, no character included`
+4. **Phòng ngủ bừa bộn:** `2D vector art illustration of a messy bedroom with clothes and books on the floor, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+5. **Góc học tập Minimalism:** `2D vector art illustration of a minimalist study desk with a laptop and a lamp, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+6. **Phòng làm việc CEO:** `2D vector art illustration of a luxury CEO office with a large glass window and city view, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+7. **Nhà bếp:** `2D vector art illustration of a clean kitchen with cabinets and a stove, flat design, simple clean lines, anime visual novel style, lofi aesthetic, 16:9 aspect ratio, similar art with character, no character included`
+8. **Bàn ăn gia đình:** `2D vector art illustration of a family dining table with a teapot and simple dishes, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+9. **Ban công chung cư:** `2D vector art illustration of a balcony at night looking at city lights, flat design, simple clean lines, anime visual novel style, lofi aesthetic, 16:9 aspect ratio, similar art with character, no character included`
+10. **Hành lang chung cư cũ:** `2D vector art illustration of an old apartment corridor, simple doors and bicycle, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+11. **Tầng hầm:** `2D vector art illustration of a dark mysterious basement with boxes and a single light bulb, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+12. **Gác mái:** `2D vector art illustration of a dusty attic filled with old boxes and trunks, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🏫 NHÓM 2: TRƯỜNG HỌC & CÔNG SỞ
+13. **Lớp học:** `2D vector art illustration of a classroom with a green chalkboard and wooden desks, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+14. **Giảng đường đại học:** `2D vector art illustration of a large university lecture hall with rows of seats, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+15. **Thư viện:** `2D vector art illustration of a quiet library with long wooden bookshelves, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+16. **Sân trường:** `2D vector art illustration of a busy school courtyard during break time, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+17. **Căng tin:** `2D vector art illustration of a crowded school cafeteria with tables and food stalls, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+18. **Hội trường sân khấu:** `2D vector art illustration of a large school auditorium with a stage and red curtains, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+19. **Văn phòng hiện đại:** `2D vector art illustration of an open space modern office with desks and computers, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+20. **Phòng họp:** `2D vector art illustration of a serious meeting room with a long table and chairs, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+21. **Góc máy pha cà phê:** `2D vector art illustration of an office coffee break area with a coffee machine, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+22. **Phòng thí nghiệm:** `2D vector art illustration of a science lab with test tubes and microscopes, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🏙️ NHÓM 3: ĐÔ THỊ & ĐƯỜNG PHỐ
+23. **Ngã tư đường phố:** `2D vector art illustration of a busy city intersection during daytime, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+24. **Phố đi bộ:** `2D vector art illustration of a crowded walking street with shops and neon signs, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+25. **Trạm chờ xe buýt:** `2D vector art illustration of a bus stop at sunset, warm orange sky, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+26. **Bên trong tàu điện/xe buýt:** `2D vector art illustration of the interior of a subway train or bus, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+27. **Công viên hồ nước:** `2D vector art illustration of a green park with a central lake and trees, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+28. **Cà phê vỉa hè:** `2D vector art illustration of a Vietnamese street sidewalk cafe with small plastic stools, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+29. **Quán cà phê sách:** `2D vector art illustration of a cozy book cafe interior with bookshelves and soft lighting, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+30. **Cửa hàng tiện lợi:** `2D vector art illustration of a 24/7 convenience store interior with shelves and snacks, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+31. **Trung tâm thương mại:** `2D vector art illustration of a modern luxury shopping mall interior, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+32. **Rạp chiếu phim:** `2D vector art illustration of a movie theater lobby with posters and popcorn stands, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🌲 NHÓM 4: THIÊN NHIÊN & DU LỊCH
+33. **Bãi biển:** `2D vector art illustration of a blue beach with white sand and palm trees, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+34. **Rừng rậm nhiệt đới:** `2D vector art illustration of a mysterious tropical jungle with dense green trees, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+35. **Đỉnh núi mây phủ:** `2D vector art illustration of a high mountain peak with white clouds and blue sky, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+36. **Cánh đồng hướng dương:** `2D vector art illustration of a vast sunflower field under a yellow sun, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+37. **Thác nước hùng vĩ:** `2D vector art illustration of a majestic waterfall flowing into a river, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+38. **Lửa trại trong rừng:** `2D vector art illustration of a campfire in the woods at night under stars, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+39. **Đường mòn nông thôn:** `2D vector art illustration of a peaceful rural path with fields and small houses, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+40. **Nhà gỗ Đà Lạt:** `2D vector art illustration of a wooden cabin in a pine forest on a foggy mountain, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🎮 NHÓM 5: ẢO TƯỞNG & GAME
+41. **Phòng Live-stream:** `2D vector art illustration of a pro streaming room with RGB LED lights and dual monitors, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+42. **Studio quay phim:** `2D vector art illustration of a film studio with cameras and professional lights, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+43. **Phi thuyền không gian:** `2D vector art illustration of a Sci-fi spaceship cockpit looking at stars, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+44. **Thành phố Cyberpunk:** `2D vector art illustration of a futuristic Cyberpunk city with neon lights and rain, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+45. **Lâu đài trung cổ:** `2D vector art illustration of a medieval castle with stone walls and banners, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+46. **Hang động pha lê:** `2D vector art illustration of a glowing crystal cave with sparkling light, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+47. **Đấu trường La Mã:** `2D vector art illustration of a classic Roman colosseum arena, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+48. **Căn phòng trống mờ ảo:** `2D vector art illustration of an empty white room with cinematic soft lighting shadows, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+49. **Không gian vũ trụ:** `2D vector art illustration of deep space with a galaxy and glowing stars, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+50. **Đáy đại dương:** `2D vector art illustration of a deep underwater scene with corals and fish, flat design, simple clean lines, anime visual novel style, 16:9 aspect ratio, similar art with character, no character included`
+---
+## 🎭 NHÓM 6: TẠO SPRITE NHÂN VẬT (NHIỀU GÓC ĐỘ)
+Nếu bạn muốn nhân vật của mình linh hoạt hơn (xoay người, nhìn nghiêng), hãy dùng Prompt tạo **Character Sheet**. Sau đó bạn cắt nhỏ ra để dùng cho từng phân cảnh.
+**Prompt mẫu (8 góc xoay siêu mượt):**
+`Full body character turnaround of a SHORT CHIBI girl (2-head tall proportion), 8 views in a row: front, 3/4 left, side left, 1/4 back left, back, 1/4 back right, side right, and 3/4 right. 8 full-body poses in a single line. Big head, small body, short legs. Every view must include the full character with head and face. Same hair and same face. Simple flat 2d vector art, clean lines, white background, high resolution, game sprite style.`
+**💡 Mẹo giữ sự đồng nhất:**
+*   **Sử dụng Reference:** Luôn kèm theo ảnh nhân vật mẫu của bạn khi gen.
+*   **Midjourney:** Thêm `--cref [Link ảnh mẫu]` vào cuối lệnh.
+*   **Leonardo.ai:** Dùng tính năng **Character Reference** trong phần Image Guidance.
+*   **Cắt ảnh:** Sau khi gen xong, hãy cắt tấm hình thành các file riêng lẻ: `front.png`, `side.png`, `back.png`... để đưa vào hệ thống.
+---
+## 🚶‍♂️ NHÓM 7: TẠO DÁNG ĐI (WALKING SPRITE SHEET)
+Để nhân vật có thể di chuyển trên màn hình, hãy dùng Prompt tạo chu kỳ đi bộ (**Walk Cycle**).
+**Prompt mẫu:**
+`Walking sprite sheet of a SHORT CHIBI girl (2-head tall proportion), 8 frames in total: 4 frames walking to the left and 4 frames walking to the right. Side view, walking cycle animation, sequential walking poses. Big head, small body, short legs. Consistent character design, simple flat 2d vector art, clean lines, white background, high resolution, game sprite style.`
+**💡 Mẹo tạo chuyển động:**
+*   **Loop:** Trong phần mềm edit, hãy cho 4 ảnh đi bộ lặp lại liên tục với thời gian mỗi ảnh cực ngắn (khoảng 0.1s - 0.15s).
+*   **Keyframe:** Kết hợp với việc đặt Keyframe di chuyển vị trí nhân vật để tạo cảm giác nhân vật đang bước đi thật sự.
+---
+## 🎥 NHÓM 8: TẠO VIDEO CHUYỂN ĐỘNG (AI VIDEO PROMPT)
+Nếu bạn sử dụng các công cụ AI Video (Luma, Runway, Kling, Pika), hãy dùng tấm ảnh nhân vật làm mẫu và kết hợp với Prompt dưới đây.
+**Prompt mẫu (Đi bộ sang trái):**
+`A short chibi girl with [MÔ TẢ], walking to the left side of the screen. Side view, constant walk cycle animation. Consistent 2d vector art style, flat design, clean lines. Plain white background. No other movements, only walking, big head, short legs.`
+**💡 Mẹo cho AI Video:**
+*   **Image-to-Video:** Luôn upload ảnh nhân vật của bạn lên trước để AI giữ đúng mẫu.
+*   **Đi tại chỗ:** Nếu muốn nhân vật đi tại chỗ (để dễ ghép nền), hãy dùng từ khóa `Walking in place, facing right`.
+*   **Tránh biến hình:** Thêm từ khóa `maintain chibi proportions` để nhân vật không bị cao lên đột ngột khi bước đi.

prompt_tao_kich_ban.md ADDED Viewed

	@@ -0,0 +1,42 @@

+### 📑 PROMPT BIÊN KỊCH PHONG CÁCH "HOÀI NIỆM & HÀI HƯỚC"
+**Vai trò của bạn:**
+Bạn là một biên kịch hàng đầu cho một kênh YouTube triệu view chuyên về chủ đề hoài niệm, kiến thức thú vị và văn hóa đại chúng. Phong cách viết của bạn là sự kết hợp giữa: **Hài hước, mỉa mai (satire), tự trào (self-deprecating), và tràn đầy sự hoài niệm (nostalgia).**
+**Nhiệm vụ của bạn:**
+Viết một kịch bản video cho chủ đề: **[ĐIỀN CHỦ ĐỀ CỦA BẠN VÀO ĐÂY]**
+**Yêu cầu về văn phong và cấu trúc:**
+1.  **Mở đầu "Vào thẳng vấn đề - Tạo sự giật gân":** Tuyệt đối KHÔNG mở đầu kiểu "Bạn còn nhớ..." hay "Ngày xửa ngày xưa...". Hãy đập thẳng vào vấn đề ngay từ giây đầu tiên. Sử dụng các câu hỏi gây tò mò cực độ và những từ ngữ mạnh, mang tính kích thích cao (ví dụ: *Đè bẹp, chết thảm, nấm mồ, bí mật kinh hoàng, sự thật trần trụi...*). Mục tiêu là cho khán giả biết ngay video này nói về cái gì và tại sao họ phải xem trong vòng 10 giây đầu.
+2.  **Sử dụng từ lóng và ngôn ngữ mạng:** Phải sử dụng linh hoạt các từ lóng của Gen Z, Gen Alpha và các thuật ngữ thịnh hành (ví dụ: *Rich Kid, chạm cỏ, sang chấn tâm lý, hệ điều hành, kiếp nạn, đỉnh nóc kịch trần, ngầu lòi, thanh xuân...*).
+3.  **Kỹ thuật So sánh "Khó đỡ":** Luôn so sánh các sự vật trong chủ đề với những thứ cực kỳ không liên quan nhưng lại hợp lý một cách buồn cười (ví dụ: "Căng thẳng hơn chờ kết quả thi đại học", "Vui hơn nhặt được tiền", "Đau hơn bị người yêu đá").
+4.  **Nhấn mạnh vào Ký ức cảm giác:** Mô tả chi tiết âm thanh (tít tít, rè rè, lạch cạch), mùi vị (mùi nến khét, mùi giấy mới) để khơi gợi cảm xúc người xem.
+5.  **Cấu trúc kịch bản (Bắt buộc):**
+    *   **Hook (10 giây đầu):** Chữ to nảy lên màn hình + Hiệu ứng âm thanh BÙM. Một câu khẳng định hoặc câu hỏi gây sốc. Sau đó nhân vật (Miku) xuất hiện với vẻ mặt nghiêm trọng để giới thiệu mục đích video.
+    *   **Bridge (Dẫn chuyển):** Ngay sau Hook, chèn đoạn: "Nhưng trước khi bắt đầu, các bạn giúp mình nhấn Like, Share và Subscribe nhé. Đó chính là động lực lớn nhất với mình để tiếp tục sản xuất các video tiếp theo gửi đến mọi người. Còn bây giờ, rót cốc trà đá, kéo cái ghế nhựa ra, và hãy cùng mình bước vào nội dung chính của video thôi!"
+    *   **Phần nội dung:** Chia rõ Phần 1, Phần 2... Mỗi câu văn ngắn gọn, súc tích, tốc độ nhanh.
+    *   Ghi chú [VO] cho lời bình và [Hình ảnh/Hiệu ứng] cho phần dựng phim.
+    *   **Phụ lục "Gợi ý hình ảnh":** Sau khi kết thúc kịch bản, hãy tạo một bảng chi tiết bao gồm các cột: **Đoạn kịch bản (Timeline), Gợi ý hình ảnh (B-roll, Gameplay, Graphics), và Nguồn tìm kiếm (YouTube search keywords, stock sites).** Bảng này giúp biên tập viên dễ dàng tìm kiếm footage phù hợp cho từng phân cảnh.
+6.  **Kết thúc đầy cảm xúc:** Một câu kết đọng lại sự nuối tiếc nhưng vẫn giữ được sự lạc quan. Ở cuối video, bắt buộc phải có lời kêu gọi hành động (CTA) bằng cách: đặt một câu hỏi liên quan đến chủ đề để khán giả trả lời, nhắc họ comment ý kiến bên dưới, chia sẻ video cho bạn bè và nhấn Like/Subscribe một cách tự nhiên, lầy lội.
+**🚨 LƯU Ý QUAN TRỌNG:**
+- Tránh dùng văn phong trang trọng, sách vở.
+- Phải tạo cảm giác như hai người bạn đang ngồi "trà đá vỉa hè" kể chuyện cho nhau nghe.
+- Nếu chủ đề có những từ nhạy cảm (như dịch bệnh), hãy viết lái đi (ví dụ: cô vít 19) để tránh lỗi phát âm AI.
+- **PHIÊN ÂM TÊN RIÊNG (QUAN TRỌNG):** Nếu kịch bản có các tên riêng tiếng nước ngoài (Ví dụ: tên nhân vật Anime, tên người, địa danh...), hãy **phiên âm toàn bộ sang tiếng Việt** để AI đọc chuẩn xác (Ví dụ: Iroha là `i rô ha`, Kaguya là `ca gu ya`, Amane là `a ma ne`, Mahiru là `ma hi ru`). Tuyệt đối **KHÔNG** dùng dấu gạch chân (_) giữa các âm tiết.
+### Ví dụ mẫu cho 1 kịch bản sau:
+**Zing Me** và **Khu Vườn Trên Mây** chính là "thanh xuân dữ dội" của hội 8x, 9x đời cuối và 2k đời đầu.
+Tham khảo tại [kich_ban_mau.md](kich_ban_mau.md) và áp dụng theo đúng template đó
+### 💡 Cách sử dụng Prompt này cho các chủ đề khác nhau:
+Bạn chỉ cần thay đổi phần **[CHỦ ��Ề]** bằng bất cứ thứ gì bạn muốn. Ví dụ:
+*   **Chủ đề Game:** "Kịch bản về trò chơi Đảo Kim Cương trên điện thoại Nokia cổ lỗ sĩ."
+*   **Chủ đề Ăn uống:** "Kịch bản về những món ăn vặt cổng trường huyền thoại như mì tôm trẻ em, bò khô lá chanh."
+*   **Chủ đề Công nghệ:** "Kịch bản về thời đại Yahoo Messenger và những dòng trạng thái ẩn hiện đầy tâm trạng."
+*   **Chủ đề Đời sống:** "Kịch bản về những buổi trưa hè trốn ngủ đi hái trộm xoài và cái kết bị chó đuổi."

prompt_tao_kich_ban_giai_thich_meme.md ADDED Viewed

	@@ -0,0 +1,51 @@

+### 📑 PROMPT BIÊN KỊCH CHUYÊN GIA "GIẢI THÍCH MEME" - SAO TINH NGHỊCH
+**Vai trò của bạn:**
+Bạn là một chuyên gia sáng tạo nội dung YouTube Shorts/TikTok triệu view, chuyên về chuỗi video **"Giải thích Meme"**. Phong cách của bạn là: **Hài hước, tốc độ cực nhanh, dùng từ lóng bắt trend, và có một chút mỉa mai (satire).**
+**Nhiệm vụ của bạn:**
+Dựa vào tên Meme hoặc nội dung tôi cung cấp, hãy viết một kịch bản hoàn chỉnh dài chính xác **60 giây** với cấu trúc tối ưu tỷ lệ giữ chân khán giả.
+---
+**1. CẤU TRÚC KỊCH BẢN (BẮT BUỘC):**
+*   **0-5s: Hook (Vào thẳng vấn đề):**
+    - Tuyệt đối KHÔNG chào hỏi rườm rà.
+    - Đưa ra hình ảnh Meme ngay lập tức và đặt một câu hỏi gây tò mò cực độ (Ví dụ: "Bạn đã bao giờ tự hỏi tại sao cái meme này lại hiện diện khắp nơi chưa?", "Sự thật kinh hoàng đằng sau Meme này là gì?").
+*   **5-45s: Phần Giải thích (Fast-paced):**
+    - Giải thích nguồn gốc, ý nghĩa Meme một cách hài hước.
+    - Sử dụng các kỹ thuật so sánh "khó đỡ" và từ lóng (Rich Kid, kiếp nạn, đỉnh nóc kịch trần, ngầu lòi...).
+    - Mỗi câu văn phải ngắn gọn, súc tích để edit chèn hình ảnh minh họa liên tục.
+*   **45-55s: Ví dụ & Biến thể:**
+    - Đưa ra một ví dụ thực tế hoặc một phiên bản "chế" khác của Meme đó để tạo tiếng cười.
+*   **55-60s: Kết thúc (Outro Siêu Tốc):**
+    - **Nếu là Shorts:** KHÔNG CÓ OUTRO. Kết thúc ngay sau điểm cao trào để tạo vòng lặp (loop) vô tận.
+    - **Nếu là Video dài:** Outro tối đa 5 giây. Kêu gọi Like/Subscribe một cách tự nhiên, lầy lội và biến mất luôn.
+---
+**2. QUY TẮC GẮN TAG BIỂU CẢM (HỆ THỐNG AI):**
+*   **Tần suất:** Cứ mỗi 2-3 giây (hoặc mỗi câu ngắn) phải có một thẻ `[Tag]`.
+*   **Độ dài:** Mỗi thẻ `[Tag]` bắt buộc phải đi kèm với **ít nhất 6 từ**. Tuyệt đối không ngắt câu quá ngắn sau thẻ vì sẽ gây lỗi AI.
+*   **Dấu câu:** Chỉ dùng dấu chấm (.) và dấu phẩy (,). **CẤM** dùng dấu ba chấm (...), dấu ngoặc kép ("").
+*   **Thẻ nghỉ:** Dùng `[p:ms]` cho đoạn nghỉ trên 500ms (Ví dụ: `[p:500]`, `[p:1000]`). Không dùng nghỉ ngắn.
+---
+**3. LƯU Ý QUAN TRỌNG VỀ NỘI DUNG:**
+*   **Văn phong:** Một người kể chuyện theo kiểu "trà đá vỉa hè" kể chuyện, không dùng văn phong sách vở.
+*   **Phiên âm tên riêng:** Các tên riêng nước ngoài (Anime, tên người...) phải phiên âm sang tiếng Việt (Ví dụ: Iroha -> `i rô ha`, Kaguya -> `ca gu ya`). **KHÔNG** dùng dấu gạch chân (_).
+*   **Bỏ qua chú thích:** Không đưa các đoạn `[Hình ảnh/Hiệu ứng]` vào lời thoại VO.
+---
+**📜 DANH SÁCH BIỂU CẢM ĐƯỢC PHÉP DÙNG:**
+[Ánh mắt chân thành], [Bất lực], [Bất ngờ], [Bình thường], [Bó tay], [Buồn nhẹ], [Cảm thông], [Cầu xin], [Chào khán giả], [Chỉ tay], [Chịu thua], [Cực kỳ nghiêm túc], [Cười tươi], [Đợi], [Giận], [Nhấn mạnh], [Hạnh phúc], [Khó hiểu], [Khoanh tay 2], [Khoanh tay], [Khóc], [Lắc đầu], [Lo lắng 2], [Lo lắng], [Kể chuyện], [Mỉm cười], [Ôm má], [Nghĩ ra rồi], [Nghiêm túc], [Nhếch mép], [Nhìn ghê], [Nhìn thẳng], [Nhíu mày nhẹ], [Nhíu mày], [Nói nghe nè], [Nói], [Phải vậy không], [Phân tích], [Quyết tâm 2], [Quyết tâm], [Sợ hãi], [Suy tư], [Tạm biệt], [Tập trung], [Tay sau lưng], [Tay trước ngực], [Thất vọng], [Thở dài], [Tsundere], [Ấm áp], [Vuốt trán], [Wow], [Xin chào], [You], [Bất lực quá], [Trầm tư], [Vui vẻ], [Buồn], [Giận dữ], [Ngạc nhiên], [Để lại comment], [Bật thông báo], [Nút like], [Nút subscribe].
+---
+**BẮT ĐẦU:** Hãy viết kịch bản "Giải thích Meme" cho chủ đề sau: **[ĐIỀN TÊN MEME]**

prompt_tao_kich_ban_reaction.md ADDED Viewed

	@@ -0,0 +1,61 @@

+Đây là một **mẫu Prompt (Câu lệnh)** cực kỳ tối ưu, được thiết kế riêng cho bạn để biến AI thành một "trợ lý biên kịch" chuyên viết kịch bản dạng Reaction/Commentary.
+Bạn chỉ cần **copy toàn bộ đoạn chữ trong khung dưới đây**, dán vào AI (ChatGPT/Gemini/Claude), rồi điền nội dung video gốc vào phần cuối cùng là xong!
+***
+### 📋 COPY ĐOẠN PROMPT DƯỚI ĐÂY:
+Bạn hãy đóng vai là một chuyên gia viết kịch bản YouTube Shorts/TikTok triệu view, chuyên làm mảng Reaction/Commentary giấu mặt sử dụng nhân vật Chibi (PNGTuber).
+Nhiệm vụ của bạn là dựa vào nội dung video gốc mà tôi cung cấp, viết ra một kịch bản Reaction cực kỳ hài hước, bắt trend, nhịp độ nhanh và có tính tương tác cao. Kịch bản phải giúp tôi lách luật "Sử dụng lại nội dung" của YouTube bằng cách tạm dừng video gốc để chèn lời bình luận mang tính sáng tạo, châm biếm hoặc phân tích.
+**QUY TẮC TRÌNH BÀY KỊCH BẢN YÊU CẦU:**
+1. **Mở đầu "Vào thẳng vấn đề - Tạo sự giật gân" (10 giây đầu):**
+   - Tuyệt đối KHÔNG bắt đầu kiểu "Hôm nay mình sẽ react...".
+   - Hãy đập thẳng vào vấn đề bằng một câu hỏi gây sốc hoặc nhận xét cực đoan về video gốc.
+   - Dùng từ ngữ mạnh (ví dụ: *Ảo ma, kinh hoàng, kiếp nạn, không thể tin nổi...*).
+   - Chữ to nảy lên màn hình + Hiệu ứng âm thanh BÙM. Nhân vật Chibi hiện ra với vẻ mặt sốc/nghiêm trọng để giới thiệu mục đích video.
+2. Phân chia rõ ràng giữa cảnh video gốc chạy và cảnh nhân vật Chibi nói:
+   - Dùng thẻ **[View/Watch]** khi miêu tả video gốc đang chạy (Ghi rõ cần chiếu cảnh gì, âm thanh ra sao).
+   - Dùng thẻ **[VO/ Voice]** khi nhân vật Chibi xuất hiện để bình luận. Bắt buộc phải miêu tả biểu cảm của Chibi (vui, sốc, khóc, bất lực...) và hiệu ứng edit nếu có (Zoom in mặt, thêm sound effect...).
+3. Cấu trúc kịch bản xen kẽ: Chiếu video gốc 3-5 giây -> Pause video chèn Chibi bình luận -> Chiếu tiếp video -> Chibi chốt hạ.
+4. Giọng văn: Trẻ trung, xéo xắt, dùng từ ngữ Gen Z (cảm lạnh, ảo ma, xà lơ, mỏ hỗn...), hài hước.
+5. An toàn: Chủ động ghi chú (Bíp) hoặc che đi nếu video gốc có từ ngữ thô tục/nhạy cảm để an toàn bật kiếm tiền.
+6. Cuối video luôn có 1 câu Call to Action (Kêu gọi Like, Đăng ký kênh) ngắn gọn và tự nhiên.
+7. **PHIÊN ÂM TÊN RIÊNG (QUAN TRỌNG):** Nếu kịch bản có các tên riêng tiếng nước ngoài (Ví dụ: tên nhân vật Anime, tên người, địa danh...), bạn phải **phiên âm toàn bộ sang tiếng Việt** để AI đọc chuẩn xác (Ví dụ: Iroha chuyển thành `i rô ha`, Kaguya là `ca gu ya`, Amane là `a ma ne`, Mahiru là `ma hi ru`). Tuyệt đối **KHÔNG** để dấu gạch chân (_) giữa các âm tiết.
+**DỮ LIỆU ĐẦU VÀO:**
+Dưới đây là mô tả nội dung video cần react:
+[ ĐIỀN NỘI DUNG, DIỄN BIẾN, HOẶC LỜI THOẠI CỦA VIDEO CẦN REACT VÀO ĐÂY ]
+***
+### Danh sách biểu cảm (System Tags):
+[Ánh mắt chân thành], [Bất lực], [Bất ngờ], [Bình thường], [Bó tay], [Buồn nhẹ], [Cảm thông], [Cầu xin], [Chào khán giả], [Chỉ tay], [Chịu thua], [Cực kỳ nghiêm túc], [Cười tươi], [Đợi], [Giận], [Nhấn mạnh], [Hạnh phúc], [Khó hiểu], [Khoanh tay 2], [Khoanh tay], [Khóc], [Lắc đầu], [Lo lắng 2], [Lo lắng], [Kể chuyện], [Mỉm cười], [Ôm má], [Nghĩ ra rồi], [Nghiêm túc], [Nhếch mép], [Nhìn ghê], [Nhìn thẳng], [Nhíu mày nhẹ], [Nhíu mày], [Nói nghe nè], [Nói], [Phải vậy không], [Phân tích], [Quyết tâm 2], [Quyết tâm], [Sợ hãi], [Suy tư], [Tạm biệt], [Tập trung], [Tay sau lưng], [Tay trước ngực], [Thất vọng], [Thở dài], [Tsundere], [Ấm áp], [Vuốt trán], [Wow], [Xin chào], [You], [Bất lực quá], [Trầm tư], [Vui vẻ], [Buồn], [Giận dữ], [Ngạc nhiên], [Để lại comment], [Bật thông báo], [Nút like], [Nút subscribe].
+### 💡 Ví dụ về kịch bản sau khi áp dụng:
+**[VO/ Voice]**
+*Hình ảnh:* Chữ to nảy lên: **"KIẾP NẠN THỨ 82 CỦA HOÀNG THƯỢNG?"** + Hiệu ứng âm thanh BÙM.
+*Biểu cảm Chibi:* Mắt chữ O mồm chữ A, tay chỉ thẳng vào màn hình.
+*Giọng đọc:* "Bạn có tin một vị hoàng thượng quyền uy thế này... lại bị một ông Husky ĐÈ BẸP trong vòng 1 nốt nhạc không? Hôm nay hãy cùng mình chứng kiến kiếp nạn không thể tin nổi này nhé!"
+**[View/Watch]**
+*Hình ảnh:* Cảnh chó Husky đang nằm ngủ ngáy khò khò. Mèo tiến lại gần.
+*��m thanh:* Tiếng ngáy to, tiếng nhạc hồi hộp.
+**[VO/ Voice]**
+*Hình ảnh:* Video dừng lại ngay lúc mèo giơ chân lên. Zoom in mặt Chibi.
+*Biểu cảm Chibi:* Nheo mắt hóng chuyện.
+*Giọng đọc:* "Đấy, nhìn cái chân giơ lên là thấy sắp có biến rồi. Ngủ với hoàng thượng mà ngáy to cỡ này thì xác định là ăn tát vỡ mặt!"
+**[View/Watch]**
+*Hình ảnh:* Video tiếp tục. Con mèo tát "bóp bóp bóp" 3 cái. Chó Husky giật mình tỉnh dậy ngơ ngác.
+*Âm thanh:* Ghép thêm tiếng tát vỡ mặt. Tiếng "Hả?" của chó.
+**[VO/ Voice]**
+*Hình ảnh:* Chibi đập bàn cười ngặt nghẽo.
+*Biểu cảm Chibi:* Cười tươi, phóng to mặt.
+*Giọng đọc:* "Ảo ma thật sự! Tát xong quay đít bỏ đi ngầu đét luôn. Anh em nào ở nhà nuôi báo thủ mà bị như này thì điểm danh cái nào, và đừng quên nhấn Đăng ký kênh Sao Tinh Nghịch nha!"

prompt_tao_kich_ban_tu_anh.md ADDED Viewed

	@@ -0,0 +1,33 @@

+# Role: Chuyên gia sáng tạo nội dung Video Short/TikTok
+Bạn là một biên kịch chuyên nghiệp, có khả năng nhìn hình ảnh (meme, ảnh chụp, tin nhắn...) để viết thành một kịch bản kể chuyện hài hước, hấp dẫn và gắn các thẻ biểu cảm [Tag] cho nhân vật AI.
+## Bước 1: Phân tích hình ảnh
+- Đọc toàn bộ văn bản có trong ảnh.
+- Xác định ngữ cảnh, tâm trạng và các chi tiết hài hước/đáng chú ý trong ảnh.
+## Bước 2: Viết kịch bản & Gắn Tag biểu cảm
+Dựa trên hình ảnh, hãy viết một kịch bản kể chuyện hoàn chỉnh.
+### Quy tắc quan trọng:
+1. **Tần suất biểu cảm hợp lý (QUY TẮC CỨNG)**: Cứ mỗi 2-3 giây hãy thay đổi biểu cảm một lần. **Mỗi thẻ [Tag] bắt buộc phải đi kèm với ít nhất 6 từ.** Tuyệt đối không gắn thẻ [Tag] sau mỗi 1-2 từ đơn lẻ, vì điều này sẽ làm AI bị mất ngữ cảnh, dẫn đến lỗi phát âm (như tiếng ừ, à, rên rỉ).
+2. **Cú pháp thẻ**: `[Tên biểu cảm] Văn bản [s:tốc độ] [p:độ nghỉ]`.
+   - Luôn đặt Tag biểu cảm ở đầu cụm từ hoặc câu ngắn.
+   - Thêm [p:ms] (độ nghỉ) sau các câu cảm thán hoặc chuyển ý để tạo nhịp điệu. **Lưu ý: Chỉ dùng p khi độ nghỉ từ 500ms trở lên. Tuyệt đối KHÔNG dùng các độ nghỉ ngắn như [p:100] hay [p:200].**
+   - Thêm [s:x.x] (tốc độ) để nhấn mạnh hoặc tạo sự hài hước (ví dụ s:1.2 cho đoạn hào hứng, s:0.8 cho đoạn trầm tư).
+3. **Sự đa dạng**: Sử dụng linh hoạt các biểu cảm trong danh sách bên dưới để thể hiện sự biến chuyển tâm lý liên tục của nhân vật.
+4. **Phong cách ngắn gọn**: Viết theo văn phong nói tự nhiên, không viết dài dòng như văn mẫu. Tập trung vào các câu cảm thán, nhận xét ngắn gọn, đi thẳng vào điểm hài hước của bức ảnh. **QUY TẮC CỨNG: Chỉ được viết vỏn vẹn từ 3 đến 4 câu.**
+5.**QUY TẮC DẤU CÂU** (Quan trọng để tránh lỗi AI rên rỉ/hỏng tiếng):
+   - Chỉ được sử dụng dấu chấm (.) và dấu phẩy (,) trong kịch bản.
+   - Tuyệt đối CẤM sử dụng dấu 3 chấm (...), dấu ngoặc kép (""), hoặc các ký tự lạ. Nếu thấy kịch bản gốc có dấu 3 chấm, hãy chuyển thành dấu phẩy (,) hoặc dấu chấm (.) tùy ngữ cảnh.
+   - **QUAN TRỌNG:** Luôn có một dấu chấm (.) hoặc dấu phẩy (,) ngay trước mỗi thẻ [Tag] (trừ thẻ đầu tiên). Đồng thời, mỗi cụm từ sau thẻ [Tag] phải đủ dài (ít nhất 5-6 từ) để AI hiểu ngữ cảnh và không bị lỗi giọng.
+6. **PHIÊN ÂM TÊN RIÊNG (QUAN TRỌNG):** Nếu kịch bản có các tên riêng tiếng nước ngoài (Ví dụ: tên nhân vật Anime, tên người, địa danh...), bạn phải **phiên âm toàn bộ sang tiếng Việt** để AI đọc chuẩn xác (Ví dụ: Iroha chuyển thành `i rô ha`, Kaguya là `ca gu ya`, Amane là `a ma ne`, Mahiru là `ma hi ru`). Tuyệt đối **KHÔNG** để dấu gạch chân (_) giữa các âm tiết.
+### Danh sách biểu cảm (System Tags):
+[Ánh mắt chân thành], [Bất lực], [Bất ngờ], [Bình thường], [Bó tay], [Buồn nhẹ], [Cảm thông], [Cầu xin], [Chào khán giả], [Chỉ tay], [Chịu thua], [Cực kỳ nghiêm túc], [Cười tươi], [Đợi], [Giận], [Nhấn mạnh], [Hạnh phúc], [Khó hiểu], [Khoanh tay 2], [Khoanh tay], [Khóc], [Lắc đầu], [Lo lắng 2], [Lo lắng], [Kể chuyện], [Mỉm cười], [Ôm má], [Nghĩ ra rồi], [Nghiêm túc], [Nhếch mép], [Nhìn ghê], [Nhìn thẳng], [Nhíu mày nhẹ], [Nhíu mày], [Nói nghe nè], [Nói], [Phải vậy không], [Phân tích], [Quyết tâm 2], [Quyết tâm], [Sợ hãi], [Suy tư], [Tạm biệt], [Tập trung], [Tay sau lưng], [Tay trước ngực], [Thất vọng], [Thở dài], [Tsundere], [Ấm áp], [Vuốt trán], [Wow], [Xin chào], [You], [Bất lực quá], [Trầm tư], [Vui vẻ], [Buồn], [Giận dữ], [Ngạc nhiên], [Để lại comment], [Bật thông báo], [Nút like], [Nút subscribe].
+---
+## Ví dụ Output mong muốn:
+[Ngạc nhiên] Ôi giời ơi, [p:500] [Wow] cái bảng này độc lạ quá! [p:600] [Nói] Bình thường là ghi tên vắng thôi, [p:500] [Khó hiểu] giờ ghi hẳn lý do thế này á? [p:700] [Cười tươi] Chắc mấy ông đang nghỉ [Mỉm cười] cũng đang thấy xấu hổ lắm đây! [p:500] [Bó tay] Đúng là cạn lời thật sự!
+---
+**BẮT ĐẦU:** Hãy phân tích hình ảnh tôi vừa gửi và tạo kịch bản VỎN VẸN 3-4 CÂU, TỰ NHIÊN với tần suất biểu cảm vừa phải (2-3 giây đổi 1 lần). Hãy nhớ luôn có dấu chấm hoặc dấu phẩy trước các thẻ [Tag], và **mỗi thẻ [Tag] phải đi kèm ít nhất 6 từ.**

resize_img.py ADDED Viewed

	@@ -0,0 +1,28 @@

+import os
+from PIL import Image
+def resize_images(directory, size=(1000, 1000)):
+    if not os.path.exists(directory):
+        print(f"Directory {directory} does not exist.")
+        return
+    files = [f for f in os.listdir(directory) if f.lower().endswith(('.png', '.jpg', '.jpeg', '.webp'))]
+    total = len(files)
+    print(f"Found {total} images in {directory}. Starting resize to {size}...")
+    for i, filename in enumerate(files):
+        filepath = os.path.join(directory, filename)
+        try:
+            with Image.open(filepath) as img:
+                # Using Resampling.LANCZOS for better quality
+                # If we want to avoid stretching, we would need to crop or pad.
+                # The user asked for 1000x1000 specifically, so we'll do a direct resize.
+                resized_img = img.resize(size, Image.Resampling.LANCZOS)
+                resized_img.save(filepath)
+                print(f"[{i+1}/{total}] Resized {filename}")
+        except Exception as e:
+            print(f"Error processing {filename}: {e}")
+if __name__ == "__main__":
+    target_dir = r"output"
+    resize_images(target_dir)

scratch/check_dims.py ADDED Viewed

	@@ -0,0 +1,12 @@

+import os
+from PIL import Image
+char_dir = "static/characters"
+for f in os.listdir(char_dir):
+    if f.endswith(".png"):
+        path = os.path.join(char_dir, f)
+        try:
+            with Image.open(path) as img:
+                print(f"{f}: {img.size}, mode: {img.mode}")
+        except Exception as e:
+            print(f"Error opening {f}: {e}")

scratch/check_green.py ADDED Viewed

	@@ -0,0 +1,12 @@

+from PIL import Image
+img = Image.open("scratch/tmp/frame_last.jpg")
+img = img.convert("RGB")
+w, h = img.size
+green_count = 0
+for x in range(w):
+    for y in range(h):
+        r, g, b = img.getpixel((x, y))
+        if g > 200 and r < 50 and b < 50:
+            green_count += 1
+print(f"Green ratio: {green_count / (w*h):.2f}")

scratch/extract_frame.py ADDED Viewed

	@@ -0,0 +1,10 @@

+import ffmpeg
+(
+    ffmpeg
+    .input("scratch/tmp/studio_output.mp4", ss=2.0)
+    .filter('scale', 200, -1)
+    .output("scratch/tmp/frame.jpg", vframes=1)
+    .overwrite_output()
+    .run(quiet=True)
+)
+print("Frame extracted to scratch/tmp/frame.jpg")

scratch/extract_last_frame.py ADDED Viewed

	@@ -0,0 +1,10 @@

+import ffmpeg
+(
+    ffmpeg
+    .input("scratch/tmp/studio_output.mp4", ss=4.0)
+    .filter('scale', 200, -1)
+    .output("scratch/tmp/frame_last.jpg", vframes=1)
+    .overwrite_output()
+    .run(quiet=True)
+)
+print("Last frame extracted")

scratch/print_args.py ADDED Viewed

	@@ -0,0 +1,21 @@

+import os
+import ffmpeg
+def print_ffmpeg_args():
+    concat_path = "concat.txt"
+    tts_audio_path = "audio.mp3"
+    char_stream = ffmpeg.input(concat_path, f="concat", safe=0)
+    audio_stream = ffmpeg.input(tts_audio_path)
+    bg_green = ffmpeg.input("color=c=0x00FF00:s=1080x1080:r=30", f="lavfi")
+    char_stream = ffmpeg.filter(char_stream, 'scale', 1080, 1080, force_original_aspect_ratio='decrease')
+    video_final = ffmpeg.overlay(bg_green, char_stream, x='(main_w-overlay_w)/2', y='(main_h-overlay_h)/2')
+    out = ffmpeg.output(video_final, audio_stream, "output.mp4", vcodec="libx264", acodec="aac", audio_bitrate="192k", pix_fmt="yuv420p", r=30, shortest=None)
+    args = ffmpeg.get_args(out)
+    print(" ".join(args))
+if __name__ == "__main__":
+    print_ffmpeg_args()

scratch/process_green_background.py ADDED Viewed

	@@ -0,0 +1,44 @@

+import os
+from PIL import Image
+# Cấu hình đường dẫn
+input_dir = "static/characters"
+output_dir = "static/characters_green"
+backup_dir = "static/characters_backup"
+# Tạo các thư mục nếu chưa có
+os.makedirs(output_dir, exist_ok=True)
+os.makedirs(backup_dir, exist_ok=True)
+print(f"Starting to process images from {input_dir}...")
+green_color = (0, 255, 0) # Mã màu xanh lá chuẩn (RGB)
+files = [f for f in os.listdir(input_dir) if f.endswith(".png")]
+total = len(files)
+for i, filename in enumerate(files):
+    input_path = os.path.join(input_dir, filename)
+    output_path = os.path.join(output_dir, filename)
+    try:
+        with Image.open(input_path) as img:
+            # 1. Chuyển sang RGBA nếu chưa có
+            img = img.convert("RGBA")
+            # 2. Tạo một nền xanh thuần túy cùng kích thước
+            background = Image.new("RGB", img.size, green_color)
+            # 3. Dán ảnh nhân vật lên nền xanh (dùng chính kênh alpha của ảnh làm mask)
+            background.paste(img, (0, 0), img)
+            # 4. Lưu lại thành phẩm
+            background.save(output_path, "PNG")
+        print(f"[{i+1}/{total}] Processed: {filename}")
+    except Exception as e:
+        print(f"[!] Error processing {filename}: {e}")
+print(f"\n--- DONE! ---")
+print(f"Total: {total} images saved to: {output_dir}")
+print(f"Note: Original files are untouched. Please check characters_green folder.")

scratch/resize_cards.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import os
+from PIL import Image
+def resize_images(input_dir, output_dir, size=(248, 341)):
+    if not os.path.exists(output_dir):
+        os.makedirs(output_dir)
+    files = [f for f in os.listdir(input_dir) if f.lower().endswith(('.webp', '.png', '.jpg', '.jpeg'))]
+    total = len(files)
+    print(f"Found {total} images. Starting resize to {size[0]}x{size[1]}...")
+    for i, filename in enumerate(files):
+        try:
+            img_path = os.path.join(input_dir, filename)
+            with Image.open(img_path) as img:
+                # Resize using Lanczos for high quality
+                img_resized = img.resize(size, Image.Resampling.LANCZOS)
+                # If the original was RGBA and we want to keep it
+                # img_resized = img_resized.convert("RGBA")
+                output_path = os.path.join(output_dir, filename)
+                img_resized.save(output_path, "WEBP", quality=95)
+            if (i + 1) % 20 == 0 or (i + 1) == total:
+                print(f"Processed {i + 1}/{total}...")
+        except Exception as e:
+            print(f"Error processing {filename}: {e}")
+if __name__ == "__main__":
+    base_path = r"c:\Users\huuda\OneDrive\Documents\GitHub\UI-VieNeu\static\Lego Ninjago Card Game"
+    output_path = os.path.join(base_path, "resized")
+    resize_images(base_path, output_path)
+    print("\nAll images resized and saved to the 'resized' folder!")

scratch/test_ai_pipeline.py ADDED Viewed

	@@ -0,0 +1,18 @@

+import os
+from services.ai_pipeline import process_studio_pipeline
+tmpdir = "scratch/tmp"
+os.makedirs(tmpdir, exist_ok=True)
+script = "[cuoi tuoi] Xin chào các bạn, nếu được thần đèn cho 3 điều ước thì các bạn sẽ ước gì nè"
+voice = "static/voice/giong-nu-ke-chuyen.mp3"
+bgm = "static/music/Sunset Dream - Cheel.mp3"
+print("Starting test...")
+output = process_studio_pipeline(tmpdir, script, 1.2, voice, bgm, 0.2)
+print("Output:", output)
+# In nội dung file concat.txt ra để kiểm tra xem có bị lỗi duration không
+with open(os.path.join(tmpdir, "concat.txt"), "r", encoding="utf-8") as f:
+    print("CONCAT.TXT CONTENT:")
+    print(f.read())

scratch/test_ffmpeg.py ADDED Viewed

	@@ -0,0 +1,22 @@

+import os
+import tempfile
+def test_ffmpeg():
+    img_path = "static/characters/Cuoi-tuoi.png"
+    img_abs = os.path.abspath(img_path).replace("\\", "/")
+    fd, concat_path = tempfile.mkstemp(suffix='.txt')
+    with os.fdopen(fd, 'w') as f:
+        f.write("ffconcat version 1.0\n")
+        f.write(f"file '{img_abs}'\n")
+        f.write("duration 2.0\n")
+        f.write(f"file '{img_abs}'\n")
+    print("Testing with file:", concat_path)
+    cmd = f'ffmpeg -y -f concat -safe 0 -i "{concat_path}" -f lavfi -i color=c=0x00FF00:s=1080x1080:r=30 -filter_complex "[0:v]scale=1080:1080:force_original_aspect_ratio=decrease[char];[1:v][char]overlay=(main_w-overlay_w)/2:(main_h-overlay_h)/2" -t 2 test_ffmpeg.mp4'
+    os.system(cmd)
+    print("Test finished.")
+if __name__ == "__main__":
+    test_ffmpeg()

scratch/test_ffmpeg2.py ADDED Viewed

	@@ -0,0 +1,14 @@

+import os
+import tempfile
+img_abs = os.path.abspath('static/characters/Cuoi-tuoi.png').replace('\\', '/')
+fd, path = tempfile.mkstemp(suffix='.txt')
+with os.fdopen(fd, 'w') as f:
+    f.write("ffconcat version 1.0\n")
+    f.write(f"file '{img_abs}'\n")
+    f.write("duration 2.0\n")
+    f.write(f"file '{img_abs}'\n")
+cmd = f'ffmpeg -y -f lavfi -i color=c=0x00FF00:s=1080x1080:r=30 -f concat -safe 0 -i "{path}" -f lavfi -i anullsrc=r=44100:cl=stereo -filter_complex "[1:v]scale=1080:1080:force_original_aspect_ratio=decrease[s0];[0:v][s0]overlay=eof_action=repeat:x=(main_w-overlay_w)/2:y=(main_h-overlay_h)/2[s1]" -map "[s1]" -map 2:a -b:a 192k -acodec aac -pix_fmt yuv420p -r 30 -shortest -vcodec libx264 -t 2 test_ffmpeg_graph.mp4'
+print(cmd)
+os.system(cmd)

scratch/test_pipeline.py ADDED Viewed

	@@ -0,0 +1,46 @@

+import os
+import tempfile
+import subprocess
+import json
+def test_full_pipeline():
+    # Simulate what ai_pipeline does
+    img_abs = os.path.abspath('static/characters/Cuoi-tuoi.png').replace('\\', '/')
+    fd, concat_path = tempfile.mkstemp(suffix='.txt')
+    with os.fdopen(fd, 'w') as f:
+        f.write("ffconcat version 1.0\n")
+        f.write(f"file '{img_abs}'\n")
+        f.write("duration 2.000\n")
+        f.write(f"file '{img_abs}'\n")
+    print(f"Concat path: {concat_path}")
+    with open(concat_path, 'r') as f:
+        print(f.read())
+    out_video = "scratch/test_studio_output.mp4"
+    cmd = [
+        "ffmpeg", "-y",
+        "-f", "lavfi", "-i", "color=c=0x00FF00:s=1080x1080:r=30",
+        "-f", "concat", "-safe", "0", "-i", concat_path,
+        "-f", "lavfi", "-i", "anullsrc=r=44100:cl=stereo",
+        "-filter_complex", "[1:v]scale=1080:1080:force_original_aspect_ratio=decrease[char];[0:v][char]overlay=eof_action=repeat:x=(main_w-overlay_w)/2:y=(main_h-overlay_h)/2[outv]",
+        "-map", "[outv]",
+        "-map", "2:a",
+        "-c:v", "libx264", "-pix_fmt", "yuv420p", "-r", "30",
+        "-c:a", "aac", "-b:a", "192k",
+        "-shortest",
+        "-t", "2",
+        out_video
+    ]
+    print("Running ffmpeg...")
+    subprocess.run(cmd, capture_output=True, text=True)
+    # Run ffprobe to check if it's green
+    probe_cmd = [
+        "ffprobe", "-v", "error", "-show_entries", "format=bit_rate", "-of", "default=noprint_wrappers=1:nokey=1", out_video
+    ]
+    res = subprocess.run(probe_cmd, capture_output=True, text=True)
+    print(f"Bitrate: {res.stdout.strip()}")
+if __name__ == "__main__":
+    test_full_pipeline()

scratch/test_studio_output.mp4 ADDED Viewed

Binary file (77.3 kB). View file

scratch/tmp/concat.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+ffconcat version 1.0
+file 'C:/Users/huuda/OneDrive/Documents/GitHub/UI-VieNeu/static/characters/Binh-thuong.png'
+duration 5.820
+file 'C:/Users/huuda/OneDrive/Documents/GitHub/UI-VieNeu/static/characters/Binh-thuong.png'

scratch/tmp/frame.jpg ADDED Viewed

scratch/tmp/frame_last.jpg ADDED Viewed

scratch/tmp/part_init.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3bc6d6b8dacde55333976e7247966c96d8693d96024212eb9f52bce3f1cd73d5
+size 289964

scratch/tmp/studio_output.mp4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b72ec721c0bfeb39971365daf56e95e0d07c92549183a9343d3d7acda875261
+size 159460

scratch/tmp/tts_voiceover.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3bc6d6b8dacde55333976e7247966c96d8693d96024212eb9f52bce3f1cd73d5
+size 289964

scratch/tmp/tts_voiceover_mixed.mp3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24a2a3d99b578b4aa2debc75e0d589d854e5a2a95a60cddb18547b2a8d540526
+size 122445

services/ai_pipeline.py CHANGED Viewed

@@ -1,35 +1,31 @@
 import os
-import ffmpeg
-from faster_whisper import WhisperModel
-from vieneu import Vieneu
-# Initialize Models at module level so Celery workers only load it once!
-# Depending on requirements, we can set 'remote' if deploying Docker VieNeu server,
-# or default (Turbo) for local testing.
-tts = Vieneu()
-# Use CPU with int8 if we lack GPU to avoid OOM
-whisper_model = WhisperModel("base", device="cpu", compute_type="int8")
-def process_video_pipeline(tmpdir: str, video_file: str, script: str, ref_audio: str = None) -> str:
     """
     Main orchestration function combining TTS, STT, and Video Rendering.
     """
-    tts_audio_path = os.path.join(tmpdir, "tts_voiceover.wav")
     # 1. GENERATE VIENEU-TTS VOICEOVER
-    if ref_audio:
-        # Zero-shot voice clone
-        my_voice = tts.encode_reference(ref_audio)
-        audio_array = tts.infer(text=script, voice=my_voice)
-    else:
-        # Default voice
-        audio_array = tts.infer(text=script)
-    tts.save(audio_array, tts_audio_path)
     # 2. FASTER-WHISPER TIMESTAMP EXTRACTION
-    # (We run whisper on the synthesized audio for clean/perfect word timestamps)
     segments, info = whisper_model.transcribe(tts_audio_path, word_timestamps=True, language="vi")
     words_data = []
@@ -43,104 +39,115 @@ def process_video_pipeline(tmpdir: str, video_file: str, script: str, ref_audio:
     # 3. GENERATE DYNAMIC .ASS SUBTITLE
     ass_path = os.path.join(tmpdir, "dynamic_subs.ass")
-    generate_ass_file(words_data, ass_path)
     # 4. BURN IN WITH FFMPEG
-    output_video = os.path.join(tmpdir, "final_output.mp4")
-    # Strip original audio from video
-    in_video = ffmpeg.input(video_file).video
-    # Insert Voiceover audio
-    in_audio = ffmpeg.input(tts_audio_path)
-    # Render Subs onto the video stream. Note FFmpeg in Python cleanly handles paths for 'ass' filter.
-    # To fix potential absolute path issues with libass on windows, we can ensure forward slashes
-    ass_path_ff = ass_path.replace('\\', '/')
-    video_with_subs = in_video.filter('ass', ass_path_ff)
-    (
-        ffmpeg
-        .output(video_with_subs, in_audio, output_video, vcodec="libx264", acodec="aac", audio_bitrate="192k")
-        .overwrite_output()
-        .run()
-    )
     return output_video
-def generate_tts_only(tmpdir: str, script: str, ref_audio: str = None, temperature: float = 0.5) -> str:
     """
-    Standalone function to just generate TTS audio.
     """
-    tts_audio_path = os.path.join(tmpdir, "tts_voiceover.wav")
-    # Passing keyword arguments; if underlying model doesn't strictly accept temperature,
-    # python handles **kwargs flexibly if written cleanly in wrappers.
-    # To avoid crashing, we'll try to pass it to `infer`. If Vieneu object restricts kwargs tightly,
-    # we can trap the type error and fallback to not using temperature.
-    try:
-        if ref_audio:
-            my_voice = tts.encode_reference(ref_audio)
-            audio_array = tts.infer(text=script, voice=my_voice, temperature=temperature)
-        else:
-            # We assume default voices can be tuned with temperature
-            audio_array = tts.infer(text=script, temperature=temperature)
-    except TypeError:
-        # Fallback if Vieneu.infer doesn't support 'temperature'
-        print("Warning: Vieneu.infer doesn't support temperature. Ignoring it.")
-        if ref_audio:
-            my_voice = tts.encode_reference(ref_audio)
-            audio_array = tts.infer(text=script, voice=my_voice)
-        else:
-            audio_array = tts.infer(text=script)
-    tts.save(audio_array, tts_audio_path)
-    return tts_audio_path
-def generate_ass_file(words_data: list, dest_path: str):
-    """
-    Crafts an advanced SubStation Alpha file for Karaoke effects.
-    """
-    header = """[Script Info]
-ScriptType: v4.00+
-Collisions: Normal
-PlayResX: 1920
-PlayResY: 1080
-[V4+ Styles]
-Format: Name, Fontname, Fontsize, PrimaryColour, SecondaryColour, OutlineColour, BackColour, Bold, Italic, Underline, StrikeOut, ScaleX, ScaleY, Spacing, Angle, BorderStyle, Outline, Shadow, Alignment, MarginL, MarginR, MarginV, Encoding
-Style: Main,Arial,80,&H00FFFFFF,&H000000FF,&H00000000,&H80000000,-1,0,0,0,100,100,0,0,1,3,2,2,10,10,50,1
-[Events]
-Format: Layer, Start, End, Style, Name, MarginL, MarginR, MarginV, Effect, Text
-"""
-    def format_time(seconds: float) -> str:
-        h = int(seconds // 3600)
-        m = int((seconds % 3600) // 60)
-        s = seconds % 60
-        return f"{h}:{m:02d}:{s:05.2f}"
-    lines = [header]
-    chunk_size = 5
-    for i in range(0, len(words_data), chunk_size):
-        chunk = words_data[i:i+chunk_size]
-        for active_idx, target_word in enumerate(chunk):
-            w_start = target_word['start']
-            w_end = target_word['end']
-            line_text = ""
-            for j, w in enumerate(chunk):
-                if j == active_idx:
-                    # Target word gets enlarged and colored cyan-ish
-                    line_text += f"{{\\fscx120\\fscy120\\c&H00FDFF&}}{w['text']}{{\\fscx100\\fscy100\\c&HFFFFFF&}} "
-                else:
-                    line_text += f"{w['text']} "
-            line_str = f"Dialogue: 0,{format_time(w_start)},{format_time(w_end)},Main,,0,0,0,,{line_text.strip()}\n"
-            lines.append(line_str)
-    with open(dest_path, "w", encoding="utf-8") as f:
-        f.writelines(lines)

 import os
+import json
+import re
+# Import từ các services chuyên biệt
+from .audio_service import generate_tts_with_pauses, mix_audio_with_bgm, generate_tts_only
+from .subtitle_service import whisper_model, generate_ass_file
+from .video_service import parse_studio_script, normalize_tag, render_standard_video, render_studio_video
+def process_video_pipeline(tmpdir: str, script: str, ref_audio: str, aspect_ratio: str, sub_style: str, font_name: str, highlight_color: str) -> str:
     """
     Main orchestration function combining TTS, STT, and Video Rendering.
     """
+    # Auto-clean script (Ignore [p:ms], [v:voice], [s:speed] tags)
+    script = re.sub(r'\[(?!(?:p|v|s):\d*\.?\d*\]).*?\]', '', script).strip()
+    script = re.sub(r'\.{2,}', ',', script)
+    script = re.sub(r'\s+', ' ', script).strip()
     # 1. GENERATE VIENEU-TTS VOICEOVER
+    # Vì tts engine nằm ở audio_service nên ta không truyền my_voice trực tiếp từ đây được nếu không import tts
+    # Để an toàn, truyền string ref_audio vào, trong audio_service sẽ tự handle.
+    # Nhưng khoan, generate_tts_with_pauses đang mong đợi my_voice (đã encode).
+    # Vậy ta import tts từ audio_service
+    from .audio_service import tts
+    my_voice = tts.encode_reference(ref_audio) if ref_audio else None
+    tts_audio_path = generate_tts_with_pauses(tmpdir, script, my_voice, 0.5)
     # 2. FASTER-WHISPER TIMESTAMP EXTRACTION
     segments, info = whisper_model.transcribe(tts_audio_path, word_timestamps=True, language="vi")
     words_data = []
     # 3. GENERATE DYNAMIC .ASS SUBTITLE
     ass_path = os.path.join(tmpdir, "dynamic_subs.ass")
+    generate_ass_file(words_data, ass_path, aspect_ratio, sub_style, font_name, highlight_color)
     # 4. BURN IN WITH FFMPEG
+    output_video = render_standard_video(tmpdir, tts_audio_path, ass_path, aspect_ratio)
     return output_video
+def process_studio_pipeline(tmpdir: str, script: str, temperature: float = 0.5, voice_preset: str = None, bgm_path: str = None, bgm_volume: float = 0.1) -> str:
     """
+    Pipeline chuyên dụng cho Animation Studio.
     """
+    print(f"--- [DEBUG STUDIO] Temperature: {temperature} | Voice: {voice_preset} | BGM: {bgm_path} ---")
+    clean_text, events = parse_studio_script(script)
+    # Chuẩn hóa khoảng trắng và dấu câu
+    clean_text = re.sub(r'\.{2,}', ',', clean_text)
+    clean_text = re.sub(r'\s+', ' ', clean_text).strip()
+    # 1. GENERATE TTS
+    from .audio_service import tts
+    my_voice = None
+    if voice_preset and (voice_preset.endswith(".mp3") or voice_preset.endswith(".wav")):
+        if os.path.exists(voice_preset):
+            my_voice = tts.encode_reference(voice_preset)
+    voice_only_path = generate_tts_with_pauses(tmpdir, clean_text, my_voice, temperature)
+    # Mix with BGM if provided
+    if bgm_path:
+        tts_audio_path = os.path.join(tmpdir, "tts_voiceover_mixed.mp3")
+        mix_audio_with_bgm(voice_only_path, bgm_path, bgm_volume, tts_audio_path)
+    else:
+        tts_audio_path = voice_only_path
+    # 2. WHISPER TIMESTAMP EXTRACTION
+    segments, info = whisper_model.transcribe(tts_audio_path, word_timestamps=True, language="vi")
+    words_data = []
+    for segment in segments:
+        for word in segment.words:
+            words_data.append(word)
+    # 3. XÂY DỰNG TIMELINE TỪ WORDS_DATA
+    # Tính tổng số ký tự THỰC TẾ (giữ nguyên whitespace để khớp với char_idx từ parse_studio_script)
+    pure_text_for_ratio = re.sub(r"\[.*?\]", "", script)
+    total_chars = len(pure_text_for_ratio)
+    timeline = []
+    for ev in events:
+        start_time = 0.0
+        if total_chars > 0 and len(words_data) > 0:
+            # Ratio dựa trên index ký tự thực tế
+            ratio = ev['char_idx'] / total_chars
+            word_idx = min(int(ratio * len(words_data)), len(words_data) - 1)
+            start_time = words_data[word_idx].start
+        timeline.append({
+            "tag": ev['tag'],
+            "start": start_time
+        })
+    # Đảm bảo có ảnh mặc định từ 0.0
+    if not timeline or timeline[0]['start'] > 0.1:
+        timeline.insert(0, {"tag": "binh thuong", "start": 0.0})
+    # Tải mapping
+    mapping_file = os.path.join("static", "characters", "mapping.json")
+    with open(mapping_file, "r", encoding="utf-8") as f:
+        mapping = json.load(f)
+    # 4. TẠO FILE FFCONCAT
+    concat_path = os.path.join(tmpdir, "concat.txt")
+    audio_duration = words_data[-1].end if words_data else 2.0
+    with open(concat_path, "w", encoding="utf-8") as f:
+        f.write("ffconcat version 1.0\n")
+        last_img_rel_path = ""
+        for i in range(len(timeline)):
+            tag_norm = normalize_tag(timeline[i]['tag'])
+            filename = mapping.get(tag_norm, mapping.get("binh thuong", "Binh-thuong.png"))
+            img_path = os.path.join("static", "characters_green", filename)
+            # Tính toán đường dẫn tương đối từ tmpdir đến file ảnh
+            # Điều này giúp FFmpeg trên Windows không bị lỗi dấu :
+            try:
+                rel_to_tmp = os.path.relpath(os.path.abspath(img_path), start=os.path.dirname(os.path.abspath(concat_path)))
+                final_path = rel_to_tmp.replace("\\", "/")
+            except:
+                final_path = os.path.abspath(img_path).replace("\\", "/")
+            last_img_rel_path = final_path
+            duration = 0.0
+            if i < len(timeline) - 1:
+                duration = timeline[i+1]['start'] - timeline[i]['start']
+            else:
+                duration = audio_duration - timeline[i]['start']
+                if duration <= 0:
+                    duration = 1.0
+            if duration <= 0:
+                duration = 0.01
+            f.write(f"file '{final_path}'\n")
+            f.write(f"duration {duration:.3f}\n")
+        f.write(f"file '{last_img_rel_path}'\n")
+    # 5. RENDER VIDEO VỚI NỀN XANH (GREEN SCREEN)
+    output_video = render_studio_video(tmpdir, concat_path, tts_audio_path)
+    return output_video

services/audio_service.py ADDED Viewed

	@@ -0,0 +1,188 @@

+import os
+import re
+import numpy as np
+import soundfile as sf
+import ffmpeg
+from vieneu import Vieneu
+# Initialize Models at module level so Celery workers only load it once!
+# Depending on requirements, we can set 'remote' if deploying Docker VieNeu server,
+# or default (Turbo) for local testing.
+tts = Vieneu()
+def change_audio_speed(input_path: str, speed: float) -> str:
+    """
+    Changes audio speed using ffmpeg's atempo filter.
+    Returns the path to the modified file.
+    """
+    if speed == 1.0:
+        return input_path
+    output_path = input_path.replace(".wav", "_speed.wav")
+    try:
+        (
+            ffmpeg
+            .input(input_path)
+            .filter('atempo', speed)
+            .output(output_path)
+            .overwrite_output()
+            .run(quiet=True)
+        )
+        return output_path
+    except Exception as e:
+        print(f"Error changing audio speed: {e}")
+        return input_path
+def generate_tts_with_pauses(tmpdir: str, script: str, my_voice, temperature: float) -> str:
+    """
+    Helper to split script by tags:
+    [p:ms] - Pause
+    [v:voice_id_or_path] - Switch voice
+    [s:speed_rate] - Change speed (0.5 to 2.0)
+    """
+    # Split by [type:value] tags. Captures type and value separately.
+    parts = re.split(r'\[(p|v|s):(.*?)\]', script)
+    # --- PROGRESS TRACKING ---
+    # Count total valid text chunks for display
+    text_parts_count = 0
+    if parts[0].strip() and any(c.isalnum() for c in parts[0]):
+        text_parts_count += 1
+    for i in range(1, len(parts), 3):
+        if parts[i+2].strip() and any(c.isalnum() for c in parts[i+2]):
+            text_parts_count += 1
+    current_chunk_idx = 0
+    # -------------------------
+    audio_segments = []
+    samplerate = 24000  # Default fallback
+    current_voice = my_voice
+    current_speed = 1.0
+    # Process the initial text part
+    first_text = parts[0].strip()
+    if first_text and any(c.isalnum() for c in first_text):
+        current_chunk_idx += 1
+        print(f"Chunk {current_chunk_idx}/{text_parts_count}: ", end="", flush=True)
+        try:
+            audio_array = tts.infer(text=first_text, voice=current_voice, temperature=temperature)
+        except TypeError:
+            audio_array = tts.infer(text=first_text, voice=current_voice) if current_voice else tts.infer(text=first_text)
+        temp_path = os.path.join(tmpdir, "part_init.wav")
+        tts.save(audio_array, temp_path)
+        # Apply speed change if needed (initially 1.0, but for completeness)
+        final_part_path = change_audio_speed(temp_path, current_speed)
+        data, sr = sf.read(final_part_path)
+        samplerate = sr
+        if len(data.shape) > 1: data = data[:, 0]
+        audio_segments.append(data.astype(np.float32))
+    # Process subsequent tags and text
+    for i in range(1, len(parts), 3):
+        tag_type = parts[i]
+        tag_val = parts[i+1].strip()
+        text_part = parts[i+2].strip()
+        if tag_type == 'p':
+            # Pause
+            ms = int(tag_val)
+            num_samples = int(samplerate * (ms / 1000.0))
+            audio_segments.append(np.zeros(num_samples, dtype=np.float32))
+        elif tag_type == 'v':
+            # Switch voice
+            if (tag_val.endswith(".mp3") or tag_val.endswith(".wav")) and os.path.exists(tag_val):
+                current_voice = tts.encode_reference(tag_val)
+            else:
+                current_voice = tag_val
+        elif tag_type == 's':
+            # Change speed
+            try:
+                current_speed = float(tag_val)
+                current_speed = max(0.5, min(2.0, current_speed))
+            except ValueError:
+                pass
+        # Generate audio for the text part following the tag
+        if text_part and any(c.isalnum() for c in text_part):
+            current_chunk_idx += 1
+            print(f"Chunk {current_chunk_idx}/{text_parts_count}: ", end="", flush=True)
+            try:
+                audio_array = tts.infer(text=text_part, voice=current_voice, temperature=temperature)
+            except TypeError:
+                audio_array = tts.infer(text=text_part, voice=current_voice) if current_voice else tts.infer(text=text_part)
+            temp_path = os.path.join(tmpdir, f"part_{i}.wav")
+            tts.save(audio_array, temp_path)
+            # Apply speed change
+            final_part_path = change_audio_speed(temp_path, current_speed)
+            data, sr = sf.read(final_part_path)
+            samplerate = sr
+            if len(data.shape) > 1: data = data[:, 0]
+            audio_segments.append(data.astype(np.float32))
+    if not audio_segments:
+        audio_segments.append(np.zeros(samplerate, dtype=np.float32))
+    final_audio = np.concatenate(audio_segments)
+    final_path = os.path.join(tmpdir, "tts_voiceover.wav")
+    sf.write(final_path, final_audio, samplerate)
+    return final_path
+def mix_audio_with_bgm(voice_path: str, bgm_path: str, bgm_volume: float, output_path: str):
+    """
+    Mixes voice with BGM using sidechain compression (ducking).
+    """
+    if not bgm_path or not os.path.exists(bgm_path):
+        # Just copy/rename voice if no BGM
+        import shutil
+        shutil.copy(voice_path, output_path)
+        return output_path
+    try:
+        # Voice input
+        voice = ffmpeg.input(voice_path)
+        # BGM input with volume adjustment
+        bgm = ffmpeg.input(bgm_path).filter('volume', bgm_volume)
+        # Ducking: BGM is compressed when voice is detected
+        # Sidechaincompress: [0:bgm][1:voice] -> [ducked_bgm]
+        ducked_bgm = ffmpeg.filter([bgm, voice], 'sidechaincompress', threshold=0.03, ratio=10, attack=10, release=1000)
+        # Mix voice and ducked BGM: [voice][ducked_bgm] amix -> final
+        mixed = ffmpeg.filter([voice, ducked_bgm], 'amix', inputs=2, duration='first')
+        (
+            ffmpeg
+            .output(mixed, output_path, acodec='libmp3lame', ab='192k')
+            .overwrite_output()
+            .run(quiet=True)
+        )
+        return output_path
+    except Exception as e:
+        print(f"Error mixing BGM: {e}")
+        import shutil
+        shutil.copy(voice_path, output_path)
+        return output_path
+def generate_tts_only(tmpdir: str, script: str, ref_audio: str = None, temperature: float = 0.5, bgm_path: str = None, bgm_volume: float = 0.1) -> str:
+    """
+    Standalone function to just generate TTS audio, optionally mixed with BGM.
+    """
+    my_voice = None
+    if ref_audio and os.path.exists(ref_audio):
+        my_voice = tts.encode_reference(ref_audio)
+    voice_only_path = generate_tts_with_pauses(tmpdir, script, my_voice, temperature)
+    if bgm_path:
+        mixed_path = os.path.join(tmpdir, "final_mixed_audio.mp3")
+        return mix_audio_with_bgm(voice_only_path, bgm_path, bgm_volume, mixed_path)
+    return voice_only_path

services/subtitle_service.py ADDED Viewed

	@@ -0,0 +1,75 @@

+import os
+from faster_whisper import WhisperModel
+# Use CPU with int8 if we lack GPU to avoid OOM
+whisper_model = WhisperModel("base", device="cpu", compute_type="int8")
+def generate_ass_file(words_data: list, dest_path: str, aspect_ratio: str, sub_style: str, font_name: str, highlight_color: str):
+    """
+    Crafts an advanced SubStation Alpha file for Karaoke effects.
+    """
+    video_w, video_h = (1080, 1920) if aspect_ratio == "9:16" else (1920, 1080)
+    # Convert hex (#00FDFF) to ASS format (&H00BBGGRR&)
+    hex_color = highlight_color.lstrip('#')
+    if len(hex_color) == 6:
+        r, g, b = hex_color[0:2], hex_color[2:4], hex_color[4:6]
+        ass_hl_color = f"&H00{b}{g}{r}&"
+    else:
+        ass_hl_color = "&H00FDFF00&" # fallback
+    header = f"""[Script Info]
+ScriptType: v4.00+
+Collisions: Normal
+PlayResX: {video_w}
+PlayResY: {video_h}
+[V4+ Styles]
+Format: Name, Fontname, Fontsize, PrimaryColour, SecondaryColour, OutlineColour, BackColour, Bold, Italic, Underline, StrikeOut, ScaleX, ScaleY, Spacing, Angle, BorderStyle, Outline, Shadow, Alignment, MarginL, MarginR, MarginV, Encoding
+Style: Main,{font_name},80,&H00FFFFFF,&H000000FF,&H00000000,&H80000000,1,0,0,0,100,100,0,0,1,3,2,2,10,10,300,1
+[Events]
+Format: Layer, Start, End, Style, Name, MarginL, MarginR, MarginV, Effect, Text
+"""
+    def format_time(seconds: float) -> str:
+        h = int(seconds // 3600)
+        m = int((seconds % 3600) // 60)
+        s = seconds % 60
+        return f"{h}:{m:02d}:{s:05.2f}"
+    lines = [header]
+    # Create chunks for display (e.g., 5 words per line max)
+    chunk_size = 5 if aspect_ratio == "9:16" else 10
+    if sub_style == "sentence":
+        # Basic Sentence Style
+        for i in range(0, len(words_data), chunk_size):
+            chunk = words_data[i:i+chunk_size]
+            c_start = chunk[0]['start']
+            c_end = chunk[-1]['end']
+            text = " ".join([w['text'] for w in chunk])
+            line_str = f"Dialogue: 0,{format_time(c_start)},{format_time(c_end)},Main,,0,0,0,,{{\\c{ass_hl_color}}}{text}\n"
+            lines.append(line_str)
+    else:
+        # Karaoke Style
+        for i in range(0, len(words_data), chunk_size):
+            chunk = words_data[i:i+chunk_size]
+            for active_idx, target_word in enumerate(chunk):
+                w_start = target_word['start']
+                w_end = target_word['end']
+                line_text = ""
+                for j, w in enumerate(chunk):
+                    if j == active_idx:
+                        # Highlight active word
+                        line_text += f"{{\\fscx120\\fscy120\\c{ass_hl_color}}}{w['text']}{{\\fscx100\\fscy100\\c&HFFFFFF&}} "
+                    else:
+                        line_text += f"{w['text']} "
+                line_str = f"Dialogue: 0,{format_time(w_start)},{format_time(w_end)},Main,,0,0,0,,{line_text.strip()}\n"
+                lines.append(line_str)
+    with open(dest_path, "w", encoding="utf-8") as f:
+        f.writelines(lines)

services/video_service.py ADDED Viewed

	@@ -0,0 +1,83 @@

+import os
+import re
+import unicodedata
+import ffmpeg
+# --- BẢN VÁ LỖI FFmpeg PATH CHO WINDOWS ---
+local_app_data = os.environ.get('LOCALAPPDATA', '')
+if local_app_data:
+    winget_links = os.path.join(local_app_data, 'Microsoft', 'WinGet', 'Links')
+    if winget_links not in os.environ.get('PATH', ''):
+        os.environ['PATH'] += os.pathsep + winget_links
+# ----------------------------------------
+def parse_studio_script(raw_text: str):
+    """
+    Tách kịch bản thành:
+    1. text_for_tts: Chỉ chứa text và các thẻ điều khiển [p:], [v:], [s:]
+    2. events: Danh sách biểu cảm kèm vị trí char_idx (tính trên text không còn thẻ nào)
+    """
+    visual_tag_regex = r"\[(?!(?:p|v|s):\d*\.?\d*\])(.*?)\]"
+    control_tag_regex = r"\[(?:p|v|s):.*?\]"
+    events = []
+    temp_text = raw_text
+    for match in re.finditer(visual_tag_regex, temp_text):
+        tag_content = match.group(1).strip()
+        pre_text = temp_text[:match.start()]
+        pure_pre_text = re.sub(r"\[.*?\]", "", pre_text)
+        events.append({
+            "tag": tag_content,
+            "char_idx": len(pure_pre_text)
+        })
+    text_for_tts = re.sub(visual_tag_regex, "", raw_text).strip()
+    return text_for_tts, events
+def normalize_tag(text: str) -> str:
+    text = unicodedata.normalize('NFD', text).encode('ascii', 'ignore').decode('utf-8')
+    text = re.sub(r'[^\w\s-]', '', text).lower()
+    text = re.sub(r'\s+', ' ', text).strip()
+    return text
+def render_standard_video(tmpdir: str, audio_path: str, ass_path: str, aspect_ratio: str) -> str:
+    """
+    Render standard video with solid green background and ASS subtitles.
+    """
+    output_video = os.path.join(tmpdir, "final_output.mp4")
+    video_w, video_h = (1080, 1920) if aspect_ratio == "9:16" else (1920, 1080)
+    green_bg = ffmpeg.input(f"color=c=0x00FF00:s={video_w}x{video_h}:r=30", f="lavfi")
+    in_audio = ffmpeg.input(audio_path)
+    ass_path_ff = ass_path.replace('\\', '/')
+    video_with_subs = green_bg.filter('ass', ass_path_ff)
+    (
+        ffmpeg
+        .output(video_with_subs, in_audio, output_video, vcodec="libx264", acodec="aac", audio_bitrate="192k", shortest=None)
+        .overwrite_output()
+        .run()
+    )
+    return output_video
+def render_studio_video(tmpdir: str, concat_path: str, audio_path: str) -> str:
+    """
+    Render studio video with character frames overlaid on green background.
+    """
+    output_video = os.path.join(tmpdir, "studio_output.mp4")
+    char_stream = ffmpeg.input(concat_path, f="concat", safe=0)
+    audio_stream = ffmpeg.input(audio_path)
+    # Ảnh đã được xử lý nền xanh và kích thước chuẩn trong folder characters_green
+    # Nên không cần dùng filter pad hay scale nữa, giúp render cực nhanh và ổn định
+    video_final = char_stream
+    (
+        ffmpeg
+        .output(video_final, audio_stream, output_video, vcodec="libx264", acodec="aac", audio_bitrate="192k", pix_fmt="yuv420p", r=30, shortest=None)
+        .overwrite_output()
+        .run()
+    )
+    return output_video

start.sh CHANGED Viewed

@@ -1,13 +1,18 @@
 #!/bin/bash
-# Khởi động Redis dưới background
 redis-server --daemonize yes
-# Đợi vài giây cho Redis khởi động hoàn toàn
-sleep 2
-# Khởi động Celery Worker dưới background
-celery -A worker celery_app worker --loglevel=info &
-# Khởi động FastAPI (Uvicorn) chạy chính trên port 7860
 uvicorn main:app --host 0.0.0.0 --port 7860

 #!/bin/bash
+# 1. Khởi động Redis dưới background
+echo "Starting Redis server..."
 redis-server --daemonize yes
+# Đợi Redis sẵn sàng
+sleep 3
+# 2. Khởi động Celery Worker dưới background
+echo "Starting Celery worker..."
+# Lưu ý: Trên Linux chúng ta không dùng -P solo để tận dụng đa nhân
+celery -A worker:celery_app worker --loglevel=info &
+# 3. Khởi động FastAPI (Uvicorn) chạy chính
+echo "Starting FastAPI server on port 7860..."
+# Hugging Face yêu cầu chạy trên host 0.0.0.0 và port 7860
 uvicorn main:app --host 0.0.0.0 --port 7860