Spaces:

minh9972t12
/

chatbot_test

Running

App Files Files Community

minh9972t12 commited on Oct 18

Commit

fdc8d37

verified ·

1 Parent(s): ac5bf8b

Update app.py

Browse files

Files changed (1) hide show

app.py +133 -719

app.py CHANGED Viewed

@@ -1,744 +1,158 @@
-from fastapi import FastAPI, File, UploadFile, HTTPException, Query, BackgroundTasks
-import numpy as np
-import cv2
-from PIL import Image
-import io
-from typing import List, Dict, Any, Optional, Tuple
-from pydantic import BaseModel
-import logging
-from pathlib import Path
-import time
-import hashlib
-from concurrent.futures import ThreadPoolExecutor
-from collections import defaultdict
-from dataclasses import dataclass, field
-import warnings
-from fastapi.middleware.cors import CORSMiddleware
-import torch
-from torchvision import transforms
-import onnxruntime as ort
-from sklearn.cluster import KMeans
-import uvicorn
-# PaddleOCR for Vietnamese
-try:
-    from paddleocr import PaddleOCR
-    PADDLEOCR_AVAILABLE = True
-except ImportError:
-    PADDLEOCR_AVAILABLE = False
-    logger.warning("PaddleOCR not available. Install: pip install paddleocr")
-warnings.filterwarnings("ignore")
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-app = FastAPI(
-    title="Fixed Seat Extraction API - Smart Color Detection",
-    description="Detects ALL colors except pure black and white",
-    version="6.0.0"
-)
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-CACHE_DIR = Path("cache")
-CACHE_DIR.mkdir(exist_ok=True)
-RESULTS_CACHE = {}
-MAX_CACHE_SIZE = 100
-extractor = None
-class PolygonResponse(BaseModel):
-    polygons: List[List[List[float]]]
-    confidence_scores: List[float]
-    areas: List[float]
-    bounding_boxes: List[List[float]]
-    labels: List[str]
-    seat_groups: Dict[str, List[int]]
-    processing_info: Dict[str, Any]
-    cache_hit: bool = False
-    detected_text: List[Dict[str, Any]] = []
-    geojson: Optional[Dict[str, Any]] = None
-@dataclass
-class OptimizationConfig:
-    """Fixed configuration - detect all colors except black/white"""
-    use_background_removal: bool = True
-    use_ocr: bool = True
-    # Color detection - NEW LOGIC
-    # Loại BỎ thuần đen và thuần trắng, GIỮ LẠI tất cả còn lại
-    exclude_pure_black: bool = True  # V < 20 in HSV
-    exclude_pure_white: bool = True  # V > 235 AND S < 25 in HSV
-    # Clustering để group màu giống nhau
-    use_color_clustering: bool = True
-    n_color_clusters: int = 20  # Số lượng nhóm màu
-    # Detection thresholds
-    min_section_area: int = 500  # Diện tích tối thiểu
-    max_section_area: int = 50000
-    min_solidity: float = 0.3  # Shape quality
-    # Morphology
-    morphology_kernel_size: int = 3
-    # OCR
-    ocr_languages: List[str] = field(default_factory=lambda: ["vi", "en"])
-    ocr_gpu: bool = True
-class BackgroundRemover:
-    """Background removal using BiRefNet ONNX"""
-    def __init__(self):
-        self.session = None
-        self.input_name = None
-        self.output_name = None
-        self.transform = transforms.Compose([
-            transforms.Resize((1024, 1024)),
-            transforms.ToTensor(),
-            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
-        ])
-    def load_model(self):
-        if self.session is None:
-            try:
-                providers = []
-                if ort.get_device() == 'GPU' and 'CUDAExecutionProvider' in ort.get_available_providers():
-                    providers.append('CUDAExecutionProvider')
-                providers.append('CPUExecutionProvider')
-                model_path = "models/BiRefNet.onnx"
-                self.session = ort.InferenceSession(model_path, providers=providers)
-                self.input_name = self.session.get_inputs()[0].name
-                self.output_name = self.session.get_outputs()[0].name
-                logger.info(f"✅ BiRefNet loaded: {self.session.get_providers()}")
-            except Exception as e:
-                logger.error(f"BiRefNet load failed: {e}")
-                self.session = None
-    def remove_background(self, image: Image.Image) -> Tuple[Image.Image, np.ndarray]:
-        if self.session is None:
-            if image.mode != 'RGB':
-                image = image.convert('RGB')
-            return image, None
-        if image.mode != 'RGB':
-            image = image.convert('RGB')
-        image_size = image.size
-        input_tensor = self.transform(image).unsqueeze(0)
-        input_numpy = input_tensor.numpy()
-        try:
-            outputs = self.session.run([self.output_name], {self.input_name: input_numpy})
-            pred_numpy = outputs[0][0]
-            pred_numpy = 1 / (1 + np.exp(-pred_numpy))
-            if len(pred_numpy.shape) == 3:
-                pred_numpy = pred_numpy[0]
-            pred_numpy = (pred_numpy * 255).astype(np.uint8)
-            pred_pil = Image.fromarray(pred_numpy, mode='L')
-            mask = pred_pil.resize(image_size)
-        except Exception as e:
-            logger.error(f"ONNX inference failed: {e}")
-            return image, None
-        mask_np = np.array(mask)
-        if len(mask_np.shape) == 3:
-            mask_np = mask_np[:, :, 0]
-        image_array = np.array(image)
-        if len(image_array.shape) == 2:
-            image_array = cv2.cvtColor(image_array, cv2.COLOR_GRAY2RGB)
-        elif image_array.shape[2] == 4:
-            image_array = cv2.cvtColor(image_array, cv2.COLOR_RGBA2RGB)
-        masked_array = np.zeros_like(image_array)
-        mask_normalized = mask_np.astype(np.float32) / 255.0
-        for c in range(3):
-            masked_array[:, :, c] = (image_array[:, :, c] * mask_normalized).astype(np.uint8)
-        processed_image = Image.fromarray(masked_array)
-        return processed_image, mask_np
-class TextDetector:
-    """OCR with Vietnamese support using PaddleOCR"""
-    def __init__(self, config: OptimizationConfig):
-        self.config = config
-        self.ocr = None
-    def load_models(self):
-        if not PADDLEOCR_AVAILABLE:
-            logger.error("PaddleOCR not available")
-            return
-        try:
-            # Initialize PaddleOCR với mobile lite models cho Vietnamese
-            self.ocr = PaddleOCR(
-                lang='latin',  # Vietnamese sử dụng latin script
-                # Sử dụng PP-OCRv4 mobile models (lightweight)
-                text_detection_model_name="PP-OCRv4_mobile_det",
-                text_recognition_model_name="PP-OCRv4_mobile_rec",
-                # Tắt các features không cần thiết để tăng tốc
-                use_angle_cls=False,
-                use_doc_orientation_classify=False,
-                use_doc_unwarping=False,
-                use_textline_orientation=False,
-                # GPU settings
-                use_gpu=torch.cuda.is_available() and self.config.ocr_gpu,
-                # Giảm batch size cho lightweight
-                det_db_box_thresh=0.5,  # Detection threshold
-                det_db_unclip_ratio=1.6,  # Unclip ratio cho bbox
-                # Rec settings
-                rec_batch_num=1,
-                drop_score=0.3,  # Confidence threshold thấp để catch nhiều text
-                # Tắt logging
-                show_log=False
-            )
-            logger.info("✅ PaddleOCR loaded (PP-OCRv4_mobile) for Vietnamese")
-            logger.info(f"   GPU enabled: {torch.cuda.is_available() and self.config.ocr_gpu}")
-        except Exception as e:
-            logger.error(f"PaddleOCR load failed: {e}")
-            import traceback
-            traceback.print_exc()
-            self.ocr = None
-    def preprocess_for_vietnamese_ocr(self, image: np.ndarray) -> np.ndarray:
-        """
-        Preprocessing tối ưu cho Vietnamese OCR với PaddleOCR
-        """
-        if len(image.shape) == 3:
-            gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
-        else:
-            gray = image.copy()
-        # 1. Denoise
-        denoised = cv2.fastNlMeansDenoising(gray, h=7)
-        # 2. Sharpen để diacritics rõ hơn
-        kernel_sharpen = np.array([[-1,-1,-1],
-                                   [-1, 9,-1],
-                                   [-1,-1,-1]])
-        sharpened = cv2.filter2D(denoised, -1, kernel_sharpen)
-        # 3. CLAHE
-        clahe = cv2.createCLAHE(clipLimit=2.5, tileGridSize=(8, 8))
-        enhanced = clahe.apply(sharpened)
-        # 4. Contrast
-        alpha = 1.3
-        beta = 10
-        adjusted = cv2.convertScaleAbs(enhanced, alpha=alpha, beta=beta)
-        # PaddleOCR có thể nhận grayscale hoặc RGB
-        # Trả về RGB để consistent
-        rgb = cv2.cvtColor(adjusted, cv2.COLOR_GRAY2RGB)
-        return rgb
-    def detect_language(self, text: str) -> str:
-        """Detect Vietnamese by diacritics"""
-        vietnamese_chars = 'àáạảãâầấậẩẫăằắặẳẵèéẹẻẽêềếệểễìíịỉĩòóọỏõôồốộổỗơờớợởỡùúụủũưừứựửữỳýỵỷỹđ'
-        if any(c in vietnamese_chars for c in text.lower()):
-            return 'vi'
-        return 'en'
-    def detect_text(self, image: np.ndarray) -> List[Dict]:
-        text_regions = []
-        if self.ocr is None:
-            logger.warning("PaddleOCR not initialized")
-            return text_regions
-        try:
-            # Preprocessing
-            preprocessed = self.preprocess_for_vietnamese_ocr(image)
-            # PaddleOCR inference
-            # result[0] là list của page đầu tiên
-            # Mỗi item: [bbox_points, (text, confidence)]
-            result = self.ocr.ocr(preprocessed, cls=False)
-            if result is None or len(result) == 0:
-                logger.warning("PaddleOCR returned no results")
-                return text_regions
-            # Parse kết quả
-            for line in result[0]:
-                if line is None:
-                    continue
-                bbox_points, (text, confidence) = line
-                # bbox_points format: [[x1,y1], [x2,y2], [x3,y3], [x4,y4]]
-                x_coords = [point[0] for point in bbox_points]
-                y_coords = [point[1] for point in bbox_points]
-                if confidence > 0.2:  # Threshold thấp để catch nhiều text
-                    # Detect language
-                    language = self.detect_language(text)
-                    text_regions.append({
-                        'bbox': [int(min(x_coords)), int(min(y_coords)),
-                                int(max(x_coords)), int(max(y_coords))],
-                        'text': text,
-                        'confidence': float(confidence),
-                        'language': language
-                    })
-                    logger.info(f"OCR: '{text}' (conf: {confidence:.2f}, lang: {language})")
-            logger.info(f"✅ Detected {len(text_regions)} text regions")
-        except Exception as e:
-            logger.error(f"PaddleOCR failed: {e}")
-            import traceback
-            traceback.print_exc()
-        return text_regions
-class SmartColorDetector:
-    """
-    LOGIC MỚI: Detect TẤT CẢ màu NGOẠI TRỪ đen thuần và trắng thuần
-    """
-    def __init__(self, config: OptimizationConfig):
-        self.config = config
-    def create_valid_color_mask(self, image: np.ndarray) -> np.ndarray:
-        """
-        Tạo mask cho TẤT CẢ pixel có màu (không phải đen/trắng/xám thuần)
-        Trong HSV:
-        - Đen thuần: V (value) rất thấp (0-20)
-        - Trắng thuần: V rất cao (235-255) VÀ S (saturation) rất thấp (0-25)
-        - Xám thuần: S rất thấp (0-30) - không phân biệt hue
-        - MỌI màu khác: VALID!
-        """
-        hsv = cv2.cvtColor(image, cv2.COLOR_RGB2HSV)
-        h, s, v = cv2.split(hsv)
-        # Tạo mask GIỮ LẠI tất cả pixel
-        valid_mask = np.ones(image.shape[:2], dtype=np.uint8) * 255
-        # Loại BỎ đen thuần: V < 20
-        if self.config.exclude_pure_black:
-            black_mask = v < 20
-            valid_mask[black_mask] = 0
-            logger.info(f"Excluded {np.sum(black_mask)} pure black pixels")
-        # Loại BỎ trắng thuần: V > 235 AND S < 25
-        if self.config.exclude_pure_white:
-            white_mask = (v > 235) & (s < 25)
-            valid_mask[white_mask] = 0
-            logger.info(f"Excluded {np.sum(white_mask)} pure white pixels")
-        # Loại BỎ xám thuần: S < 30 (màu không có saturation = màu xám)
-        # Nhưng KHÔNG loại nếu đã là đen hoặc trắng thuần (đã loại ở trên)
-        gray_mask = (s < 30) & (v >= 20) & (v <= 235)
-        valid_mask[gray_mask] = 0
-        logger.info(f"Excluded {np.sum(gray_mask)} gray pixels")
-        logger.info(f"Valid colored pixels: {np.sum(valid_mask > 0)}")
-        return valid_mask
-    def cluster_colors(self, image: np.ndarray, valid_mask: np.ndarray) -> List[np.ndarray]:
-        """
-        Group các màu giống nhau bằng K-means clustering
-        """
-        masks = []
-        # Lấy tất cả pixel hợp lệ
-        valid_pixels = image[valid_mask > 0]
-        if len(valid_pixels) < 100:
-            logger.warning("Not enough valid pixels for clustering")
-            return [valid_mask]
-        # K-means clustering
-        pixels_flat = valid_pixels.reshape(-1, 3).astype(np.float32)
-        n_clusters = min(self.config.n_color_clusters, len(pixels_flat) // 100)
-        if n_clusters < 2:
-            return [valid_mask]
-        logger.info(f"Clustering into {n_clusters} color groups...")
-        try:
-            kmeans = KMeans(n_clusters=n_clusters, random_state=42, n_init=10)
-            labels = kmeans.fit_predict(pixels_flat)
-            centers = kmeans.cluster_centers_.astype(np.uint8)
-            # Tạo mask cho mỗi cluster
-            pixel_coords = np.argwhere(valid_mask > 0)
-            for cluster_id in range(n_clusters):
-                cluster_mask = np.zeros(image.shape[:2], dtype=np.uint8)
-                cluster_pixels = pixel_coords[labels == cluster_id]
-                if len(cluster_pixels) < 50:
-                    continue
-                for coord in cluster_pixels:
-                    cluster_mask[coord[0], coord[1]] = 255
-                # Clean up mask
-                kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (3, 3))
-                cluster_mask = cv2.morphologyEx(cluster_mask, cv2.MORPH_CLOSE, kernel, iterations=2)
-                cluster_mask = cv2.morphologyEx(cluster_mask, cv2.MORPH_OPEN, kernel, iterations=1)
-                if np.sum(cluster_mask) > 100:
-                    masks.append(cluster_mask)
-                    logger.info(f"  Cluster {cluster_id}: {np.sum(cluster_mask)} pixels, "
-                              f"center color: {centers[cluster_id]}")
-        except Exception as e:
-            logger.error(f"Clustering failed: {e}")
-            return [valid_mask]
-        return masks
-class EnhancedSeatExtractor:
-    def __init__(self, config: OptimizationConfig = OptimizationConfig()):
-        self.config = config
-        self.executor = ThreadPoolExecutor(max_workers=4)
-        self.bg_remover = BackgroundRemover()
-        self.text_detector = TextDetector(config)
-        self.color_detector = SmartColorDetector(config)
-        logger.info("✅ Enhanced Extractor with Smart Color Detection initialized")
-    def compute_image_hash(self, image: np.ndarray) -> str:
-        return hashlib.md5(image.tobytes()).hexdigest()
-    def detect_sections_in_mask(self, mask: np.ndarray, text_regions: List[Dict]) -> List[Dict]:
-        """Detect sections from a color mask"""
-        sections = []
-        if np.sum(mask) < self.config.min_section_area:
-            return sections
-        # KHÔNG loại bỏ text regions - giữ nguyên sections hoàn chỉnh
-        # Text là PART OF section, không phải noise cần loại bỏ
-        text_excluded_mask = mask.copy()
-        # Morphological operations - GIảM iterations để không "ăn mòn" sections
-        kernel = cv2.getStructuringElement(
-            cv2.MORPH_ELLIPSE,
-            (self.config.morphology_kernel_size, self.config.morphology_kernel_size)
-        )
-        # Chỉ CLOSE để nối các vùng gần nhau, không OPEN để tránh làm nhỏ sections
-        cleaned_mask = cv2.morphologyEx(text_excluded_mask, cv2.MORPH_CLOSE, kernel, iterations=2)
-        # Find contours
-        contours, _ = cv2.findContours(cleaned_mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
-        for contour in contours:
-            area = cv2.contourArea(contour)
-            if area < self.config.min_section_area or area > self.config.max_section_area:
-                continue
-            # Check solidity (shape quality)
-            hull = cv2.convexHull(contour)
-            hull_area = cv2.contourArea(hull)
-            solidity = area / hull_area if hull_area > 0 else 0
-            if solidity < self.config.min_solidity:
-                continue
-            # Simplify contour
-            epsilon = 0.01 * cv2.arcLength(contour, True)
-            approx = cv2.approxPolyDP(contour, epsilon, True)
-            if len(approx) >= 3:
-                x, y, w, h = cv2.boundingRect(contour)
-                sections.append({
-                    'contour': approx,
-                    'bbox': [x, y, x + w, y + h],
-                    'area': area,
-                    'confidence': min(1.0, solidity),
-                    'center': (x + w // 2, y + h // 2),
-                    'solidity': solidity
-                })
-        return sections
-    def extract_polygons_enhanced(self, image: np.ndarray) -> PolygonResponse:
-        """Main extraction pipeline"""
-        start_time = time.time()
-        # Check cache
-        image_hash = self.compute_image_hash(image)
-        if image_hash in RESULTS_CACHE:
-            logger.info("Returning cached results")
-            cached_result = RESULTS_CACHE[image_hash]
-            cached_result.cache_hit = True
-            return cached_result
-        # Ensure RGB
-        if len(image.shape) == 2:
-            image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)
-        elif len(image.shape) == 3:
-            if image.shape[2] == 4:
-                image = cv2.cvtColor(image, cv2.COLOR_RGBA2RGB)
-        # Step 1: Background Removal
-        if self.config.use_background_removal:
-            logger.info("🔄 Removing background...")
-            pil_image = Image.fromarray(image).convert('RGB')
-            processed_image, bg_mask = self.bg_remover.remove_background(pil_image)
-            image = np.array(processed_image)
-            if len(image.shape) != 3 or image.shape[2] != 3:
-                if len(image.shape) == 2:
-                    image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)
-        # Step 2: OCR Text Detection
-        text_regions = []
-        if self.config.use_ocr:
-            logger.info("🔄 Detecting text...")
-            text_regions = self.text_detector.detect_text(image)
-        # Step 3: Smart Color Detection
-        logger.info("🔄 Detecting all colors (excluding black/white)...")
-        valid_color_mask = self.color_detector.create_valid_color_mask(image)
-        # Step 4: Cluster Colors
-        all_sections = []
-        if self.config.use_color_clustering:
-            logger.info("🔄 Clustering colors...")
-            color_masks = self.color_detector.cluster_colors(image, valid_color_mask)
-            logger.info(f"Found {len(color_masks)} color groups")
-            # Detect sections in each color group
-            for i, mask in enumerate(color_masks):
-                logger.info(f"Processing color group {i + 1}/{len(color_masks)}...")
-                sections = self.detect_sections_in_mask(mask, text_regions)
-                for section in sections:
-                    section['color_group'] = i
-                all_sections.extend(sections)
-                logger.info(f"  Found {len(sections)} sections in group {i}")
         else:
-            # Single pass without clustering
-            all_sections = self.detect_sections_in_mask(valid_color_mask, text_regions)
-        # Step 5: Remove overlapping sections
-        filtered_sections = self.remove_overlapping_sections(all_sections)
-        # Convert to response format
-        polygons = []
-        confidence_scores = []
-        areas = []
-        bounding_boxes = []
-        labels = []
-        for i, section in enumerate(filtered_sections):
-            contour = section['contour']
-            polygon = contour.reshape(-1, 2).tolist()
-            polygons.append(polygon)
-            confidence_scores.append(section['confidence'])
-            areas.append(section['area'])
-            bounding_boxes.append(section['bbox'])
-            labels.append(f"Section_{i + 1}")
-        # Group sections
-        seat_groups = self.group_sections(filtered_sections)
-        processing_time = time.time() - start_time
-        geojson_output = self.to_geojson(filtered_sections)
-        response = PolygonResponse(
-            polygons=polygons,
-            confidence_scores=confidence_scores,
-            areas=areas,
-            bounding_boxes=bounding_boxes,
-            labels=labels,
-            seat_groups=seat_groups,
-            detected_text=[{
-                'text': t['text'],
-                'confidence': t['confidence'],
-                'bbox': t['bbox'],
-                'language': t.get('language', 'unknown')
-            } for t in text_regions],
-            processing_info={
-                "total_sections": len(polygons),
-                "total_text_regions": len(text_regions),
-                "vietnamese_text": sum(1 for t in text_regions if t.get('language') == 'vi'),
-                "english_text": sum(1 for t in text_regions if t.get('language') == 'en'),
-                "processing_time": processing_time,
-                "clustering_enabled": self.config.use_color_clustering
-            },
-            cache_hit=False,
-            geojson=geojson_output
-        )
-        # Cache result
-        if len(RESULTS_CACHE) >= MAX_CACHE_SIZE:
-            RESULTS_CACHE.pop(next(iter(RESULTS_CACHE)))
-        RESULTS_CACHE[image_hash] = response
-        return response
-    def remove_overlapping_sections(self, sections: List[Dict]) -> List[Dict]:
-        if not sections:
-            return sections
-        sorted_sections = sorted(sections, key=lambda x: x['confidence'], reverse=True)
-        filtered = []
-        for section in sorted_sections:
-            overlap = False
-            for accepted in filtered:
-                if self.calculate_overlap(section['bbox'], accepted['bbox']) > 0.5:
-                    overlap = True
-                    break
-            if not overlap:
-                filtered.append(section)
-        return filtered
-    def calculate_overlap(self, bbox1: List, bbox2: List) -> float:
-        x1_1, y1_1, x2_1, y2_1 = bbox1
-        x1_2, y1_2, x2_2, y2_2 = bbox2
-        x1_int = max(x1_1, x1_2)
-        y1_int = max(y1_1, y1_2)
-        x2_int = min(x2_1, x2_2)
-        y2_int = min(y2_1, y2_2)
-        if x2_int <= x1_int or y2_int <= y1_int:
-            return 0.0
-        intersection = (x2_int - x1_int) * (y2_int - y1_int)
-        area1 = (x2_1 - x1_1) * (y2_1 - y1_1)
-        area2 = (x2_2 - x1_2) * (y2_2 - y1_2)
-        union = area1 + area2 - intersection
-        return intersection / union if union > 0 else 0.0
-    def group_sections(self, sections: List[Dict]) -> Dict[str, List[int]]:
-        groups = defaultdict(list)
-        for idx, section in enumerate(sections):
-            group_id = section.get('color_group', 0)
-            groups[f"ColorGroup_{group_id}"].append(idx)
-        return dict(groups)
-    def to_geojson(self, sections: List[Dict]) -> Dict[str, Any]:
-        features = []
-        for section in sections:
-            contour = section['contour'].reshape(-1, 2).tolist()
-            features.append({
-                "type": "Feature",
-                "properties": {
-                    "confidence": section.get("confidence"),
-                    "area": section.get("area"),
-                    "color_group": section.get("color_group")
-                },
-                "geometry": {
-                    "type": "Polygon",
-                    "coordinates": [[list(map(float, p)) for p in contour]]
-                }
-            })
-        return {
-            "type": "FeatureCollection",
-            "features": features
-        }
-@app.on_event("startup")
-async def startup_event():
-    global extractor
     try:
-        config = OptimizationConfig(
-            use_background_removal=True,
-            use_ocr=True,
-            exclude_pure_black=True,
-            exclude_pure_white=True,
-            use_color_clustering=True,
-            n_color_clusters=20,
-            min_section_area=500,
-            max_section_area=50000,
-            ocr_languages=["vi", "en"],  # For info only
-            ocr_gpu=True
         )
-        extractor = EnhancedSeatExtractor(config)
-        logger.info("Loading BiRefNet...")
-        extractor.bg_remover.load_model()
-        logger.info("Loading PaddleOCR (PP-OCRv4_mobile)...")
-        extractor.text_detector.load_models()
-        logger.info("✅ System initialized successfully")
-        logger.info("✅ Using PaddleOCR lite for Vietnamese")
-        logger.info("✅ Color detection: ALL colors except pure black/white/gray")
     except Exception as e:
-        logger.error(f"Initialization failed: {e}")
-        import traceback
-        traceback.print_exc()
-@app.post("/extract-seats/", response_model=PolygonResponse)
-async def extract_seats_endpoint(
-    file: UploadFile = File(...),
-    use_background_removal: bool = Query(True),
-    use_ocr: bool = Query(True),
-    use_clustering: bool = Query(True),
-    n_clusters: int = Query(20, ge=2, le=50)
-):
-    """
-    Extract sections with smart color detection
-    Detects ALL colors except:
-    - Pure black (V < 20 in HSV)
-    - Pure white (V > 235 AND S < 25 in HSV)
-    """
-    if extractor is None:
-        raise HTTPException(status_code=503, detail="System not initialized")
-    if not file.content_type.startswith("image/"):
-        raise HTTPException(status_code=400, detail="Must be an image")
-    try:
-        contents = await file.read()
-        image = Image.open(io.BytesIO(contents))
-        image_array = np.array(image)
-        # Update config
-        extractor.config.use_background_removal = use_background_removal
-        extractor.config.use_ocr = use_ocr
-        extractor.config.use_color_clustering = use_clustering
-        extractor.config.n_color_clusters = n_clusters
-        result = extractor.extract_polygons_enhanced(image_array)
-        return result
-    except Exception as e:
-        logger.error(f"Processing failed: {e}")
-        import traceback
-        traceback.print_exc()
-        raise HTTPException(status_code=500, detail=f"Failed: {str(e)}")
 if __name__ == "__main__":
     import os

+"""
+Test script for Event Tags Generator API
+"""
+import requests
+import json
+# API endpoint
+BASE_URL = "http://localhost:8001"
+def test_generate_tags():
+    """Test single event tag generation"""
+    print("=" * 60)
+    print("Testing Event Tags Generator")
+    print("=" * 60)
+    # Test data
+    event_data = {
+        "event_name": "Vietnam Music Festival 2025",
+        "category": "Âm nhạc",
+        "short_description": "Lễ hội âm nhạc quốc tế lớn nhất Việt Nam năm 2025",
+        "detailed_description": """
+        Vietnam Music Festival 2025 là sự kiện âm nhạc đỉnh cao quy tụ các nghệ sĩ
+        nổi tiếng trong nước và quốc tế. Sự kiện diễn ra trong 3 ngày với hơn 50
+        nghệ sĩ tham gia, từ nhạc pop, rock, EDM đến acoustic. Đặc biệt có sự góp
+        mặt của các DJ hàng đầu thế giới. Không gian festival rộng 10,000m2 tại
+        trung tâm Hà Nội với hệ thống âm thanh ánh sáng hiện đại. Dự kiến thu hút
+        hơn 30,000 khán giả mỗi ngày.
+        """,
+        "max_tags": 12,
+        "language": "vi"
+    }
+    print("\n📤 REQUEST:")
+    print(json.dumps(event_data, indent=2, ensure_ascii=False))
+    try:
+        # Call API
+        response = requests.post(
+            f"{BASE_URL}/generate-tags",
+            json=event_data,
+            headers={"Content-Type": "application/json"}
+        )
+        if response.status_code == 200:
+            result = response.json()
+            print("\n✅ SUCCESS!")
+            print("\n📥 RESPONSE:")
+            print(json.dumps(result, indent=2, ensure_ascii=False))
+            print("\n" + "=" * 60)
+            print("GENERATED METADATA:")
+            print("=" * 60)
+            print(f"\n🏷️  TAGS ({len(result['generated_tags'])} tags):")
+            for tag in result['generated_tags']:
+                print(f"   • {tag}")
+            print(f"\n📁 PRIMARY CATEGORY: {result['primary_category']}")
+            if result['secondary_categories']:
+                print(f"\n📂 SECONDARY CATEGORIES:")
+                for cat in result['secondary_categories']:
+                    print(f"   • {cat}")
+            if result['keywords']:
+                print(f"\n🔍 SEO KEYWORDS:")
+                for kw in result['keywords']:
+                    print(f"   • {kw}")
+            if result['hashtags']:
+                print(f"\n#️⃣  HASHTAGS:")
+                for ht in result['hashtags']:
+                    print(f"   • {ht}")
+            if result['target_audience']:
+                print(f"\n👥 TARGET AUDIENCE:")
+                for aud in result['target_audience']:
+                    print(f"   • {aud}")
+            print(f"\n😊 SENTIMENT: {result['sentiment']}")
+            print(f"💯 CONFIDENCE: {result['confidence_score']}")
+            print(f"⏱️  GENERATION TIME: {result['generation_time']}")
+            print(f"🤖 MODEL USED: {result['model_used']}")
         else:
+            print(f"\n❌ ERROR: {response.status_code}")
+            print(response.text)
+    except requests.exceptions.ConnectionError:
+        print("\n❌ ERROR: Cannot connect to API")
+        print("Make sure the server is running: python event_tags_generator.py")
+    except Exception as e:
+        print(f"\n❌ ERROR: {str(e)}")
+def test_batch_generation():
+    """Test batch event tag generation"""
+    print("\n\n" + "=" * 60)
+    print("Testing Batch Tag Generation")
+    print("=" * 60)
+    events = [
+        {
+            "event_name": "Tech Summit Vietnam 2025",
+            "category": "Công nghệ",
+            "short_description": "Hội nghị công nghệ lớn nhất Đông Nam Á",
+            "detailed_description": "Sự kiện quy tụ các chuyên gia AI, Blockchain, Cloud Computing từ Google, Microsoft, Amazon...",
+            "max_tags": 10,
+            "language": "vi"
+        },
+        {
+            "event_name": "Food Festival Saigon",
+            "category": "Ẩm thực",
+            "short_description": "Lễ hội ẩm thực đường phố Sài Gòn",
+            "detailed_description": "Khám phá hơn 100 món ăn đường phố đặc trưng của Sài Gòn với các đầu bếp nổi tiếng...",
+            "max_tags": 8,
+            "language": "vi"
+        }
+    ]
+    print(f"\n📤 Generating tags for {len(events)} events...")
     try:
+        response = requests.post(
+            f"{BASE_URL}/generate-tags/batch",
+            json=events,
+            headers={"Content-Type": "application/json"}
         )
+        if response.status_code == 200:
+            result = response.json()
+            print(f"\n✅ Batch completed!")
+            print(f"   Total: {result['total']}")
+            print(f"   Successful: {result['successful']}")
+            print(f"   Failed: {result['failed']}")
+            for item in result['results']:
+                if item['success']:
+                    print(f"\n✓ {item['event_name']}")
+                    print(f"   Tags: {', '.join(item['data']['generated_tags'][:5])}...")
+                else:
+                    print(f"\n✗ {item['event_name']}")
+                    print(f"   Error: {item['error']}")
+        else:
+            print(f"\n❌ ERROR: {response.status_code}")
+            print(response.text)
     except Exception as e:
+        print(f"\n❌ ERROR: {str(e)}")
 if __name__ == "__main__":
     import os