Spaces:

danicor
/

TR2

Sleeping

App Files Files Community

danicor commited on Sep 25, 2025

Commit

e9d25da

verified ·

1 Parent(s): ef551b0

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -42

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from datetime import datetime, timedelta
 from concurrent.futures import ThreadPoolExecutor
 from typing import Dict, List, Optional, Any
 import json
 from fastapi import FastAPI, HTTPException, BackgroundTasks
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
@@ -17,25 +17,11 @@ import torch
 from transformers import M2M100ForConditionalGeneration, M2M100Tokenizer
 import requests
-os.environ['HF_HOME'] = '/home/user/.cache/huggingface'
-os.environ['HUGGINGFACE_HUB_CACHE'] = '/home/user/.cache/huggingface/hub'
-# ایجاد مسیرهای کش
-cache_paths = [
-    '/home/user/.cache',
-    '/home/user/.cache/huggingface',
-    '/home/user/.cache/huggingface/hub'
-]
-for path in cache_paths:
-    os.makedirs(path, exist_ok=True)
-    # تنظیم مجوزهای مناسب
-    try:
-        os.chmod(path, 0o755)
-    except:
-        pass
-print(f"✅ مسیرهای کش تنظیم شد: {cache_paths}")
 # تنظیمات اولیه
 MODEL_NAME = "facebook/m2m100_418M"
@@ -311,23 +297,26 @@ class MultilingualTranslator:
         print("در حال راه‌اندازی مترجم...")
         try:
-            # استفاده از tokenizer و model با تنظیمات minimal
-            print("🚀 در حال بارگذاری سریع مدل...")
             self.tokenizer = M2M100Tokenizer.from_pretrained(
                 MODEL_NAME,
-                use_fast=True,  # استفاده از tokenizer سریع
-                trust_remote_code=False
             )
             self.model = M2M100ForConditionalGeneration.from_pretrained(
                 MODEL_NAME,
-                device_map="auto",  # مدیریت خودکار دستگاه
-                trust_remote_code=False,
-                low_cpu_mem_usage=True
             )
-            # اگر device_map کار نکرد، دستی انتقال دهید
             if not hasattr(self.model, 'device'):
                 self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
                 self.model.to(self.device)
@@ -336,34 +325,46 @@ class MultilingualTranslator:
             self.model.eval()
-            print(f"✅ مدل روی {self.device} بارگذاری شد")
         except Exception as e:
-            print(f"⚠️ خطا: {str(e)}")
-            print("🔧 استفاده از حالت fallback...")
-            # حالت fallback بسیار ساده
-            from transformers import pipeline
-            self.translator_pipeline = pipeline(
-                "translation",
-                model=MODEL_NAME,
-                device=0 if torch.cuda.is_available() else -1
-            )
-            self.use_pipeline = True
-            self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-            print("✅ مدل از طریق pipeline بارگذاری شد")
-        # بقیه کد بدون تغییر...
         self.cache = TranslationCache(cache_expiry_minutes)
         self.chunker = TextChunker()
         self.queue = TranslationQueue()
         self.translation_sessions: Dict[str, Dict] = {}
         self.completed_translations: Dict[str, Dict] = {}
         self.translation_requests: Dict[str, Dict] = {}
         self.total_requests = 0
         self.lock = threading.Lock()
-        print("🎊 مترجم آماده است!")
     def _normalize_language(self, lang: str) -> str:
         """تبدیل نام زبان به کد دوحرفی"""

 from concurrent.futures import ThreadPoolExecutor
 from typing import Dict, List, Optional, Any
 import json
+import tempfile
 from fastapi import FastAPI, HTTPException, BackgroundTasks
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from transformers import M2M100ForConditionalGeneration, M2M100Tokenizer
 import requests
+temp_cache_dir = tempfile.mkdtemp()
+os.environ['HF_HOME'] = temp_cache_dir
+os.environ['HUGGINGFACE_HUB_CACHE'] = os.path.join(temp_cache_dir, 'hub')
+print(f"✅ مسیر کش موقت ایجاد شد: {temp_cache_dir}")
 # تنظیمات اولیه
 MODEL_NAME = "facebook/m2m100_418M"
         print("در حال راه‌اندازی مترجم...")
         try:
+            print("🚀 در حال بارگذاری مدل M2M100...")
+            # روش 1: استفاده از device_map="auto" برای مدیریت خودکار حافظه
             self.tokenizer = M2M100Tokenizer.from_pretrained(
                 MODEL_NAME,
+                use_fast=True,
+                cache_dir=None,  # عدم استفاده از کش دائمی
+                local_files_only=False
             )
             self.model = M2M100ForConditionalGeneration.from_pretrained(
                 MODEL_NAME,
+                device_map="auto",  # مدیریت خودکار دستگاه و حافظه
+                torch_dtype=torch.float16,  # استفاده از float16 برای صرفه‌جویی در حافظه
+                low_cpu_mem_usage=True,
+                cache_dir=None,
+                local_files_only=False
             )
+            # اگر device_map کار نکند، از روش سنتی استفاده می‌کنیم
             if not hasattr(self.model, 'device'):
                 self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
                 self.model.to(self.device)
             self.model.eval()
+            print(f"✅ مدل با موفقیت روی {self.device} بارگذاری شد")
         except Exception as e:
+            print(f"❌ خطا در بارگذاری مدل: {str(e)}")
+            # روش جایگزین: استفاده از pipeline
+            try:
+                print("🔄 استفاده از pipeline به عنوان راه‌حل جایگزین...")
+                from transformers import pipeline
+                self.translation_pipeline = pipeline(
+                    "translation",
+                    model=MODEL_NAME,
+                    tokenizer=MODEL_NAME,
+                    device=0 if torch.cuda.is_available() else -1,
+                    torch_dtype=torch.float16
+                )
+                self.use_pipeline = True
+                self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+                print("✅ pipeline ترجمه با موفقیت ایجاد شد")
+            except Exception as e2:
+                print(f"❌ خطا در ایجاد pipeline: {str(e2)}")
+                raise RuntimeError("امکان بارگذاری مدل ترجمه وجود ندارد")
+        # اجزای کمکی
         self.cache = TranslationCache(cache_expiry_minutes)
         self.chunker = TextChunker()
         self.queue = TranslationQueue()
+        # ذخیره وضعیت ترجمه‌ها
         self.translation_sessions: Dict[str, Dict] = {}
         self.completed_translations: Dict[str, Dict] = {}
         self.translation_requests: Dict[str, Dict] = {}
+        # آمار
         self.total_requests = 0
         self.lock = threading.Lock()
+        print("🎉 مترجم با موفقیت راه‌اندازی شد!")
     def _normalize_language(self, lang: str) -> str:
         """تبدیل نام زبان به کد دوحرفی"""