Spaces:

sonygod
/

flash

Sleeping

App Files Files Community

sonygod commited on Jan 24, 2025

Commit

1ba7fb7

1 Parent(s): 3afb208

111

Browse files

Files changed (3) hide show

Dockerfile +14 -0
app.py +471 -0
requirements.txt +7 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,14 @@

+FROM python:3.9-slim
+WORKDIR /app
+COPY ./requirements.txt /app/requirements.txt
+COPY ./app.py /app/app.py
+RUN pip install --no-cache-dir -r requirements.txt
+EXPOSE 7860
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

app.py ADDED Viewed

	@@ -0,0 +1,471 @@

+from fastapi import FastAPI, HTTPException, UploadFile, File, Form
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import HTMLResponse
+from pydantic import BaseModel
+from fastapi import FastAPI, HTTPException, Request
+from asyncio import TimeoutError
+import asyncio
+from typing import Optional
+import requests
+import uvicorn
+import shutil
+import datetime  # Add this import
+import logging
+from logging.handlers import RotatingFileHandler
+import time
+from typing import List, Dict, Optional
+import json
+import os
+import psutil
+import sys
+from typing import Dict
+import tempfile
+import re
+import random
+import aiohttp
+app = FastAPI()
+# Add USER_AGENTS constant
+USER_AGENTS = [
+    "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
+    "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
+    "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/121.0.0.0 Safari/537.36"
+]
+# Configure logging
+# Configure detailed logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+# Request counter
+request_counter = {
+    "analyze": 0,
+    "compareAnalyze": 0,
+    "total": 0
+}
+# Add CORS middleware
+# Add CORS middleware with both HTTP and HTTPS
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=[
+        "http://*",
+        "https://*"
+    ],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+class AskRequest(BaseModel):
+    prompt: str
+    model: str = "GEMINI"
+@app.get("/")
+async def health_check():
+    return {
+        "health": "ok",
+        "timestamp": datetime.datetime.now().isoformat(),
+        "service": "AI API Forwarding Service",
+        "version": "1.0"
+    }
+@app.post("/ask")
+async def forward_ask(request: AskRequest):
+    request_counter["total"] += 1
+    try:
+        response = requests.post(
+            "http://s5.serv00.com:9081/ask",
+            headers={'Content-Type': 'application/json'},
+            json=request.dict()
+        )
+        return response.json()
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/analyze")
+async def forward_analyze(image: UploadFile = File(...), model: str = Form(...)):
+    request_counter["analyze"] += 1
+    request_counter["total"] += 1
+    try:
+        files = {'image': (image.filename, image.file, image.content_type)}
+        data = {'model': model}
+        response = requests.post(
+            "http://s5.serv00.com:9081/analyze",
+            files=files,
+            data=data
+        )
+        return response.json()
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/compareAnalyze")
+async def forward_compare_analyze(image: UploadFile = File(...)):
+    request_counter["compareAnalyze"] += 1
+    request_counter["total"] += 1
+    try:
+        files = {'image': (image.filename, image.file, image.content_type)}
+        response = requests.post(
+            "http://s5.serv00.com:9081/compareAnalyze",
+            files=files
+        )
+        return response.json()
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.get("/status")
+async def forward_status():
+    start_time = time.time()
+    logger.info(f"Received status request at {datetime.datetime.now()}")
+    logger.info(f"Current request counter: {request_counter}")
+    try:
+        logger.info("Attempting to contact upstream server...")
+        response = requests.get("http://s5.serv00.com:9081/status")
+        elapsed_time = time.time() - start_time
+        logger.info(f"Upstream server responded in {elapsed_time:.2f} seconds")
+        logger.info(f"Response status code: {response.status_code}")
+        logger.info(f"Response content: {response.text[:200]}...")
+        return response.json()
+    except Exception as e:
+        logger.error(f"Error occurred: {str(e)}")
+        logger.error(f"Error type: {type(e).__name__}")
+        return {
+            "status": "running",
+            "requests": request_counter,
+            "error": str(e),
+            "timestamp": datetime.datetime.now().isoformat()
+        }
+@app.get("/check", response_class=HTMLResponse)
+async def forward_check():
+    try:
+        response = requests.get("http://s5.serv00.com:9081/check")
+        return response.text
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+# Add new models
+class Translation(BaseModel):
+    translation: str
+    type: str
+class Phrase(BaseModel):
+    phrase: str
+    translation: str
+class Word(BaseModel):
+    word: str
+    translations: List[dict]  # Changed to accept dictionary format
+    phrases: List[Phrase] = []  # Made optional with default empty list
+    level: str = ""  # Add level field with default empty string
+# Add global word map
+word_map: Dict[str, Word] = {}
+def get_level_from_filename(filename: str) -> str:
+    # Extract level from filenames like "1-初中-顺序.json"
+    match = re.match(r'\d+-(.+?)-顺序\.json', filename)
+    return match.group(1) if match else "unknown"
+# Add initialization function
+def init_word_map():
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+    json_dir = os.path.join(current_dir, "json")
+    stats = {
+        "total_words": 0,
+        "total_files": 0,
+        "file_stats": {}
+    }
+    try:
+        for filename in os.listdir(json_dir):
+            if filename.endswith('.json'):
+                try:
+                    level = get_level_from_filename(filename)
+                    with open(os.path.join(json_dir, filename), 'r', encoding='utf-8') as f:
+                        words = json.load(f)
+                        word_count = len(words)
+                        stats["total_words"] += word_count
+                        stats["total_files"] += 1
+                        stats["file_stats"][filename] = word_count
+                        for word_data in words:
+                            # Convert legacy format to new format
+                            if 'translations' not in word_data:
+                                word_data['translations'] = [{
+                                    'translation': word_data.get('translation', ''),
+                                    'type': word_data.get('type', '')
+                                }]
+                            if 'phrases' not in word_data:
+                                word_data['phrases'] = []
+                            word_data['level'] = level
+                            word = Word(**word_data)
+                            word_map[word.word.lower()] = word
+                    logger.info(f"Loaded {filename}: {word_count} words")
+                except Exception as e:
+                    logger.error(f"Error loading {filename}: {str(e)}")
+                    continue
+        logger.info(f"Dictionary initialization complete:")
+        logger.info(f"Total files processed: {stats['total_files']}")
+        logger.info(f"Total words loaded: {stats['total_words']}")
+        return stats
+    except Exception as e:
+        logger.error(f"Fatal error in init_word_map: {str(e)}")
+        return stats
+# Add cache configuration
+# Update cache file location
+CACHE_DIR = os.path.join(tempfile.gettempdir(), "flash_api_cache")
+CACHE_FILE = os.path.join(CACHE_DIR, "ai_translation_cache.json")
+ai_cache: Dict[str, dict] = {}
+# Load cache on startup
+def save_cache():
+    try:
+        # Create cache directory if it doesn't exist
+        os.makedirs(CACHE_DIR, exist_ok=True)
+        with open(CACHE_FILE, 'w', encoding='utf-8') as f:
+            json.dump(ai_cache, f, ensure_ascii=False, indent=2)
+            logger.info(f"Cache saved to: {CACHE_FILE}")
+    except PermissionError as pe:
+        logger.error(f"Permission denied writing to cache: {pe}")
+    except Exception as e:
+        logger.error(f"Error saving cache: {e}")
+def load_cache():
+    global ai_cache
+    try:
+        if os.path.exists(CACHE_FILE):
+            with open(CACHE_FILE, 'r', encoding='utf-8') as f:
+                ai_cache = json.load(f)
+                logger.info(f"Loaded {len(ai_cache)} cached translations from: {CACHE_FILE}")
+    except Exception as e:
+        logger.error(f"Error loading cache: {e}")
+        ai_cache = {}
+# Add translate endpoint
+@app.get("/translate/{word}")
+async def translate_word(word: str):
+    start_time = time.time()
+    logger.info(f"Translation request received for word: {word}")
+    try:
+        word = word.lower().strip()
+        logger.debug(f"Processed word: {word}")
+        # Check word map
+        # if word in word_map:
+        #     logger.info(f"Word found in map: {word}")
+        #     word_data = word_map[word]
+        #     logger.debug(f"Word data: {word_data}")
+        #     # Format all translations
+        #     translations_text = []
+        #     for trans in word_data.translations:
+        #         translation = trans['translation']
+        #         type_info = trans['type']
+        #         translations_text.append(f"({type_info}) {translation}")
+        #     # Join translations with separators
+        #     translations_combined = " | ".join(translations_text)
+        #     logger.debug(f"Combined translations: {translations_combined}")
+        #     # Handle examples
+        #     examples = []
+        #     if word_data.phrases:
+        #         examples = [f"{p.phrase}: {p.translation}" for p in word_data.phrases[:3]]
+        #         logger.debug(f"Examples found: {examples}")
+        #     # Build response with proper formatting
+        #     formatted_response = f"{word} [{word_data.level}]: {translations_combined}"
+        #     if examples:
+        #         formatted_response += f"\n\n例句：\n{chr(10).join(examples)}"
+        #     elapsed = time.time() - start_time
+        #     logger.info(f"Word map translation completed in {elapsed:.2f}s")
+        #     return {
+        #         "status": 200,
+        #         "data": {
+        #             "response": formatted_response,
+        #             "word": word,
+        #             "level": word_data.level,  # Add level info here
+        #             "translations": word_data.translations,
+        #             "examples": examples
+        #         }
+        #     }
+        # Check AI cache
+        # if word in ai_cache:
+        #     logger.info(f"Word found in AI cache: {word}")
+        #     elapsed = time.time() - start_time
+        #     logger.info(f"Cache hit completed in {elapsed:.2f}s")
+        #     return ai_cache[word]
+        # Fallback to AI translation
+        logger.info("Word not found in cache, calling AI API")
+        # Fallback to AI translation
+        logger.info("Word not found in map, falling back to AI translation")
+        try:
+            request = AskRequest(
+                prompt=f'''翻译以下英文
+            {word}
+            每行一个 格式参考,不要任何md格式,分别要有音标，单词属性(名词，动词，形容词),中文翻译，英文解析，例句，近义词，反义词，词性
+            格式参考:
+            hello:/həˈləʊ/| n. vt. int.|你好，问候语，|例句：Hello, how are you? 你好，你好吗？|近义词：hi, hey, |反义词:sick, bad.''',
+                model="GEMINI"
+            )
+            logger.debug(f"AI Request: {request}")
+            result = await forward_ask(request)
+             # Cache the result
+            #ai_cache[word] = result
+           #save_cache()
+            logger.debug(f"AI Response: {result}")
+            elapsed = time.time() - start_time
+            logger.info(f"AI translation completed in {elapsed:.2f}s")
+            return result
+        except Exception as e:
+            logger.error(f"AI translation error: {str(e)}", exc_info=True)
+            raise HTTPException(status_code=500, detail=str(e))
+    except Exception as e:
+        logger.error(f"Translation error: {str(e)}", exc_info=True)
+        raise HTTPException(status_code=500, detail=str(e))
+# Add cleanup functions
+def cleanup_temp_files():
+    try:
+        # Clean temp directory
+        temp_dir = os.path.join(tempfile.gettempdir(), "flash_api_cache")
+        if os.path.exists(temp_dir):
+            shutil.rmtree(temp_dir)
+            logger.info(f"Cleaned up temp directory: {temp_dir}")
+    except Exception as e:
+        logger.error(f"Error cleaning temp files: {e}")
+def cleanup_cache():
+    global ai_cache
+    ai_cache = {}
+    logger.info("Cache cleared")
+# Initialize word map on startup
+@app.on_event("startup")
+async def startup_event():
+    #init_word_map()// waste of memory
+    #load_cache()
+    cleanup_temp_files()
+    cleanup_cache()
+    logger.info(f"Memory usage after init: {get_memory_usage()}")
+@app.on_event("shutdown")
+async def shutdown_event():
+    # Cleanup on shutdown
+    cleanup_temp_files()
+    cleanup_cache()
+    logger.info("Application shutdown cleanup complete")
+def get_memory_usage():
+    process = psutil.Process()
+    memory_info = process.memory_info()
+    # Get system memory info
+    system = psutil.virtual_memory()
+    return {
+        "process": {
+            "rss": f"{memory_info.rss / 1024 / 1024:.2f} MB",
+            "rss_percent": f"{memory_info.rss / system.total * 100:.2f}%",
+            "vms": f"{memory_info.vms / 1024 / 1024:.2f} MB",
+            "vms_percent": f"{memory_info.vms / system.total * 100:.2f}%"
+        },
+        "system": {
+            "total": f"{system.total / 1024 / 1024:.2f} MB",
+            "available": f"{system.available / 1024 / 1024:.2f} MB",
+            "used_percent": f"{system.percent:.2f}%"
+        },
+        "word_map": {
+            "entries": len(word_map),
+            "memory": f"{sys.getsizeof(word_map) / 1024 / 1024:.2f} MB",
+            "memory_percent": f"{sys.getsizeof(word_map) / system.total * 100:.4f}%"
+        }
+    }
+@app.get("/memory")
+async def memory_status():
+    return get_memory_usage()
+# Add new endpoint
+@app.get("/proxy")
+async def proxy_request(url: str, request: Request):
+    try:
+        # Get random user agent
+        user_agent = random.choice(USER_AGENTS)
+        #print url
+        logger.info(f"Proxy request received for: {url}")
+        # Prepare headers
+        headers = {
+            'User-Agent': user_agent,
+            'Accept': 'application/json, text/plain, */*',
+            'Accept-Language': 'en-US,en;q=0.9',
+            'Origin': 'https://www.youtube.com',
+            'Referer': 'https://www.youtube.com/',
+            'Sec-Fetch-Dest': 'empty',
+            'Sec-Fetch-Mode': 'cors',
+            'Sec-Fetch-Site': 'same-site',
+            'Connection': 'keep-alive'
+        }
+        # Set timeout
+        timeout = aiohttp.ClientTimeout(total=10)  # 10 seconds timeout
+        async with aiohttp.ClientSession(timeout=timeout) as session:
+            async with session.get(url, headers=headers) as response:
+                # Check HTTP status
+                if response.status != 200:
+                    raise HTTPException(
+                        status_code=response.status,
+                        detail=f"HTTP error: {response.status}"
+                    )
+                # Parse JSON response
+                data = await response.json()
+                #print data's length
+                logger.info(f"Received youtube subtile data: {len(data)} bytes")
+                # Validate data format
+                if not data or 'events' not in data:
+                    raise HTTPException(
+                        status_code=400,
+                        detail="Invalid subtitle data format"
+                    )
+                return data
+    except TimeoutError:
+        raise HTTPException(status_code=408, detail="Request timeout")
+    except Exception as e:
+        logger.error(f"Proxy error: {str(e)}")
+        raise HTTPException(status_code=500, detail=str(e))
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=7860)

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+fastapi
+uvicorn
+requests
+python-multipart
+pydantic
+psutil
+aiohttp>=3.8.0