Spaces:

MyanmarSwe
/

medium

Running

App Files Files Community

MyanmarSwe commited on 2 days ago

Commit

c60549e

verified ·

1 Parent(s): 04fa3a5

Update main.py

Browse files

Files changed (1) hide show

main.py +40 -48

main.py CHANGED Viewed

@@ -31,7 +31,7 @@ CACHE_TTL = 1800
 client = httpx.AsyncClient(
     timeout=httpx.Timeout(60.0, read=None),
     follow_redirects=True,
-    limits=httpx.Limits(max_connections=200, max_keepalive_connections=50)
 )
 @app.get("/")
@@ -64,6 +64,28 @@ def get_clean_filename(url):
     name = decoded_url.split('/')[-1].split('?')[0]
     return name if (name and '.' in name) else "video.mp4"
 @app.get("/download")
 async def download_proxy(request: Request, url: str, key: str = None):
     if key != ACCESS_KEY:
@@ -76,56 +98,28 @@ async def download_proxy(request: Request, url: str, key: str = None):
     # --- MediaFire Section ---
     if "mediafire.com" in clean_url:
-        target_link = None
         cached = MEDIAFIRE_CACHE.get(clean_url)
-        if cached and (current_time - cached['time']) < CACHE_TTL:
-            target_link = cached['link']
         if not target_link:
-            try:
-                headers = {
-                    'User-Agent': ua.random,
-                    'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8',
-                    'Accept-Language': 'en-US,en;q=0.5',
-                    'Referer': 'https://www.mediafire.com/'
-                }
-                async with httpx.AsyncClient(headers=headers, follow_redirects=True, timeout=20.0) as temp_client:
-                    r = await temp_client.get(clean_url)
-                    if r.status_code == 200:
-                        # 1. Regex ရှာဖွေခြင်း (ပိုမိုကျယ်ပြန့်သော Pattern)
-                        match = re.search(r'https?://download[^\s"\']+mediafire\.com/[^\s"\']+', r.text)
-                        if match:
-                            target_link = match.group(0).strip()
-                        # 2. BeautifulSoup နဲ့ ထပ်မံရှာဖွေခြင်း
-                        if not target_link:
-                            soup = BeautifulSoup(r.text, 'html.parser')
-                            # Download link ရှာရန် ဖြစ်နိုင်သမျှ နည်းလမ်းအားလုံးသုံးခြင်း
-                            link_tags = soup.find_all('a', href=True)
-                            for tag in link_tags:
-                                href = tag['href']
-                                if 'download' in href and 'mediafire.com' in href:
-                                    target_link = href
-                                    break
-                            # aria-label ထဲတွင် ဝှက်ထားသော link ကိုရှာခြင်း
-                            if not target_link:
-                                download_btn = soup.find('a', {'aria-label': re.compile(r'Download', re.I)})
-                                if download_btn: target_link = download_btn.get('href')
-                        if target_link:
-                            # // နဲ့စရင် https: ထည့်ပေးခြင်း
-                            if target_link.startswith("//"): target_link = f"https:{target_link}"
-                            MEDIAFIRE_CACHE[clean_url] = {'link': target_link, 'time': current_time}
-            except Exception as e:
-                print(f"Scraper Error: {e}")
         if target_link:
-            return await stream_file(target_link, range_header, filename, referer=clean_url)
         else:
-            # 404 ပြန်ရခြင်းအကြောင်းရင်းမှာ Scraper က link ရှာမတွေ့လို့ပါ
-            raise HTTPException(status_code=404, detail="Direct link not found in MediaFire page.")
     # --- Google Drive Section ---
     elif "drive.google.com" in clean_url:
@@ -164,11 +158,9 @@ async def stream_file(target_url, range_header, filename, referer=None):
         req = client.build_request("GET", target_url, headers=headers)
         r = await client.send(req, stream=True)
-        # HTML ပြန်ကျလာရင် (Block ခံရရင်) Cache ရှင်းပြီး Error ပြန်ပေးရန်
         if "text/html" in r.headers.get("Content-Type", "").lower() and r.status_code == 200:
             await r.aclose()
-            for key, val in list(MEDIAFIRE_CACHE.items()):
-                if val['link'] == target_url: del MEDIAFIRE_CACHE[key]
             raise HTTPException(status_code=415, detail="MediaFire detection triggered.")
         return await process_response(r, filename)

 client = httpx.AsyncClient(
     timeout=httpx.Timeout(60.0, read=None),
     follow_redirects=True,
+    limits=httpx.Limits(max_connections=300, max_keepalive_connections=100)
 )
 @app.get("/")
     name = decoded_url.split('/')[-1].split('?')[0]
     return name if (name and '.' in name) else "video.mp4"
+async def scrape_mediafire(url):
+    """MediaFire Direct Link ကို ပိုမိုတိကျစွာ ရှာဖွေပေးခြင်း"""
+    try:
+        headers = {
+            'User-Agent': ua.random,
+            'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8',
+            'Referer': 'https://www.mediafire.com/'
+        }
+        async with httpx.AsyncClient(headers=headers, follow_redirects=True, timeout=20.0) as temp_client:
+            r = await temp_client.get(url)
+            if r.status_code == 200:
+                # Regex ရှာဖွေခြင်း
+                match = re.search(r'https?://download[^\s"\']+mediafire\.com/[^\s"\']+', r.text)
+                if match: return match.group(0).strip()
+                # BS4 နဲ့ ထပ်ရှာခြင်း
+                soup = BeautifulSoup(r.text, 'html.parser')
+                btn = soup.find('a', {'id': 'downloadButton'}) or soup.find('a', {'aria-label': re.compile(r'Download', re.I)})
+                if btn: return btn.get('href')
+    except: pass
+    return None
 @app.get("/download")
 async def download_proxy(request: Request, url: str, key: str = None):
     if key != ACCESS_KEY:
     # --- MediaFire Section ---
     if "mediafire.com" in clean_url:
         cached = MEDIAFIRE_CACHE.get(clean_url)
+        target_link = cached['link'] if (cached and (current_time - cached['time']) < CACHE_TTL) else None
         if not target_link:
+            target_link = await scrape_mediafire(clean_url)
+            if target_link:
+                if target_link.startswith("//"): target_link = f"https:{target_link}"
+                MEDIAFIRE_CACHE[clean_url] = {'link': target_link, 'time': current_time}
         if target_link:
+            # Retry Logic: Block ခံရရင် တစ်ကြိမ်ထပ်ကြိုးစားမည်
+            try:
+                return await stream_file(target_link, range_header, filename, referer=clean_url)
+            except HTTPException as e:
+                if e.status_code == 415: # HTML Blocked ဖြစ်ခဲ့ရင် Cache ဖျက်ပြီး အသစ်တခါပြန်ရှာ
+                    del MEDIAFIRE_CACHE[clean_url]
+                    new_link = await scrape_mediafire(clean_url)
+                    if new_link:
+                        return await stream_file(new_link, range_header, filename, referer=clean_url)
+                raise e
         else:
+            raise HTTPException(status_code=404, detail="Direct link failure")
     # --- Google Drive Section ---
     elif "drive.google.com" in clean_url:
         req = client.build_request("GET", target_url, headers=headers)
         r = await client.send(req, stream=True)
+        # HTML Blocked Detection
         if "text/html" in r.headers.get("Content-Type", "").lower() and r.status_code == 200:
             await r.aclose()
             raise HTTPException(status_code=415, detail="MediaFire detection triggered.")
         return await process_response(r, filename)