Spaces:

q6
/

p

Running

App Files Files Community

q6 commited on Jun 25, 2025

Commit

d7d9d98

1 Parent(s): d639071

X

Browse files

Files changed (2) hide show

API/app.py +5 -6
Client/Extract Pixiv/ai_search.py +6 -4

API/app.py CHANGED Viewed

@@ -6,6 +6,8 @@ import time
 import os
 from pydantic import BaseModel
 from typing import List, Dict
 img_base = 'https://i.pximg.net/img-original/img/'
@@ -17,6 +19,7 @@ class PixifDownloadModel(BaseModel):
 env_path = os.path.dirname(os.path.realpath(__file__)) + "/../.env"
 PHPSESSID = os.getenv("PHPSESSID")
 cookies = {"PHPSESSID": PHPSESSID}
@@ -44,11 +47,10 @@ async def search(raw, pages, ai_only=True, real_only=True, cookies=None, headers
     post_ids = []
     tasks = []
-    prev_first_id = None
     async with aiohttp.ClientSession(cookies=cookies, headers=headers) as session:
         for page in range(1, pages + 1):
-            page_url = f"{url}&p={page}"
             task = fetch_page(session, page_url)
             tasks.append(task)
@@ -67,10 +69,6 @@ async def search(raw, pages, ai_only=True, real_only=True, cookies=None, headers
                 posts = data['body']['illustManga']['data']
             if not posts:
                 break
-            current_first_id = posts[0]['id']
-            if prev_first_id and current_first_id == prev_first_id:
-                break
-            prev_first_id = current_first_id
             post_ids.extend([post['id'] for post in posts])
     return post_ids, requests.utils.unquote(keywords, encoding='utf-8')
@@ -95,6 +93,7 @@ async def search_endpoint(
     pages: int = Query(1, description="Number of pages to fetch."),
     ai_only: bool = Query(True, description="Filter for AI-generated content.")
 ):
     try:
         post_ids, keywords = await search(raw, pages, ai_only, cookies=cookies, headers=headers)
         return {"post_ids": post_ids, "filename": base26_time() + "_" + keywords}

 import os
 from pydantic import BaseModel
 from typing import List, Dict
+from dotenv import load_dotenv
 img_base = 'https://i.pximg.net/img-original/img/'
 env_path = os.path.dirname(os.path.realpath(__file__)) + "/../.env"
+load_dotenv(env_path)
 PHPSESSID = os.getenv("PHPSESSID")
 cookies = {"PHPSESSID": PHPSESSID}
     post_ids = []
     tasks = []
     async with aiohttp.ClientSession(cookies=cookies, headers=headers) as session:
         for page in range(1, pages + 1):
+            page_url = f"{url.strip()}&p={page}"
             task = fetch_page(session, page_url)
             tasks.append(task)
                 posts = data['body']['illustManga']['data']
             if not posts:
                 break
             post_ids.extend([post['id'] for post in posts])
     return post_ids, requests.utils.unquote(keywords, encoding='utf-8')
     pages: int = Query(1, description="Number of pages to fetch."),
     ai_only: bool = Query(True, description="Filter for AI-generated content.")
 ):
+    print(raw, pages, ai_only, cookies, headers)
     try:
         post_ids, keywords = await search(raw, pages, ai_only, cookies=cookies, headers=headers)
         return {"post_ids": post_ids, "filename": base26_time() + "_" + keywords}

Client/Extract Pixiv/ai_search.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import requests
 import os
-local = 0
 if local:
     endpoint = "http://127.0.0.1:7860"
 else:
@@ -11,7 +11,7 @@ os.chdir(os.path.dirname(os.path.abspath(__file__)))
 input_url = input("Enter the URL: ")
-pages = 300 // 60
 params = {
     'raw': input_url,
@@ -23,5 +23,7 @@ params = {
 response = requests.get(f'{endpoint}/search', params=params)
 data = response.json()
-with open(f"../{data['filename']}.txt", "w") as f:
-    f.write("\n".join(data['post_ids']))

 import requests
 import os
+local = 1
 if local:
     endpoint = "http://127.0.0.1:7860"
 else:
 input_url = input("Enter the URL: ")
+pages = 3
 params = {
     'raw': input_url,
 response = requests.get(f'{endpoint}/search', params=params)
 data = response.json()
+# with open(f"../{data['filename']}.txt", "w") as f:
+#     f.write("\n".join(data['post_ids']))
+print(data)