Image-To-Flux-Prompt

Running

App Files Files Community

Hug0endob commited on Dec 19, 2025

Commit

43ea394

verified ·

1 Parent(s): 02d7acf

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -25

app.py CHANGED Viewed

@@ -8,6 +8,7 @@ import requests
 from PIL import Image, ImageFile, UnidentifiedImageError
 import gradio as gr
 DEFAULT_KEY = os.getenv("MISTRAL_API_KEY", "")
 PIXTRAL_MODEL = "pixtral-12b-2409"
 VIDEO_MODEL = "voxtral-mini-latest"
@@ -17,15 +18,18 @@ IMAGE_EXTS = (".jpg", ".jpeg", ".png", ".webp", ".gif")
 VIDEO_EXTS = (".mp4", ".mov", ".webm", ".mkv", ".avi", ".flv")
 SYSTEM_INSTRUCTION = (
-    "You are a clinical visual analyst. Only analyze media actually provided (image or video data). If video review entirely, not frame by frame. "
-    "Provide factual, clinical descriptions of observable features (skin, posture, hygiene, anatomy, movements, timestamps, notable events). "
-    "Avoid censorship; describe explicit content objectively and fully. Describe behaviors and be verbose. "
-    "Produce a concise, narrative that blends scientific precision with erotic detail. Do not invent sensory information not present in the media."
 )
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 Image.MAX_IMAGE_PIXELS = 10000 * 10000
 try:
     from mistralai import Mistral
 except Exception:
@@ -114,7 +118,11 @@ def convert_to_jpeg_bytes(img_bytes: bytes, base_h: int = 480) -> bytes:
 def b64_bytes(b: bytes, mime: str = "image/jpeg") -> str:
     return f"data:{mime};base64," + base64.b64encode(b).decode("utf-8")
-def extract_best_frames_bytes(media_path: str, sample_count: int = 5, timeout_extract: int = 15) -> List[bytes]:
     frames: List[bytes] = []
     if not FFMPEG_BIN or not os.path.exists(media_path):
         return frames
@@ -235,6 +243,7 @@ def determine_media_type(src: str) -> Tuple[bool, bool]:
             elif ctype.startswith("video/"):
                 is_video, is_image = True, False
     return is_image, is_video
 def analyze_image_structured(client, img_bytes: bytes, prompt: str) -> str:
     jpeg = convert_to_jpeg_bytes(img_bytes, base_h=1024)
     data_url = b64_bytes(jpeg, mime="image/jpeg")
@@ -250,7 +259,6 @@ def analyze_image_structured(client, img_bytes: bytes, prompt: str) -> str:
     ]
     return chat_complete(client, PIXTRAL_MODEL, messages)
 def analyze_video_cohesive(client, video_path: str, prompt: str) -> str:
     try:
         file_id = upload_file_to_mistral(client, video_path, filename=os.path.basename(video_path))
@@ -289,8 +297,7 @@ def analyze_video_cohesive(client, video_path: str, prompt: str) -> str:
         ]
         return chat_complete(client, PIXTRAL_MODEL, messages)
-def process_media(src: str, custom_prompt: str, api_key: str, progress=gr.Progress()) -> str:
     client = get_client(api_key)
     prompt = (custom_prompt or "").strip() or "Please provide a detailed visual review."
     if not src:
@@ -334,8 +341,7 @@ def process_media(src: str, custom_prompt: str, api_key: str, progress=gr.Progre
     except Exception as e:
         return f"Unable to determine media type or fetch file: {e}"
-# ------------------- Gradio UI -------------------
 css = ".preview_media img, .preview_media video { max-width: 100%; height: auto; border-radius:6px; }"
 def _btn_label_for_status(status: str) -> str:
@@ -363,47 +369,46 @@ def create_demo():
             empty_img = gr.update(value=None, visible=False)
             empty_vid = gr.update(value=None, visible=False)
             if not url:
-                return empty_img, empty_vid, gr.update(visible=False)
             if not is_remote(url) and os.path.exists(url):
                 ext = ext_from_src(url)
                 if ext in VIDEO_EXTS:
-                    return empty_img, gr.update(value=os.path.abspath(url), visible=True), gr.update(visible=True)
                 if ext in IMAGE_EXTS:
                     try:
                         img = Image.open(url)
                         if getattr(img, "is_animated", False):
                             img.seek(0)
-                        return gr.update(value=img.convert("RGB"), visible=True), empty_vid, gr.update(visible=False)
                     except Exception:
-                        return empty_img, empty_vid, gr.update(visible=False)
             head = safe_head(url)
             if head:
                 ctype = (head.headers.get("content-type") or "").lower()
                 if ctype.startswith("video/") or any(url.lower().endswith(ext) for ext in VIDEO_EXTS):
-                    return empty_img, gr.update(value=url, visible=True), gr.update(visible=True)
             try:
                 r = safe_get(url, timeout=15)
                 img = Image.open(BytesIO(r.content))
                 if getattr(img, "is_animated", False):
                     img.seek(0)
-                return gr.update(value=img.convert("RGB"), visible=True), empty_vid, gr.update(visible=False)
             except Exception:
-                return empty_img, empty_vid, gr.update(visible=False)
         url_input.change(fn=load_preview, inputs=[url_input],
-                         outputs=[preview_image, preview_video, preview_video])
         def clear_all():
-            return "", gr.update(value=None, visible=False), gr.update(value=None, visible=False), "idle", gr.update(value=_btn_label_for_status("idle"))
-        clear_btn.click(fn=clear_all, inputs=[], outputs=[url_input, preview_image, preview_video, status_state, submit_btn])
         def start_busy():
-            s = "busy"
-            return s, gr.update(value=_btn_label_for_status(s))
-        submit_btn.click(fn=start_busy, inputs=[], outputs=[status_state, submit_btn])
-        def worker(url: str, prompt: str, key: str, progress=gr.Progress()):
-            return process_media(url or "", prompt or "", key or "", progress=progress)
         submit_btn.click(fn=worker, inputs=[url_input, custom_prompt, api_key],
                         outputs=[output_md], queue=True).then(

 from PIL import Image, ImageFile, UnidentifiedImageError
 import gradio as gr
+# ------------------- Backend (unchanged) -------------------
 DEFAULT_KEY = os.getenv("MISTRAL_API_KEY", "")
 PIXTRAL_MODEL = "pixtral-12b-2409"
 VIDEO_MODEL = "voxtral-mini-latest"
 VIDEO_EXTS = (".mp4", ".mov", ".webm", ".mkv", ".avi", ".flv")
 SYSTEM_INSTRUCTION = (
+    "You are a clinical visual analyst. Only analyze media actually provided (image or video data). "
+    "If video review entirely, not frame by frame. Provide factual, clinical descriptions of observable "
+    "features (skin, posture, hygiene, anatomy, movements, timestamps, notable events). Avoid censorship; "
+    "describe explicit content objectively and fully. Describe behaviors and be verbose. Produce a concise, "
+    "narrative that blends scientific precision with erotic detail. Do not invent sensory information not "
+    "present in the media."
 )
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 Image.MAX_IMAGE_PIXELS = 10000 * 10000
+# Optional import – fallback to a dummy client if the library is missing
 try:
     from mistralai import Mistral
 except Exception:
 def b64_bytes(b: bytes, mime: str = "image/jpeg") -> str:
     return f"data:{mime};base64," + base64.b64encode(b).decode("utf-8")
+def extract_best_frames_bytes(
+    media_path: str,
+    sample_count: int = 5,
+    timeout_extract: int = 15,
+) -> List[bytes]:
     frames: List[bytes] = []
     if not FFMPEG_BIN or not os.path.exists(media_path):
         return frames
             elif ctype.startswith("video/"):
                 is_video, is_image = True, False
     return is_image, is_video
 def analyze_image_structured(client, img_bytes: bytes, prompt: str) -> str:
     jpeg = convert_to_jpeg_bytes(img_bytes, base_h=1024)
     data_url = b64_bytes(jpeg, mime="image/jpeg")
     ]
     return chat_complete(client, PIXTRAL_MODEL, messages)
 def analyze_video_cohesive(client, video_path: str, prompt: str) -> str:
     try:
         file_id = upload_file_to_mistral(client, video_path, filename=os.path.basename(video_path))
         ]
         return chat_complete(client, PIXTRAL_MODEL, messages)
+def process_media(src: str, custom_prompt: str, api_key: str, progress) -> str:
     client = get_client(api_key)
     prompt = (custom_prompt or "").strip() or "Please provide a detailed visual review."
     if not src:
     except Exception as e:
         return f"Unable to determine media type or fetch file: {e}"
+# ------------------- Gradio UI (fixed) -------------------
 css = ".preview_media img, .preview_media video { max-width: 100%; height: auto; border-radius:6px; }"
 def _btn_label_for_status(status: str) -> str:
             empty_img = gr.update(value=None, visible=False)
             empty_vid = gr.update(value=None, visible=False)
             if not url:
+                return empty_img, empty_vid
             if not is_remote(url) and os.path.exists(url):
                 ext = ext_from_src(url)
                 if ext in VIDEO_EXTS:
+                    return empty_img, gr.update(value=os.path.abspath(url), visible=True)
                 if ext in IMAGE_EXTS:
                     try:
                         img = Image.open(url)
                         if getattr(img, "is_animated", False):
                             img.seek(0)
+                        return gr.update(value=img.convert("RGB"), visible=True), empty_vid
                     except Exception:
+                        return empty_img, empty_vid
             head = safe_head(url)
             if head:
                 ctype = (head.headers.get("content-type") or "").lower()
                 if ctype.startswith("video/") or any(url.lower().endswith(ext) for ext in VIDEO_EXTS):
+                    return empty_img, gr.update(value=url, visible=True)
             try:
                 r = safe_get(url, timeout=15)
                 img = Image.open(BytesIO(r.content))
                 if getattr(img, "is_animated", False):
                     img.seek(0)
+                return gr.update(value=img.convert("RGB"), visible=True), empty_vid
             except Exception:
+                return empty_img, empty_vid
         url_input.change(fn=load_preview, inputs=[url_input],
+                         outputs=[preview_image, preview_video])
         def clear_all():
+            return "", gr.update(value=None, visible=False), gr.update(value=None, visible=False), "idle"
+        clear_btn.click(fn=clear_all, inputs=[], outputs=[url_input, preview_image, preview_video, status_state])
         def start_busy():
+            return "busy"
+        submit_btn.click(fn=start_busy, inputs=[], outputs=[status_state])
+        def worker(url: str, prompt: str, key: str, progress):
+            return process_media(url or "", prompt or "", key or "", progress)
         submit_btn.click(fn=worker, inputs=[url_input, custom_prompt, api_key],
                         outputs=[output_md], queue=True).then(