Spaces:

GLAkavya
/

ADDENEATOR

Running

App Files Files Community

GLAkavya commited on 9 days ago

Commit

7dfb42b

verified ·

1 Parent(s): 6595df8

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -46

app.py CHANGED Viewed

@@ -12,63 +12,45 @@ from diffusers import StableVideoDiffusionPipeline
 from diffusers.utils import export_to_video
 # ── ENV SETUP ────────────────────────────────────────────────────────────────
-HF_TOKEN = (
-    os.environ.get("HF_TOKEN", "")
-    or os.environ.get("HF_KEY", "")
 ).strip()
-if HF_TOKEN:
-    login(token=HF_TOKEN)
-    print(f"✅ HF login OK — token starts: {HF_TOKEN[:8]}...")
 else:
-    print("⚠️  No HF token found.")
-# ── DEBUG: Print ALL env vars that contain KEY or TOKEN ──────────────────────
-print("\n=== ENV DEBUG (secrets check) ===")
-for k, v in os.environ.items():
-    if any(word in k.upper() for word in ["KEY", "TOKEN", "GEMINI", "API"]):
-        masked = v[:6] + "..." + v[-4:] if len(v) > 10 else "TOO_SHORT"
-        print(f"  {k} = {masked}  (len={len(v)})")
-print("=================================\n")
-# ── DEVICE SETUP ─────────────────────────────────────────────────────────────
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 DTYPE  = torch.float16 if DEVICE == "cuda" else torch.float32
-print(f"🖥️  Using device: {DEVICE}")
-# ── LOAD SVD MODEL ONCE ──────────────────────────────────────────────────────
-print("⏳  Loading Stable Video Diffusion …")
 svd_pipe = StableVideoDiffusionPipeline.from_pretrained(
     "stabilityai/stable-video-diffusion-img2vid-xt",
     torch_dtype=DTYPE,
     variant="fp16" if DEVICE == "cuda" else None,
 )
 svd_pipe = svd_pipe.to(DEVICE)
-print("✅  SVD model ready.")
-# ── GEMINI HELPER ─────────────────────────────────────────────────────────────
 def call_gemini(pil_image: Image.Image, user_desc: str, language: str, style: str) -> dict:
-    # Try every possible env var name user might have used
-    api_key = (
-        os.environ.get("GEMINI_API_KEY", "")
-        or os.environ.get("GEMINI_KEY", "")
-        or os.environ.get("GOOGLE_API_KEY", "")
-        or os.environ.get("API_KEY", "")
-    ).strip()
-    print(f"[Gemini] Using key: {api_key[:6]}...{api_key[-4:]} (len={len(api_key)})")
-    if not api_key:
-        raise ValueError(
-            "No Gemini API key found! Tried: GEMINI_API_KEY, GEMINI_KEY, "
-            "GOOGLE_API_KEY, API_KEY. Please set one in Space Secrets."
-        )
-    if len(api_key) < 20:
-        raise ValueError(f"Key looks too short (len={len(api_key)}). Check for copy-paste errors.")
-    client = genai.Client(api_key=api_key)
     lang_map = {
         "English":  "Write everything in English.",
@@ -87,7 +69,7 @@ def call_gemini(pil_image: Image.Image, user_desc: str, language: str, style: st
 Language rule : {lang_map.get(language, lang_map['English'])}
 Style rule     : {style_map.get(style, style_map['Fun'])}
-CRITICAL: Return ONLY a raw JSON object. No markdown. No ```json. No explanation. Pure JSON only.
 {{
   "hook":         "attention-grabbing opening line (1-2 sentences)",
   "script":       "full 15-20 second voiceover script",
@@ -117,7 +99,7 @@ CRITICAL: Return ONLY a raw JSON object. No markdown. No ```json. No explanation
     return json.loads(raw)
-# ── VIDEO GENERATION ──────────────────────────────────────────────────────────
 def generate_video(pil_image: Image.Image) -> str:
     img = pil_image.convert("RGB").resize((1024, 576))
     frames = svd_pipe(
@@ -132,7 +114,7 @@ def generate_video(pil_image: Image.Image) -> str:
     return tmp.name
-# ── MAIN PIPELINE ─────────────────────────────────────────────────────────────
 def generate_ad(image, user_desc, language, style):
     if image is None:
         return None, "⚠️ Please upload a product image.", "", ""
@@ -156,7 +138,7 @@ def generate_ad(image, user_desc, language, style):
     return video_path, hook, script, cta
-# ── GRADIO UI ─────────────────────────────────────────────────────────────────
 css = """
 #title { text-align:center; font-size:2.2rem; font-weight:800; margin-bottom:.2rem; }
 #sub   { text-align:center; color:#888; margin-bottom:1.5rem; }
@@ -201,7 +183,7 @@ with gr.Blocks(css=css, theme=gr.themes.Soft(primary_hue="violet")) as demo:
     gr.Markdown(
         "---\n**How it works:** "
         "1️⃣ Gemini 2.5 Flash reads your image → hook, script, CTA. "
-        "2️⃣ Stable Video Diffusion → short cinematic video clip. "
         "3️⃣ Ready-to-post reel! 🎉"
     )

 from diffusers.utils import export_to_video
 # ── ENV SETUP ────────────────────────────────────────────────────────────────
+# genai.Client() auto-reads GOOGLE_API_KEY — so we map our secret to it
+gemini_key = (
+    os.environ.get("GEMINI_API_KEY", "")
+    or os.environ.get("GOOGLE_API_KEY", "")
 ).strip()
+if gemini_key:
+    os.environ["GOOGLE_API_KEY"] = gemini_key  # ensure Client() finds it
+    print(f"✅ Gemini key loaded: {gemini_key[:6]}...{gemini_key[-4:]} (len={len(gemini_key)})")
 else:
+    print("❌ No Gemini key found!")
+hf_token = (
+    os.environ.get("HF_TOKEN", "")
+    or os.environ.get("HF_KEY", "")
+).strip()
+if hf_token:
+    login(token=hf_token)
+    print("✅ HuggingFace login OK")
+# ── DEVICE ───────────────────────────────────────────────────────────────────
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 DTYPE  = torch.float16 if DEVICE == "cuda" else torch.float32
+print(f"🖥️  Device: {DEVICE}")
+# ── LOAD SVD ONCE ─────────────────────────────────────────────────────────────
+print("⏳ Loading Stable Video Diffusion …")
 svd_pipe = StableVideoDiffusionPipeline.from_pretrained(
     "stabilityai/stable-video-diffusion-img2vid-xt",
     torch_dtype=DTYPE,
     variant="fp16" if DEVICE == "cuda" else None,
 )
 svd_pipe = svd_pipe.to(DEVICE)
+print("✅ SVD ready.")
+# ── GEMINI ────────────────────────────────────────────────────────────────────
 def call_gemini(pil_image: Image.Image, user_desc: str, language: str, style: str) -> dict:
+    # genai.Client() reads GOOGLE_API_KEY automatically — no manual key passing!
+    client = genai.Client()
     lang_map = {
         "English":  "Write everything in English.",
 Language rule : {lang_map.get(language, lang_map['English'])}
 Style rule     : {style_map.get(style, style_map['Fun'])}
+CRITICAL: Return ONLY raw JSON. No markdown. No ```json. No explanation. Pure JSON only.
 {{
   "hook":         "attention-grabbing opening line (1-2 sentences)",
   "script":       "full 15-20 second voiceover script",
     return json.loads(raw)
+# ── VIDEO ─────────────────────────────────────────────────────────────────────
 def generate_video(pil_image: Image.Image) -> str:
     img = pil_image.convert("RGB").resize((1024, 576))
     frames = svd_pipe(
     return tmp.name
+# ── PIPELINE ──────────────────────────────────────────────────────────────────
 def generate_ad(image, user_desc, language, style):
     if image is None:
         return None, "⚠️ Please upload a product image.", "", ""
     return video_path, hook, script, cta
+# ── UI ────────────────────────────────────────────────────────────────────────
 css = """
 #title { text-align:center; font-size:2.2rem; font-weight:800; margin-bottom:.2rem; }
 #sub   { text-align:center; color:#888; margin-bottom:1.5rem; }
     gr.Markdown(
         "---\n**How it works:** "
         "1️⃣ Gemini 2.5 Flash reads your image → hook, script, CTA. "
+        "2️⃣ Stable Video Diffusion → short cinematic clip. "
         "3️⃣ Ready-to-post reel! 🎉"
     )