|
|
import streamlit as st |
|
|
import google.generativeai as genai |
|
|
from huggingface_hub import InferenceClient |
|
|
import requests |
|
|
from PIL import Image |
|
|
import io |
|
|
import json |
|
|
import time |
|
|
import zipfile |
|
|
import tempfile |
|
|
import os |
|
|
from gtts import gTTS |
|
|
|
|
|
|
|
|
st.set_page_config( |
|
|
page_title="AI Video Script & Storyboard Generator", |
|
|
page_icon="🎬", |
|
|
layout="wide" |
|
|
) |
|
|
|
|
|
if 'generated_script' not in st.session_state: |
|
|
st.session_state.generated_script = None |
|
|
if 'storyboard_images' not in st.session_state: |
|
|
st.session_state.storyboard_images = [] |
|
|
if 'gif_preview' not in st.session_state: |
|
|
st.session_state.gif_preview = None |
|
|
|
|
|
|
|
|
def load_api_keys(): |
|
|
"""Load API keys from secrets or environment""" |
|
|
try: |
|
|
gemini_api_key = st.secrets.get("GEMINI_API_KEY") or os.getenv("GEMINI_API_KEY") |
|
|
hf_token = st.secrets.get("HF_TOKEN") or os.getenv("HF_TOKEN") |
|
|
|
|
|
if not gemini_api_key or not hf_token: |
|
|
st.error("❌ API Keys not found. Please configure GEMINI_API_KEY and HF_TOKEN") |
|
|
st.stop() |
|
|
|
|
|
return gemini_api_key, hf_token |
|
|
except Exception as e: |
|
|
st.error(f"❌ Error loading API keys: {str(e)}") |
|
|
st.stop() |
|
|
|
|
|
|
|
|
gemini_api_key, hf_token = load_api_keys() |
|
|
|
|
|
|
|
|
genai.configure(api_key=gemini_api_key) |
|
|
|
|
|
|
|
|
client = InferenceClient(token=hf_token) |
|
|
|
|
|
|
|
|
st.title("🎬 AI Video Script & Storyboard Generator") |
|
|
st.markdown("Create professional video scripts and visual storyboards with AI assistance") |
|
|
|
|
|
|
|
|
st.header("📝 Video Specifications") |
|
|
|
|
|
col1, col2 = st.columns(2) |
|
|
|
|
|
with col1: |
|
|
video_topic = st.text_area( |
|
|
"Video Topic", |
|
|
placeholder="Enter your video topic or detailed description...", |
|
|
height=100 |
|
|
) |
|
|
|
|
|
video_length = st.selectbox( |
|
|
"Video Length", |
|
|
["30 seconds", "1 minute", "2 minutes", "3 minutes", "5 minutes", "Custom"] |
|
|
) |
|
|
|
|
|
if video_length == "Custom": |
|
|
custom_length = st.number_input("Custom length (seconds)", min_value=10, max_value=600, value=60) |
|
|
video_length = f"{custom_length} seconds" |
|
|
|
|
|
style = st.selectbox( |
|
|
"Video Style", |
|
|
["Explainer", "Cinematic", "Tutorial", "Vlog", "Animation", "Documentary", "Commercial"] |
|
|
) |
|
|
|
|
|
with col2: |
|
|
tone = st.selectbox( |
|
|
"Tone/Emotion", |
|
|
["Professional", "Funny", "Serious", "Dramatic", "Inspirational", "Casual", "Educational"] |
|
|
) |
|
|
|
|
|
platform = st.selectbox( |
|
|
"Target Platform", |
|
|
["YouTube", "TikTok", "Instagram Reels", "LinkedIn", "Presentation", "General"] |
|
|
) |
|
|
|
|
|
art_style = st.selectbox( |
|
|
"Storyboard Art Style", |
|
|
["Realistic", "Cartoon", "Cinematic", "Minimalistic", "Sketch", "Digital Art"] |
|
|
) |
|
|
|
|
|
|
|
|
def generate_script_with_gemini(topic, length, style, tone, platform): |
|
|
"""Generate video script using Gemini API""" |
|
|
try: |
|
|
model = genai.GenerativeModel('gemini-1.5-flash') |
|
|
|
|
|
prompt = f""" |
|
|
Create a detailed video script for the following specifications: |
|
|
|
|
|
Topic: {topic} |
|
|
Length: {length} |
|
|
Style: {style} |
|
|
Tone: {tone} |
|
|
Platform: {platform} |
|
|
|
|
|
Format the output as JSON with the following structure: |
|
|
{{ |
|
|
"title": "Video Title", |
|
|
"total_duration": "{length}", |
|
|
"scenes": [ |
|
|
{{ |
|
|
"scene_number": 1, |
|
|
"duration": "10 seconds", |
|
|
"description": "Visual description for storyboard", |
|
|
"dialogue": "Script/narration text", |
|
|
"camera_angle": "Wide shot/Close-up/etc", |
|
|
"visual_elements": "Key visual elements to include" |
|
|
}} |
|
|
] |
|
|
}} |
|
|
|
|
|
Make sure the scenes add up to the total duration and are engaging for {platform}. |
|
|
Include specific visual descriptions that can be used to generate storyboard images. |
|
|
Return only valid JSON, no additional text. |
|
|
""" |
|
|
|
|
|
response = model.generate_content(prompt) |
|
|
response_text = response.text.strip() |
|
|
|
|
|
|
|
|
if response_text.startswith("```json"): |
|
|
response_text = response_text[7:-3] |
|
|
elif response_text.startswith("```"): |
|
|
response_text = response_text[3:-3] |
|
|
|
|
|
script_data = json.loads(response_text) |
|
|
return script_data |
|
|
|
|
|
except Exception as e: |
|
|
st.error(f"Error generating script: {str(e)}") |
|
|
return generate_fallback_script(topic, length, style, tone, platform) |
|
|
|
|
|
def generate_fallback_script(topic, length, style, tone, platform): |
|
|
"""Generate a simple fallback script""" |
|
|
try: |
|
|
|
|
|
if "second" in length.lower(): |
|
|
total_seconds = int(length.split()[0]) |
|
|
elif "minute" in length.lower(): |
|
|
minutes = int(length.split()[0]) |
|
|
total_seconds = minutes * 60 |
|
|
else: |
|
|
total_seconds = 60 |
|
|
|
|
|
|
|
|
num_scenes = max(3, min(8, total_seconds // 10)) |
|
|
scene_duration = total_seconds // num_scenes |
|
|
|
|
|
scenes = [] |
|
|
scene_types = ["opening", "main content", "detail", "conclusion"] |
|
|
|
|
|
for i in range(num_scenes): |
|
|
scene_type = scene_types[min(i, len(scene_types)-1)] |
|
|
scene = { |
|
|
"scene_number": i + 1, |
|
|
"duration": f"{scene_duration} seconds", |
|
|
"description": f"A {style.lower()} {scene_type} scene about {topic}, showing professional visuals in {art_style.lower()} style", |
|
|
"dialogue": f"Engaging {tone.lower()} narration about {topic} for scene {i+1}", |
|
|
"camera_angle": ["Wide shot", "Medium shot", "Close-up", "Over shoulder"][i % 4], |
|
|
"visual_elements": f"Professional visuals related to {topic}, {style.lower()} cinematography" |
|
|
} |
|
|
scenes.append(scene) |
|
|
|
|
|
return { |
|
|
"title": f"{topic} - {style} Video", |
|
|
"total_duration": length, |
|
|
"scenes": scenes |
|
|
} |
|
|
except Exception as e: |
|
|
st.error(f"Error creating fallback script: {str(e)}") |
|
|
return None |
|
|
|
|
|
def generate_storyboard_image_stable(scene_description, art_style, max_retries=3): |
|
|
"""Generate storyboard image with better error handling""" |
|
|
|
|
|
style_prompts = { |
|
|
"Realistic": "photorealistic, professional, high quality, detailed", |
|
|
"Cartoon": "cartoon style, animated, colorful, illustration, Disney-like", |
|
|
"Cinematic": "cinematic, dramatic lighting, film still, movie scene", |
|
|
"Minimalistic": "minimalist, clean, simple, modern design", |
|
|
"Sketch": "pencil sketch, hand-drawn, artistic, line art", |
|
|
"Digital Art": "digital art, concept art, vibrant colors, detailed" |
|
|
} |
|
|
|
|
|
|
|
|
base_prompt = f"{scene_description}" |
|
|
style_enhancement = style_prompts.get(art_style, "professional, high quality") |
|
|
enhanced_prompt = f"{base_prompt}, {style_enhancement}, storyboard frame" |
|
|
|
|
|
|
|
|
approaches = [ |
|
|
enhanced_prompt, |
|
|
f"storyboard illustration: {base_prompt}, {style_enhancement}", |
|
|
f"{base_prompt}, simple illustration, clean design" |
|
|
] |
|
|
|
|
|
for attempt, prompt in enumerate(approaches): |
|
|
try: |
|
|
|
|
|
image = client.text_to_image( |
|
|
prompt, |
|
|
model="runwayml/stable-diffusion-v1-5" |
|
|
) |
|
|
|
|
|
if image and hasattr(image, 'size'): |
|
|
return image |
|
|
else: |
|
|
raise Exception("Invalid image returned") |
|
|
|
|
|
except Exception as e: |
|
|
if attempt < len(approaches) - 1: |
|
|
time.sleep(2) |
|
|
continue |
|
|
else: |
|
|
|
|
|
return create_placeholder_image(f"Scene: {scene_description[:50]}...") |
|
|
|
|
|
return None |
|
|
|
|
|
def create_placeholder_image(text): |
|
|
"""Create a placeholder image with text""" |
|
|
try: |
|
|
from PIL import Image, ImageDraw, ImageFont |
|
|
|
|
|
|
|
|
img = Image.new('RGB', (512, 384), color=(200, 200, 200)) |
|
|
draw = ImageDraw.Draw(img) |
|
|
|
|
|
|
|
|
try: |
|
|
font = ImageFont.load_default() |
|
|
except: |
|
|
font = None |
|
|
|
|
|
|
|
|
text_lines = text.split(' ') |
|
|
line_height = 30 |
|
|
y_pos = 150 |
|
|
|
|
|
for i in range(0, len(text_lines), 4): |
|
|
line = ' '.join(text_lines[i:i+4]) |
|
|
draw.text((50, y_pos), line, fill=(50, 50, 50), font=font) |
|
|
y_pos += line_height |
|
|
if y_pos > 300: |
|
|
break |
|
|
|
|
|
return img |
|
|
except Exception: |
|
|
return None |
|
|
|
|
|
def create_gif_preview(images, script_data): |
|
|
"""Create a GIF preview""" |
|
|
try: |
|
|
|
|
|
valid_images = [img for img in images if img is not None] |
|
|
if not valid_images: |
|
|
return None |
|
|
|
|
|
|
|
|
target_size = (400, 300) |
|
|
resized_images = [] |
|
|
|
|
|
for image in valid_images: |
|
|
try: |
|
|
resized_img = image.resize(target_size, Image.Resampling.LANCZOS) |
|
|
resized_images.append(resized_img) |
|
|
except Exception: |
|
|
continue |
|
|
|
|
|
if not resized_images: |
|
|
return None |
|
|
|
|
|
|
|
|
gif_buffer = io.BytesIO() |
|
|
resized_images[0].save( |
|
|
gif_buffer, |
|
|
format='GIF', |
|
|
save_all=True, |
|
|
append_images=resized_images[1:] if len(resized_images) > 1 else [], |
|
|
duration=2500, |
|
|
loop=0 |
|
|
) |
|
|
gif_buffer.seek(0) |
|
|
return gif_buffer |
|
|
|
|
|
except Exception as e: |
|
|
st.error(f"Error creating GIF: {str(e)}") |
|
|
return None |
|
|
|
|
|
def text_to_speech(text, language='en'): |
|
|
"""Convert text to speech using gTTS""" |
|
|
try: |
|
|
|
|
|
if len(text) > 500: |
|
|
text = text[:500] + "..." |
|
|
|
|
|
tts = gTTS(text=text, lang=language, slow=False) |
|
|
audio_buffer = io.BytesIO() |
|
|
tts.write_to_fp(audio_buffer) |
|
|
audio_buffer.seek(0) |
|
|
return audio_buffer |
|
|
except Exception as e: |
|
|
st.error(f"Error generating speech: {str(e)}") |
|
|
return None |
|
|
|
|
|
def create_download_zip(images, script_data): |
|
|
"""Create a ZIP file with all content""" |
|
|
try: |
|
|
zip_buffer = io.BytesIO() |
|
|
|
|
|
with zipfile.ZipFile(zip_buffer, 'w', zipfile.ZIP_DEFLATED) as zip_file: |
|
|
|
|
|
script_json = json.dumps(script_data, indent=2) |
|
|
zip_file.writestr("script.json", script_json) |
|
|
|
|
|
|
|
|
script_text = f"Title: {script_data.get('title', '')}\n" |
|
|
script_text += f"Duration: {script_data.get('total_duration', '')}\n\n" |
|
|
|
|
|
for i, scene in enumerate(script_data.get('scenes', []), 1): |
|
|
script_text += f"=== SCENE {i} ===\n" |
|
|
script_text += f"Duration: {scene.get('duration', '')}\n" |
|
|
script_text += f"Camera: {scene.get('camera_angle', '')}\n" |
|
|
script_text += f"Description: {scene.get('description', '')}\n" |
|
|
script_text += f"Dialogue: {scene.get('dialogue', '')}\n" |
|
|
script_text += f"Visual Elements: {scene.get('visual_elements', '')}\n\n" |
|
|
|
|
|
zip_file.writestr("script.txt", script_text) |
|
|
|
|
|
|
|
|
for i, image in enumerate(images): |
|
|
if image: |
|
|
img_buffer = io.BytesIO() |
|
|
try: |
|
|
image.save(img_buffer, format='PNG') |
|
|
zip_file.writestr(f"scene_{i+1:02d}.png", img_buffer.getvalue()) |
|
|
except Exception: |
|
|
continue |
|
|
|
|
|
zip_buffer.seek(0) |
|
|
return zip_buffer |
|
|
except Exception as e: |
|
|
st.error(f"Error creating ZIP file: {str(e)}") |
|
|
return None |
|
|
|
|
|
|
|
|
if st.button("🚀 Generate Video Script & Storyboard", type="primary"): |
|
|
if not video_topic.strip(): |
|
|
st.error("Please enter a video topic") |
|
|
else: |
|
|
|
|
|
with st.spinner("🤖 Generating script with AI..."): |
|
|
script_data = generate_script_with_gemini(video_topic, video_length, style, tone, platform) |
|
|
|
|
|
if script_data: |
|
|
st.session_state.generated_script = script_data |
|
|
st.success("✅ Script generated successfully!") |
|
|
|
|
|
|
|
|
st.info("🎨 Generating storyboard images (this may take a few minutes)...") |
|
|
images = [] |
|
|
|
|
|
|
|
|
progress_container = st.container() |
|
|
with progress_container: |
|
|
progress_bar = st.progress(0) |
|
|
status_text = st.empty() |
|
|
|
|
|
total_scenes = len(script_data['scenes']) |
|
|
|
|
|
for i, scene in enumerate(script_data['scenes']): |
|
|
status_text.text(f"Generating image {i+1}/{total_scenes}: Scene {i+1}") |
|
|
|
|
|
try: |
|
|
image = generate_storyboard_image_stable( |
|
|
scene['description'], |
|
|
art_style |
|
|
) |
|
|
images.append(image) |
|
|
|
|
|
if image: |
|
|
st.success(f"✅ Scene {i+1} generated successfully") |
|
|
else: |
|
|
st.warning(f"⚠️ Scene {i+1} failed, using placeholder") |
|
|
|
|
|
except Exception as e: |
|
|
st.error(f"❌ Error generating scene {i+1}: {str(e)}") |
|
|
images.append(None) |
|
|
|
|
|
progress_bar.progress((i + 1) / total_scenes) |
|
|
|
|
|
|
|
|
if i < total_scenes - 1: |
|
|
time.sleep(3) |
|
|
|
|
|
status_text.text("✅ Storyboard generation complete!") |
|
|
|
|
|
st.session_state.storyboard_images = images |
|
|
st.success(f"✅ Generated {len([img for img in images if img is not None])} out of {len(images)} storyboard images!") |
|
|
|
|
|
else: |
|
|
st.error("Failed to generate script. Please try again.") |
|
|
|
|
|
|
|
|
if st.session_state.generated_script: |
|
|
script_data = st.session_state.generated_script |
|
|
|
|
|
st.header("📜 Generated Script") |
|
|
st.subheader(f"🎬 {script_data.get('title', 'Video Title')}") |
|
|
st.write(f"**Duration:** {script_data.get('total_duration', 'N/A')}") |
|
|
|
|
|
|
|
|
tab1, tab2, tab3 = st.tabs(["📝 Script Details", "🖼️ Storyboard", "📥 Export"]) |
|
|
|
|
|
with tab1: |
|
|
for i, scene in enumerate(script_data.get('scenes', []), 1): |
|
|
with st.expander(f"Scene {i} - {scene.get('duration', 'N/A')}", expanded=False): |
|
|
col1, col2 = st.columns(2) |
|
|
|
|
|
with col1: |
|
|
st.write("**Visual Description:**") |
|
|
st.write(scene.get('description', 'N/A')) |
|
|
st.write("**Camera Angle:**") |
|
|
st.write(scene.get('camera_angle', 'N/A')) |
|
|
|
|
|
with col2: |
|
|
st.write("**Dialogue/Narration:**") |
|
|
st.write(scene.get('dialogue', 'N/A')) |
|
|
st.write("**Visual Elements:**") |
|
|
st.write(scene.get('visual_elements', 'N/A')) |
|
|
|
|
|
|
|
|
dialogue = scene.get('dialogue', '') |
|
|
if dialogue and st.button(f"🔊 Play Audio - Scene {i}", key=f"audio_{i}"): |
|
|
with st.spinner("Generating audio..."): |
|
|
audio_buffer = text_to_speech(dialogue) |
|
|
if audio_buffer: |
|
|
st.audio(audio_buffer.getvalue(), format='audio/mp3') |
|
|
|
|
|
with tab2: |
|
|
if st.session_state.storyboard_images: |
|
|
st.subheader("🎨 Storyboard Images") |
|
|
|
|
|
|
|
|
cols_per_row = 2 |
|
|
for i in range(0, len(st.session_state.storyboard_images), cols_per_row): |
|
|
cols = st.columns(cols_per_row) |
|
|
|
|
|
for j, col in enumerate(cols): |
|
|
idx = i + j |
|
|
if idx < len(st.session_state.storyboard_images): |
|
|
image = st.session_state.storyboard_images[idx] |
|
|
scene = script_data['scenes'][idx] if idx < len(script_data['scenes']) else {} |
|
|
|
|
|
with col: |
|
|
if image: |
|
|
st.image(image, caption=f"Scene {idx+1}", use_container_width=True) |
|
|
else: |
|
|
st.write(f"❌ Scene {idx+1} - Image failed to generate") |
|
|
|
|
|
st.write(f"**Duration:** {scene.get('duration', 'N/A')}") |
|
|
st.write(f"**Description:** {scene.get('description', 'N/A')[:100]}...") |
|
|
|
|
|
|
|
|
st.subheader("📱 Animated Preview") |
|
|
col1, col2 = st.columns([1, 2]) |
|
|
|
|
|
with col1: |
|
|
if st.button("🎬 Create GIF Preview"): |
|
|
with st.spinner("Creating animated preview..."): |
|
|
gif_buffer = create_gif_preview( |
|
|
st.session_state.storyboard_images, |
|
|
script_data |
|
|
) |
|
|
if gif_buffer: |
|
|
st.session_state.gif_preview = gif_buffer |
|
|
st.success("GIF preview created!") |
|
|
else: |
|
|
st.error("Failed to create GIF preview") |
|
|
|
|
|
with col2: |
|
|
if st.session_state.gif_preview: |
|
|
st.image(st.session_state.gif_preview.getvalue(), caption="Storyboard Preview") |
|
|
else: |
|
|
st.info("Generate storyboard images first using the button above.") |
|
|
|
|
|
with tab3: |
|
|
st.subheader("📥 Download Options") |
|
|
|
|
|
col1, col2, col3 = st.columns(3) |
|
|
|
|
|
with col1: |
|
|
|
|
|
script_json = json.dumps(script_data, indent=2) |
|
|
st.download_button( |
|
|
label="📄 Download Script (JSON)", |
|
|
data=script_json, |
|
|
file_name=f"script_{int(time.time())}.json", |
|
|
mime="application/json" |
|
|
) |
|
|
|
|
|
with col2: |
|
|
|
|
|
if st.session_state.storyboard_images: |
|
|
zip_data = create_download_zip(st.session_state.storyboard_images, script_data) |
|
|
if zip_data: |
|
|
st.download_button( |
|
|
label="📦 Download Complete Package", |
|
|
data=zip_data.getvalue(), |
|
|
file_name=f"storyboard_package_{int(time.time())}.zip", |
|
|
mime="application/zip" |
|
|
) |
|
|
|
|
|
with col3: |
|
|
|
|
|
if st.session_state.gif_preview: |
|
|
st.download_button( |
|
|
label="🎬 Download GIF Preview", |
|
|
data=st.session_state.gif_preview.getvalue(), |
|
|
file_name=f"storyboard_preview_{int(time.time())}.gif", |
|
|
mime="image/gif" |
|
|
) |
|
|
|
|
|
|
|
|
with st.sidebar: |
|
|
st.markdown("### 📚 How to Use") |
|
|
st.markdown(""" |
|
|
1. **Enter Details**: Describe your video topic and preferences |
|
|
2. **Generate**: Click the generate button and wait |
|
|
3. **Review**: Check the script and storyboard images |
|
|
4. **Export**: Download your files |
|
|
""") |
|
|
|
|
|
st.markdown("### 🔧 Features") |
|
|
st.markdown(""" |
|
|
- ✅ AI-powered script generation |
|
|
- ✅ Visual storyboard creation |
|
|
- ✅ Text-to-speech narration |
|
|
- ✅ GIF preview generation |
|
|
- ✅ Complete package download |
|
|
""") |
|
|
|
|
|
st.markdown("### 🐛 Debug Info") |
|
|
if st.button("🧪 Test Image Generation"): |
|
|
with st.spinner("Testing image generation..."): |
|
|
test_image = generate_storyboard_image_stable( |
|
|
"A simple test scene with a person", |
|
|
"Cartoon" |
|
|
) |
|
|
if test_image: |
|
|
st.image(test_image, caption="Test Image", width=200) |
|
|
st.success("✅ Image generation working!") |
|
|
else: |
|
|
st.error("❌ Image generation failed!") |
|
|
|
|
|
st.markdown("### ⚙️ Settings") |
|
|
st.markdown(""" |
|
|
**Required API Keys:** |
|
|
- GEMINI_API_KEY |
|
|
- HF_TOKEN (Hugging Face) |
|
|
|
|
|
**Models Used:** |
|
|
- Script: Gemini 1.5 Flash |
|
|
- Images: Stable Diffusion v1.5 |
|
|
- Speech: Google TTS |
|
|
""") |
|
|
|
|
|
|
|
|
st.markdown("---") |
|
|
st.markdown("🤖 **Powered by**: Gemini AI • Hugging Face • Google TTS") |
|
|
st.markdown("💡 **Tips**: Be specific in your descriptions for better results!") |