Spaces:

kader1997
/

AutoCaptionPro

Sleeping

App Files Files Community

kader1997 commited on Dec 21, 2025

Commit

4881671

verified ·

1 Parent(s): 051777c

Upload 3 files

Browse files

Files changed (3) hide show

main.py +115 -0
packages.txt +2 -0
requirements.txt +6 -0

main.py ADDED Viewed

	@@ -0,0 +1,115 @@

+import os
+import json
+import gradio as gr
+import pandas as pd  # أضفنا هذا السطر
+from faster_whisper import WhisperModel
+from moviepy import VideoFileClip, TextClip, CompositeVideoClip
+from arabic_reshaper import reshape
+from bidi.algorithm import get_display
+# --- الإعدادات الثابتة ---
+JSON_DATA = "captions_data.json"
+# في لينكس، نستخدم خطاً متوفراً في النظام أو نرفق ملف خط مع المشروع
+FONT_PATH = "Arial" # أو اتركها فارغة وسيقوم ImageMagick باختيار الخط الافتراضي
+# تحميل النموذج
+model = WhisperModel("small", device="cpu", compute_type="int8")
+def process_arabic_text(text):
+    reshaped_text = reshape(text)
+    bidi_text = get_display(reshaped_text)
+    return bidi_text + "\n "
+def step_1_extract_words(video_path):
+    if not video_path:
+        return None, "الرجاء رفع ملف فيديو أولاً."
+    print("جاري استخراج الكلمات...")
+    segments, _ = model.transcribe(video_path, word_timestamps=True, language="ar")
+    words_data = []
+    for segment in segments:
+        for word in segment.words:
+            words_data.append([word.word.strip(), round(word.start, 2), round(word.end, 2)])
+    # تحويل لـ DataFrame ليعمل مع Gradio بشكل صحيح
+    df = pd.DataFrame(words_data, columns=["الكلمة", "البداية (ثانية)", "النهاية (ثانية)"])
+    return df, "تم الاستخراج! عدل الكلمات في الجدول ثم اضغط 'إنتاج الفيديو'."
+def step_2_render_video(video_path, df_edited):
+    # إصلاح الخطأ: التحقق من وجود البيانات في DataFrame
+    if video_path is None or df_edited is None or df_edited.empty:
+        return None, "تأكد من وجود الفيديو والبيانات في الجدول."
+    output_path = "final_captioned_video.mp4"
+    video = VideoFileClip(video_path)
+    w, h = int(video.w), int(video.h)
+    clips = [video]
+    # تحويل DataFrame إلى قائمة صفوف لمعالجتها
+    words_list = df_edited.values.tolist()
+    print(f"جاري دمج {len(words_list)} كلمة...")
+    for row in words_list:
+        word_text = str(row[0])
+        start_t = float(row[1])
+        end_t = float(row[2])
+        clean_text = process_arabic_text(word_text)
+        # إنشاء النص مع إطار أسود (التعديل النهائي لإصدار 2.0)
+        # إنشاء النص بدون خلفية (Transparent Background)
+        txt_clip = TextClip(
+            text=clean_text,
+            font_size=85,  # زيادة الحجم قليلاً لتعويض حذف الخلفية
+            color='yellow',
+            font=FONT_PATH,
+            stroke_color='black',  # الحدود السوداء ضرورية جداً هنا لرؤية النص
+            stroke_width=2,  # جعل الحدود أسمك لزيادة التباين
+            method='caption',
+            size=(int(w * 0.8), None),  # ترك مساحة عرض كافية
+            text_align='center'
+        )
+        txt_clip = (txt_clip
+                    .with_start(start_t)
+                    .with_duration(max(0.1, end_t - start_t))  # ضمان مدة زمنية موجبة
+                    .with_position(('center', int(h * 0.7))))
+        clips.append(txt_clip)
+    final_video = CompositeVideoClip(clips, size=(w, h))
+    final_video.write_videofile(output_path, codec="libx264", audio_codec="aac", fps=video.fps, logger='bar')
+    return output_path, "مبروك! تم إنتاج الفيديو بنجاح."
+# --- بناء الواجهة ---
+with gr.Blocks(title="Caption Pro") as app:
+    gr.Markdown("# 🎬 محرر الكابشن العربي الاحترافي")
+    with gr.Row():
+        video_in = gr.Video(label="فيديو المدخلات")
+        video_out = gr.Video(label="الفيديو النهائي")
+    status = gr.Textbox(label="الحالة", interactive=False)
+    # استخدام Dataframe من Gradio
+    table = gr.Dataframe(
+        headers=["الكلمة", "البداية (ثانية)", "النهاية (ثانية)"],
+        datatype=["str", "number", "number"],
+        interactive=True
+    )
+    btn_extract = gr.Button("1. استخراج الكلمات", variant="primary")
+    btn_render = gr.Button("2. إنتاج الفيديو النهائي", variant="secondary")
+    btn_extract.click(step_1_extract_words, inputs=[video_in], outputs=[table, status])
+    btn_render.click(step_2_render_video, inputs=[video_in, table], outputs=[video_out, status])
+if __name__ == "__main__":
+    app.launch()

packages.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ imagemagick
2	+ ffmpeg

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+faster-whisper
+moviepy
+arabic-reshaper
+python-bidi
+gradio
+pandas