Spaces:

kader1997
/

AutoCaptionPro

Sleeping

App Files Files Community

kader1997 commited on Dec 22, 2025

Commit

04fb6eb

verified ·

1 Parent(s): db158f3

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -46

app.py CHANGED Viewed

@@ -16,38 +16,32 @@ def step_1_extract_words(video_path, progress=gr.Progress()):
     if not video_path:
         return None, "الرجاء رفع فيديو أولاً."
-    progress(0, desc="جاري تحميل النموذج...")
     segments, _ = model.transcribe(video_path, word_timestamps=True, language="ar")
     words_data = []
-    progress(0.5, desc="جاري تحليل الصوت واستخراج الكلمات...")
     for segment in segments:
         for word in segment.words:
             words_data.append([word.word.strip(), round(word.start, 2), round(word.end, 2)])
     df = pd.DataFrame(words_data, columns=["الكلمة", "البداية", "النهاية"])
-    return df, "تم الاستخراج بنجاح!"
 def step_2_render_video(video_path, df_edited, font_selection, text_color, font_size, progress=gr.Progress()):
     if video_path is None or df_edited is None or df_edited.empty:
         return None, "بيانات ناقصة."
-    # حل مشكلة الألوان: التأكد أن اللون بصيغة نصية واضحة
-    if text_color.startswith('rgba'):
-        # تحويل بسيط لضمان قبول اللون
-        final_color = "yellow"
-    else:
-        final_color = text_color
-    output_path = "final_clean_video.mp4"
     video = VideoFileClip(video_path)
     w, h = int(video.w), int(video.h)
     clips = [video]
     words_list = df_edited.values.tolist()
     chunk_size = 3
-    progress(0.1, desc="جاري إنتاج الفيديو...")
     for i in range(0, len(words_list), chunk_size):
         current_chunk = words_list[i : i + chunk_size]
@@ -58,63 +52,59 @@ def step_2_render_video(video_path, df_edited, font_selection, text_color, font_
         c_end = float(current_chunk[-1][2])
         duration = max(0.1, c_end - c_start)
-        txt_clip = TextClip(
             text=clean_sentence,
-            font_size=font_size,
-            color=final_color,
             stroke_color='black',
-            stroke_width=2,
             method='caption',
-            font=font_selection,
-            size=(int(w * 0.9), None),
             text_align='center'
         ).with_start(c_start).with_duration(duration).with_position(('center', int(h * 0.65)))
-        clips.append(txt_clip)
     final_video = CompositeVideoClip(clips, size=(w, h))
     final_video.write_videofile(
         output_path,
         codec="libx264",
         audio_codec="aac",
         fps=video.fps,
-        logger='bar'
     )
-    return output_path, "تم إنتاج الفيديو بنجاح!"
-# --- بناء الواجهة ---
-with gr.Blocks(title="Caption Pro Final") as app:
-    gr.Markdown("# 🎬 Caption Pro - Stable Version")
     with gr.Row():
-        video_in = gr.Video(label="فيديو المدخلات")
-        video_out = gr.Video(label="الفيديو الناتج")
     with gr.Row():
-        # استخدام القائمة المنسدلة للخطوط
-        font_dropdown = gr.Dropdown(
-            choices=["arialbd.ttf", "Cairo-Bold.ttf", "Almarai-Bold.ttf", "Tajawal-Bold.ttf"],
             value="arialbd.ttf",
-            label="اختر الخط (تأكد من وجود الملف)"
         )
-        # تحديد لون النص عبر الكلمات أو Hex لضمان الاستقرار
-        color_input = gr.ColorPicker(value="#FFFF00", label="اختر لون النص")
-        size_slider = gr.Slider(minimum=30, maximum=120, value=70, step=5, label="حجم الخط")
-    status = gr.Textbox(label="الحالة", interactive=False)
-    table = gr.Dataframe(headers=["الكلمة", "البداية", "النهاية"], datatype=["str", "number", "number"], interactive=True)
-    btn_ex = gr.Button("1. استخراج الكلمات", variant="primary")
-    btn_re = gr.Button("2. إنتاج الفيديو", variant="secondary")
-    btn_ex.click(step_1_extract_words, inputs=[video_in], outputs=[table, status])
-    btn_re.click(
-        step_2_render_video,
-        inputs=[video_in, table, font_dropdown, color_input, size_slider],
-        outputs=[video_out, status]
-    )
-if __name__ == "__main__":
-    app.launch()

     if not video_path:
         return None, "الرجاء رفع فيديو أولاً."
+    progress(0, desc="جاري استخراج الكلمات...")
     segments, _ = model.transcribe(video_path, word_timestamps=True, language="ar")
     words_data = []
     for segment in segments:
         for word in segment.words:
             words_data.append([word.word.strip(), round(word.start, 2), round(word.end, 2)])
     df = pd.DataFrame(words_data, columns=["الكلمة", "البداية", "النهاية"])
+    return df, "تم الاستخراج!"
 def step_2_render_video(video_path, df_edited, font_selection, text_color, font_size, progress=gr.Progress()):
     if video_path is None or df_edited is None or df_edited.empty:
         return None, "بيانات ناقصة."
+    # التأكد من مسار الخط: إذا لم يجد الملف المرفوع سيستخدم Arial الافتراضي
+    actual_font = font_selection if os.path.exists(font_selection) else "Arial-Bold"
+    output_path = "output_final.mp4"
     video = VideoFileClip(video_path)
     w, h = int(video.w), int(video.h)
     clips = [video]
     words_list = df_edited.values.tolist()
     chunk_size = 3
+    progress(0.1, desc="جاري معالجة النصوص بالإعدادات الجديدة...")
     for i in range(0, len(words_list), chunk_size):
         current_chunk = words_list[i : i + chunk_size]
         c_end = float(current_chunk[-1][2])
         duration = max(0.1, c_end - c_start)
+        # إنشاء الكليب مع التأكد من تمرير اللون والخط بشكل صريح
+        txt = TextClip(
             text=clean_sentence,
+            font_size=int(font_size),
+            color=text_color, # سيأخذ اللون من ColorPicker مباشرة
             stroke_color='black',
+            stroke_width=1.5,
+            font=actual_font,
             method='caption',
+            size=(int(w * 0.85), None),
             text_align='center'
         ).with_start(c_start).with_duration(duration).with_position(('center', int(h * 0.65)))
+        clips.append(txt)
     final_video = CompositeVideoClip(clips, size=(w, h))
+    # تحسين سرعة المعالجة وتقليل المشاكل
     final_video.write_videofile(
         output_path,
         codec="libx264",
         audio_codec="aac",
         fps=video.fps,
+        logger='bar',
+        threads=4 # استخدام تعدد الخيوط لتسريع العملية
     )
+    return output_path, f"تم الحفظ! اللون: {text_color}، الخط: {actual_font}"
+# --- الواجهة ---
+with gr.Blocks() as app:
+    gr.Markdown("### 🎬 Caption Pro: تخصيص كامل")
     with gr.Row():
+        v_in = gr.Video()
+        v_out = gr.Video()
     with gr.Row():
+        # تأكد من رفع هذه الملفات في Hugging Face (مثلاً Cairo-Bold.ttf)
+        font_opt = gr.Dropdown(
+            choices=["arialbd.ttf", "Cairo-Bold.ttf", "Almarai-Bold.ttf"],
             value="arialbd.ttf",
+            label="نوع الخط"
         )
+        color_opt = gr.ColorPicker(value="#FFFF00", label="لون النص")
+        size_opt = gr.Slider(30, 150, value=70, label="حجم الخط")
+    btn_1 = gr.Button("1. استخراج")
+    table = gr.Dataframe(headers=["الكلمة", "البداية", "النهاية"], interactive=True)
+    btn_2 = gr.Button("2. إنتاج الفيديو")
+    status = gr.Textbox(label="الحالة")
+    btn_1.click(step_1_extract_words, inputs=[v_in], outputs=[table, status])
+    btn_2.click(step_2_render_video, inputs=[v_in, table, font_opt, color_opt, size_opt], outputs=[v_out, status])
+app.launch()