Spaces:

kader1997
/

AutoCaptionPro

Sleeping

App Files Files Community

kader1997 commited on Dec 23, 2025

Commit

7d91661

verified ·

1 Parent(s): 3d500a1

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -19

app.py CHANGED Viewed

@@ -8,13 +8,16 @@ from moviepy import VideoFileClip, TextClip, CompositeVideoClip
 from arabic_reshaper import reshape
 # --- الإعدادات ---
-# استخدمنا cpu و int8 لضمان العمل على أغلب الأجهزة، يمكن تغييره لـ cuda إذا توفر GPU
 model = WhisperModel("large-v3", device="cpu", compute_type="int8")
 def process_arabic_text(text):
     if not text: return ""
-    # معالجة النصوص العربية لتعرض بشكل صحيح (من اليمين لليسار وبدون حروف مقطعة)
-    return reshape(text)
 def clean_color(color_str):
     if color_str.startswith('rgba'):
@@ -26,8 +29,6 @@ def clean_color(color_str):
 def step_1_extract_words(video_path, progress=gr.Progress()):
     if not video_path: return None, "الرجاء رفع فيديو."
-    # تفعيل word_timestamps=True هو السر لاستخراج توقيت كل كلمة
     segments, _ = model.transcribe(video_path, word_timestamps=True, language="ar")
     words_data = []
@@ -35,7 +36,7 @@ def step_1_extract_words(video_path, progress=gr.Progress()):
         for word in segment.words:
             words_data.append([word.word.strip(), round(word.start, 2), round(word.end, 2)])
-    return pd.DataFrame(words_data, columns=["الكلمة", "البداية", "النهاية"]), "تم استخراج الكلمات بدقة!"
 def step_2_render_video(video_path, df_edited, font_selection, text_color, font_size, progress=gr.Progress()):
     if video_path is None or df_edited is None: return None, "بيانات ناقصة."
@@ -43,14 +44,13 @@ def step_2_render_video(video_path, df_edited, font_selection, text_color, font_
     safe_color = clean_color(text_color)
     actual_font = font_selection if os.path.exists(font_selection) else "DejaVu-Sans-Bold"
-    output_path = "final_word_by_word.mp4"
     video = VideoFileClip(video_path)
     w, h = video.size
     clips = [video]
     words_list = df_edited.values.tolist()
-    # تحويل كل صف في الجدول (كلمة) إلى Clip مستقل يظهر في وقته
     for row in words_list:
         word_text = str(row[0])
         t_start = float(row[1])
@@ -58,38 +58,37 @@ def step_2_render_video(video_path, df_edited, font_selection, text_color, font_
         if not word_text.strip(): continue
         clean_word = process_arabic_text(word_text)
-        # إنشاء كليب للكلمة الواحدة
         txt = TextClip(
             text=clean_word,
             font_size=int(font_size),
             color=safe_color,
             stroke_color='black',
-            stroke_width=2,
             font=actual_font,
-            method='label', # 'label' أفضل للكلمات المنفردة للحفاظ على جودتها
-        ).with_start(t_start).with_duration(max(0.1, t_end - t_start)).with_position(('center', int(h * 0.5))) # وضعها في منتصف الشاشة تقريباً
         clips.append(txt)
-    # دمج كل الكلمات فوق الفيديو الأصلي
     final = CompositeVideoClip(clips, size=(w, h))
     final.write_videofile(output_path, codec="libx264", audio_codec="aac", fps=video.fps, logger='bar')
-    return output_path, "تم إنتاج الفيديو بنظام كلمة بكلمة!"
 # --- الواجهة ---
 with gr.Blocks() as app:
-    gr.Markdown("## 🎬 Word-by-Word Captioner (Like Pro Apps)")
     with gr.Row():
         v_in = gr.Video(); v_out = gr.Video()
     with gr.Row():
         font_opt = gr.Dropdown(choices=["arialbd.ttf"], value="arialbd.ttf", label="الخط")
-        color_opt = gr.ColorPicker(value="#00FF00", label="لون الكلمة (مثلاً أخضر)")
-        size_opt = gr.Slider(50, 250, value=120, label="حجم الكلمة")
-    btn_1 = gr.Button("1. تحليل الكلمات المنطوقة"); table = gr.Dataframe(interactive=True)
-    btn_2 = gr.Button("2. إنشاء الفيديو النهائي"); status = gr.Textbox()
     btn_1.click(step_1_extract_words, [v_in], [table, status])
     btn_2.click(step_2_render_video, [v_in, table, font_opt, color_opt, size_opt], [v_out, status])

 from arabic_reshaper import reshape
 # --- الإعدادات ---
 model = WhisperModel("large-v3", device="cpu", compute_type="int8")
 def process_arabic_text(text):
     if not text: return ""
+    # 1. إضافة الشكل الجمالي (النقاط)
+    decorated_text = f"• {text} •"
+    # 2. إعادة تشكيل الحروف العربية لتظهر متصلة وصحيحة
+    reshaped = reshape(decorated_text)
+    # 3. إضافة سطر فارغ في الأسفل لمنع قص النقاط السفلية (مثل الياء والباء)
+    return reshaped + "\n "
 def clean_color(color_str):
     if color_str.startswith('rgba'):
 def step_1_extract_words(video_path, progress=gr.Progress()):
     if not video_path: return None, "الرجاء رفع فيديو."
     segments, _ = model.transcribe(video_path, word_timestamps=True, language="ar")
     words_data = []
         for word in segment.words:
             words_data.append([word.word.strip(), round(word.start, 2), round(word.end, 2)])
+    return pd.DataFrame(words_data, columns=["الكلمة", "البداية", "النهاية"]), "تم استخراج الكلمات!"
 def step_2_render_video(video_path, df_edited, font_selection, text_color, font_size, progress=gr.Progress()):
     if video_path is None or df_edited is None: return None, "بيانات ناقصة."
     safe_color = clean_color(text_color)
     actual_font = font_selection if os.path.exists(font_selection) else "DejaVu-Sans-Bold"
+    output_path = "final_fixed_dots_video.mp4"
     video = VideoFileClip(video_path)
     w, h = video.size
     clips = [video]
     words_list = df_edited.values.tolist()
     for row in words_list:
         word_text = str(row[0])
         t_start = float(row[1])
         if not word_text.strip(): continue
+        # النص هنا يحتوي الآن على السطر الفارغ الإضافي
         clean_word = process_arabic_text(word_text)
         txt = TextClip(
             text=clean_word,
             font_size=int(font_size),
             color=safe_color,
             stroke_color='black',
+            stroke_width=2.5,
             font=actual_font,
+            method='label' # 'label' تحافظ على حجم الكلمة وتتأثر بالسطر الجديد المضاف
+        ).with_start(t_start).with_duration(max(0.1, t_end - t_start)).with_position(('center', int(h * 0.5)))
         clips.append(txt)
     final = CompositeVideoClip(clips, size=(w, h))
     final.write_videofile(output_path, codec="libx264", audio_codec="aac", fps=video.fps, logger='bar')
+    return output_path, "تم الحفظ بنجاح مع ضمان ظهور النقاط السفلية!"
 # --- الواجهة ---
 with gr.Blocks() as app:
+    gr.Markdown("## 🎬 محرر الفيديو: حل مشكلة النقاط السفلية")
     with gr.Row():
         v_in = gr.Video(); v_out = gr.Video()
     with gr.Row():
         font_opt = gr.Dropdown(choices=["arialbd.ttf"], value="arialbd.ttf", label="الخط")
+        color_opt = gr.ColorPicker(value="#FF8C00", label="لون ذهبي برتقالي")
+        size_opt = gr.Slider(50, 250, value=130, label="حجم الكلمة")
+    btn_1 = gr.Button("1. تحليل الكلمات"); table = gr.Dataframe(interactive=True)
+    btn_2 = gr.Button("2. إنتاج الفيديو"); status = gr.Textbox()
     btn_1.click(step_1_extract_words, [v_in], [table, status])
     btn_2.click(step_2_render_video, [v_in, table, font_opt, color_opt, size_opt], [v_out, status])