Spaces:

Shatha2030
/

Faheem

Sleeping

App Files Files Community

Shatha2030 commited on Feb 26, 2025

Commit

d5d66d6

verified ·

1 Parent(s): e281787

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -8

app.py CHANGED Viewed

@@ -67,24 +67,26 @@ def convert_audio_to_text(uploaded_file):
         # معالجة ملفات الفيديو
         if input_path.split('.')[-1].lower() in ['mp4', 'avi', 'mov', 'mkv']:
-            VideoFileClip(input_path).audio.write_audiofile(output_path, codec='pcm_s16le')
         else:
             output_path = input_path
         audio, rate = librosa.load(output_path, sr=16000)
         transcripts = []
-        # معالجة الصوت على شكل مقاطع
         for start in np.arange(0, len(audio)/rate, 30):
             end = min(start + 30, len(audio)/rate)
             segment = audio[int(start*rate):int(end*rate)]
             sf.write(f"/tmp/segment_{int(start)}.wav", segment, rate)
             transcripts.append(pipe(f"/tmp/segment_{int(start)}.wav")["text"])
         return " ".join(transcripts)
     except Exception as e:
         return f"⛔ خطأ: {str(e)}"
 def process_example_audio():
     try:
         if not os.path.exists(EXAMPLE_AUDIO_PATH):
@@ -106,10 +108,25 @@ def summarize_text(text):
 def answer_question(text, question):
     if not question.strip() or not text.strip():
-        return "⛔ الرجاء إدخال النص والسؤال بشكل صحيح"
-    result = qa_pipeline({'question': question, 'context': context})
-    return result['answer']
 def text_to_speech(text):
     if not text.strip():

         # معالجة ملفات الفيديو
         if input_path.split('.')[-1].lower() in ['mp4', 'avi', 'mov', 'mkv']:
+            video = VideoFileClip(input_path)
+            if video.audio:
+                video.audio.write_audiofile(output_path, codec='pcm_s16le')
+            else:
+                return "⛔ لا يوجد صوت في الفيديو!"
         else:
             output_path = input_path
         audio, rate = librosa.load(output_path, sr=16000)
         transcripts = []
+        # تقسيم الصوت إلى مقاطع للتعامل مع الملفات الكبيرة
         for start in np.arange(0, len(audio)/rate, 30):
             end = min(start + 30, len(audio)/rate)
             segment = audio[int(start*rate):int(end*rate)]
             sf.write(f"/tmp/segment_{int(start)}.wav", segment, rate)
             transcripts.append(pipe(f"/tmp/segment_{int(start)}.wav")["text"])
         return " ".join(transcripts)
     except Exception as e:
         return f"⛔ خطأ: {str(e)}"
 def process_example_audio():
     try:
         if not os.path.exists(EXAMPLE_AUDIO_PATH):
 def answer_question(text, question):
     if not question.strip() or not text.strip():
+        return "⛔️ الرجاء إدخال النص والسؤال بشكل صحيح"
+    # تقسيم النص إلى شرائح صغيرة بحيث لا تزيد كل شريحة عن 256 كلمة
+    words = text.split()
+    chunk_size = 256
+    segments = [" ".join(words[i:i+chunk_size]) for i in range(0, len(words), chunk_size)]
+    best_answer = None
+    best_score = -1
+    # تطبيق نموذج الإجابة على كل شريحة واختيار الإجابة ذات أعلى score
+    for seg in segments:
+        result = qa_pipeline({'question': question, 'context': seg})
+        if result['score'] > best_score:
+            best_score = result['score']
+            best_answer = result['answer']
+    return best_answer
 def text_to_speech(text):
     if not text.strip():