Spaces:

Woziii
/

scribe

Running

App Files Files Community

Woziii commited on Aug 21, 2024

Commit

f4cc38c

verified ·

1 Parent(s): 3209254

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -0

app.py CHANGED Viewed

@@ -178,6 +178,10 @@ def transcribe_and_diarize(file_path, task, progress=gr.Progress()):
     return "Transcription terminée!", transcription_result['text'], speaker_transcription
 def format_to_markdown(transcription_text, speaker_transcription, audio_duration=None, location=None, speaker_age=None, context=None, num_speakers=None, speaker_names=None):
     metadata = {
         "Date de traitement": datetime.now().strftime('%d/%m/%Y %H:%M'),
         "Durée de l'audio": f"{audio_duration}" if audio_duration else "[à remplir]",
@@ -199,15 +203,20 @@ def format_to_markdown(transcription_text, speaker_transcription, audio_duration
             elif isinstance(row, (list, tuple)) and len(row) == 2:
                 custom_names[row[0]] = row[1]
     metadata_text = "\n".join([f"- **{key}** : '{value}'" for key, value in metadata.items()])
     try:
         if isinstance(speaker_transcription, str):
             speaker_transcription = parse_simplified_diarization(speaker_transcription)
         formatted_transcription = []
         for speaker, text in speaker_transcription:
             custom_name = custom_names.get(speaker, speaker)
             formatted_transcription.append(f"**{custom_name}**: {text}")
         transcription_text = "\n\n".join(formatted_transcription)
     except Exception as e:
@@ -223,6 +232,7 @@ def format_to_markdown(transcription_text, speaker_transcription, audio_duration
 ## Transcription
 {transcription_text}
 """
     return formatted_output
 def _return_yt_html_embed(yt_url):

     return "Transcription terminée!", transcription_result['text'], speaker_transcription
 def format_to_markdown(transcription_text, speaker_transcription, audio_duration=None, location=None, speaker_age=None, context=None, num_speakers=None, speaker_names=None):
+    print("Début de format_to_markdown")
+    print("speaker_names reçu :", speaker_names)
+    print("num_speakers reçu :", num_speakers)
     metadata = {
         "Date de traitement": datetime.now().strftime('%d/%m/%Y %H:%M'),
         "Durée de l'audio": f"{audio_duration}" if audio_duration else "[à remplir]",
             elif isinstance(row, (list, tuple)) and len(row) == 2:
                 custom_names[row[0]] = row[1]
+    print("custom_names créé :", custom_names)
     metadata_text = "\n".join([f"- **{key}** : '{value}'" for key, value in metadata.items()])
     try:
         if isinstance(speaker_transcription, str):
             speaker_transcription = parse_simplified_diarization(speaker_transcription)
+        print("speaker_transcription après parsing :", speaker_transcription)
         formatted_transcription = []
         for speaker, text in speaker_transcription:
             custom_name = custom_names.get(speaker, speaker)
+            print(f"Utilisation du nom : {custom_name} pour le speaker : {speaker}")
             formatted_transcription.append(f"**{custom_name}**: {text}")
         transcription_text = "\n\n".join(formatted_transcription)
     except Exception as e:
 ## Transcription
 {transcription_text}
 """
+    print("Fin de format_to_markdown")
     return formatted_output
 def _return_yt_html_embed(yt_url):