MMS_1_10

Sleeping

bomolopuu commited on Oct 12, 2024

Commit

5d13184

1 Parent(s): d3bad75

remove loop

Files changed (3) hide show

asr.py CHANGED Viewed

@@ -46,21 +46,22 @@ def safe_process_file(file_obj):
 def transcribe_multiple_files(audio_files, lang, transcription):
     transcriptions = []
-    for audio_file in audio_files:
-        try:
-            audio_samples, sr, safe_name = safe_process_file(audio_file)
-            logger.debug(f"Transcribing file: {safe_name}")
-            logger.debug(f"Language selected: {lang}")
-            logger.debug(f"User-provided transcription: {transcription}")
-            result = transcribe_file(model, audio_samples, lang, transcription)
-            logger.debug(f"Transcription result: {result}")
-            transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
-        except Exception as e:
-            logger.error(f"Error in transcription process: {str(e)}")
-            transcriptions.append(f"Error processing file: {str(e)}\n")
-    return "\n".join(transcriptions)
 @spaces.GPU
 def transcribe_file(model, audio_samples, lang, user_transcription):

 def transcribe_multiple_files(audio_files, lang, transcription):
     transcriptions = []
+    # for audio_file in audio_files:
+    try:
+        audio_samples, sr, safe_name = safe_process_file(audio_files)
+        logger.debug(f"Transcribing file: {safe_name}")
+        logger.debug(f"Language selected: {lang}")
+        logger.debug(f"User-provided transcription: {transcription}")
+        result = transcribe_file(model, audio_samples, lang, transcription)
+        logger.debug(f"Transcription result: {result}")
+        transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
+    except Exception as e:
+        logger.error(f"Error in transcription process: {str(e)}")
+        transcriptions.append(f"Error processing file: {str(e)}\n")
+    # return "\n".join(transcriptions)
 @spaces.GPU
 def transcribe_file(model, audio_samples, lang, user_transcription):

audio_plus_hash_uniq_07102024.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

csv_processor.py CHANGED Viewed

@@ -14,7 +14,7 @@ def hash_md5(filepath):
 import csv
-def update_csv(file_path, search_hash, new_path, new_transcription):
     # Use read/write mode to modify the relevant line or append if not found
     with open(file_path, mode='r+', newline='', encoding='utf-8') as file:
         reader = csv.DictReader(file)
@@ -24,8 +24,8 @@ def update_csv(file_path, search_hash, new_path, new_transcription):
         # Locate the row with the matching hash
         for i, row in enumerate(rows):
-            if row['hash'] == search_hash:
-                rows[i]['filepath'] = new_path
                 rows[i]['transcription'] = new_transcription
                 found = True
                 break
@@ -42,6 +42,7 @@ def update_csv(file_path, search_hash, new_path, new_transcription):
         writer = csv.DictWriter(append_file, fieldnames=fieldnames)
         writer.writerow({
             'hash': search_hash,
             'filepath': new_path,
             'transcription': new_transcription
         })

 import csv
+def update_csv(file_path, search_hash, hash_16000, new_path, new_transcription):
     # Use read/write mode to modify the relevant line or append if not found
     with open(file_path, mode='r+', newline='', encoding='utf-8') as file:
         reader = csv.DictReader(file)
         # Locate the row with the matching hash
         for i, row in enumerate(rows):
+            if row['hash'] == search_hash or row['hash_16000'] == search_hash:
+                rows[i]['hash_16000'] = hash_16000
                 rows[i]['transcription'] = new_transcription
                 found = True
                 break
         writer = csv.DictWriter(append_file, fieldnames=fieldnames)
         writer.writerow({
             'hash': search_hash,
+            'hash_16000': hash_16000,
             'filepath': new_path,
             'transcription': new_transcription
         })