Dibiddo commited on
Commit
9ec90b2
·
verified ·
1 Parent(s): e3c4891

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -2
app.py CHANGED
@@ -3,7 +3,7 @@ from transformers import AutoModelForSpeechSeq2Seq, AutoProcessor, pipeline
3
  from datasets import load_dataset
4
  import spacy
5
  import gradio as gr
6
- import numpy as np # 確保導入 Numpy
7
 
8
  # 設置設備和環境變數(如有需要)
9
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
@@ -36,9 +36,19 @@ except Exception as e:
36
 
37
  def process_audio(audio_file):
38
 
 
 
 
 
 
 
 
 
 
 
39
  # 語音轉文字
40
 
41
- result= whisper_pipe(audio_file)["text"]
42
 
43
  # 使用 T5 作為替代模型
44
 
 
3
  from datasets import load_dataset
4
  import spacy
5
  import gradio as gr
6
+ from pydub import AudioSegment # 引入 pydub 庫
7
 
8
  # 設置設備和環境變數(如有需要)
9
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
 
36
 
37
  def process_audio(audio_file):
38
 
39
+ # 將 MP3 轉換為 WAV
40
+
41
+ try:
42
+ audio_segment = AudioSegment.from_mp3(audio_file)
43
+ wav_path = audio_file.replace(".mp3", ".wav")
44
+ audio_segment.export(wav_path, format="wav")
45
+
46
+ except Exception as e:
47
+ print(f"MP3 轉 WAV 時出現錯誤:{e}")
48
+
49
  # 語音轉文字
50
 
51
+ result= whisper_pipe(wav_path)["text"]
52
 
53
  # 使用 T5 作為替代模型
54