inoryQwQ commited on
Commit
02707b5
·
1 Parent(s): 4fd2d31

fix gradio bug

Browse files
Files changed (3) hide show
  1. .gitignore +2 -1
  2. gradio_demo.py +4 -10
  3. server.py +1 -1
.gitignore CHANGED
@@ -1 +1,2 @@
1
- __pycache__
 
 
1
+ __pycache__
2
+ .gradio
gradio_demo.py CHANGED
@@ -6,7 +6,7 @@ from print_utils import rich_transcription_postprocess
6
  from download_utils import download_model
7
 
8
  use_itn = True # 标点符号预测
9
- max_len = 68
10
 
11
  model_path = os.path.join("sensevoice_ax650", "sensevoice.axmodel")
12
  bpemodel = "chn_jpn_yue_eng_ko_spectok.bpe.model"
@@ -19,7 +19,7 @@ pipeline = SenseVoiceAx(model_path,
19
  language="auto",
20
  use_itn=use_itn,
21
  tokenizer=tokenizer)
22
- # 你实现的语言转文本函数
23
  def speech_to_text(audio_path, lang):
24
  """
25
  audio_path: 音频文件路径
@@ -31,8 +31,7 @@ def speech_to_text(audio_path, lang):
31
  pipeline.choose_language(language=lang)
32
  asr_res = pipeline.infer(audio_path, print_rtf=True)
33
  res = " ".join([rich_transcription_postprocess(i) for i in asr_res])
34
- # TODO: 这里写你的语音识别逻辑
35
- # 返回一个示例文本
36
  return res
37
 
38
 
@@ -47,7 +46,7 @@ def main():
47
 
48
  with gr.Row():
49
  audio_input = gr.Audio(
50
- sources=["microphone"],
51
  type="filepath",
52
  label="录制或上传音频",
53
  format="mp3"
@@ -58,9 +57,6 @@ def main():
58
  label="选择音频语言"
59
  )
60
 
61
-
62
-
63
-
64
  audio_input.change(
65
  fn=speech_to_text,
66
  inputs=[audio_input, lang_dropdown],
@@ -69,8 +65,6 @@ def main():
69
 
70
  demo.launch(
71
  server_name="0.0.0.0",
72
- server_port=7860,
73
- ssl_certfile="./cert.pem", ssl_keyfile="./key.pem", ssl_verify=False
74
  )
75
 
76
  if __name__ == "__main__":
 
6
  from download_utils import download_model
7
 
8
  use_itn = True # 标点符号预测
9
+ max_len = 256
10
 
11
  model_path = os.path.join("sensevoice_ax650", "sensevoice.axmodel")
12
  bpemodel = "chn_jpn_yue_eng_ko_spectok.bpe.model"
 
19
  language="auto",
20
  use_itn=use_itn,
21
  tokenizer=tokenizer)
22
+
23
  def speech_to_text(audio_path, lang):
24
  """
25
  audio_path: 音频文件路径
 
31
  pipeline.choose_language(language=lang)
32
  asr_res = pipeline.infer(audio_path, print_rtf=True)
33
  res = " ".join([rich_transcription_postprocess(i) for i in asr_res])
34
+
 
35
  return res
36
 
37
 
 
46
 
47
  with gr.Row():
48
  audio_input = gr.Audio(
49
+ sources=["upload"],
50
  type="filepath",
51
  label="录制或上传音频",
52
  format="mp3"
 
57
  label="选择音频语言"
58
  )
59
 
 
 
 
60
  audio_input.change(
61
  fn=speech_to_text,
62
  inputs=[audio_input, lang_dropdown],
 
65
 
66
  demo.launch(
67
  server_name="0.0.0.0",
 
 
68
  )
69
 
70
  if __name__ == "__main__":
server.py CHANGED
@@ -32,7 +32,7 @@ async def load_model():
32
  # 模型加载
33
  language = "auto"
34
  use_itn = True # 标点符号预测
35
- max_len = 68
36
 
37
  model_path = os.path.join("sensevoice_ax650", "sensevoice.axmodel")
38
  bpemodel = "chn_jpn_yue_eng_ko_spectok.bpe.model"
 
32
  # 模型加载
33
  language = "auto"
34
  use_itn = True # 标点符号预测
35
+ max_len = 256
36
 
37
  model_path = os.path.join("sensevoice_ax650", "sensevoice.axmodel")
38
  bpemodel = "chn_jpn_yue_eng_ko_spectok.bpe.model"