david commited on
Commit
0d81579
·
1 Parent(s): 3556e74

add string replace

Browse files
config.py CHANGED
@@ -1,6 +1,8 @@
1
  import pathlib
2
  import re
3
  import logging
 
 
4
 
5
  DEBUG = False
6
  LOG_LEVEL = logging.DEBUG if DEBUG else logging.INFO
@@ -73,4 +75,4 @@ LLM_SYS_PROMPT_EN = """
73
  """
74
 
75
  hotwords_file = MODEL_DIR / 'hotwords.txt'
76
- hotwords_json = MODEL_DIR / 'hotwords.json'
 
1
  import pathlib
2
  import re
3
  import logging
4
+ import json
5
+
6
 
7
  DEBUG = False
8
  LOG_LEVEL = logging.DEBUG if DEBUG else logging.INFO
 
75
  """
76
 
77
  hotwords_file = MODEL_DIR / 'hotwords.txt'
78
+ hotwords_json = json.loads((MODEL_DIR / 'hotwords.json').read_text())
transcribe/pipelines/pipe_vad.py CHANGED
@@ -28,10 +28,10 @@ class VadPipe(BasePipe):
28
  def init(cls):
29
  if cls.vac is None:
30
  cls.vac = FixedVADIterator(
31
- threshold=0.5,
32
  sampling_rate=cls.sample_rate,
33
  # speech_pad_ms=10
34
- min_silence_duration_ms = 100,
35
  # speech_pad_ms = 30,
36
  )
37
  cls.vac.reset_states()
 
28
  def init(cls):
29
  if cls.vac is None:
30
  cls.vac = FixedVADIterator(
31
+ threshold=0.6,
32
  sampling_rate=cls.sample_rate,
33
  # speech_pad_ms=10
34
+ min_silence_duration_ms = 80,
35
  # speech_pad_ms = 30,
36
  )
37
  cls.vac.reset_states()
transcribe/utils.py CHANGED
@@ -67,25 +67,13 @@ def replace_hotwords(text: str) -> str:
67
  Returns:
68
  The string with hotwords replaced.
69
  """
70
- # Using the provided absolute path for simplicity in this example
71
- hotwords_path = config.hotwords_file.as_posix()
72
-
73
- try:
74
- with open(hotwords_path, 'r', encoding='utf-8') as f:
75
- hotwords = json.load(f)
76
- except FileNotFoundError:
77
- print(f"Error: hotwords.json not found at {hotwords_path}")
78
- return text
79
- except json.JSONDecodeError:
80
- print(f"Error: Could not decode JSON from {hotwords_path}")
81
- return text
82
 
83
  processed_text = text
84
  # Iterate through the hotwords dictionary
85
- for key, value in hotwords.items():
86
  # Replace all occurrences of the key with the value in the text
87
  processed_text = processed_text.replace(key, value)
88
-
89
  return processed_text
90
 
91
 
 
67
  Returns:
68
  The string with hotwords replaced.
69
  """
 
 
 
 
 
 
 
 
 
 
 
 
70
 
71
  processed_text = text
72
  # Iterate through the hotwords dictionary
73
+ for key, value in config.hotwords_json.items():
74
  # Replace all occurrences of the key with the value in the text
75
  processed_text = processed_text.replace(key, value)
76
+ logging.debug(f"Replace string: {text} => {processed_text}")
77
  return processed_text
78
 
79