Update modules/whisper/whisper_base.py
Browse files
modules/whisper/whisper_base.py
CHANGED
|
@@ -224,7 +224,10 @@ class WhisperBase(ABC):
|
|
| 224 |
files = [files]
|
| 225 |
if files and isinstance(files[0], gr.utils.NamedString):
|
| 226 |
files = [file.name for file in files]
|
| 227 |
-
|
|
|
|
|
|
|
|
|
|
| 228 |
## Load model to detect language
|
| 229 |
model = whisper.load_model("base")
|
| 230 |
|
|
@@ -235,8 +238,6 @@ class WhisperBase(ABC):
|
|
| 235 |
for file in files:
|
| 236 |
|
| 237 |
## Detect language
|
| 238 |
-
#params = WhisperParameters.as_value(*whisper_params)
|
| 239 |
-
#model = whisper.load_model(params.model_size)
|
| 240 |
mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
|
| 241 |
_, probs = model.detect_language(mel)
|
| 242 |
file_language = ""
|
|
@@ -274,7 +275,8 @@ class WhisperBase(ABC):
|
|
| 274 |
input_list_dict=transcribed_segments,
|
| 275 |
model_size=translate_model,
|
| 276 |
src_lang=file_language,
|
| 277 |
-
tgt_lang=target_lang
|
|
|
|
| 278 |
)
|
| 279 |
|
| 280 |
## Get preview as txt
|
|
|
|
| 224 |
files = [files]
|
| 225 |
if files and isinstance(files[0], gr.utils.NamedString):
|
| 226 |
files = [file.name for file in files]
|
| 227 |
+
|
| 228 |
+
## Load parameters related with whisper
|
| 229 |
+
params = WhisperParameters.as_value(*whisper_params)
|
| 230 |
+
|
| 231 |
## Load model to detect language
|
| 232 |
model = whisper.load_model("base")
|
| 233 |
|
|
|
|
| 238 |
for file in files:
|
| 239 |
|
| 240 |
## Detect language
|
|
|
|
|
|
|
| 241 |
mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
|
| 242 |
_, probs = model.detect_language(mel)
|
| 243 |
file_language = ""
|
|
|
|
| 275 |
input_list_dict=transcribed_segments,
|
| 276 |
model_size=translate_model,
|
| 277 |
src_lang=file_language,
|
| 278 |
+
tgt_lang=target_lang,
|
| 279 |
+
speaker_diarization=params.is_diarize
|
| 280 |
)
|
| 281 |
|
| 282 |
## Get preview as txt
|