Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -20,7 +20,12 @@ pipe = pipeline(task="automatic-speech-recognition", model=model_repo_id, device
|
|
| 20 |
def infer(
|
| 21 |
audio
|
| 22 |
):
|
| 23 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
|
| 25 |
css = """
|
| 26 |
#col-container {
|
|
|
|
| 20 |
def infer(
|
| 21 |
audio
|
| 22 |
):
|
| 23 |
+
sampling_rate, wav = audio
|
| 24 |
+
if wav.ndim > 1:
|
| 25 |
+
wav = wav.mean(axis=1)
|
| 26 |
+
wav = wav.astype(np.float32)
|
| 27 |
+
wav /= np.max(np.abs(wav))
|
| 28 |
+
return pipe({"sampling_rate": sampling_rate, "raw": wav}, generate_kwargs={'language': 'chinese'})['text']
|
| 29 |
|
| 30 |
css = """
|
| 31 |
#col-container {
|