Luis J Camargo commited on
Commit
40f26b2
·
1 Parent(s): 7c2c8fa

feat: add audio normalization for int16 and int32 audio input arrays

Browse files
Files changed (1) hide show
  1. app.py +10 -0
app.py CHANGED
@@ -99,6 +99,16 @@ def predict_language(audio):
99
  sample_rate, audio_array = audio
100
  audio_len_sec = len(audio_array) / sample_rate
101
 
 
 
 
 
 
 
 
 
 
 
102
  # Resampling
103
  if sample_rate != 16000:
104
  print(f"[LOG] Step 2: Resampling {sample_rate}Hz -> 16000Hz...")
 
99
  sample_rate, audio_array = audio
100
  audio_len_sec = len(audio_array) / sample_rate
101
 
102
+ # Normalization
103
+ print("[LOG] Step 1: Normalizing audio...")
104
+ if audio_array.dtype == np.int16:
105
+ print("was npint16")
106
+ audio_array = audio_array.astype(np.float32) / 32768.0
107
+ elif audio_array.dtype == np.int32:
108
+ print("was npint32")
109
+ audio_array = audio_array.astype(np.float32) / 2147483648.0
110
+ print(f"[LOG] Memory after normalization: {get_mem_usage():.2f} MB")
111
+
112
  # Resampling
113
  if sample_rate != 16000:
114
  print(f"[LOG] Step 2: Resampling {sample_rate}Hz -> 16000Hz...")