Phospheneser commited on
Commit
17b249b
·
verified ·
1 Parent(s): d7c95ea

Update utils.py

Browse files
Files changed (1) hide show
  1. utils.py +7 -1
utils.py CHANGED
@@ -1912,7 +1912,13 @@ def extract_speech_token(model, feature_extractor, utts, batch_size=128):
1912
  # make sure kernel also on device
1913
  if hasattr(_resample_buffer[sample_rate], "kernel"):
1914
  _resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
1915
- audio = _resample_buffer[sample_rate](audio)
 
 
 
 
 
 
1916
  # if audio.shape[0] > 1:
1917
  # audio = audio[:1]
1918
  audio = audio[0]
 
1912
  # make sure kernel also on device
1913
  if hasattr(_resample_buffer[sample_rate], "kernel"):
1914
  _resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
1915
+ if torchaudio.__version__ == "2.8.0":
1916
+ audio_device = audio.device
1917
+ audio = audio.cpu()
1918
+ audio = _resample_buffer[sample_rate](audio)
1919
+ audio = audio.to(audio_device)
1920
+ else:
1921
+ audio = _resample_buffer[sample_rate](audio)
1922
  # if audio.shape[0] > 1:
1923
  # audio = audio[:1]
1924
  audio = audio[0]