Phospheneser commited on
Commit
8f84585
·
verified ·
1 Parent(s): d3c20ea

Update utils.py

Browse files
Files changed (1) hide show
  1. utils.py +3 -1
utils.py CHANGED
@@ -1912,8 +1912,10 @@ def extract_speech_token(model, feature_extractor, utts, batch_size=128):
1912
  # make sure kernel also on device
1913
  if hasattr(_resample_buffer[sample_rate], "kernel"):
1914
  _resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
1915
-
 
1916
  audio = _resample_buffer[sample_rate](audio)
 
1917
  # if audio.shape[0] > 1:
1918
  # audio = audio[:1]
1919
  audio = audio[0]
 
1912
  # make sure kernel also on device
1913
  if hasattr(_resample_buffer[sample_rate], "kernel"):
1914
  _resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
1915
+
1916
+ audio = audio.cpu()
1917
  audio = _resample_buffer[sample_rate](audio)
1918
+ audio = audio.to(device)
1919
  # if audio.shape[0] > 1:
1920
  # audio = audio[:1]
1921
  audio = audio[0]