speechbrain · goexle · Feb 16, 2022 · May 24, 2022 · May 24, 2022 · May 24, 2022
diff --git a/speechbrain/pretrained/interfaces.py b/speechbrain/pretrained/interfaces.py
@@ -219,18 +219,15 @@ def _prepare_modules(self, freeze_params):
             for p in self.mods.parameters():
                 p.requires_grad = False
 
-    def load_audio(self, path, savedir="."):
+    def load_audio(self, path):
         """Load an audio file with this model"s input spec
 
         When using a speech model, it is important to use the same type of data,
         as was used to train the model. This means for example using the same
         sampling rate and number of channels. It is, however, possible to
         convert a file from a higher sampling rate to a lower one (downsampling).
         Similarly, it is simple to downmix a stereo file to mono.
-        The path can be a local path, a web url, or a link to a huggingface repo.
         """
-        source, fl = split_path(path)
-        path = fetch(fl, source=source, savedir=savedir)
         signal, sr = torchaudio.load(str(path), channels_first=False)
         return self.audio_normalizer(signal, sr)
 

diff --git a/tests/unittests/test_interfaces.py b/tests/unittests/test_interfaces.py
@@ -0,0 +1,17 @@
+import torch
+
+
+def test_load_audio(tmpdir):
+    from speechbrain.pretrained.interfaces import Pretrained
+
+    verification = Pretrained.from_hparams(
+        source="speechbrain/spkrec-ecapa-voxceleb",
+        savedir=tmpdir.mkdir("savedir"),
+    )
+    audio1 = verification.load_audio(
+        "samples/voxceleb_samples/wav/id10002/xTV-jFAUKcw/00001.wav"
+    )
+    audio2 = verification.load_audio(
+        "samples/voxceleb_samples/wav/id10001/1zcIwhmdeo4/00001.wav"
+    )
+    assert not torch.equal(audio1, audio2)