Skip to content

Commit

Permalink
Merge pull request #1419 from mravanelli/sample_refactor
Browse files Browse the repository at this point in the history
Clean up of  samples and integration tests
  • Loading branch information
mravanelli authored May 31, 2022
2 parents be3628a + f87e40e commit 421fb46
Show file tree
Hide file tree
Showing 172 changed files with 230 additions and 708 deletions.
6 changes: 0 additions & 6 deletions samples/audio_samples/csv_example3.csv

This file was deleted.

4 changes: 0 additions & 4 deletions samples/audio_samples/csv_example_multichannel.csv

This file was deleted.

Binary file removed samples/audio_samples/example_fr.wav
Binary file not shown.
Binary file removed samples/audio_samples/example_multichannel.wav
Binary file not shown.
Binary file removed samples/audio_samples/example_noisy.wav
Binary file not shown.
9 changes: 0 additions & 9 deletions samples/audio_samples/nn_training_samples/debug.csv

This file was deleted.

3 changes: 0 additions & 3 deletions samples/audio_samples/nn_training_samples/dev.csv

This file was deleted.

Binary file removed samples/audio_samples/nn_training_samples/spk1_snt1.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk1_snt2.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk1_snt3.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk1_snt4.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk1_snt5.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk1_snt6.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt1.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt2.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt3.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt4.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt5.pkl
Binary file not shown.
Binary file removed samples/audio_samples/nn_training_samples/spk2_snt6.pkl
Binary file not shown.
3 changes: 0 additions & 3 deletions samples/audio_samples/nn_training_samples/test.csv

This file was deleted.

9 changes: 0 additions & 9 deletions samples/audio_samples/nn_training_samples/train.csv

This file was deleted.

This file was deleted.

This file was deleted.

This file was deleted.

This file was deleted.

9 changes: 0 additions & 9 deletions samples/audio_samples/test_csv_merge.csv

This file was deleted.

Binary file removed samples/audio_samples/test_mixture.wav
Binary file not shown.
3 changes: 0 additions & 3 deletions samples/label_samples/hyp.csv

This file was deleted.

3 changes: 0 additions & 3 deletions samples/label_samples/ref.csv

This file was deleted.

7 changes: 0 additions & 7 deletions samples/noise_samples/noise.csv

This file was deleted.

4 changes: 0 additions & 4 deletions samples/noise_samples/noise_multichannel.csv

This file was deleted.

Binary file removed samples/noise_samples/noise_multichannel.wav
Binary file not shown.
3 changes: 0 additions & 3 deletions samples/rir_samples/rir_multichannel.csv

This file was deleted.

Binary file removed samples/rir_samples/rir_multichannel.wav
Binary file not shown.
6 changes: 0 additions & 6 deletions samples/rir_samples/rirs.csv

This file was deleted.

Binary file removed samples/text_samples/hdf5_example.h5
Binary file not shown.
Binary file removed samples/text_samples/label_dict.pkl
Binary file not shown.
9 changes: 0 additions & 9 deletions samples/text_samples/readme.txt

This file was deleted.

6 changes: 0 additions & 6 deletions samples/voxceleb_samples/meta/iden_split.txt

This file was deleted.

4 changes: 0 additions & 4 deletions samples/voxceleb_samples/readme.txt

This file was deleted.

4 changes: 0 additions & 4 deletions samples/voxceleb_samples/wav/dev.csv

This file was deleted.

Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
7 changes: 0 additions & 7 deletions samples/voxceleb_samples/wav/train.csv

This file was deleted.

2 changes: 1 addition & 1 deletion speechbrain/alignment/ctc_segmentation.py
Original file line number Diff line number Diff line change
Expand Up @@ -185,7 +185,7 @@ class CTCSegmentation:
>>> asr_model = EncoderDecoderASR.from_hparams(source=pre_trained)
>>> aligner = CTCSegmentation(asr_model, kaldi_style_text=False)
>>> # load data
>>> audio_path = "./samples/audio_samples/example1.wav"
>>> audio_path = "tests/samples/single-mic/example1.wav"
>>> text = ["THE BIRCH CANOE", "SLID ON THE", "SMOOTH PLANKS"]
>>> segments = aligner(audio_path, text, name="example1")
Expand Down
8 changes: 4 additions & 4 deletions speechbrain/dataio/dataio.py
Original file line number Diff line number Diff line change
Expand Up @@ -772,7 +772,7 @@ def get_md5(file):
Example
-------
>>> get_md5('samples/audio_samples/example1.wav')
>>> get_md5('tests/samples/single-mic/example1.wav')
'c482d0081ca35302d30d12f1136c34e5'
"""
# Lets read stuff in 64kb chunks!
Expand Down Expand Up @@ -803,7 +803,7 @@ def save_md5(files, out_file):
None
Example:
>>> files = ['samples/audio_samples/example1.wav']
>>> files = ['tests/samples/single-mic/example1.wav']
>>> tmpdir = getfixture('tmpdir')
>>> save_md5(files, os.path.join(tmpdir, "md5.pkl"))
"""
Expand Down Expand Up @@ -983,8 +983,8 @@ def merge_csvs(data_folder, csv_lst, merged_csv):
Example
-------
>>> merge_csvs("samples/audio_samples/",
... ["csv_example.csv", "csv_example2.csv"],
>>> merge_csvs("tests/samples/annotation/",
... ["speech.csv", "speech.csv"],
... "test_csv_merge.csv")
"""
write_path = os.path.join(data_folder, merged_csv)
Expand Down
6 changes: 3 additions & 3 deletions speechbrain/dataio/preprocess.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,14 +20,14 @@ class AudioNormalizer:
Example
-------
>>> import torchaudio
>>> example_file = 'samples/audio_samples/example_multichannel.wav'
>>> example_file = 'tests/samples/multi-mic/speech_-0.82918_0.55279_-0.082918.flac'
>>> signal, sr = torchaudio.load(example_file, channels_first = False)
>>> normalizer = AudioNormalizer(sample_rate=8000)
>>> normalized = normalizer(signal, sr)
>>> signal.shape
torch.Size([33882, 2])
torch.Size([160000, 4])
>>> normalized.shape
torch.Size([16941])
torch.Size([80000])
NOTE
----
Expand Down
14 changes: 7 additions & 7 deletions speechbrain/pretrained/interfaces.py
Original file line number Diff line number Diff line change
Expand Up @@ -379,7 +379,7 @@ class EndToEndSLU(Pretrained):
... source="speechbrain/slu-timers-and-such-direct-librispeech-asr",
... savedir=tmpdir,
... )
>>> slu_model.decode_file("samples/audio_samples/example6.wav")
>>> slu_model.decode_file("tests/samples/single-mic/example6.wav")
"{'intent': 'SimpleMath', 'slots': {'number1': 37.67, 'number2': 75.7, 'op': ' minus '}}"
"""

Expand Down Expand Up @@ -495,7 +495,7 @@ class EncoderDecoderASR(Pretrained):
... source="speechbrain/asr-crdnn-rnnlm-librispeech",
... savedir=tmpdir,
... )
>>> asr_model.transcribe_file("samples/audio_samples/example2.flac")
>>> asr_model.transcribe_file("tests/samples/single-mic/example2.flac")
"MY FATHER HAS REVEALED THE CULPRIT'S NAME"
"""

Expand Down Expand Up @@ -743,7 +743,7 @@ class EncoderClassifier(Pretrained):
... )
>>> # Compute embeddings
>>> signal, fs = torchaudio.load("samples/audio_samples/example1.wav")
>>> signal, fs = torchaudio.load("tests/samples/single-mic/example1.wav")
>>> embeddings = classifier.encode_batch(signal)
>>> # Classification
Expand Down Expand Up @@ -896,8 +896,8 @@ class SpeakerRecognition(EncoderClassifier):
... )
>>> # Perform verification
>>> signal, fs = torchaudio.load("samples/audio_samples/example1.wav")
>>> signal2, fs = torchaudio.load("samples/audio_samples/example2.flac")
>>> signal, fs = torchaudio.load("tests/samples/single-mic/example1.wav")
>>> signal2, fs = torchaudio.load("tests/samples/single-mic/example2.flac")
>>> score, prediction = verification.verify_batch(signal, signal2)
"""

Expand Down Expand Up @@ -994,7 +994,7 @@ class VAD(Pretrained):
... )
>>> # Perform VAD
>>> boundaries = VAD.get_speech_segments("samples/audio_samples/example1.wav")
>>> boundaries = VAD.get_speech_segments("tests/samples/single-mic/example1.wav")
"""

HPARAMS_NEEDED = ["sample_rate", "time_resolution", "device"]
Expand Down Expand Up @@ -2033,7 +2033,7 @@ class SpectralMaskEnhancement(Pretrained):
... source="speechbrain/mtl-mimic-voicebank",
... savedir=tmpdir,
... )
>>> noisy, fs = torchaudio.load("samples/audio_samples/example_noisy.wav")
>>> noisy, fs = torchaudio.load("tests/samples/single-mic/example1.wav")
>>> # Channel dimension is interpreted as batch dimension here
>>> enhanced = enhancer.enhance_batch(noisy)
"""
Expand Down
8 changes: 4 additions & 4 deletions speechbrain/processing/decomposition.py
Original file line number Diff line number Diff line change
Expand Up @@ -140,9 +140,9 @@ def svdl(a):
>>> from speechbrain.dataio.dataio import read_audio_multichannel
>>> xs_speech = read_audio_multichannel(
... 'samples/audio_samples/multi_mic/speech_-0.82918_0.55279_-0.082918.flac'
... 'tests/samples/multi-mic/speech_-0.82918_0.55279_-0.082918.flac'
... )
>>> xs_noise = read_audio_multichannel('samples/audio_samples/multi_mic/noise_diffuse.flac')
>>> xs_noise = read_audio_multichannel('tests/samples/multi-mic/noise_diffuse.flac')
>>> xs = xs_speech + 0.05 * xs_noise
>>> xs = xs.unsqueeze(0).float()
>>>
Expand Down Expand Up @@ -378,9 +378,9 @@ def inv(x):
>>> from speechbrain.processing.decomposition import inv
>>>
>>> xs_speech = read_audio(
... 'samples/audio_samples/multi_mic/speech_-0.82918_0.55279_-0.082918.flac'
... 'tests/samples/multi-mic/speech_-0.82918_0.55279_-0.082918.flac'
... )
>>> xs_noise = read_audio('samples/audio_samples/multi_mic/noise_0.70225_-0.70225_0.11704.flac')
>>> xs_noise = read_audio('tests/samples/multi-mic/noise_0.70225_-0.70225_0.11704.flac')
>>> xs = xs_speech + 0.05 * xs_noise
>>> xs = xs.unsqueeze(0).float()
>>>
Expand Down
Loading

0 comments on commit 421fb46

Please sign in to comment.