Skip to content

Commit

Permalink
Merge pull request #4799 from YoshikiMas/update_enh_recipes
Browse files Browse the repository at this point in the history
Fix an audio format issue in some enh recipes
  • Loading branch information
sw005320 committed Dec 3, 2022
2 parents cb06bb1 + a52159b commit 1a50788
Show file tree
Hide file tree
Showing 7 changed files with 60 additions and 9 deletions.
16 changes: 13 additions & 3 deletions egs2/sms_wsj/enh1/conf/tuning/train_enh_beamformer_no_wpe.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,6 @@ scheduler_conf:
mode: min
factor: 0.5
patience: 1
model_conf:
loss_type: mask_mse
mask_type: PSM^2
encoder: stft
encoder_conf:
n_fft: 512
Expand Down Expand Up @@ -60,3 +57,16 @@ separator_conf:
use_noise_mask: True
beamformer_type: mvdr_souden
bdropout_rate: 0.0


criterions:
# The first criterion
- name: mse
conf:
compute_on_mask: True
mask_type: PSM^2
# the wrapper for the current criterion
# for single-talker case, we simplely use fixed_order wrapper
wrapper: pit
wrapper_conf:
weight: 1.0
1 change: 1 addition & 0 deletions egs2/sms_wsj/enh1/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -26,4 +26,5 @@ test_sets="test_eval92"
--use_dereverb_ref false \
--use_noise_ref true \
--inference_model "valid.loss.best.pth" \
--audio_format wav \
"$@"
1 change: 1 addition & 0 deletions egs2/wham/enh1/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -25,4 +25,5 @@ test_sets="tt_mix_both_min_8k"
--use_dereverb_ref false \
--use_noise_ref true \
--inference_model "valid.loss.best.pth" \
--audio_format wav \
"$@"
18 changes: 18 additions & 0 deletions egs2/whamr/enh1/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,18 @@
# MVDR beamformer (mask_mse loss)
## Environments
- date: `Thu Dec 1 19:01:36 UTC 2022`
- python version: `3.7.4 (default, Aug 13 2019, 20:35:49) [GCC 7.3.0]`
- espnet version: `espnet 202209`
- pytorch version: `pytorch 1.10.1+cu111`
- Git hash: `4ba0ccb6c5ee0dd6751fdd88d4d6a8f0cd61d87c`
- Commit date: ``


## enh_train_enh_beamformer_mvdr_raw

config: ./conf/tuning/train_enh_beamformer_mvdr.yaml

|dataset|STOI|SAR|SDR|SIR|SI_SNR|
|---|---|---|---|---|---|
|enhanced_cv_mix_single_reverb_min_8k|77.35|4.11|4.11|0.00|3.81|
|enhanced_tt_mix_single_reverb_min_8k|79.26|3.44|3.44|0.00|3.17|
16 changes: 13 additions & 3 deletions egs2/whamr/enh1/conf/tuning/train_enh_beamformer_mvdr.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,6 @@ scheduler_conf:
mode: min
factor: 0.5
patience: 1
model_conf:
loss_type: mask_mse
mask_type: PSM^2
encoder: stft
encoder_conf:
n_fft: 512
Expand Down Expand Up @@ -60,3 +57,16 @@ separator_conf:
use_noise_mask: True
beamformer_type: mvdr_souden
bdropout_rate: 0.0


criterions:
# The first criterion
- name: mse
conf:
compute_on_mask: True
mask_type: PSM^2
# the wrapper for the current criterion
# for single-talker case, we simplely use fixed_order wrapper
wrapper: fixed_order
wrapper_conf:
weight: 1.0
16 changes: 13 additions & 3 deletions egs2/whamr/enh1/conf/tuning/train_enh_beamformer_wmpdr.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,6 @@ scheduler_conf:
mode: min
factor: 0.5
patience: 1
model_conf:
loss_type: mask_mse
mask_type: PSM^2
encoder: stft
encoder_conf:
n_fft: 512
Expand Down Expand Up @@ -62,3 +59,16 @@ separator_conf:
rtf_iterations: 3
bdropout_rate: 0.0
shared_power: True


criterions:
# The first criterion
- name: mse
conf:
compute_on_mask: True
mask_type: PSM^2
# the wrapper for the current criterion
# for single-talker case, we simplely use fixed_order wrapper
wrapper: fixed_order
wrapper_conf:
weight: 1.0
1 change: 1 addition & 0 deletions egs2/whamr/enh1/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -26,4 +26,5 @@ test_sets="tt_mix_single_reverb_min_8k"
--use_dereverb_ref false \
--use_noise_ref true \
--inference_model "valid.loss.best.pth" \
--audio_format wav \
"$@"

0 comments on commit 1a50788

Please sign in to comment.