From e9229a10064821815dac4925edeee797d0e94b18 Mon Sep 17 00:00:00 2001 From: Di Wu <1176705630@qq.com> Date: Tue, 8 Dec 2020 11:31:09 +0800 Subject: [PATCH] [fix] remove unused spaces in text --- examples/aishell/s0/run.sh | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/examples/aishell/s0/run.sh b/examples/aishell/s0/run.sh index 7459daaf3..bd4f4e902 100644 --- a/examples/aishell/s0/run.sh +++ b/examples/aishell/s0/run.sh @@ -27,11 +27,10 @@ train_config=conf/train_conformer.yaml checkpoint= cmvn=true dir=exp/sp_spec_aug - # use average_checkpoint will get better result average_checkpoint=true decode_checkpoint=$dir/final.pt -average_num=5 +average_num=10 . utils/parse_options.sh || exit 1; @@ -47,6 +46,14 @@ if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then utils/perturb_data_dir_speed.sh 0.9 data/train data/train_sp0.9 utils/perturb_data_dir_speed.sh 1.1 data/train data/train_sp1.1 utils/combine_data.sh data/train_sp data/train data/train_sp0.9 data/train_sp1.1 + # Remove the space in Mandarin text + for x in train_sp dev test; do + cp data/${x}/text data/${x}/text.org + paste -d " " <(cut -f 1 -d" " data/${x}/text.org) <(cut -f 2- -d" " data/${x}/text.org | tr -d " ") \ + > data/${x}/text + rm data/${x}/text.org + done + fi if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then