From 0165c450ade50e90ca3fea2d246b9d71eb86bb4a Mon Sep 17 00:00:00 2001 From: Junkun Date: Thu, 17 Feb 2022 16:40:25 -0800 Subject: [PATCH 1/5] update script --- examples/ted_en_zh/st1/local/data.sh | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/examples/ted_en_zh/st1/local/data.sh b/examples/ted_en_zh/st1/local/data.sh index f9c876b1..511ebd23 100755 --- a/examples/ted_en_zh/st1/local/data.sh +++ b/examples/ted_en_zh/st1/local/data.sh @@ -198,10 +198,14 @@ if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then fi if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then + x=(${feat_tr_dir} ${feat_dt_dir} ${feat_trans_dir}) + y=(train dev test) echo "stage 3: Format the Json Data" - python3 local/espnet_json_to_manifest.py --json-file ${feat_tr_dir}/data_${bpemode}${nbpe}.json --manifest-file data/manifest.train - python3 local/espnet_json_to_manifest.py --json-file ${feat_dt_dir}/data_${bpemode}${nbpe}.json --manifest-file data/manifest.dev - python3 local/espnet_json_to_manifest.py --json-file ${feat_trans_dir}/data_${bpemode}${nbpe}.json --manifest-file data/manifest.test + for (( i=0; i<${#x[*]}; ++i)); do + python3 ${MAIN_ROOT}/utils/espnet_json_to_manifest.py \ + --json-file ${x[$i]}/data_${bpemode}${nbpe}.json + --manifest-file data/manifest.${y[$i]} + done fi echo "Ted En-Zh Data preparation done." exit 0 From af2b20650e650bb44de0fc7e2a0ac9d07420cf23 Mon Sep 17 00:00:00 2001 From: Junkun Date: Thu, 17 Feb 2022 21:51:35 -0800 Subject: [PATCH 2/5] update mustc v1 --- examples/mustc/st1/cmd.sh | 89 ++++++++ examples/mustc/st1/conf/fbank.conf | 2 + examples/mustc/st1/conf/pitch.conf | 1 + examples/mustc/st1/local/augmentation.json | 19 ++ examples/mustc/st1/local/data.sh | 201 ++++++++++++++++++ examples/mustc/st1/local/data_prep.sh | 163 ++++++++++++++ examples/mustc/st1/local/divide_lang.sh | 52 +++++ .../mustc/st1/local/remove_punctuation.pl | 25 +++ examples/mustc/st1/local/test.sh | 48 +++++ examples/mustc/st1/local/train.sh | 40 ++++ examples/mustc/st1/path.sh | 29 +++ examples/mustc/st1/run.sh | 39 ++++ examples/mustc/st1/steps | 1 + examples/mustc/st1/utils | 1 + 14 files changed, 710 insertions(+) create mode 100644 examples/mustc/st1/cmd.sh create mode 100644 examples/mustc/st1/conf/fbank.conf create mode 100644 examples/mustc/st1/conf/pitch.conf create mode 100644 examples/mustc/st1/local/augmentation.json create mode 100755 examples/mustc/st1/local/data.sh create mode 100644 examples/mustc/st1/local/data_prep.sh create mode 100644 examples/mustc/st1/local/divide_lang.sh create mode 100755 examples/mustc/st1/local/remove_punctuation.pl create mode 100755 examples/mustc/st1/local/test.sh create mode 100755 examples/mustc/st1/local/train.sh create mode 100644 examples/mustc/st1/path.sh create mode 100755 examples/mustc/st1/run.sh create mode 120000 examples/mustc/st1/steps create mode 120000 examples/mustc/st1/utils diff --git a/examples/mustc/st1/cmd.sh b/examples/mustc/st1/cmd.sh new file mode 100644 index 00000000..7b70ef5e --- /dev/null +++ b/examples/mustc/st1/cmd.sh @@ -0,0 +1,89 @@ +# ====== About run.pl, queue.pl, slurm.pl, and ssh.pl ====== +# Usage: .pl [options] JOB=1: +# e.g. +# run.pl --mem 4G JOB=1:10 echo.JOB.log echo JOB +# +# Options: +# --time