diff --git a/examples/ted_en_zh/st0/local/data.sh b/examples/ted_en_zh/st0/local/data.sh index 097cd3a8..7ea185db 100755 --- a/examples/ted_en_zh/st0/local/data.sh +++ b/examples/ted_en_zh/st0/local/data.sh @@ -42,7 +42,7 @@ if [ ${stage} -le -1 ] && [ ${stop_stage} -ge -1 ]; then # generate manifests python3 ${TARGET_DIR}/ted_en_zh/ted_en_zh.py \ --manifest_prefix="data/manifest" \ - --src_dir="${data_dir}" + --src-dir="${data_dir}" echo "Complete raw data pre-process." fi diff --git a/paddlespeech/s2t/frontend/utility.py b/paddlespeech/s2t/frontend/utility.py index 175727e1..50fced25 100644 --- a/paddlespeech/s2t/frontend/utility.py +++ b/paddlespeech/s2t/frontend/utility.py @@ -102,9 +102,9 @@ def read_manifest( with jsonlines.open(manifest_path, 'r') as reader: for json_data in reader: feat_len = json_data["input"][0]["shape"][ - 0] if 'shape' in json_data["input"][0] else 1.0 + 0] if "input" in json_data and "shape" in json_data["input"][0] else 1.0 token_len = json_data["output"][0]["shape"][ - 0] if 'shape' in json_data["output"][0] else 1.0 + 0] if "output" in json_data and "shape" in json_data["input"][0] else 1.0 conditions = [ feat_len >= min_input_len, feat_len <= max_input_len,