diff --git a/README.md b/README.md index b20c75f9..bb1815c0 100644 --- a/README.md +++ b/README.md @@ -1,10 +1,8 @@ # Deep Speech 2 on PaddlePaddle -## Quick Start +## Installation -### Installation - -Please replace `$PADDLE_INSTALL_DIR` with your paddle installation directory. +Please replace `$PADDLE_INSTALL_DIR` with your own paddle installation directory. ``` pip install -r requirements.txt @@ -13,7 +11,9 @@ export LD_LIBRARY_PATH=$PADDLE_INSTALL_DIR/Paddle/third_party/install/warpctc/li For some machines, we also need to install libsndfile1. Details to be added. -### Preparing Dataset(s) +## Usage + +### Preparing Data ``` cd data diff --git a/data/librispeech.py b/data/librispeech.py index 676bbec5..838fee59 100644 --- a/data/librispeech.py +++ b/data/librispeech.py @@ -15,7 +15,7 @@ import argparse import soundfile import json -DATA_HOME = os.path.expanduser('~/.cache2/paddle/dataset/speech') +DATA_HOME = os.path.expanduser('~/.cache/paddle/dataset/speech') URL_ROOT = "http://www.openslr.org/resources/12" URL_TEST_CLEAN = URL_ROOT + "/test-clean.tar.gz" @@ -30,7 +30,7 @@ MD5_TEST_CLEAN = "32fa31d27d2e1cad72775fee3f4849a9" MD5_DEV_CLEAN = "42e2234ba48799c1f50f24a7926300a1" MD5_TRAIN_CLEAN_100 = "2a93770f6d5c6c964bc36631d331a522" MD5_TRAIN_CLEAN_360 = "c0e676e450a7ff2f54aeade5171606fa" -MD5_TRAIN_CLEAN_500 = "d1a0fd59409feb2c614ce4d30c387708" +MD5_TRAIN_OTHER_500 = "d1a0fd59409feb2c614ce4d30c387708" parser = argparse.ArgumentParser( description='Downloads and prepare LibriSpeech dataset.')