Json Format
{
"duration": length_of_speech_in_secs,
"text": label,
"key": a path of a wave file
}
# a line number is a token index
phone1
phone2
...
export PYTHONPATH=`pwd`
python -u rnnt/train.py \
--paths-data-path=$TIMIT_DATA_PATH \
--config=$CONFIG/timit_graves13_CTC-3L-250H.conf \
--paths-vocab=$TIMIT_DATA_PATH/timit_61.phone \
--paths-cmvn-mean=train_core_corpus_61_graves13.mean \
--paths-cmvn-std=train_core_corpus_61_graves13.std \
--paths-train-corpus=train_core_corpus_61.json \
--paths-valid-corpus=valid_noncore_50spk_61.json \
--paths-test-corpus=test_core_corpus_61.json