author | Jan Trmal <jtrmal@gmail.com> | |
Sat, 12 Oct 2013 00:15:20 +0000 (00:15 +0000) | ||
committer | Jan Trmal <jtrmal@gmail.com> | |
Sat, 12 Oct 2013 00:15:20 +0000 (00:15 +0000) |
git-svn-id: https://svn.code.sf.net/p/kaldi/code/sandbox/tacc_kaldi@3074 5e6a8d80-dfce-4ca6-a32a-6e07a63d50c8
diff --cc egs/babel/s5/conf/common.limitedLP
index a04babc29d7804938034751333bd198b899c7af0,a04babc29d7804938034751333bd198b899c7af0..33c1465f06a3fe381c6727fa655986cc6bfd5fd5
babel_type=limited
use_pitch=false
++use_ffv=false
lmwt_plp_extra_opts=( --min-lmwt 8 --max-lmwt 12 )
lmwt_bnf_extra_opts=( --min-lmwt 13 --max-lmwt 18 )
icu_opt=(--use-icu true --icu-transform Any-Lower)
if [[ `hostname` == *.tacc.utexas.edu ]] ; then
-- dnn_train_extra_opts=(--num-threads 6 --parallel-opts "-pe smp 6" --num-jobs-nnet 16 --stage 0)
++ dnn_train_extra_opts=(--num-threads 6 --parallel-opts "-pe smp 6" --num-jobs-nnet 16 )
decode_extra_opts=( --num-threads 4 --parallel-opts "-pe smp 4" )
sgmm_train_extra_opts=( )
sgmm_group_extra_opts=( )
index e4d22cdb4162c38c0c87f25aa372b17a2ba3cb6d,e4d22cdb4162c38c0c87f25aa372b17a2ba3cb6d..6e04e9afe2350d72c7f2907be064685fef50f08b
. conf/common.limitedLP || exit 1;
#speech corpora files location
--train_data_dir=/export/babel/data/107-vietnamese/release-current/conversational/training/
--train_data_list=/export/babel/data/splits/Vietnamese_Babel107/train.LimitedLP.list
--train_nj=16
++train_data_dir=/work/02359/jtrmal/107-vietnamese/release-current/conversational/training/
++train_data_list=/work/02359/jtrmal/splits/Vietnamese_Babel107/train.LimitedLP.list
++train_nj=12
#RADICAL DEV data files
--dev2h_data_dir=/export/babel/data/107-vietnamese/release-current/conversational/dev
--dev2h_data_list=/export/babel/data/splits/Vietnamese_Babel107/dev.2hr.list
--dev2h_data_cmudb=/export/babel/data/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
--dev2h_stm_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.stm
--dev2h_ecf_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev.ecf.xml
--dev2h_rttm_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.mitllfa3.rttm
--dev2h_kwlist_file=/export/babel/data/splits/Vietnamese_Babel107/keywords.expanded.cmu.v2.xml
++dev2h_data_dir=/work/02359/jtrmal/107-vietnamese/release-current/conversational/dev
++dev2h_data_list=/work/02359/jtrmal/splits/Vietnamese_Babel107/dev.2hr.list
++dev2h_data_cmudb=/work/02359/jtrmal/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
++dev2h_stm_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.stm
++dev2h_ecf_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev.ecf.xml
++dev2h_rttm_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.mitllfa3.rttm
++dev2h_kwlist_file=/work/02359/jtrmal/splits/Vietnamese_Babel107/keywords.expanded.cmu.v2.xml
dev2h_subset_ecf=true
dev2h_nj=27
#Official DEV data files
--dev10h_data_dir=/export/babel/data/107-vietnamese/release-current/conversational/dev/
--dev10h_data_list=/export/babel/data/splits/Vietnamese_Babel107/dev.list
--dev10h_data_cmudb=/export/babel/data/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
--dev10h_stm_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.stm
--dev10h_ecf_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev.ecf.xml
--dev10h_rttm_file=/export/babel/data/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.mitllfa3.rttm
--dev10h_kwlist_file=/export/babel/data/splits/Vietnamese_Babel107/keywords.expanded.cmu.v2.xml
++dev10h_data_dir=/work/02359/jtrmal/107-vietnamese/release-current/conversational/dev/
++dev10h_data_list=/work/02359/jtrmal/splits/Vietnamese_Babel107/dev.list
++dev10h_data_cmudb=/work/02359/jtrmal/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
++dev10h_stm_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.stm
++dev10h_ecf_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev.ecf.xml
++dev10h_rttm_file=/work/02359/jtrmal/scoring/IndusDB/babel107b-v0.7_conv-dev/babel107b-v0.7_conv-dev.mitllfa3.rttm
++dev10h_kwlist_file=/work/02359/jtrmal/splits/Vietnamese_Babel107/keywords.expanded.cmu.v2.xml
dev10h_nj=32
#Official EVAL period evaluation data files
--eval_data_dir=/export/babel/data/107-vietnamese/release-current/conversational/eval/
--eval_data_list=/export/babel/data/splits/Vietnamese_Babel107/eval.list
--eval_data_cmudb=/export/babel/data/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
--eval_ecf_file=/export/babel/data/scoring/IndusDB.20130424/babel107b-v0.7_conv-eval.ecf.xml
--eval_kwlist_file=/export/babel/data/scoring/IndusDB.20130424/babel107b-v0.7_conv-eval.kwlist3.xml
++eval_data_dir=/work/02359/jtrmal/107-vietnamese/release-current/conversational/eval/
++eval_data_list=/work/02359/jtrmal/splits/Vietnamese_Babel107/eval.list
++eval_data_cmudb=/work/02359/jtrmal/splits/Vietnamese_Babel107/uem/conv-eval/db-v8-utt.dat
++eval_ecf_file=/work/02359/jtrmal/scoring/IndusDB.20130424/babel107b-v0.7_conv-eval.ecf.xml
++eval_kwlist_file=/work/02359/jtrmal/scoring/IndusDB.20130424/babel107b-v0.7_conv-eval.kwlist3.xml
eval_nj=81
#Official (POST-)EVAL evaluation data portion
# Lexicon and Language Model parameters
oovSymbol="<unk>"
lexiconFlags="--oov <unk>"
--use_pitch=true
++use_pitch=false
# Scoring protocols (dummy GLM file to appease the scoring script)
#glmFile=./conf/glm
--lexicon_file=/export/babel/data/107-vietnamese/release-current/conversational/reference_materials/lexicon.sub-train.txt
++lexicon_file=/work/02359/jtrmal/107-vietnamese/release-current/conversational/reference_materials/lexicon.sub-train.txt
phoneme_mapping="i@U=i @ U;oaI=o a I;oaI:=o a I:;u@I=u @ I;uI@= u I @;1@I=1 @ I;1@U=1 @ U;
a:I=a: I; a:U=a: U; aU=a U; @U=@ U; aI=a I; @I=@ I; EU=E U; eU=e U; i@=i @; iU=i U; Oa:=O a: ; Oa=O a;
diff --cc egs/babel/s5/run-2a-nnet.sh
index 00a3b44fe2e572ee237d7cf6524411d19e929c31,00a3b44fe2e572ee237d7cf6524411d19e929c31..3b8e71bbefdccf9574376aa23475482d47a3c725
if [ ! -f exp/tri6_nnet/.done ]; then
-- steps/train_nnet_cpu.sh \
++ bash -x steps/train_nnet_cpu.sh \
--mix-up "$dnn_mixup" \
--initial-learning-rate "$dnn_initial_learning_rate" \
--final-learning-rate "$dnn_final_learning_rate" \
diff --cc tools/Makefile
index 870a3021182f6f1a5f3a9760cf46315c8b6c6290,870a3021182f6f1a5f3a9760cf46315c8b6c6290..4a46384a4cdae73116b0cae46a7690b3d277e8a7
--- 1/tools/Makefile
--- 2/tools/Makefile
+++ b/tools/Makefile
# SHELL += -x
--all: check_required_programs sph2pipe atlas irstlm_tgt sclite_tgt openfst_tgt
++all: check_required_programs sph2pipe atlas irstlm_tgt openfst_tgt
check_required_programs: