# include common settings for limitedLP systems. . conf/common.limitedLP || exit 1; #speech corpora files location train_data_dir=/export/babel/data/102-assamese/release-current/conversational/training train_data_list=/export/babel/data/splits/Assamese_Babel102/train.LimitedLP.list train_nj=16 #RADICAL DEV data files dev2h_data_dir=/export/babel/data/102-assamese/release-current/conversational/dev dev2h_data_list=/export/babel/data/splits/Assamese_Babel102/dev.2hr.list dev2h_data_cmudb=/export/babel/data/splits/Assamese_Babel102/uem/db-dev-jhuseg-v7-utt.dat dev2h_stm_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev/IARPA-babel102b-v0.5a_conv-dev.stm dev2h_ecf_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.ecf.xml dev2h_rttm_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev/IARPA-babel102b-v0.5a_conv-dev.mitllfa3.rttm dev2h_kwlist_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.kwlist.xml dev2h_more_kwlists=( [limitedLP]=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.kwlist2.xml ) dev2h_subset_ecf=true dev2h_nj=24 #Official DEV data files dev10h_data_dir=/export/babel/data/102-assamese/release-current/conversational/dev dev10h_data_list=/export/babel/data/splits/Assamese_Babel102//dev.list dev10h_data_cmudb=/export/babel/data/splits/Assamese_Babel102/uem/db-dev-jhuseg-v7-utt.dat dev10h_stm_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev/IARPA-babel102b-v0.5a_conv-dev.stm dev10h_ecf_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.ecf.xml dev10h_rttm_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev/IARPA-babel102b-v0.5a_conv-dev.mitllfa3.rttm dev10h_kwlist_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.kwlist.xml dev10h_more_kwlists=( [limitedLP]=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.kwlist2.xml ) dev10h_nj=32 #Official EVAL period evaluation data files eval_data_dir=/export/babel/data/IARPA-BABEL_OP1_dev_eval/BABEL_OP1_102/conversational/eval/ eval_data_list=/export/babel/data/splits/Assamese_Babel102/eval.list eval_data_cmudb=/export/babel/data/splits/Assamese_Babel102/uem/db-shadow-jhuseg-v7-utt.dat eval_ecf_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-eval.ecf.xml eval_kwlist_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-eval.kwlist4.xml eval_nj=32 #Shadow data files shadow_data_dir=( /export/babel/data/102-assamese/release-current/conversational/dev /export/babel/data/IARPA-BABEL_OP1_dev_eval/BABEL_OP1_102/conversational/eval/ ) shadow_data_list=( /export/babel/data/splits/Assamese_Babel102/dev.list /export/babel/data/splits/Assamese_Babel102/eval.list ) shadow_data_cmudb=/export/babel/data/splits/Assamese_Babel102/uem/102-shadow-v0-utt.dat shadow_ecf_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.ecf.xml shadow_kwlist_file=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-eval.kwlist4.xml shadow_more_kwlists=( [FullLPdev]=/export/babel/data/scoring/IndusDB/IARPA-babel102b-v0.5a_conv-dev.kwlist.xml ) shadow_nj=32 unsup_data_dir=(/export/babel/data/102-assamese//release-current/conversational/training/ /export/babel/data/102-assamese//release-current/conversational/untranscribed-training/ ) unsup_data_list=( /export/babel/data/splits/Assamese_Babel102/train.LimitedLP.untranscribed.list /export/babel/data/splits/Assamese_Babel102/train.untranscribed.list ) unsup_nj=64 # Acoustic model parameters numLeavesTri1=1000 numGaussTri1=10000 numLeavesTri2=2500 numGaussTri2=36000 numLeavesTri3=2500 numGaussTri3=36000 numLeavesMLLT=2500 numGaussMLLT=36000 numLeavesSAT=2500 numGaussSAT=36000 numGaussUBM=750 numLeavesSGMM=5000 numGaussSGMM=18000 # Lexicon and Language Model parameters oovSymbol="" lexiconFlags="--romanized --oov " lexicon_file=/export/babel/data/102-assamese/release-current/conversational/reference_materials/lexicon.sub-train.txt cer=0 max_index_states=150000 word_ins_penalty=0.5 #keyword search settings duptime=0.5 case_insensitive=true