#---------------------------------------------------------------# # htrain.env SWBD Training Environment File # # # # This version is for: # # # # htrain triphone training script # # # #---------------------------------------------------------------# echo "Enter htrain.env" # if USE_EXPORT is set, the enviornment variable ncpus is used to # decide how many CPUs will the job be partitioned on. set USE_EXPORT=1 #unset USE_EXPORT set ncpus=4 # CPUs to use for training: if USE_EXPORT is set, and cpus is also set, # then the export is restricted to the cpus in the list set cpus = ( s02 s03 s04 s05 s06 s07 s08 s09 s10 s11 s12 s13 s14 s15 s16 s17 s18 s19 s20) # unset cpus # Note that label editing and model editing will be done on a single # CPU if ( $?USE_EXPORT && $?cpus ) then foreach t($cpus) if (! $?export_opt ) then set export_opt = "-attr $t" else set export_opt = "$export_opt -attr OR -attr $t" endif end endif if ( $?USE_EXPORT ) then set cpus = "cpu${ncpus}" @ t = $ncpus - 1 while ( $t ) set cpus = "cpu$t $cpus" @ t -= 1 end endif # Comment the next statement if you do not wish to use your local CPU. #if ( $?export_opt ) then # set export_opt = "$export_opt OR -uselocal" #else # set export_opt = "-uselocal" #endif echo "$export_opt" # to Save space, results on intermidiate iterations of HERest are # deleted if SAVE_SPACE is set # Main directory location set maindir = /export/q/ws96/mordow/HTK_TRAIN set SAVE_SPACE # Switchboard toolkit library location #set swbdlib = /export/p/ws96/WS96_TOOLS/HMM_Tools96 set swbdlib = /export/q/ws96/mordow set HTE = $swbdlib/train_scripts/HTE.train # Triphone type that will be used: wintri --> Word Internal # xwrdtri--> Cross word set tritype = wintri # Define input file coercions. This must agree with HMM definitions. #setenv HCOERCE MFCC_E_D_A_Z setenv HCOERCE USER # set feature dimension (after coercion) set Feature_Dim = 38 # Set the following to read data from ESPS files # setenv HFORMAT ESPS # setenv HSAMPKIND # setenv HCOERCE # Define training script files. Script files are ascii files which # contain file names with complete paths. set trnscpfs = /export/n/ws96/SWB/Lists/swb.htk.8hr.cut0.plplist # Flat-start training files set trnscp = /export/n/ws96/SWB/Lists/swb.htk.8hr.cut0.plplist # Full training file list # Define HMM lists. These must cover the phones in the test and training sets. set hmmlist_fs = $maindir/phon_lists/mono-sp # Flat-start monophones set hmmlist_mono = $maindir/phon_lists/mono # Baseline monophones set hmmlist_tri = $maindir/phon_lists/allcd # all Triphones that can ever # occur in training and testing # Define phone-level training Master Label Files set trainmlf_fs = $maindir/train.mono-sp.mlf # flat-start monophone labels set trainmlf_mono = $maindir/train.mono.mlf # monophones labels # Define Word-level Master Label Files for Alignment during training set wordmlf = /export/p/ws96/WS96_DATA/SWB_TRANS/TRAINING.word.mlf # Define the Dictionary for words in the training data set dict = $maindir/WS96AMDict.icsi56.ver1.spsil # Minimum Varinace (Variance Floor) as a fraction of Global data # variance set minvFloor = 0.002 # HHEd state-clustering threshold for state-clustered # triphones. See HTK V2.0 manual and HHEd.c source code set hhed = $maindir/edit_scripts/${tritype}.hed # script for cloning monophones to triphones and tying # transition matrices set ro_thresh = 250 set dt_thresh = 300 set treehed = $maindir/edit_scripts/tree.hed # Main edit script for # decision tree clustering # HLEd script for creating triphone transcription from monophone # transcription set led_to_tri = $swbdlib/edit_scripts/${tritype}.led # HERest training iterations set fsits = 4 # Flat-Start set monoitsb = 4 # Monophone iterations before Alignment set monoitsa = 9 # Total # of Monophone iterations. set triits_bc = 3 # Triphone iterations before clustering #set triits_bc = 2 # Triphone iterations before clustering set triits_ac = 4 # Total # of triphone iterations after clustering set tricits = 4 # Number of State-Clustered Triphones iterations # Mixture growing sequence. State-clustered triphone mixtures are # increased in this sequence. tricits (above) determines the number # of HERest iterations performed after each increase in mixture count. set mixtures = (2 4 5 7) echo "Exit htrain.env" #---------------------------------------------------------------# # END OF ENVIRONMENT DEFINITION # #---------------------------------------------------------------#