www.pudn.com > sphinx_recipe.zip > align_trans.sh
# Align the transcriptions using sphinx and previously trained # Resource Management acoustic model. MODEL_PARAM=$CMU_RM1/model_parameters/rm1.cd_cont_1000_8 MODEL_ARCH=$CMU_RM1/model_architecture/rm1.1000.mdef $CMU_ROOT/bin/sphinx3_align -ctl etc/wsj_all_train_pruned.fileids -insent etc/wsj_all_train.align -mdef $MODEL_ARCH -mean $MODEL_PARAM/means -var $MODEL_PARAM/variances -mixw $MODEL_PARAM/mixture_weights -tmat $MODEL_PARAM/transition_matrices -dict etc/wsj_all.dic -fdict etc/wsj_all.filler -cepdir feat -outsent etc/wsj_all_train_pruned_aligned.transcription -logfn align.log -beam 1e-100 # Prune out any utterances that didn't get force aligned perl $CMU_SCRIPTS/PruneToAligned.pl etc/wsj_all_train_pruned_aligned.transcription etc/wsj_all_train_pruned.fileids >etc/wsj_all_train_pruned_aligned.fileids # Create SI-284 only file list and transcription file perl $CMU_SCRIPTS/PruneToIntersection.pl etc/wsj_all_train_pruned_aligned.fileids etc/wsj_all_train_pruned_aligned.transcription etc/wsj_si284_train.fileids etc/wsj_si284_train_pruned_aligned.fileids etc/wsj_si284_train_pruned_aligned.transcription # Create SI-84 only file list and transcription file perl $CMU_SCRIPTS/PruneToIntersection.pl etc/wsj_all_train_pruned_aligned.fileids etc/wsj_all_train_pruned_aligned.transcription etc/wsj_si84_train.fileids etc/wsj_si84_train_pruned_aligned.fileids etc/wsj_si84_train_pruned_aligned.transcription