www.pudn.com > sphinx_recipe.zip > align_trans.sh



# Align the transcriptions using sphinx and previously trained
# Resource Management acoustic model.

MODEL_PARAM=$CMU_RM1/model_parameters/rm1.cd_cont_1000_8
MODEL_ARCH=$CMU_RM1/model_architecture/rm1.1000.mdef

$CMU_ROOT/bin/sphinx3_align -ctl etc/wsj_all_train_pruned.fileids -insent etc/wsj_all_train.align -mdef $MODEL_ARCH -mean $MODEL_PARAM/means -var $MODEL_PARAM/variances -mixw $MODEL_PARAM/mixture_weights -tmat $MODEL_PARAM/transition_matrices -dict etc/wsj_all.dic -fdict etc/wsj_all.filler -cepdir feat -outsent etc/wsj_all_train_pruned_aligned.transcription -logfn align.log -beam 1e-100

# Prune out any utterances that didn't get force aligned
perl $CMU_SCRIPTS/PruneToAligned.pl etc/wsj_all_train_pruned_aligned.transcription etc/wsj_all_train_pruned.fileids >etc/wsj_all_train_pruned_aligned.fileids

# Create SI-284 only file list and transcription file
perl $CMU_SCRIPTS/PruneToIntersection.pl etc/wsj_all_train_pruned_aligned.fileids etc/wsj_all_train_pruned_aligned.transcription etc/wsj_si284_train.fileids etc/wsj_si284_train_pruned_aligned.fileids etc/wsj_si284_train_pruned_aligned.transcription

# Create SI-84 only file list and transcription file
perl $CMU_SCRIPTS/PruneToIntersection.pl etc/wsj_all_train_pruned_aligned.fileids etc/wsj_all_train_pruned_aligned.transcription etc/wsj_si84_train.fileids etc/wsj_si84_train_pruned_aligned.fileids etc/wsj_si84_train_pruned_aligned.transcription