kaldi-asr · hhadian · May 29, 2017 · May 29, 2017 · May 30, 2017 · May 31, 2017
diff --git a/egs/fisher_english/s5/local/chain/compare_wer_general.sh b/egs/fisher_english/s5/local/chain/compare_wer_general.sh
@@ -0,0 +1,106 @@
+#!/bin/bash
+
+# this script is used for comparing decoding results between systems.
+# e.g. local/chain/compare_wer_general.sh exp/chain_cleaned/tdnn_{c,d}_sp
+# For use with discriminatively trained systems you specify the epochs after a colon:
+# for instance,
+# local/chain/compare_wer_general.sh exp/chain_cleaned/tdnn_c_sp exp/chain_cleaned/tdnn_c_sp_smbr:{1,2,3}
+
+
+echo "# $0 $*"
+
+include_looped=false
+if [ "$1" == "--looped" ]; then
+  include_looped=true
+  shift
+fi
+
+used_epochs=false
+
+# this function set_names is used to separate the epoch-related parts of the name
+# [for discriminative training] and the regular parts of the name.
+# If called with a colon-free directory name, like:
+#  set_names exp/chain_cleaned/tdnn_lstm1e_sp_bi_smbr
+# it will set dir=exp/chain_cleaned/tdnn_lstm1e_sp_bi_smbr and epoch_infix=""
+# If called with something like:
+#  set_names exp/chain_cleaned/tdnn_d_sp_smbr:3
+# it will set dir=exp/chain_cleaned/tdnn_d_sp_smbr and epoch_infix="_epoch3"
+
+
+set_names() {
+  if [ $# != 1 ]; then
+    echo "compare_wer_general.sh: internal error"
+    exit 1  # exit the program
+  fi
+  dirname=$(echo $1 | cut -d: -f1)
+  epoch=$(echo $1 | cut -s -d: -f2)
+  if [ -z $epoch ]; then
+    epoch_infix=""
+  else
+    used_epochs=true
+    epoch_infix=_epoch${epoch}
+  fi
+}
+
+
+
+echo -n "# System               "
+for x in $*; do   printf "% 10s" " $(basename $x)";   done
+echo
+
+strings=("# WER on dev    "  "# WER on test    ")
+
+for n in 0 1; do
+   echo -n "${strings[$n]}"
+   for x in $*; do
+     set_names $x  # sets $dirname and $epoch_infix
+     decode_names=(dev${epoch_infix} test${epoch_infix})
+     wer=$(grep WER $dirname/decode_${decode_names[$n]}/wer* | utils/best_wer.sh | awk '{print $2}')
+     printf "% 10s" $wer
+   done
+   echo
+   if $include_looped; then
+     echo -n "#         [looped:]    "
+     for x in $*; do
+       set_names $x  # sets $dirname and $epoch_infix
+       decode_names=(dev${epoch_infix} test${epoch_infix})
+       wer=$(grep WER $dirname/decode_looped_${decode_names[$n]}/wer* | utils/best_wer.sh | awk '{print $2}')
+       printf "% 10s" $wer
+     done
+     echo
+   fi
+done
+
+
+if $used_epochs; then
+  exit 0;  # the diagnostics aren't comparable between regular and discriminatively trained systems.
+fi
+
+echo -n "# Final train prob     "
+for x in $*; do
+  prob=$(grep Overall $x/log/compute_prob_train.final.log | grep -v xent | awk '{printf("%.4f", $8)}')
+  printf "% 10s" $prob
+done
+echo
+
+echo -n "# Final valid prob     "
+for x in $*; do
+  prob=$(grep Overall $x/log/compute_prob_valid.final.log | grep -v xent | awk '{printf("%.4f", $8)}')
+  printf "% 10s" $prob
+done
+echo
+
+echo -n "# Final train prob (xent)"
+for x in $*; do
+  prob=$(grep Overall $x/log/compute_prob_train.final.log | grep -w xent | awk '{printf("%.4f", $8)}')
+  printf "% 10s" $prob
+done
+echo
+
+echo -n "# Final valid prob (xent)"
+for x in $*; do
+  prob=$(grep Overall $x/log/compute_prob_valid.final.log | grep -w xent | awk '{printf("%.4f", $8)}')
+  printf "% 10s" $prob
+done
+
+echo
diff --git a/egs/fisher_english/s5/local/chain/run_semisupervised.sh b/egs/fisher_english/s5/local/chain/run_semisupervised.sh
@@ -0,0 +1,148 @@
+#!/bin/bash
+
+set -e -o pipefail
+
+stage=-2
+nj=30
+decode_nj=30
+base_train_set=train_comb350k # for reference
+
+unsupervised_set=train_unsup250k  # set this to your choice of unsupervised data
+supervised_set=train_sup
+semi_affix=350k  # affix relating train-set splitting proportion
+
+tdnn_affix=_sup1a  # affix for the supervised chain-model directory
+train_supervised_opts="--stage -10 --train-stage -10"
+
+# combination options
+decode_affix=
+egs_affix=  # affix for the egs that are generated from unsupervised data and for the comined egs dir
+comb_affix=_comb1a  # affix for new chain-model directory trained on the combined supervised+unsupervised subsets
+unsup_frames_per_eg=  # if empty will be equal to the supervised model's config -- you will need to change minibatch_size for comb training accordingly
+unsup_egs_weight=1.0
+lattice_lm_scale=0.0  # lm-scale for using the weights from unsupervised lattices
+lattice_prune_beam=2.0  # If supplied will prune the lattices prior to getting egs for unsupervised data
+left_tolerance=2
+right_tolerance=2
+train_combined_opts="--num-epochs 4.5"
+graph_affix=   # can be used to decode the unsup data with another lm/graph
+phone_insertion_penalty=
+# to tune:
+# frames_per_eg for unsupervised
+
+# End configuration section.
+echo "$0 $@"  # Print the command line for logging
+
+. cmd.sh
+. ./path.sh
+. ./utils/parse_options.sh
+
+nnet3_affix=_semi${semi_affix}  # affix for nnet3 and chain dirs
+decode_affix=${decode_affix}${graph_affix}
+
+if ! cuda-compiled; then
+  cat <<EOF && exit 1
+This script is intended to be used with GPUs but you have not compiled Kaldi with CUDA
+If you want to use GPUs (and have them), go to src/, and configure and make on a machine
+where "nvcc" is installed.
+EOF
+fi
+
+if [ $stage -le -2 ]; then
+  ali_dir=exp/tri4a_ali_$supervised_set
+  if [ ! -f $ali_dir/ali.1.gz ]; then
+    steps/align_fmllr.sh --nj 30 --cmd "queue.pl" data/$supervised_set data/lang exp/tri4a $ali_dir
+  fi
+  echo "$0: chain training on the supervised subset data/${supervised_set}"
+  local/chain/run_tdnn.sh $train_supervised_opts --remove-egs false \
+                          --train-set $supervised_set \
+                          --build-tree-ali-dir $ali_dir \
+                          --nnet3-affix $nnet3_affix --tdnn-affix $tdnn_affix
+fi
+
+if [ $stage -le -1 ] && [ ! -f exp/nnet3${nnet3_affix}/ivectors_${unsupervised_set}_hires/ivector_online.scp ]; then
+  echo "$0: getting ivectors for the hires unsupervised data data/${unsupervised_set}_hires"
+  steps/online/nnet2/extract_ivectors_online.sh --cmd "$train_cmd" --nj "$nj" \
+            data/${unsupervised_set}_hires exp/nnet3${nnet3_affix}/extractor \
+            exp/nnet3${nnet3_affix}/ivectors_${unsupervised_set}_hires
+fi
+
+chaindir=exp/chain${nnet3_affix}/tdnn${tdnn_affix}_sp
+
+left_context=`cat $chaindir/egs/info/left_context`
+right_context=`cat $chaindir/egs/info/right_context`
+left_context_initial=`cat $chaindir/egs/info/left_context_initial`
+right_context_final=`cat $chaindir/egs/info/right_context_final`
+[ -z $unsup_frames_per_eg ] && unsup_frames_per_eg=`cat $chaindir/egs/info/frames_per_eg`
+frame_subsampling_factor=`cat $chaindir/frame_subsampling_factor`
+cmvn_opts=`cat $chaindir/cmvn_opts`
+
+if [ $stage -le 0 ]; then
+  echo "$0: getting the decoding lattices for the unsupervised subset using the chain model at: $chaindir"
+  graphdir=$chaindir/graph${graph_affix}
+  if [ ! -f $graphdir/HCLG.fst ]; then
+    utils/mkgraph.sh --self-loop-scale 1.0 data/lang_test${graph_affix} $chaindir $graphdir
+  fi
+  steps/nnet3/decode.sh --num-threads 4 --nj $decode_nj --cmd "$decode_cmd" \
+            --acwt 1.0 --post-decode-acwt 10.0 \
+            --online-ivector-dir exp/nnet3${nnet3_affix}/ivectors_${unsupervised_set}_hires \
+            --scoring-opts "--min-lmwt 5 " \
+            $chaindir/graph${graph_affix} data/${unsupervised_set}_hires $chaindir/decode_${unsupervised_set}${decode_affix}
+  ln -s ../final.mdl $chaindir/decode_${unsupervised_set}${decode_affix}/final.mdl || true
+fi
+
+if [ $stage -le 1 ]; then
+  echo "$0: generating egs from the unsupervised data"
+  steps/nnet3/chain/get_egs.sh --cmd "$decode_cmd" --alignment-subsampling-factor 1 \
+             --left-tolerance $left_tolerance --right-tolerance $right_tolerance \
+             --left-context $left_context --right-context $right_context \
+             --left-context-initial $left_context_initial --right-context-final $right_context_final \
+             --frames-per-eg $unsup_frames_per_eg --frames-per-iter 1500000 \
+             --frame-subsampling-factor $frame_subsampling_factor \
+             --cmvn-opts "$cmvn_opts" --lattice-lm-scale $lattice_lm_scale \
+             --lattice-prune-beam "$lattice_prune_beam" \
+             --egs-weight $unsup_egs_weight \
+             --phone-insertion-penalty "$phone_insertion_penalty" \
+             --online-ivector-dir exp/nnet3${nnet3_affix}/ivectors_${unsupervised_set}_hires \
+             data/${unsupervised_set}_hires $chaindir \
+             ${chaindir}/decode_${unsupervised_set}${decode_affix} $chaindir/unsup_egs${decode_affix}${egs_affix}
+fi
+
+sup_egs_dir=$chaindir/egs
+unsup_egs_dir=$chaindir/unsup_egs${decode_affix}${egs_affix}
+comb_egs_dir=$chaindir/comb_egs${decode_affix}${egs_affix}
+if [ $stage -le 2 ]; then
+  echo "$0: combining supervised/unsupervised egs"
+  n1=`cat $sup_egs_dir/info/num_archives`
+  n2=`cat $unsup_egs_dir/info/num_archives`
+  num_archives=$(($n2>$n1?$n2:$n1))
+  num_archives=$[num_archives*3/2]
+  mkdir -p $comb_egs_dir/log
+  cp {$sup_egs_dir,$comb_egs_dir}/train_diagnostic.cegs
+  cp {$sup_egs_dir,$comb_egs_dir}/valid_diagnostic.cegs
+  nnet3-chain-copy-egs "ark:cat $sup_egs_dir/combine.cegs $unsup_egs_dir/combine.cegs |" ark:$comb_egs_dir/combine.cegs
+  cp {$sup_egs_dir,$comb_egs_dir}/cmvn_opts
+  cp -r $sup_egs_dir/info $comb_egs_dir
+  echo $num_archives > $comb_egs_dir/info/num_archives
+  cat {$sup_egs_dir,$unsup_egs_dir}/info/num_frames | awk '{s+=$1} END{print s}' > $comb_egs_dir/info/num_frames
+  cat {$sup_egs_dir,$unsup_egs_dir}/info/egs_per_archive | awk '{s+=$1} END{print s}' > $comb_egs_dir/info/egs_per_archive
+  out_egs_list=
+  egs_list=
+  for n in $(seq $num_archives); do
+      [ -f $sup_egs_dir/cegs.$n.ark ] && egs_list="$egs_list $sup_egs_dir/cegs.$n.ark"
+      [ -f $unsup_egs_dir/cegs.$n.ark ] && egs_list="$egs_list $unsup_egs_dir/cegs.$n.ark"
+      out_egs_list="$out_egs_list ark:$comb_egs_dir/cegs.$n.ark"
+  done
+  srand=0
+  $decode_cmd $comb_egs_dir/log/combine.log \
+              nnet3-chain-copy-egs "ark:cat $egs_list|" $out_egs_list
+fi
+
+if [ $stage -le 3 ]; then
+  echo "$0: training on the supervised+unsupervised subset"
+  # the train-set and gmm do not matter as we are providing the egs
+  local/chain/run_tdnn.sh --stage 12 --remove-egs false --train-set $supervised_set \
+                          --nnet3-affix $nnet3_affix \
+                          --tdnn-affix ${tdnn_affix}${decode_affix}${egs_affix}${comb_affix} \
+                          --common-egs-dir $comb_egs_dir $train_combined_opts
+fi