some aesthetic changes; not final yet

kaldi-asr · danpovey · Nov 23, 2017 · Sep 18, 2017 · Sep 20, 2017 · Sep 22, 2017
commit 483450dc80eb35c3e4acc9ab5c788f243d041b14
diff --git a/egs/swbd/s5/local/rnnlm/run_rescoring.sh b/egs/swbd/s5/local/rnnlm/run_rescoring.sh
@@ -20,7 +20,7 @@ for decode_set in eval2000; do
   decode_dir=${dir}/decode_${decode_set}_$LM
 
   # Lattice rescoring
-  steps/lmrescore_rnnlm_lat.sh \
+  rnnlm/lmrescore_rnnlm_lat.sh \
     --cmd "$decode_cmd --mem 16G" \
     --rnnlm-ver kaldirnnlm  --weight 0.5 --max-ngram-order $ngram_order \
     data/lang_$LM $rnndir \

diff --git a/scripts/rnnlm/lmrescore_rnnlm_lat.sh b/scripts/rnnlm/lmrescore_rnnlm_lat.sh
@@ -0,0 +1,115 @@
+#!/bin/bash
+
+# Copyright 2015  Guoguo Chen
+#           2017  Hainan Xu
+# Apache 2.0
+
+# This script rescores lattices with RNNLM.  See also rnnlmrescore.sh which is
+# an older script using n-best lists.
+
+# Begin configuration section.
+cmd=run.pl
+skip_scoring=false
+max_ngram_order=4
+N=10
+inv_acwt=12
+weight=1.0  # Interpolation weight for RNNLM.
+# End configuration section.
+rnnlm_ver=
+#layer_string=
+
+echo "$0 $@"  # Print the command line for logging
+
+. ./utils/parse_options.sh
+
+if [ $# != 5 ]; then
+   echo "Does language model rescoring of lattices (remove old LM, add new LM)"
+   echo "with RNNLM."
+   echo ""
+   echo "Usage: $0 [options] <old-lang-dir> <rnnlm-dir> \\"
+   echo "                   <data-dir> <input-decode-dir> <output-decode-dir>"
+   echo " e.g.: $0 ./rnnlm data/lang_tg data/test \\"
+   echo "                   exp/tri3/test_tg exp/tri3/test_rnnlm"
+   echo "options: [--cmd (run.pl|queue.pl [queue opts])]"
+   exit 1;
+fi
+
+[ -f path.sh ] && . ./path.sh;
+
+oldlang=$1
+rnnlm_dir=$2
+data=$3
+indir=$4
+outdir=$5
+
+rescoring_binary=lattice-lmrescore-rnnlm
+
+
+if [ "$rnnlm_ver" == "kaldirnnlm" ]; then
+  rescoring_binary="lattice-lmrescore-kaldi-rnnlm"
+  first_arg="\"rnnlm-get-word-embedding $rnnlm_dir/word_feats.txt $rnnlm_dir/feat_embedding.final.mat -|\" $rnnlm_dir/config/words.txt "
+fi
+
+oldlm=$oldlang/G.fst
+if [ -f $oldlang/G.carpa ]; then
+  oldlm=$oldlang/G.carpa
+elif [ ! -f $oldlm ]; then
+  echo "$0: expecting either $oldlang/G.fst or $oldlang/G.carpa to exist" &&\
+    exit 1;
+fi
+
+[ ! -f $oldlm ] && echo "$0: Missing file $oldlm" && exit 1;
+[ ! -f $rnnlm_dir/final.raw ] && echo "$0: Missing file $rnnlm_dir/final.raw" && exit 1;
+[ ! -f $rnnlm_dir/feat_embedding.final.mat ] && [ ! -f $rnnlm_dir/word_embedding.final.mat ] && echo "$0: Missing word embedding file" && exit 1;
+
+[ ! -f $oldlang/words.txt ] &&\
+  echo "$0: Missing file $oldlang/words.txt" && exit 1;
+! ls $indir/lat.*.gz >/dev/null &&\
+  echo "$0: No lattices input directory $indir" && exit 1;
+awk -v n=$0 -v w=$weight 'BEGIN {if (w < 0 || w > 1) {
+  print n": Interpolation weight should be in the range of [0, 1]"; exit 1;}}' \
+  || exit 1;
+
+oldlm_command="fstproject --project_output=true $oldlm |"
+
+acwt=`perl -e "print (1.0/$inv_acwt);"`
+
+word_embedding=
+if [ -f $rnnlm_dir/word_embedding.final.mat ]; then
+  word_embedding=$rnnlm_dir/word_embedding.final.mat
+else
+  word_embedding="\"rnnlm-get-word-embedding $rnnlm_dir/word_feats.txt $rnnlm_dir/feat_embedding.final.mat -|\""
+fi
+
+mkdir -p $outdir/log
+nj=`cat $indir/num_jobs` || exit 1;
+cp $indir/num_jobs $outdir
+
+oldlm_weight=`perl -e "print -1.0 * $weight;"`
+if [ "$oldlm" == "$oldlang/G.fst" ]; then
+  $cmd JOB=1:$nj $outdir/log/rescorelm.JOB.log \
+    lattice-lmrescore --lm-scale=$oldlm_weight \
+    "ark:gunzip -c $indir/lat.JOB.gz|" "$oldlm_command" ark:-  \| \
+    $rescoring_binary --lm-scale=$weight \
+    --max-ngram-order=$max_ngram_order \
+    $oldlang/words.txt ark:- $rnnlm_dir/config/words.txt $word_embedding "$rnnlm_dir/final.raw" \
+    "ark,t:|gzip -c>$outdir/lat.JOB.gz" || exit 1;
+else
+  $cmd JOB=1:$nj $outdir/log/rescorelm.JOB.log \
+    lattice-lmrescore-const-arpa --lm-scale=$oldlm_weight \
+    "ark:gunzip -c $indir/lat.JOB.gz|" "$oldlm" ark:-  \| \
+    $rescoring_binary --lm-scale=$weight \
+    --max-ngram-order=$max_ngram_order \
+    $oldlang/words.txt ark:- $rnnlm_dir/config/words.txt $word_embedding "$rnnlm_dir/final.raw" \
+    "ark,t:|gzip -c>$outdir/lat.JOB.gz" || exit 1;
+fi
+if ! $skip_scoring ; then
+  err_msg="Not scoring because local/score.sh does not exist or not executable."
+  [ ! -x local/score.sh ] && echo $err_msg && exit 1;
+  local/score.sh --cmd "$cmd" $data $oldlang $outdir
+else
+  echo "Not scoring because requested so..."
+fi
+
+exit 0;
+
diff --git a/scripts/rnnlm/train_rnnlm.sh b/scripts/rnnlm/train_rnnlm.sh
@@ -221,11 +221,8 @@ if [ $stage -le $num_iters ]; then
   echo "$0: best iteration (out of $num_iters) was $best_iter, linking it to final iteration."
   ln -sf $embedding_type.$best_iter.mat $dir/$embedding_type.final.mat
   ln -sf $best_iter.raw $dir/final.raw
-  ln -sf $best_iter.raw $dir/rnnlm  # to make it consistent with other RNNLMs
 fi
 
-touch $dir/unk.probs
-
 # Now get some diagnostics about the evolution of the objective function.
 if [ $stage -le $[num_iters+1] ]; then
   (

diff --git a/src/latbin/lattice-lmrescore-kaldi-rnnlm.cc b/src/latbin/lattice-lmrescore-kaldi-rnnlm.cc
@@ -1,8 +1,8 @@
 // latbin/lattice-lmrescore-kaldi-rnnlm.cc
 
 // Copyright 2017 Johns Hopkins University (author: Daniel Povey)
-//                Hainan Xu
-//                Yiming Wang
+//           2017 Hainan Xu
+//           2017 Yiming Wang
 
 // See ../../COPYING for clarification regarding multiple authors
 //
@@ -66,10 +66,10 @@ int main(int argc, char *argv[]) {
     std::string lats_rspecifier, rnn_wordlist, word_embedding_rxfilename,
         word_symbols_rxfilename, rnnlm_rxfilename, lats_wspecifier;
 
-    word_embedding_rxfilename = po.GetArg(1);
-    rnn_wordlist = po.GetArg(2);
-    word_symbols_rxfilename = po.GetArg(3);
-    lats_rspecifier = po.GetArg(4);
+    word_symbols_rxfilename = po.GetArg(1);
+    lats_rspecifier = po.GetArg(2);
+    rnn_wordlist = po.GetArg(3);
+    word_embedding_rxfilename = po.GetArg(4);
     rnnlm_rxfilename = po.GetArg(5);
     lats_wspecifier = po.GetArg(6);
 
@@ -85,8 +85,8 @@ int main(int argc, char *argv[]) {
     CuMatrix<BaseFloat> word_embedding_mat;
     ReadKaldiObject(word_embedding_rxfilename, &word_embedding_mat);
 
-    const nnet3::DecodableRnnlmSimpleLoopedComputationOptions opts;
-    const nnet3::DecodableRnnlmSimpleLoopedInfo info(opts, rnnlm, word_embedding_mat);
+    const nnet3::RnnlmSimpleLoopedComputationOptions opts;
+    const nnet3::RnnlmSimpleLoopedInfo info(opts, rnnlm, word_embedding_mat);
 
     // Reads and writes as compact lattice.
     SequentialCompactLatticeReader compact_lattice_reader(lats_rspecifier);

diff --git a/src/rnnlm/Makefile b/src/rnnlm/Makefile
@@ -10,7 +10,7 @@ TESTFILES = sampler-test sampling-lm-test rnnlm-example-test
 OBJFILES = sampler.o rnnlm-example.o rnnlm-example-utils.o \
            rnnlm-core-training.o rnnlm-embedding-training.o rnnlm-core-compute.o \
            rnnlm-utils.o rnnlm-training.o rnnlm-test-utils.o sampling-lm-estimate.o \
-           sampling-lm.o rnnlm-decodable-simple-looped.o rnnlm-lattice-rescoring.o
+           sampling-lm.o rnnlm-simple-looped.o rnnlm-lattice-rescoring.o
 
 LIBNAME = kaldi-rnnlm
 

diff --git a/src/rnnlm/rnnlm-lattice-rescoring.cc b/src/rnnlm/rnnlm-lattice-rescoring.cc
@@ -1,8 +1,8 @@
 // rnnlm/rnnlm-lattice-rescoring.cc
 
-// Copyright 2017 Johns Hopkins University (author: Daniel Povey)
-//                Yiming Wang
-//                Hainan Xu
+// Copyright 2017 Johns Hopkins University (author: Daniel Povey) 
+//           2017 Yiming Wang
+//           2017 Hainan Xu
 //
 // See ../../COPYING for clarification regarding multiple authors
 //
@@ -64,7 +64,9 @@ void KaldiRnnlmDeterministicFst::ReadFstWordSymbolTableAndRnnWordlist(
     int32 i = 0;
     while (ifile >> word >> id) {
       if (word == "</s>") {
-        final_word_index_ = id;
+        eos_index_ = id;
+      } else if (word == "<s>") {
+        bos_index_ = id;
       }
       KALDI_ASSERT(i == id);
       i++;
@@ -95,18 +97,18 @@ void KaldiRnnlmDeterministicFst::ReadFstWordSymbolTableAndRnnWordlist(
 KaldiRnnlmDeterministicFst::KaldiRnnlmDeterministicFst(int32 max_ngram_order,
     const std::string &rnn_wordlist,
     const std::string &word_symbol_table_rxfilename,
-    const DecodableRnnlmSimpleLoopedInfo &info) {
+    const RnnlmSimpleLoopedInfo &info) {
   max_ngram_order_ = max_ngram_order;
   ReadFstWordSymbolTableAndRnnWordlist(rnn_wordlist,
                                        word_symbol_table_rxfilename);
 
-  std::vector<Label> bos;
-  bos.push_back(0); // 0 for <s>
-  state_to_wseq_.push_back(bos);
-  DecodableRnnlmSimpleLooped decodable_rnnlm(info);
-  decodable_rnnlm.TakeFeatures(std::vector<Label>(1, bos[0]));
+  std::vector<Label> bos_seq;
+  bos_seq.push_back(bos_index_);
+  state_to_wseq_.push_back(bos_seq);
+  RnnlmSimpleLooped decodable_rnnlm(info);
+  decodable_rnnlm.TakeFeatures(bos_seq);
   state_to_decodable_rnnlm_.push_back(decodable_rnnlm);
-  wseq_to_state_[bos] = 0;
+  wseq_to_state_[bos_seq] = 0;
   start_state_ = 0;
 }
 
@@ -115,7 +117,7 @@ fst::StdArc::Weight KaldiRnnlmDeterministicFst::Final(StateId s) {
   KALDI_ASSERT(static_cast<size_t>(s) < state_to_wseq_.size());
 
   // log prob of end of sentence
-  BaseFloat logprob = state_to_decodable_rnnlm_[s].GetOutput(0, final_word_index_);
+  BaseFloat logprob = state_to_decodable_rnnlm_[s].GetOutput(0, eos_index_);
   return Weight(-logprob);
 }
 
@@ -125,7 +127,7 @@ bool KaldiRnnlmDeterministicFst::GetArc(StateId s, Label ilabel,
   KALDI_ASSERT(static_cast<size_t>(s) < state_to_wseq_.size());
 
   std::vector<Label> wseq = state_to_wseq_[s];
-  DecodableRnnlmSimpleLooped decodable_rnnlm = state_to_decodable_rnnlm_[s];
+  RnnlmSimpleLooped decodable_rnnlm = state_to_decodable_rnnlm_[s];
   int32 rnn_word = fst_label_to_rnn_label_[ilabel];
 
   BaseFloat logprob = decodable_rnnlm.GetOutput(0, rnn_word);

diff --git a/src/rnnlm/rnnlm-lattice-rescoring.h b/src/rnnlm/rnnlm-lattice-rescoring.h
@@ -1,8 +1,8 @@
 // rnnlm/rnnlm-lattice-rescoring.h
 //
 // Copyright 2017 Johns Hopkins University (author: Daniel Povey) 
-//                Yiming Wang
-//                Hainan Xu
+//           2017 Yiming Wang
+//           2017 Hainan Xu
 //
 // See ../../COPYING for clarification regarding multiple authors
 //
@@ -27,7 +27,7 @@
 
 #include "base/kaldi-common.h"
 #include "fstext/deterministic-fst.h"
-#include "rnnlm/rnnlm-decodable-simple-looped.h"
+#include "rnnlm/rnnlm-simple-looped.h"
 #include "util/common-utils.h"
 
 namespace kaldi {
@@ -44,7 +44,7 @@ class KaldiRnnlmDeterministicFst
   KaldiRnnlmDeterministicFst(int32 max_ngram_order,
       const std::string &rnn_wordlist,
       const std::string &word_symbol_table_rxfilename,
-      const DecodableRnnlmSimpleLoopedInfo &info);
+      const RnnlmSimpleLoopedInfo &info);
 
   // We cannot use "const" because the pure virtual function in the interface is
   // not const.
@@ -66,7 +66,8 @@ class KaldiRnnlmDeterministicFst
   std::vector<std::string> fst_label_to_word_;
   int32 full_voc_size_;
   int32 out_OOS_index_;
-  int32 final_word_index_;
+  int32 bos_index_;
+  int32 eos_index_;
 
   typedef unordered_map
       <std::vector<Label>, StateId, VectorHasher<Label> > MapType;
@@ -75,7 +76,7 @@ class KaldiRnnlmDeterministicFst
   std::vector<std::vector<Label> > state_to_wseq_;
 
   int32 max_ngram_order_;
-  std::vector<DecodableRnnlmSimpleLooped> state_to_decodable_rnnlm_;
+  std::vector<RnnlmSimpleLooped> state_to_decodable_rnnlm_;
 
   void ReadFstWordSymbolTableAndRnnWordlist(const std::string &rnn_in_wordlist,
 //      const std::string &rnn_out_wordlist,