[src,scripts,egs] Misc small fixes, including fix to TDNN-F results in mini_librispeech (kaldi-asr#2565)

danpovey · web-flow · commit 1d61f1cf4c4d · 2018-07-22T14:11:44.000-07:00
diff --git a/.travis.yml b/.travis.yml
@@ -21,6 +21,7 @@ addons:
       - gfortran-4.9
       - liblapack-dev
       - clang-3.8
+      - sox
 
 branches:
   only:
diff --git a/egs/mini_librispeech/s5/local/chain/tuning/run_tdnn_1h.sh b/egs/mini_librispeech/s5/local/chain/tuning/run_tdnn_1h.sh
@@ -1,25 +1,26 @@
 #!/bin/bash
 
 # 1h is as 1g but a re-tuned model based on resnet-style TDNN-F layers with
-# bypass connections.  Below, 1h2 is just a rerun of 1h with a different --affix
-# option, to give some idea of the run-to-run variation.
-
-# local/chain/compare_wer.sh --online exp/chain/tdnn1g_sp exp/chain/tdnn1h_sp exp/chain/tdnn1h2_sp
-# System                tdnn1g_sp tdnn1h_sp tdnn1h2_sp
-#WER dev_clean_2 (tgsmall)      13.50     13.18     13.04
-#             [online:]         13.52     13.03     12.97
-#WER dev_clean_2 (tglarge)       9.79      9.18      9.16
-#             [online:]          9.79      9.29      9.24
-# Final train prob        -0.0460   -0.0531   -0.0590
-# Final valid prob        -0.0892   -0.0844   -0.0865
-# Final train prob (xent)   -1.1739   -1.5244   -1.7771
-# Final valid prob (xent)   -1.4487   -1.7447   -1.9611
-# Num-params                 6234672   3512112   3512112
-
-# steps/info/chain_dir_info.pl  exp/chain/tdnn1{g,h,h2}_sp
+# bypass connections.  Below, 1h2 and 1h3 are just reruns of 1h with different
+# --affix options, to give some idea of the run-to-run variation.
+
+# local/chain/compare_wer.sh --online exp/chain/tdnn1g_sp exp/chain/tdnn1h_sp exp/chain/tdnn1h2_sp exp/chain/tdnn1h3_sp
+# System                tdnn1g_sp tdnn1h_sp tdnn1h2_sp tdnn1h3_sp
+#WER dev_clean_2 (tgsmall)      13.50     12.09     12.23     12.19
+#             [online:]         13.52     12.11     12.25     12.14
+#WER dev_clean_2 (tglarge)       9.79      8.59      8.64      8.73
+#             [online:]          9.79      8.76      8.65      8.78
+# Final train prob        -0.0460   -0.0493   -0.0490   -0.0493
+# Final valid prob        -0.0892   -0.0805   -0.0803   -0.0813
+# Final train prob (xent)   -1.1739   -1.1730   -1.1742   -1.1749
+# Final valid prob (xent)   -1.4487   -1.3872   -1.3857   -1.3913
+# Num-params                 6234672   5207856   5207856   5207856
+
+
 # exp/chain/tdnn1g_sp: num-iters=25 nj=2..5 num-params=6.2M dim=40+100->2328 combine=-0.056->-0.055 (over 3) xent:train/valid[15,24,final]=(-1.50,-1.23,-1.17/-1.73,-1.52,-1.45) logprob:train/valid[15,24,final]=(-0.063,-0.051,-0.046/-0.101,-0.094,-0.089)
-# exp/chain/tdnn1h_sp: num-iters=34 nj=2..5 num-params=3.5M dim=40+100->2328 combine=-0.055->-0.050 (over 4) xent:train/valid[21,33,final]=(-1.97,-1.57,-1.52/-2.11,-1.78,-1.74) logprob:train/valid[21,33,final]=(-0.080,-0.061,-0.053/-0.106,-0.096,-0.084)
-# exp/chain/tdnn1h2_sp: num-iters=34 nj=2..5 num-params=3.5M dim=40+100->2328 combine=-0.062->-0.056 (over 4) xent:train/valid[21,33,final]=(-2.21,-1.78,-1.78/-2.34,-1.96,-1.96) logprob:train/valid[21,33,final]=(-0.086,-0.066,-0.059/-0.110,-0.098,-0.087)
+# exp/chain/tdnn1h_sp: num-iters=34 nj=2..5 num-params=5.2M dim=40+100->2328 combine=-0.049->-0.046 (over 4) xent:train/valid[21,33,final]=(-1.50,-1.22,-1.17/-1.66,-1.44,-1.39) logprob:train/valid[21,33,final]=(-0.068,-0.055,-0.049/-0.097,-0.088,-0.080)
+# exp/chain/tdnn1h2_sp: num-iters=34 nj=2..5 num-params=5.2M dim=40+100->2328 combine=-0.049->-0.046 (over 4) xent:train/valid[21,33,final]=(-1.50,-1.22,-1.17/-1.67,-1.43,-1.39) logprob:train/valid[21,33,final]=(-0.068,-0.055,-0.049/-0.096,-0.087,-0.080)
+# exp/chain/tdnn1h3_sp: num-iters=34 nj=2..5 num-params=5.2M dim=40+100->2328 combine=-0.050->-0.046 (over 4) xent:train/valid[21,33,final]=(-1.51,-1.23,-1.17/-1.67,-1.45,-1.39) logprob:train/valid[21,33,final]=(-0.068,-0.055,-0.049/-0.097,-0.089,-0.081)
 
 # Set -e here so that we catch if any executable fails immediately
 set -euo pipefail
diff --git a/egs/wsj/s5/steps/decode.sh b/egs/wsj/s5/steps/decode.sh
@@ -80,7 +80,7 @@ if [ $(basename $model) != final.alimdl ] ; then
 fi
 
 for f in $sdata/1/feats.scp $sdata/1/cmvn.scp $model $graphdir/HCLG.fst; do
-  [ ! -f $f ] && echo "decode.sh: no such file $f" && exit 1;
+  [ ! -f $f ] && echo "$0: Error: no such file $f" && exit 1;
 done
 
 if [ -f $srcdir/final.mat ]; then feat_type=lda; else feat_type=delta; fi
@@ -96,13 +96,13 @@ thread_string=
 case $feat_type in
   delta) feats="ark,s,cs:apply-cmvn $cmvn_opts --utt2spk=ark:$sdata/JOB/utt2spk scp:$sdata/JOB/cmvn.scp scp:$sdata/JOB/feats.scp ark:- | add-deltas $delta_opts ark:- ark:- |";;
   lda) feats="ark,s,cs:apply-cmvn $cmvn_opts --utt2spk=ark:$sdata/JOB/utt2spk scp:$sdata/JOB/cmvn.scp scp:$sdata/JOB/feats.scp ark:- | splice-feats $splice_opts ark:- ark:- | transform-feats $srcdir/final.mat ark:- ark:- |";;
-  *) echo "Invalid feature type $feat_type" && exit 1;
+  *) echo "$0: Error: Invalid feature type $feat_type" && exit 1;
 esac
 if [ ! -z "$transform_dir" ]; then # add transforms to features...
   echo "Using fMLLR transforms from $transform_dir"
   [ ! -f $transform_dir/trans.1 ] && echo "Expected $transform_dir/trans.1 to exist."
   [ ! -s $transform_dir/num_jobs ] && \
-    echo "$0: expected $transform_dir/num_jobs to contain the number of jobs." && exit 1;
+    echo "$0: Error: expected $transform_dir/num_jobs to contain the number of jobs." && exit 1;
   nj_orig=$(cat $transform_dir/num_jobs)
   if [ $nj -ne $nj_orig ]; then
     # Copy the transforms into an archive with an index.
@@ -119,7 +119,7 @@ fi
 if [ $stage -le 0 ]; then
   if [ -f "$graphdir/num_pdfs" ]; then
     [ "`cat $graphdir/num_pdfs`" -eq `am-info --print-args=false $model | grep pdfs | awk '{print $NF}'` ] || \
-      { echo "Mismatch in number of pdfs with $model"; exit 1; }
+      { echo "$0: Error: Mismatch in number of pdfs with $model"; exit 1; }
   fi
   $cmd --num-threads $num_threads JOB=1:$nj $dir/log/decode.JOB.log \
     gmm-latgen-faster$thread_string --max-active=$max_active --beam=$beam --lattice-beam=$lattice_beam \
@@ -134,9 +134,9 @@ fi
 
 if ! $skip_scoring ; then
   [ ! -x local/score.sh ] && \
-    echo "Not scoring because local/score.sh does not exist or not executable." && exit 1;
+    echo "$0: Not scoring because local/score.sh does not exist or not executable." && exit 1;
   local/score.sh --cmd "$cmd" $scoring_opts $data $graphdir $dir ||
-    { echo "$0: Scoring failed. (ignore by '--skip-scoring true')"; exit 1; }
+    { echo "$0: Error: scoring failed. (ignore by '--skip-scoring true')"; exit 1; }
 fi
 
 exit 0;
diff --git a/egs/wsj/s5/steps/nnet3/remove_egs.sh b/egs/wsj/s5/steps/nnet3/remove_egs.sh
@@ -0,0 +1 @@
+../nnet2/remove_egs.sh
diff --git a/src/nnet3/convolution.cc b/src/nnet3/convolution.cc
@@ -988,7 +988,7 @@ static void ComputeTempMatrixSize(const ConvolutionComputationOptions &opts,
     temp_rows = new_num_t_out * computation->num_images;
     BaseFloat new_num_megabytes = (4 * temp_rows * temp_cols) / 1000000.0;
     // make sure we're within the memory limit.
-    if (new_num_megabytes > megabyte_limit) {
+    if (new_num_megabytes > 1.01 * megabyte_limit) {
       KALDI_WARN << "Memory consumed in convolution is more than requested "
                  << "(maybe very long time sequence?)";
     }
diff --git a/src/nnet3/nnet-analyze.cc b/src/nnet3/nnet-analyze.cc
@@ -1441,22 +1441,35 @@ int64 GetMaxMemoryUse(const NnetComputation &computation) {
       max_memory_use = 0;
   int32 num_commands = computation.commands.size(),
       num_submatrices = computation.submatrices.size();
+  // the vector 'num_compressed_bytes' is used to remember the number of bytes
+  // in the compressed matrices for each submatrix (this will only be used for
+  // those that correspond to a 'whole matrix).  It's needed because the
+  // decompression command doesn't tell us what compression type was used for
+  // that matrix.
+  std::vector<int32> num_compressed_bytes(num_submatrices, -100000000);
   for (int32 command_index = 0; command_index < num_commands; ++command_index) {
     const NnetComputation::Command &c = computation.commands[command_index];
     int64 this_num_bytes = -100000000,
         this_compressed_num_bytes = -10000000;
+
+
     if (c.arg1 >= 0 && c.arg1 < num_submatrices) {
       // if arg1 could plausibly be a sub-matrix index...
       const NnetComputation::SubMatrixInfo &submat_info =
           computation.submatrices[c.arg1];
       this_num_bytes = static_cast<int64>(sizeof(BaseFloat)) *
           submat_info.num_rows * submat_info.num_cols;
 
-      this_compressed_num_bytes =
-          ((c.arg2 == static_cast<int32>(kCompressedMatrixInt8) ||
-            c.arg2 == static_cast<int32>(kCompressedMatrixUint8)) ?
-           1 : 2) * static_cast<int64>(submat_info.num_rows) *
-          submat_info.num_cols;
+      if (c.command_type == kCompressMatrix) {
+        this_compressed_num_bytes =
+            ((c.arg2 == static_cast<int32>(kCompressedMatrixInt8) ||
+              c.arg2 == static_cast<int32>(kCompressedMatrixUint8)) ?
+             1 : 2) * static_cast<int64>(submat_info.num_rows) *
+            submat_info.num_cols;
+        num_compressed_bytes[c.arg1] = this_compressed_num_bytes;
+      } else if (c.command_type == kDecompressMatrix) {
+        this_compressed_num_bytes = num_compressed_bytes[c.arg1];
+      }
     }
     switch (c.command_type) {
       case kAllocMatrix:
diff --git a/src/nnet3/nnet-optimize-utils.cc b/src/nnet3/nnet-optimize-utils.cc
@@ -4692,7 +4692,7 @@ class MemoryCompressionOptimizer {
 
   /** @param [in] nnet         The neural net the computation is for.
       @param [in] memory_compression_level.  The level of compression:
-         0 = no compression (the constructor should not be calle with this value).
+         0 = no compression (the constructor should not be called with this value).
          1 = compression that doesn't affect the results (but still takes time).
          2 = compression that affects the results only very slightly
          3 = compression that affects the results a little more.
diff --git a/tools/extras/check_dependencies.sh b/tools/extras/check_dependencies.sh
@@ -65,7 +65,7 @@ if ! echo "#include <zlib.h>" | $CXX -E - >&/dev/null; then
   add_packages zlib-devel zlib1g-dev zlib-devel
 fi
 
-for f in make automake autoconf patch grep bzip2 gzip wget git; do
+for f in make automake autoconf patch grep bzip2 gzip wget git sox; do
   if ! which $f >&/dev/null; then
     echo "$0: $f is not installed."
     add_packages $f $f $f
@@ -100,7 +100,7 @@ if ! which python3 >&/dev/null; then
   pythonok=false
 fi
 
-( 
+(
 #Use a subshell so that sourcing env.sh does not have an influence on the rest of the script
 [ -f ./env.sh ] && . ./env.sh
 if $pythonok && ! which python2 >&/dev/null; then
@@ -111,14 +111,14 @@ if $pythonok && ! which python2 >&/dev/null; then
 fi
 
 if [[ -f $PWD/python/.use_default_python && -f $PWD/python/python ]]; then
-  rm $PWD/python/python 
+  rm $PWD/python/python
 fi
 
 if $pythonok && which python >&/dev/null && [[ ! -f $PWD/python/.use_default_python ]]; then
   version=`python 2>&1 --version | awk '{print $2}' `
   if [[ $version != "2.7"* ]] ; then
     echo "$0: WARNING python 2.7 is not the default python. We fixed this by adding a correct symlink more prominently on the path."
-    echo "$0: If you really want to use python $version as default, add an empty file $PWD/python/.use_default_python and run this script again."  
+    echo "$0: If you really want to use python $version as default, add an empty file $PWD/python/.use_default_python and run this script again."
     mkdir -p $PWD/python
     ln -s $(which python2.7) $PWD/python/python
     echo "export PATH=$PWD/python:\${PATH}" >> env.sh

Original file line number	Diff line number	Diff line change
`@@ -988,7 +988,7 @@ static void ComputeTempMatrixSize(const ConvolutionComputationOptions &opts,`
`988`	`988`	`temp_rows = new_num_t_out * computation->num_images;`
`989`	`989`	`BaseFloat new_num_megabytes = (4 * temp_rows * temp_cols) / 1000000.0;`
`990`	`990`	`// make sure we're within the memory limit.`
`991`		`- if (new_num_megabytes > megabyte_limit) {`
	`991`	`+ if (new_num_megabytes > 1.01 * megabyte_limit) {`
`992`	`992`	`KALDI_WARN << "Memory consumed in convolution is more than requested "`
`993`	`993`	`<< "(maybe very long time sequence?)";`
`994`	`994`	`}`