fixing chain scripts

kaldi-asr · danpovey · Sep 12, 2018 · Aug 30, 2018 · Aug 31, 2018 · Aug 31, 2018
commit 5fc0d17914dcaf718c55c30455402a86a3bb0525
diff --git a/egs/iam/v2/local/chain/tuning/run_cnn_1a.sh b/egs/iam/v2/local/chain/tuning/run_cnn_1a.sh
@@ -186,7 +186,7 @@ if [ $stage -le 5 ]; then
  --chain.xent-regularize $xent_regularize \
  --chain.leaky-hmm-coefficient=0.1 \
  --chain.l2-regularize=0.00005 \
- --chain.apply-deriv-weights=false \
+ --chain.apply-deriv-weights=true \
  --chain.lm-opts="--num-extra-lm-states=500" \
  --chain.frame-subsampling-factor=$frame_subsampling_factor \
  --chain.alignment-subsampling-factor=$frame_subsampling_factor \

diff --git a/egs/iam/v2/local/chain/tuning/run_cnn_chainali_1b.sh b/egs/iam/v2/local/chain/tuning/run_cnn_chainali_1b.sh
@@ -42,10 +42,10 @@ chunk_right_context=0
 tdnn_dim=550
 # training options
 srand=0
-remove_egs=false
-lang_test=lang
+remove_egs=true
 lang_decode=data/lang
 lang_rescore=data/lang_rescore_6g
+
 dropout_schedule='0,[email protected],[email protected],0'
 # End configuration section.
 echo "$0 $@" # Print the command line for logging
@@ -120,10 +120,11 @@ if [ $stage -le 3 ]; then
  # speed-perturbed data (local/nnet3/run_ivector_common.sh made them), so use
  # those. The num-leaves is always somewhat less than the num-leaves from
  # the GMM baseline.
-  if [ -f $tree_dir/final.mdl ]; then
-  echo "$0: $tree_dir/final.mdl already exists, refusing to overwrite it."
-  exit 1;
+ if [ -f $tree_dir/final.mdl ]; then
+ echo "$0: $tree_dir/final.mdl already exists, refusing to overwrite it."
+ exit 1;
  fi
+
  steps/nnet3/chain/build_tree.sh \
  --frame-subsampling-factor $frame_subsampling_factor \
  --context-opts "--context-width=2 --central-position=1" \
@@ -156,6 +157,7 @@ if [ $stage -le 4 ]; then
  relu-batchnorm-dropout-layer name=tdnn1 input=Append(-4,-2,0,2,4) dim=$tdnn_dim $tdnn_opts dropout-proportion=0.0
  relu-batchnorm-dropout-layer name=tdnn2 input=Append(-4,0,4) dim=$tdnn_dim $tdnn_opts dropout-proportion=0.0
  relu-batchnorm-dropout-layer name=tdnn3 input=Append(-4,0,4) dim=$tdnn_dim $tdnn_opts dropout-proportion=0.0
+
  ## adding the layers for chain branch
  relu-batchnorm-layer name=prefinal-chain dim=$tdnn_dim target-rms=0.5 $tdnn_opts
  output-layer name=output include-log-softmax=false dim=$num_targets max-change=1.5 $output_opts

diff --git a/egs/iam/v2/local/chain/tuning/run_e2e_cnn_1b.sh b/egs/iam/v2/local/chain/tuning/run_e2e_cnn_1b.sh
@@ -2,20 +2,20 @@
 # Copyright 2017 Hossein Hadian
 
 # This script does end2end chain training (i.e. from scratch)
-# ./local/chain/compare_wer.sh exp/chain/e2e_cnn_1a/
-# System e2e_cnn_1a
-# WER 11.24
-# WER (rescored) 10.80
-# CER 5.32
-# CER (rescored) 5.24
-# Final train prob 0.0568
-# Final valid prob 0.0381
+# ./local/chain/compare_wer.sh exp/chain/e2e_cnn_1b/
+# System e2e_cnn_1b
+# WER 13.59
+# WER (rescored) 13.27
+# CER 6.92
+# CER (rescored) 6.71
+# Final train prob 0.0345
+# Final valid prob 0.0269
 # Final train prob (xent)
 # Final valid prob (xent)
-# Parameters 9.13M
+# Parameters 9.52M
 
-# steps/info/chain_dir_info.pl exp/chain/e2e_cnn_1a
-# exp/chain/e2e_cnn_1a: num-iters=42 nj=2..4 num-params=9.1M dim=40->12640 combine=0.049->0.049 (over 1) logprob:train/valid[27,41,final]=(0.035,0.055,0.057/0.016,0.037,0.038)
+# steps/info/chain_dir_info.pl exp/chain/e2e_cnn_1b
+# exp/chain/e2e_cnn_1b: num-iters=42 nj=2..4 num-params=9.5M dim=40->12640 combine=0.041->0.041 (over 2) logprob:train/valid[27,41,final]=(0.032,0.035,0.035/0.025,0.026,0.027)
 set -e
 
 # configs for 'chain'