added delta features script

kaldi-asr · danpovey · Aug 2, 2019 · Jul 21, 2019 · Jul 24, 2019 · Jul 25, 2019
commit bb23ee927ca7cfea3e90cdc1b7e55a3446128356
diff --git a/egs/swbd/s5c/local/chain/tuning/run_tdnn_7q.sh b/egs/swbd/s5c/local/chain/tuning/run_tdnn_7q.sh
@@ -32,7 +32,7 @@ stage=0
 train_stage=-10
 get_egs_stage=-10
 speed_perturb=true
-affix=7q
+affix=7r
 if [ -e data/rt03 ]; then maybe_rt03=rt03; else maybe_rt03= ; fi
 
 decode_iter=
@@ -131,13 +131,23 @@ if [ $stage -le 12 ]; then
   input dim=100 name=ivector
   input dim=40 name=input
 
+  no-op-component name=delta_1 input=Scale(-1.0, Offset(input, -1))
+  no-op-component name=delta_2 input=Scale(1.0, Offset(input, 1))
+  no-op-component name=delta_delta_1 input=Scale(-2.0, input)
+  no-op-component name=delta_delta_2 input=Scale(1.0, Offset(input,-2))
+  no-op-component name=delta_delta_3 input=Scale(1.0, Offset(input,2))
+
   # please note that it is important to have input layer with the name=input
   # as the layer immediately preceding the fixed-affine-layer to enable
   # the use of short notation for the descriptor
-  fixed-affine-layer name=lda input=Append(-1,0,1,ReplaceIndex(ivector, t, 0)) affine-transform-file=$dir/configs/lda.mat
+  #fixed-affine-layer name=lda input=Append(-1,0,1,ReplaceIndex(ivector, t, 0)) affine-transform-file=$dir/configs/lda.mat
+  no-op-component name=input2 input=Append(Offset(input,0), Sum(delta_1, delta_2), Sum(delta_delta_1, delta_delta_2, delta_delta_3))
+
+  batchnorm-component name=bn_input
+  no-op-component name=input3 input=Append(bn_input, Scale(1.0, ReplaceIndex(ivector, t, 0)))
 
   # the first splicing is moved before the lda layer, so no splicing here
-  relu-batchnorm-dropout-layer name=tdnn1 $affine_opts dim=1536
+  relu-batchnorm-dropout-layer name=tdnn1 $affine_opts dim=1536 input=input3
   tdnnf-layer name=tdnnf2 $tdnnf_opts dim=1536 bottleneck-dim=160 time-stride=1
   tdnnf-layer name=tdnnf3 $tdnnf_opts dim=1536 bottleneck-dim=160 time-stride=1
   tdnnf-layer name=tdnnf4 $tdnnf_opts dim=1536 bottleneck-dim=160 time-stride=1

diff --git a/egs/wsj/s5/local/chain/tuning/run_tdnn_1g.sh b/egs/wsj/s5/local/chain/tuning/run_tdnn_1g.sh
@@ -60,7 +60,7 @@ chunk_right_context=0
 
 # training options
 srand=0
-remove_egs=true
+remove_egs=false
 
 #decode options
 test_online_decoding=false  # if true, it will run the last decoding stage.
@@ -182,13 +182,23 @@ if [ $stage -le 15 ]; then
   input dim=100 name=ivector
   input dim=40 name=input
 
+  no-op-component name=delta_1 input=Scale(-1.0, Offset(input, -1))
+  no-op-component name=delta_2 input=Scale(1.0, Offset(input, 1))
+  no-op-component name=delta_delta_1 input=Scale(-2.0, input)
+  no-op-component name=delta_delta_2 input=Scale(1.0, Offset(input,-2))
+  no-op-component name=delta_delta_3 input=Scale(1.0, Offset(input,2))
+
   # please note that it is important to have input layer with the name=input
   # as the layer immediately preceding the fixed-affine-layer to enable
   # the use of short notation for the descriptor
-  fixed-affine-layer name=lda input=Append(-1,0,1,ReplaceIndex(ivector, t, 0)) affine-transform-file=$dir/configs/lda.mat
+  #fixed-affine-layer name=lda input=Append(-1,0,1,ReplaceIndex(ivector, t, 0)) affine-transform-file=$dir/configs/lda.mat
+  no-op-component name=input2 input=Append(Offset(input,0), Sum(delta_1, delta_2))
+
+  batchnorm-component name=bn_input
+  no-op-component name=input3 input=Append(bn_input, Scale(1.0, ReplaceIndex(ivector, t, 0)))
 
   # the first splicing is moved before the lda layer, so no splicing here
-  relu-batchnorm-dropout-layer name=tdnn1 $tdnn_opts dim=1024
+  relu-batchnorm-dropout-layer name=tdnn1 $tdnn_opts dim=1024 input=input3
   tdnnf-layer name=tdnnf2 $tdnnf_opts dim=1024 bottleneck-dim=128 time-stride=1
   tdnnf-layer name=tdnnf3 $tdnnf_opts dim=1024 bottleneck-dim=128 time-stride=1
   tdnnf-layer name=tdnnf4 $tdnnf_opts dim=1024 bottleneck-dim=128 time-stride=1