add skip connection.

csukuangfj · csukuangfj · commit 16052ce7f056 · 2020-01-30T11:48:06.000+08:00
diff --git a/egs/aishell/s10/chain/tdnnf_layer.py b/egs/aishell/s10/chain/tdnnf_layer.py
@@ -62,15 +62,21 @@ class FactorizedTDNN(nn.Module):
         https://github.com/kaldi-asr/kaldi/blob/master/src/nnet3/nnet-utils.cc#L982
     '''
 
-    def __init__(self, dim, bottleneck_dim, time_stride):
+    def __init__(self, dim, bottleneck_dim, time_stride, bypass_scale=0.66):
         super().__init__()
+
         assert time_stride in [0, 1]
+        assert abs(bypass_scale) <= 1
+
+        self.bypass_scale = bypass_scale
 
         if time_stride == 0:
             kernel_size = 1
         else:
             kernel_size = 3
 
+        self.kernel_size = kernel_size
+
         # WARNING(fangjun): kaldi uses [-1, 0] for the first linear layer
         # and [0, 1] for the second affine layer;
         # We use [-1, 0, 1] for the first linear layer
@@ -90,6 +96,10 @@ def __init__(self, dim, bottleneck_dim, time_stride):
     def forward(self, x):
         # input x is of shape: [batch_size, feat_dim, seq_len] = [N, C, T]
         assert x.ndim == 3
+
+        # save it for skip connection
+        input_x = x
+
         x = self.conv(x)
         # at this point, x is [N, C, T]
 
@@ -109,6 +119,10 @@ def forward(self, x):
         # TODO(fangjun): implement GeneralDropoutComponent in PyTorch
 
         # at this point, x is [N, C, T]
+        if self.kernel_size == 3:
+            x = self.bypass_scale * input_x[:, :, 1:-1] + x
+        else:
+            x = self.bypass_scale * input_x + x
         return x
 
     def constraint_orthonormal(self):
@@ -176,6 +190,10 @@ def _test_factorized_tdnn():
     y = model(x)
     assert y.size(2) == T - 2
 
+    model = FactorizedTDNN(dim=C, bottleneck_dim=2, time_stride=0)
+    y = model(x)
+    assert y.size(2) == T
+
 
 if __name__ == '__main__':
     torch.manual_seed(20200130)