microsoft
diff --git a/‎.gitattributes‎
Lines changed: 13 additions & 0 deletions b/‎.gitattributes‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 0 deletions b/‎README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎c_reference/include/conv1d.h‎
Lines changed: 152 additions & 0 deletions b/‎c_reference/include/conv1d.h‎
Lines changed: 152 additions & 0 deletions
diff --git a/‎c_reference/include/conv_utils.h‎
Lines changed: 27 additions & 0 deletions b/‎c_reference/include/conv_utils.h‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎c_reference/include/dscnn.h‎
Lines changed: 92 additions & 0 deletions b/‎c_reference/include/dscnn.h‎
Lines changed: 92 additions & 0 deletions
diff --git a/‎c_reference/src/Makefile‎
Lines changed: 10 additions & 1 deletion b/‎c_reference/src/Makefile‎
Lines changed: 10 additions & 1 deletion
@@ -60,3 +60,16 @@ c_reference/models/q_scut_head_b_face4_model/mbconv2.h filter=lfs diff=lfs merge
 c_reference/models/q_scut_head_b_face4_model/mbconv4.h filter=lfs diff=lfs merge=lfs -text
 c_reference/models/q_scut_head_b_face4_model/rnn2.h filter=lfs diff=lfs merge=lfs -text
 c_reference/models/q_scut_head_b_face4_model/detection2.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/keyword_spotting_io_1.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/keyword_spotting_io_2.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/keyword_spotting_io_3.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/conv1d/avg_pool/avg_io.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/conv1d/conv1d_regular/conv_param.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/conv1d/conv1d_lr/conv_param_lr.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/conv1d/conv1d_lr_depthwise/conv_param_lr_depth.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/conv1d/conv1d_depthwise/conv_param_depth.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/precnn_params.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/postcnn_params.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/kws/rnn_params.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/dscnn/dscnn_param_lr.h filter=lfs diff=lfs merge=lfs -text
+c_reference/tests/dscnn/dscnn_param_lr_depth_point.h filter=lfs diff=lfs merge=lfs -text
@@ -17,6 +17,7 @@ Algorithms that shine in this setting in terms of both model size and compute, n
  - **EMI-RNN**: Training routine to recover the critical signature from time series data for faster and accurate RNN predictions.
  - **Shallow RNN**: A meta-architecture for training RNNs that can be applied to streaming data.
  - **FastRNN & FastGRNN - FastCells**: **F**ast, **A**ccurate, **S**table and **T**iny (**G**ated) RNN cells.
+ - **Conv1D**: 1-D regular and low-rank convolution architectures for time-series data.
  - **DROCC**: **D**eep **R**obust **O**ne-**C**lass **C**lassfiication for training robust anomaly detectors.
  - **RNNPool**: An efficient non-linear pooling operator for RAM constrained inference.
 
 
@@ -0,0 +1,152 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT license.
+
+#ifndef __CONVLAYERS_H__
+#define __CONVLAYERS_H__
+
+/**
+ * @brief Model paramters for the 1D Convolution Layer
+ * @var   W    pointer to convolutional weights W, size for regular = out_channels*in_channels*kernel_size, size for depth based = out_channels*kernel_size
+ * @var   B    pointer to the bias vector for the convolution, shape = [out_channels]
+ */
+typedef struct ConvLayers_Params{
+    float* W;
+    float* B;
+} ConvLayers_Params;
+
+/**
+ * @brief Model definition for the 1D Convolution Layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * out_channels
+ * @param[in]    out_T            number of time steps in the output
+ * @param[in]    out_channels     number of output channels for the ouput of the conv layer
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels
+ * @param[in]    padding          padding applied to the input before the conv is performed. Note: padding is applied to both the start and end
+ * @param[in]    kernel_size      kernel size of the conv filter
+ * @param[in]    params           weights, bias and other essential parameters used to describe the layer
+ * @param[in]    activations      an integer to choose the type of activation function.
+ *                                0: none
+ *                                1: sigmoid
+ *                                2: tanh
+ *                                3: relu
+ */
+int Conv1D(float *output_signal, unsigned out_T, unsigned out_channels, const float *input_signal, 
+    unsigned in_T, unsigned in_channels, int padding, unsigned kernel_size, 
+    const void* params, int activations);
+
+/**
+ * @brief Model definition for the 1D Depthwise Convolution Layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * in_channels
+ * @param[in]    out_T            number of time steps in the output
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels. The output will have the same number of channels
+ * @param[in]    padding          padding applied to the input before the conv is performed. Note: padding is applied to both the start and end
+ * @param[in]    kernel_size      kernel size of the conv filter
+ * @param[in]    params           weights, bias and other essential parameters used to describe the layer
+ * @param[in]    activations      an integer to choose the type of activation function.
+ *                                0: none
+ *                                1: sigmoid
+ *                                2: tanh
+ *                                3: relu
+ */
+int Conv1D_Depth(float *output_signal, unsigned out_T, const float *input_signal, 
+    unsigned in_T, unsigned in_channels, int padding, unsigned kernel_size, 
+    const void* params, int activations);
+
+
+// Low Rank Convolution
+/**
+ * @brief Model paramters for the 1D Convolution Layer
+ * @var    W1      pointer to the 1st low-rank component of the weights, size = out_channels * rank
+ * @var    W2      pointer to the 2nd low-rank component of the weights, size for regular = rank * in_channels * kernel_size, size for depthwise = rank * kernel_size
+ * @var    B       pointer to the bias vector for the convolution, shape = [out_channels]
+ * @var    rank    rank of the weight tensor. A low rank decomposition typically used to reduce computation and storage
+ */
+typedef struct ConvLayers_LR_Params{
+    float* W1;
+    float* W2;
+    float* B;
+    unsigned rank;
+} ConvLayers_LR_Params;
+
+/**
+ * @brief Model definition for the 1D Low Rank Convolution Layer
+ * @brief Identical to the non-low-rank form. One modification is the mulitplication of the weights handeled witin the layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * out_channels
+ * @param[in]    out_T            number of time steps in the output
+ * @param[in]    out_channels     number of output channels for the ouput of the conv layer
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels
+ * @param[in]    padding          padding applied to the input before the conv is performed. Note: padding is applied to both the start and end
+ * @param[in]    kernel_size      kernel size of the conv filter
+ * @param[in]    params           weights, bias and other essential parameters used to describe the layer
+ * @param[in]    activations      an integer to choose the type of activation function.
+ *                                0: none
+ *                                1: sigmoid
+ *                                2: tanh
+ *                                3: relu
+ */
+int Conv1D_LR(float *output_signal, unsigned out_T, unsigned out_channels, const float *input_signal, 
+    unsigned in_T, unsigned in_channels, int padding, unsigned kernel_size, 
+    const void* params, int activations);
+
+/**
+ * @brief Model definition for the 1D Depthwise Convolution Layer
+ * @brief Identical to the non-low-rank form. One modification is the mulitplication of the weights handeled witin the layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * in_channels
+ * @param[in]    out_T            number of time steps in the output
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels. The output will have the same number of channels
+ * @param[in]    padding          padding applied to the input before the conv is performed. Note: padding is applied to both the start and end
+ * @param[in]    kernel_size      kernel size of the conv filter
+ * @param[in]    params           weights, bias and other essential parameters used to describe the layer
+ * @param[in]    activations      an integer to choose the type of activation function.
+ *                                0: none
+ *                                1: sigmoid
+ *                                2: tanh
+ *                                3: relu
+ */
+int Conv1D_Depth_LR(float *output_signal, unsigned out_T, const float *input_signal, 
+    unsigned in_T, unsigned in_channels, int padding, unsigned kernel_size, 
+    const void* params, int activations);
+
+// Auxillary Layers
+/**
+ * @brief Model definition for the 1D Average Pooling Layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * in_channels. Provide Null/0 incase of inplace computation
+ * @param[in]    out_T            number of time steps in the output
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels. The output will have the same number of channels
+ * @param[in]    padding          padding applied to the input before the pool is performed. Note: padding is applied to both the start and end
+ * @param[in]    kernel_size      kernel size of the pool filter
+ * @param[in]    activations      an integer to choose the type of activation function.
+ *                                0: none
+ *                                1: sigmoid
+ *                                2: tanh
+ *                                3: relu
+ */
+int AvgPool1D(float *output_signal, unsigned out_T, const float *input_signal, unsigned in_T, unsigned in_channels, 
+    int padding, unsigned kernel_size, int activations);
+
+/**
+ * @brief Model definition for the 1D batch Normalization Layer
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * in_channels. Provide Null/0 incase of inplace computation
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels. The output will have the same number of channels
+ * @param[in]    mean             pointer to the mean for the batch normalization, size = in_channels
+ * @param[in]    var              pointer to the variance for the batch normalization, size = in_channels
+ * @param[in]    affine           whether the affine operations are applied
+ * @param[in]    gamma            pointer to the scaling factors for the post-norm affine operation, size = in_channels
+ * @param[in]    beta             pointer to the scalar offsets for the post-norm affine operation, size = in_channels
+ * @param[in]    in_place         in place computation of the batchnorm i.e. the output is stored in place of the input signal. Storage efficient
+ * @param[in]    eps              a very small +ve value to avoid division by 0. For the default value, assign = 0.00001
+ */
+int BatchNorm1d(float* output_signal, float* input_signal, unsigned in_T, unsigned in_channels, 
+    float* mean, float* var, unsigned affine, float* gamma , float * beta, unsigned in_place, float eps);
+#endif
@@ -0,0 +1,27 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT license.
+
+#ifndef __CONVLAYER_UTILS__
+#define __CONVLAYER_UTILS__
+
+/**
+ * @brief Definition for the Utility Fucntion for Preparing the Low Rank Conv Weights
+ * @param[out]   out     pointer to the output signal, size (regular) = out_T * in_channels * kernel_size, size (depthwise) = out_t * kernel_size
+ * @param[in]    W1      1st component of the low rank weight tensor. size = out_channels * rank
+ * @param[in]    W2      2nd component of the low rank weight tensor. size (regular) = rank * in_channels * kernel_size, size (depthwise)  = rank * kernel_size
+ * @param[in]    rank    rank of the weight tensor. Low Rank
+ * @param[in]    I       dim 0 for W1, value = out_channels
+ * @param[in]    J       dim 1 for W2, value = in_channels * kernel_size, (or for depthwise) = kernel_size
+ */
+int MatMul(float* out, float* W1, float* W2, unsigned rank, unsigned I, unsigned J);
+
+/**
+ * @brief Definition for the Custom non-linear layer : The TanhGate
+ * @param[out]   output_signal    pointer to the output signal, size = out_T * in_channels
+ * @param[in]    input_signal     pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T             number of time steps in the input
+ * @param[in]    in_channels      number of input channels. The output will have the half the number of channels. Recommended in_channel % 2 == 0
+ */
+int TanhGate(float* output_signal, float* input_signal, unsigned in_T, unsigned in_channels);
+
+#endif
@@ -0,0 +1,92 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT license.
+
+#ifndef __DSCNN__
+#define __DSCNN__
+
+#include"conv1d.h"
+#include"conv_utils.h"
+#include<stdlib.h>
+#include<math.h>
+
+/**
+ * @brief Model definition for the 1D Convolution sub-block applied before the RNN
+ * @brief sub-layers : BatchNorm1d -> Conv1D_LR
+ * 
+ * @param[out]   output_signal       pointer to the final output signal, minimum size = out_T * in_channels. out_T has to be calculated based on the reduction from all the conv and pool layers
+ * @param[in]    input_signal        pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T                number of time steps in the input
+ * @param[in]    in_channels         number of input channels. The output will have the same number of channels
+ 
+ * @param[in]    mean                pointer to the mean for the batch normalization, size = in_channels
+ * @param[in]    var                 pointer to the variance for the batch normalization, size = in_channels
+ * @param[in]    affine              whether the affine operations are applied
+ * @param[in]    gamma               pointer to the scaling factors for the post-norm affine operation, size = in_channels
+ * @param[in]    beta                pointer to the scalar offsets for the post-norm affine operation, size = in_channels
+ * @param[in]    in_place            in place computation of the batchnorm. Storage efficient
+ * 
+ * @param[in]    cnn_hidden          hidden state/out_channels dimensions for the CNN
+ * @param[in]    cnn_padding         padding for the CNN layer. Note: applied to both sides of the input 
+ * @param[in]    cnn_kernel_size     kernel size of the CNN
+ * @param[in]    cnn_params          weights, bias and other essential parameters used to describe the CNN
+ * @param[in]    cnn_activations     an integer to choose the type of activation function.
+ *                                   0: none
+ *                                   1: sigmoid
+ *                                   2: tanh
+ *                                   3: relu
+ */
+int DSCNN_LR(float* output_signal, float* input_signal, unsigned in_T, unsigned in_channels, float* mean, float* var,
+    unsigned affine, float* gamma, float* beta, unsigned in_place, unsigned cnn_hidden, int cnn_padding, unsigned cnn_kernel_size,
+    const void* cnn_params, int cnn_activations);
+
+/**
+ * @brief Model definition for the 1D Convolution sub-block applied after the RNN
+ * @brief sub-layers : TanhGate(custom) nonlinearity -> BatchNorm1d -> Conv1D_Depth -> Conv1d_LR -> AvgPool
+ * 
+ * @param[out]   output_signal          pointer to the final output signal, minimum size = out_T * in_channels. out_T has to be calculated based on the reduction from all the conv and pool layers
+ * @param[in]    input_signal           pointer to the input signal. size = in_T * in_channels
+ * @param[in]    in_T                   number of time steps in the input
+ * @param[in]    in_channels            number of input channels. The output will have the same number of channels
+ 
+ * @param[in]    mean                   pointer to the mean for the batch normalization, size = in_channels
+ * @param[in]    var                    pointer to the variance for the batch normalization, size = in_channels
+ * @param[in]    affine                 whether the affine operations are applied
+ * @param[in]    gamma                  pointer to the scaling factors for the post-norm affine operation, size = in_channels
+ * @param[in]    beta                   pointer to the scalar offsets for the post-norm affine operation, size = in_channels
+ * @param[in]    in_place               in place computation of the batchnorm. Storage efficient
+ * 
+ * @param[in]    depth_cnn_hidden       hidden state/out_channels dimensions for the depth CNN
+ * @param[in]    depth_cnn_padding      padding for the depth CNN layer. Note: applied to both sides of the input 
+ * @param[in]    depth_cnn_kernel_size  kernel size of the depth CNN
+ * @param[in]    depth_cnn_params       weights, bias and other essential parameters used to describe the depth CNN
+ * @param[in]    depth_cnn_activations  an integer to choose the type of activation function.
+ *                                      0: none
+ *                                      1: sigmoid
+ *                                      2: tanh
+ *                                      3: relu
+ * 
+ * @param[in]    point_cnn_hidden       hidden state/out_channels dimensions for the point CNN
+ * @param[in]    point_cnn_padding      padding for the point CNN layer. Note: applied to both sides of the input 
+ * @param[in]    point_cnn_kernel_size  kernel size of the point CNN
+ * @param[in]    point_cnn_params       weights, bias and other essential parameters used to describe the point CNN
+ * @param[in]    point_cnn_activations  an integer to choose the type of activation function.
+ *                                      0: none
+ *                                      1: sigmoid
+ *                                      2: tanh
+ *                                      3: relu
+ * 
+ * @param[in]    pool_padding           padding for the pool layer. Note: applied to both sides of the input 
+ * @param[in]    pool_kernel_size       kernel size of the pool
+ * @param[in]    pool_activations       an integer to choose the type of activation function.
+ *                                      0: none
+ *                                      1: sigmoid
+ *                                      2: tanh
+ *                                      3: relu
+ */
+int DSCNN_LR_Point_Depth(float* output_signal, float* input_signal, unsigned in_T, unsigned in_channels, float* mean, float* var,
+    unsigned affine, float* gamma, float* beta, unsigned in_place, unsigned depth_cnn_hidden, int depth_cnn_padding, 
+    unsigned depth_cnn_kernel_size, const void* depth_cnn_params, int depth_cnn_activations, unsigned point_cnn_hidden, 
+    int point_cnn_padding, unsigned point_cnn_kernel_size, const void* point_cnn_params, int point_cnn_activations, 
+    int pool_padding, unsigned pool_kernel_size, int pool_activation);
+
+#endif
@@ -6,7 +6,16 @@ include ../config.mk
 INCLUDE_DIR=../include
 IFLAGS = -I $(INCLUDE_DIR)
 
-all: utils.o fastgrnn.o classifier.o rnnpool.o quantized_utils.o quantized_fastgrnn.o quantized_rnnpool.o quantized_mbconv.o
+all: dscnn.o conv1d.o conv_utils.o utils.o fastgrnn.o classifier.o rnnpool.o quantized_utils.o quantized_fastgrnn.o quantized_rnnpool.o quantized_mbconv.o 
+
+dscnn.o : dscnn.c
+	$(CC) -o $@ $(IFLAGS) $(CFLAGS) -c $^
+
+conv_utils.o : conv_utils.c
+	$(CC) -o $@ $(IFLAGS) $(CFLAGS) -c $^
+
+conv1d.o : conv1d.c
+	$(CC) -o $@ $(IFLAGS) $(CFLAGS) -c $^
 
 utils.o: utils.c
 	$(CC) -o $@ $(IFLAGS) $(CFLAGS) -c $^