sintel-dev
diff --git a/‎setup.py‎
Lines changed: 1 addition & 1 deletion b/‎setup.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sigpro/__init__.py‎
Lines changed: 2 additions & 2 deletions b/‎sigpro/__init__.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎sigpro/core.py‎
Lines changed: 244 additions & 0 deletions b/‎sigpro/core.py‎
Lines changed: 244 additions & 0 deletions
diff --git a/‎sigpro/primitives/sigpro.process_signals.json‎
Lines changed: 0 additions & 47 deletions b/‎sigpro/primitives/sigpro.process_signals.json‎
Lines changed: 0 additions & 47 deletions
diff --git a/‎sigpro/primitives/sigpro/SigPro.json‎
Lines changed: 35 additions & 0 deletions b/‎sigpro/primitives/sigpro/SigPro.json‎
Lines changed: 35 additions & 0 deletions
diff --git a/‎sigpro/primitives/sigpro/transformations/amplitude/spectrum/power_spectrum.json‎
Lines changed: 30 additions & 0 deletions b/‎sigpro/primitives/sigpro/transformations/amplitude/spectrum/power_spectrum.json‎
Lines changed: 30 additions & 0 deletions
@@ -12,7 +12,7 @@
     history = history_file.read()
 
 install_requires = [
-    'mlblocks>=0.4.0,<0.5',
+    'mlblocks>=0.4.1,<0.5',
     'pandas>=1,<2',
     'numpy>=1.17.4,<1.19',
     'scipy>=1.3.3,<2',
 
@@ -10,7 +10,7 @@
 
 from mlblocks import discovery
 
-from sigpro.process_signals import process_signals
+from sigpro.core import SigPro
 
 _BASE_PATH = os.path.abspath(os.path.dirname(__file__))
 MLBLOCKS_PRIMITIVES = os.path.join(_BASE_PATH, 'primitives')
@@ -46,4 +46,4 @@ def get_primitives(name=None, primitive_type=None, primitive_subtype=None):
     return discovery.find_primitives(name or 'sigpro', filters)
 
 
-__all__ = ('process_signals', )
+__all__ = ('SigPro', )
@@ -0,0 +1,244 @@
+# -*- coding: utf-8 -*-
+"""Process Signals core functionality."""
+
+from collections import Counter
+from copy import deepcopy
+
+import pandas as pd
+from mlblocks import MLPipeline, load_primitive
+
+DEFAULT_INPUT = [
+    {
+        'name': 'readings',
+        'keyword': 'data',
+        'type': 'pandas.DataFrame'
+    },
+    {
+        'name': 'feature_columns',
+        'default': None,
+        'type': 'list'
+    }
+]
+
+DEFAULT_OUTPUT = [
+    {
+        'name': 'readings',
+        'type': 'pandas.DataFrame'
+    },
+    {
+        'name': 'feature_columns',
+        'type': 'list'
+    }
+]
+
+
+class SigPro:
+    """SigPro class applies multiple transformation and aggregation primitives.
+
+    The Process Signals is responsible for applying a collection of primitives specified by the
+    user in order to create features for the given data.
+
+    Given a list of transformations and aggregations which are composed
+    by dictionaries with the following specification:
+
+        * ``Name``:
+            Name of the transformation / aggregation.
+        * ``primitive``:
+            Name of the primitive to apply.
+        * ``init_params``:
+            Dictionary containing the initializing parameters for the primitive.
+
+    The process signals will build an ``mlblocks.MLPipeline`` and will generate the features
+    by previously applying the transformations and then compute the aggregations.
+
+    Args:
+        data (pandas.DataFrame):
+            Dataframe with a column that contains signal values.
+        transformations (list):
+            List of dictionaries containing the transformation primitives.
+        aggregations (list):
+            List of dictionaries containing the aggregation primitives.
+        values_column_name (str):
+            The name of the column that contains the signal values. Defaults to ``values``.
+        keep_columns (Union[bool, list]):
+            Whether to keep non-feature columns in the output DataFrame or not.
+            If a list of column names are passed, those columns are kept.
+    """
+
+    def _build_pipeline(self):
+        """Build Pipeline function.
+
+        Given a list of transformations and aggregations build a pipeline
+        with the output of the aggregations, which take as name the specified
+        name of the transformations and the aggregation. This lists are composed
+        by dictionaries with the following specification:
+
+            * ``Name``:
+                Name of the transformation / aggregation.
+            * ``primitive``:
+                Name of the primitive to apply.
+            * ``init_params``:
+                Dictionary containing the initializing parameters for the primitive.
+
+        Args:
+            transformations (list):
+                List of dictionaries containing the transformation primitives.
+            aggregations (list):
+                List of dictionaries containing the aggregation primitives.
+
+        Returns:
+            mlblocks.MLPipeline:
+                An ``MLPipeline`` object that first applies all the transformations
+                and then produces as output the aggregations specified.
+        """
+        primitives = []
+        init_params = {}
+        prefix = []
+        outputs = []
+        counter = Counter()
+
+        for transformation in self.transformations:
+            name = transformation.get('name')
+            if name is None:
+                name = transformation['primitive'].split('.')[-1]
+
+            prefix.append(name)
+            primitive = transformation['primitive']
+            counter[primitive] += 1
+            primitive_name = f'{primitive}#{counter[primitive]}'
+            primitives.append(primitive)
+            params = transformation.get('init_params')
+            if params:
+                init_params[primitive_name] = params
+
+        prefix = '.'.join(prefix) if prefix else ''
+
+        for aggregation in self.aggregations:
+            name = aggregation.get('name')
+            if name is None:
+                name = aggregation['primitive'].split('.')[-1]
+
+            aggregation_name = f'{prefix}.{name}' if prefix else name
+
+            primitive = aggregation['primitive']
+            counter[primitive] += 1
+            primitive_name = f'{primitive}#{counter[primitive]}'
+            primitives.append(primitive)
+
+            primitive = load_primitive(primitive)
+            primitive_outputs = primitive['produce']['output']
+
+            params = aggregation.get('init_params')
+            if params:
+                init_params[primitive_name] = params
+
+            if name.lower() == 'sigpro':
+                primitive = MLPipeline([primitive], init_params={'sigpro.SigPro#1': params})
+                primitive_outputs = primitive.get_outputs()
+
+            # primitive_outputs = getattr(self, primitive_outputs)()
+            if not isinstance(primitive_outputs, str):
+                for output in primitive_outputs:
+                    output = output['name']
+                    outputs.append({
+                        'name': f'{aggregation_name}.{output}',
+                        'variable': f'{primitive_name}.{output}'
+                    })
+
+        outputs = {'default': outputs} if outputs else None
+
+        return MLPipeline(
+            primitives,
+            init_params=init_params,
+            outputs=outputs
+        )
+
+    def __init__(self, transformations, aggregations, values_column_name='values',
+                 keep_columns=False, input_is_dataframe=True):
+
+        self.transformations = transformations
+        self.aggregations = aggregations
+        self.values_column_name = values_column_name
+        self.keep_columns = keep_columns
+        self.input_is_dataframe = input_is_dataframe
+        self.pipeline = self._build_pipeline()
+
+    def _apply_pipeline(self, row):
+        """Apply a ``mlblocks.MLPipeline`` to a row.
+
+        Apply a ``MLPipeline`` to a row of a ``pd.DataFrame``, this function can
+        be combined with the ``pd.DataFrame.apply`` method to be applied to the
+        entire data frame.
+
+        Args:
+            row (pd.Series):
+                Row used to apply the pipeline to.
+        """
+        context = row.to_dict()
+        amplitude_values = context.pop(self.values_column_name)
+        output = self.pipeline.predict(
+            amplitude_values=amplitude_values,
+            **context,
+        )
+        output_names = self.pipeline.get_output_names()
+
+        # ensure that we can iterate over output
+        output = output if isinstance(output, tuple) else (output, )
+
+        return pd.Series(dict(zip(output_names, output)))
+
+    def process_signal(self, data=None, feature_columns=None, **kwargs):
+        """Apply multiple transformation and aggregation primitives.
+
+        Args:
+            data (pandas.DataFrame):
+                Dataframe with a column that contains signal values.
+            feature_columns (list):
+                List of column names from the input data frame that must be considered as
+                features and should not be dropped.
+
+        Returns:
+            tuple:
+                pandas.DataFrame:
+                    A data frame with new feature columns by applying the previous primitives. If
+                    ``keep_values`` is ``True`` the original signal values will be conserved in the
+                    data frame, otherwise the original signal values will be deleted.
+                list:
+                    A list with the feature names generated.
+        """
+        if data is None:
+            row = pd.Series(kwargs)
+            values = self._apply_pipeline(row).values
+            return values if len(values) > 1 else values[0]
+
+        features = data.apply(
+            self._apply_pipeline,
+            axis=1
+        )
+        data = pd.concat([data, features], axis=1)
+
+        if feature_columns:
+            feature_columns = feature_columns + list(features.columns)
+        else:
+            feature_columns = list(features.columns)
+
+        if isinstance(self.keep_columns, list):
+            data = data[self.keep_columns + feature_columns]
+        elif not self.keep_columns:
+            data = data[feature_columns]
+
+        return data, feature_columns
+
+    def get_input_args(self):
+        """Return the pipeline input args."""
+        if self.input_is_dataframe:
+            return deepcopy(DEFAULT_INPUT)
+
+        return self.pipeline.get_predict_args()
+
+    def get_output_args(self):
+        """Return the pipeline output args."""
+        if self.input_is_dataframe:
+            return deepcopy(DEFAULT_OUTPUT)
+
+        return self.pipeline.get_outputs()
@@ -0,0 +1,35 @@
+{
+    "name": "sigpro.SigPro",
+    "primitive": "sigpro.SigPro",
+    "classifiers": {
+        "type": "preprocessor",
+        "subtype": "feature_extractor"
+    },
+    "produce": {
+        "method": "process_signal",
+        "args": "get_input_args",
+        "output": "get_output_args"
+    },
+    "hyperparameters": {
+        "fixed": {
+            "keep_columns": {
+                "type": "bool or list",
+                "default": false
+            },
+            "values_column_name": {
+                "type": "str",
+                "default": "values"
+            },
+            "transformations": {
+                "type": "list"
+            },
+            "aggregations": {
+                "type": "list"
+            },
+            "input_is_dataframe": {
+                "type": "bool",
+                "default": true
+            }
+        }
+    }
+}
@@ -0,0 +1,30 @@
+{
+    "name": "sigpro.transformations.amplitude.spectrum.power_spectrum",
+    "primitive": "sigpro.transformations.amplitude.spectrum.power_spectrum",
+    "classifiers": {
+        "type": "transformation",
+        "subtype": "amplitude"
+    },
+    "produce": {
+        "args": [
+            {
+                "name": "amplitude_values",
+                "type": "numpy.ndarray"
+            },
+            {
+                "name": "sampling_frequency",
+                "type": "float"
+            }
+        ],
+        "output": [
+            {
+                "name": "amplitude_values",
+                "type": "numpy.ndarray"
+            },
+            {
+                "name": "frequency_values",
+                "type": "numpy.ndarray"
+            }
+        ]
+    }
+}