sintel-dev
diff --git a/‎CONTRIBUTING.md
+5-5 b/‎CONTRIBUTING.md
+5-5
diff --git a/‎HISTORY.md
+3-3 b/‎HISTORY.md
+3-3
diff --git a/‎README.md
+3-3 b/‎README.md
+3-3
diff --git a/‎docs/conf.py
+1-1 b/‎docs/conf.py
+1-1
diff --git a/‎setup.cfg
+1-1 b/‎setup.cfg
+1-1
diff --git a/‎setup.py
+3-3 b/‎setup.py
+3-3
diff --git a/‎sigpro/__init__.py
+3-3 b/‎sigpro/__init__.py
+3-3
diff --git a/‎sigpro/core.py
+244 b/‎sigpro/core.py
+244
@@ -7,21 +7,21 @@ update to `SigPro` library.
 
 The first step would be to clone the `SigPro` repository. In order to do so
 make sure that you have access to the repository by accessing it direcly
-[https://github.com/signals-dev/SigPro/](
-https://github.com/signals-dev/SigPro/).
+[https://github.com/sintel-dev/SigPro/](
+https://github.com/sintel-dev/SigPro/).
 
 If you have access to the repository and you have your `ssh` keys configured
 in your github account, you can clone it by using the following command
 
 ```bash
-git clone git@github.com:signals-dev/SigPro.git
+git clone git@github.com:sintel-dev/SigPro.git
 ```
 
 If you don't have your `ssh` keys configured you can clone the repository
 using your login name and password running the following command:
 
 ```bash
-git clone https://github.com/signals-dev/SigPro
+git clone https://github.com/sintel-dev/SigPro
 ```
 
 Next, you can enter your repository folder, create a virtualenv and install
@@ -96,4 +96,4 @@ request by doing the following steps:
 1. Add the new files and the updated ones. By running `git status` you will see the modified and `new/untracked` files. Use `git add` to `add` the files that involve your implementation, such as the new primitive `json` file, the new module with the new transformation or aggregation and other changes that you may have done to existing files (such as `setup.py` if you updated or introduce a new dependency).
 2. Commit your changes using `git commit -m "Implement my new transformation"`.
 3. Push your branch: `git push --set-upstream origin <name_of_your_branch>`.
-4. Go to [https://github.com/signals-dev/SigPro/](https://github.com/signals-dev/SigPro/) and create a pull request from this branch to the master branch.
+4. Go to [https://github.com/sintel-dev/SigPro/](https://github.com/sintel-dev/SigPro/) and create a pull request from this branch to the master branch.
@@ -20,11 +20,11 @@ to create new primitives and to test those with the demo data included in this p
 
 This release also includes the following User Guides:
 
-* [PRIMITIVES.md](https://github.com/signals-dev/SigPro/blob/master/PRIMITIVES.md): Information
+* [PRIMITIVES.md](https://github.com/sintel-dev/SigPro/blob/master/PRIMITIVES.md): Information
   about the primitive families, their expected input and output.
-* [USAGE.md](https://github.com/signals-dev/SigPro/blob/master/USAGE.md): Instructions about how
+* [USAGE.md](https://github.com/sintel-dev/SigPro/blob/master/USAGE.md): Instructions about how
   to usee the three main functionalities of `SigPro`.
-* [DEVELOPMENT.md](https://github.com/signals-dev/SigPro/blob/master/DEVELOPMENT.md): Step by step
+* [DEVELOPMENT.md](https://github.com/sintel-dev/SigPro/blob/master/DEVELOPMENT.md): Step by step
   guide about how to write a valid `SigPro` primitive and contribute it to either `SigPro` or
   your own library.
 
 
@@ -5,15 +5,15 @@
 
 [![Development Status](https://img.shields.io/badge/Development%20Status-2%20--%20Pre--Alpha-yellow)](https://pypi.org/search/?c=Development+Status+%3A%3A+2+-+Pre-Alpha)
 [![PyPi Shield](https://img.shields.io/pypi/v/SigPro.svg)](https://pypi.python.org/pypi/SigPro)
-[![Tests](https://github.com/signals-dev/SigPro/workflows/Run%20Tests/badge.svg)](https://github.com/signals-dev/SigPro/actions?query=workflow%3A%22Run+Tests%22+branch%3Amaster)
+[![Tests](https://github.com/sintel-dev/SigPro/workflows/Run%20Tests/badge.svg)](https://github.com/sintel-dev/SigPro/actions?query=workflow%3A%22Run+Tests%22+branch%3Amaster)
 [![Downloads](https://pepy.tech/badge/sigpro)](https://pepy.tech/project/sigpro)
 
 
 # SigPro: Signal Processing Tools for Machine Learning
 
-* License: [MIT](https://github.com/signals-dev/SigPro/blob/master/LICENSE)
+* License: [MIT](https://github.com/sintel-dev/SigPro/blob/master/LICENSE)
 * Development Status: [Pre-Alpha](https://pypi.org/search/?c=Development+Status+%3A%3A+2+-+Pre-Alpha)
-* Homepage: https://github.com/signals-dev/SigPro
+* Homepage: https://github.com/sintel-dev/SigPro
 
 ## Overview
 
 
@@ -60,7 +60,7 @@
 copyright = '2020, MIT Data To AI Lab'
 author = 'MIT Data To AI Lab'
 description = 'Signal Processing Tools for Machine Learning'
-user = 'signals-dev'
+user = 'sintel-dev'
 
 # The version info for the project you're documenting, acts as replacement
 # for |version| and |release|, also used in various other places throughout
 
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.0.3
+current_version = 0.1.0.dev0
 commit = True
 tag = True
 parse = (?P<major>\d+)\.(?P<minor>\d+)\.(?P<patch>\d+)(\.(?P<release>[a-z]+)(?P<candidate>\d+))?
 
@@ -12,7 +12,7 @@
     history = history_file.read()
 
 install_requires = [
-    'mlblocks>=0.4.0,<0.5',
+    'mlblocks>=0.4.1,<0.5',
     'pandas>=1,<2',
     'numpy>=1.17.4,<1.19',
     'scipy>=1.3.3,<2',
@@ -99,7 +99,7 @@
     setup_requires=setup_requires,
     test_suite='tests',
     tests_require=tests_require,
-    url='https://github.com/signals-dev/SigPro',
-    version='0.0.3',
+    url='https://github.com/sintel-dev/SigPro',
+    version='0.1.0.dev0',
     zip_safe=False,
 )
@@ -4,13 +4,13 @@
 
 __author__ = """MIT Data To AI Lab"""
 __email__ = 'dailabmit@gmail.com'
-__version__ = '0.0.3'
+__version__ = '0.1.0.dev0'
 
 import os
 
 from mlblocks import discovery
 
-from sigpro.process_signals import process_signals
+from sigpro.core import SigPro
 
 _BASE_PATH = os.path.abspath(os.path.dirname(__file__))
 MLBLOCKS_PRIMITIVES = os.path.join(_BASE_PATH, 'primitives')
@@ -46,4 +46,4 @@ def get_primitives(name=None, primitive_type=None, primitive_subtype=None):
     return discovery.find_primitives(name or 'sigpro', filters)
 
 
-__all__ = ('process_signals', )
+__all__ = ('SigPro', )
@@ -0,0 +1,244 @@
+# -*- coding: utf-8 -*-
+"""Process Signals core functionality."""
+
+from collections import Counter
+from copy import deepcopy
+
+import pandas as pd
+from mlblocks import MLPipeline, load_primitive
+
+DEFAULT_INPUT = [
+    {
+        'name': 'readings',
+        'keyword': 'data',
+        'type': 'pandas.DataFrame'
+    },
+    {
+        'name': 'feature_columns',
+        'default': None,
+        'type': 'list'
+    }
+]
+
+DEFAULT_OUTPUT = [
+    {
+        'name': 'readings',
+        'type': 'pandas.DataFrame'
+    },
+    {
+        'name': 'feature_columns',
+        'type': 'list'
+    }
+]
+
+
+class SigPro:
+    """SigPro class applies multiple transformation and aggregation primitives.
+
+    The Process Signals is responsible for applying a collection of primitives specified by the
+    user in order to create features for the given data.
+
+    Given a list of transformations and aggregations which are composed
+    by dictionaries with the following specification:
+
+        * ``Name``:
+            Name of the transformation / aggregation.
+        * ``primitive``:
+            Name of the primitive to apply.
+        * ``init_params``:
+            Dictionary containing the initializing parameters for the primitive.
+
+    The process signals will build an ``mlblocks.MLPipeline`` and will generate the features
+    by previously applying the transformations and then compute the aggregations.
+
+    Args:
+        data (pandas.DataFrame):
+            Dataframe with a column that contains signal values.
+        transformations (list):
+            List of dictionaries containing the transformation primitives.
+        aggregations (list):
+            List of dictionaries containing the aggregation primitives.
+        values_column_name (str):
+            The name of the column that contains the signal values. Defaults to ``values``.
+        keep_columns (Union[bool, list]):
+            Whether to keep non-feature columns in the output DataFrame or not.
+            If a list of column names are passed, those columns are kept.
+    """
+
+    def _build_pipeline(self):
+        """Build Pipeline function.
+
+        Given a list of transformations and aggregations build a pipeline
+        with the output of the aggregations, which take as name the specified
+        name of the transformations and the aggregation. This lists are composed
+        by dictionaries with the following specification:
+
+            * ``Name``:
+                Name of the transformation / aggregation.
+            * ``primitive``:
+                Name of the primitive to apply.
+            * ``init_params``:
+                Dictionary containing the initializing parameters for the primitive.
+
+        Args:
+            transformations (list):
+                List of dictionaries containing the transformation primitives.
+            aggregations (list):
+                List of dictionaries containing the aggregation primitives.
+
+        Returns:
+            mlblocks.MLPipeline:
+                An ``MLPipeline`` object that first applies all the transformations
+                and then produces as output the aggregations specified.
+        """
+        primitives = []
+        init_params = {}
+        prefix = []
+        outputs = []
+        counter = Counter()
+
+        for transformation in self.transformations:
+            name = transformation.get('name')
+            if name is None:
+                name = transformation['primitive'].split('.')[-1]
+
+            prefix.append(name)
+            primitive = transformation['primitive']
+            counter[primitive] += 1
+            primitive_name = f'{primitive}#{counter[primitive]}'
+            primitives.append(primitive)
+            params = transformation.get('init_params')
+            if params:
+                init_params[primitive_name] = params
+
+        prefix = '.'.join(prefix) if prefix else ''
+
+        for aggregation in self.aggregations:
+            name = aggregation.get('name')
+            if name is None:
+                name = aggregation['primitive'].split('.')[-1]
+
+            aggregation_name = f'{prefix}.{name}' if prefix else name
+
+            primitive = aggregation['primitive']
+            counter[primitive] += 1
+            primitive_name = f'{primitive}#{counter[primitive]}'
+            primitives.append(primitive)
+
+            primitive = load_primitive(primitive)
+            primitive_outputs = primitive['produce']['output']
+
+            params = aggregation.get('init_params')
+            if params:
+                init_params[primitive_name] = params
+
+            if name.lower() == 'sigpro':
+                primitive = MLPipeline([primitive], init_params={'sigpro.SigPro#1': params})
+                primitive_outputs = primitive.get_outputs()
+
+            # primitive_outputs = getattr(self, primitive_outputs)()
+            if not isinstance(primitive_outputs, str):
+                for output in primitive_outputs:
+                    output = output['name']
+                    outputs.append({
+                        'name': f'{aggregation_name}.{output}',
+                        'variable': f'{primitive_name}.{output}'
+                    })
+
+        outputs = {'default': outputs} if outputs else None
+
+        return MLPipeline(
+            primitives,
+            init_params=init_params,
+            outputs=outputs
+        )
+
+    def __init__(self, transformations, aggregations, values_column_name='values',
+                 keep_columns=False, input_is_dataframe=True):
+
+        self.transformations = transformations
+        self.aggregations = aggregations
+        self.values_column_name = values_column_name
+        self.keep_columns = keep_columns
+        self.input_is_dataframe = input_is_dataframe
+        self.pipeline = self._build_pipeline()
+
+    def _apply_pipeline(self, row):
+        """Apply a ``mlblocks.MLPipeline`` to a row.
+
+        Apply a ``MLPipeline`` to a row of a ``pd.DataFrame``, this function can
+        be combined with the ``pd.DataFrame.apply`` method to be applied to the
+        entire data frame.
+
+        Args:
+            row (pd.Series):
+                Row used to apply the pipeline to.
+        """
+        context = row.to_dict()
+        amplitude_values = context.pop(self.values_column_name)
+        output = self.pipeline.predict(
+            amplitude_values=amplitude_values,
+            **context,
+        )
+        output_names = self.pipeline.get_output_names()
+
+        # ensure that we can iterate over output
+        output = output if isinstance(output, tuple) else (output, )
+
+        return pd.Series(dict(zip(output_names, output)))
+
+    def process_signal(self, data=None, feature_columns=None, **kwargs):
+        """Apply multiple transformation and aggregation primitives.
+
+        Args:
+            data (pandas.DataFrame):
+                Dataframe with a column that contains signal values.
+            feature_columns (list):
+                List of column names from the input data frame that must be considered as
+                features and should not be dropped.
+
+        Returns:
+            tuple:
+                pandas.DataFrame:
+                    A data frame with new feature columns by applying the previous primitives. If
+                    ``keep_values`` is ``True`` the original signal values will be conserved in the
+                    data frame, otherwise the original signal values will be deleted.
+                list:
+                    A list with the feature names generated.
+        """
+        if data is None:
+            row = pd.Series(kwargs)
+            values = self._apply_pipeline(row).values
+            return values if len(values) > 1 else values[0]
+
+        features = data.apply(
+            self._apply_pipeline,
+            axis=1
+        )
+        data = pd.concat([data, features], axis=1)
+
+        if feature_columns:
+            feature_columns = feature_columns + list(features.columns)
+        else:
+            feature_columns = list(features.columns)
+
+        if isinstance(self.keep_columns, list):
+            data = data[self.keep_columns + feature_columns]
+        elif not self.keep_columns:
+            data = data[feature_columns]
+
+        return data, feature_columns
+
+    def get_input_args(self):
+        """Return the pipeline input args."""
+        if self.input_is_dataframe:
+            return deepcopy(DEFAULT_INPUT)
+
+        return self.pipeline.get_predict_args()
+
+    def get_output_args(self):
+        """Return the pipeline output args."""
+        if self.input_is_dataframe:
+            return deepcopy(DEFAULT_OUTPUT)
+
+        return self.pipeline.get_outputs()