sintel-dev
diff --git a/‎setup.py‎
Lines changed: 1 addition & 1 deletion b/‎setup.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tests/labeling/test_helpers.py‎
Lines changed: 8 additions & 4 deletions b/‎tests/labeling/test_helpers.py‎
Lines changed: 8 additions & 4 deletions
diff --git a/‎tests/primitives/test_postprocessing.py‎
Lines changed: 2 additions & 1 deletion b/‎tests/primitives/test_postprocessing.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/test___init__.py‎
Lines changed: 2 additions & 1 deletion b/‎tests/test___init__.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/test_core.py‎
Lines changed: 44 additions & 23 deletions b/‎tests/test_core.py‎
Lines changed: 44 additions & 23 deletions
diff --git a/‎tests/test_feature_engineering.py‎
Lines changed: 12 additions & 6 deletions b/‎tests/test_feature_engineering.py‎
Lines changed: 12 additions & 6 deletions
diff --git a/‎tests/test_metadata.py‎
Lines changed: 2 additions & 1 deletion b/‎tests/test_metadata.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎zephyr_ml/__init__.py‎
Lines changed: 3 additions & 10 deletions b/‎zephyr_ml/__init__.py‎
Lines changed: 3 additions & 10 deletions
@@ -54,7 +54,7 @@
     'Sphinx>=3,<3.3',
     'sphinx_rtd_theme>=0.2.4,<0.5',
     'autodocsumm>=0.1.10',
-    'mistune>=0.7,<3.1',
+    'mistune>=0.7,<2.0',
     'Jinja2>=2,<3.1',
 
     # fails on Sphinx < v3.4
 
@@ -19,31 +19,35 @@ def test_merge_labeling_and_true():
         lambda df: True,
         lambda df: True
     ]
-    assert 1 == merge_binary_labeling_functions(functions, and_connected=True)(pd.DataFrame())
+    assert 1 == merge_binary_labeling_functions(
+        functions, and_connected=True)(pd.DataFrame())
 
 
 def test_merge_labeling_and_false():
     functions = [
         lambda df: True,
         lambda df: False
     ]
-    assert 0 == merge_binary_labeling_functions(functions, and_connected=True)(pd.DataFrame())
+    assert 0 == merge_binary_labeling_functions(
+        functions, and_connected=True)(pd.DataFrame())
 
 
 def test_merge_labeling_or_true():
     functions = [
         lambda df: False,
         lambda df: True
     ]
-    assert 1 == merge_binary_labeling_functions(functions, and_connected=False)(pd.DataFrame())
+    assert 1 == merge_binary_labeling_functions(
+        functions, and_connected=False)(pd.DataFrame())
 
 
 def test_merge_labeling_or_false():
     functions = [
         lambda df: False,
         lambda df: False
     ]
-    assert 0 == merge_binary_labeling_functions(functions, and_connected=False)(pd.DataFrame())
+    assert 0 == merge_binary_labeling_functions(
+        functions, and_connected=False)(pd.DataFrame())
 
 
 def test_categorical_presence_true():
 
@@ -23,7 +23,8 @@ def _run(self, y, y_hat, value):
         threshold.fit(y, y_hat)
 
         assert threshold._threshold == value
-        binary_y_hat, detected_threshold, scores = threshold.apply_threshold(y_hat)
+        binary_y_hat, detected_threshold, scores = threshold.apply_threshold(
+            y_hat)
         np.testing.assert_allclose(binary_y_hat, y)
 
     def test_1d(self):
 
@@ -96,7 +96,8 @@ def merge_work_orders_notifications_data():
     changed_wo_data['WTG'] = ['A001', 'A001']
     changed_notif_data = NOTIFICATIONS_DATA.copy()
     # matching the output of the merge
-    changed_notif_data['Functional location_y'] = changed_notif_data.pop('Functional location')
+    changed_notif_data['Functional location_y'] = changed_notif_data.pop(
+        'Functional location')
     changed_notif_data['Functional location description_y'] = (
         changed_notif_data.pop('Functional location description'))
     # matching the notifications update
 
@@ -1,6 +1,7 @@
 import numpy as np
 import pandas as pd
 from mlblocks import MLBlock
+
 from zephyr_ml.core import DEFAULT_METRICS, Zephyr
 
 
@@ -10,8 +11,10 @@ class TestZephyr:
     def base_dfs():
         alarms_df = pd.DataFrame({
             'COD_ELEMENT': [0, 0],
-            'DAT_START': [pd.Timestamp('2022-01-01 00:00:00'), pd.Timestamp('2022-03-01 11:12:13')],
-            'DAT_END': [pd.Timestamp('2022-01-01 13:00:00'), pd.Timestamp('2022-03-02 11:12:13')],
+            'DAT_START': [pd.Timestamp('2022-01-01 00:00:00'),
+                          pd.Timestamp('2022-03-01 11:12:13')],
+            'DAT_END': [pd.Timestamp('2022-01-01 13:00:00'),
+                        pd.Timestamp('2022-03-02 11:12:13')],
             'IND_DURATION': [0.5417, 1.0],
             'COD_ALARM': [12345, 98754],
             'COD_ALARM_INT': [12345, 98754],
@@ -20,8 +23,10 @@ def base_dfs():
         })
         stoppages_df = pd.DataFrame({
             'COD_ELEMENT': [0, 0],
-            'DAT_START': [pd.Timestamp('2022-01-01 00:00:00'), pd.Timestamp('2022-03-01 11:12:13')],
-            'DAT_END': [pd.Timestamp('2022-01-08 11:07:17'), pd.Timestamp('2022-03-01 17:00:13')],
+            'DAT_START': [pd.Timestamp('2022-01-01 00:00:00'),
+                          pd.Timestamp('2022-03-01 11:12:13')],
+            'DAT_END': [pd.Timestamp('2022-01-08 11:07:17'),
+                        pd.Timestamp('2022-03-01 17:00:13')],
             'DES_WO_NAME': ['stoppage name 1', 'stoppage name 2'],
             'DES_COMMENTS': ['description of stoppage 1', 'description of stoppage 2'],
             'COD_WO': [12345, 67890],
@@ -40,12 +45,15 @@ def base_dfs():
             'COD_ORDER': [12345, 67890],
             'IND_QUANTITY': [1, -20],
             'COD_MATERIAL_SAP': [36052411, 67890],
-            'DAT_POSTING': [pd.Timestamp('2022-01-01 00:00:00'), pd.Timestamp('2022-03-01 00:00:00')],
+            'DAT_POSTING': [pd.Timestamp('2022-01-01 00:00:00'),
+                            pd.Timestamp('2022-03-01 00:00:00')],
             'COD_MAT_DOC': [77889900, 12345690],
             'DES_MEDIUM': ['Description of notification 1', 'Description of notification 2'],
             'COD_NOTIF': [567890123, 32109877],
-            'DAT_MALF_START': [pd.Timestamp('2021-12-25 18:07:10'), pd.Timestamp('2022-02-28 06:04:00')],
-            'DAT_MALF_END': [pd.Timestamp('2022-01-08 11:07:17'), pd.Timestamp('2022-03-01 17:00:13')],
+            'DAT_MALF_START': [pd.Timestamp('2021-12-25 18:07:10'),
+                               pd.Timestamp('2022-02-28 06:04:00')],
+            'DAT_MALF_END': [pd.Timestamp('2022-01-08 11:07:17'),
+                             pd.Timestamp('2022-03-01 17:00:13')],
             'IND_BREAKDOWN_DUR': [14.1378, 2.4792],
             'FUNCT_LOC_DES': ['location description 1', 'location description 2'],
             'COD_ALARM': [12345, 12345],
@@ -54,15 +62,19 @@ def base_dfs():
         work_orders_df = pd.DataFrame({
             'COD_ELEMENT': [0, 0],
             'COD_ORDER': [12345, 67890],
-            'DAT_BASIC_START': [pd.Timestamp('2022-01-01 00:00:00'), pd.Timestamp('2022-03-01 00:00:00')],
-            'DAT_BASIC_END': [pd.Timestamp('2022-01-09 00:00:00'), pd.Timestamp('2022-03-02 00:00:00')],
+            'DAT_BASIC_START': [pd.Timestamp('2022-01-01 00:00:00'),
+                                pd.Timestamp('2022-03-01 00:00:00')],
+            'DAT_BASIC_END': [pd.Timestamp('2022-01-09 00:00:00'),
+                              pd.Timestamp('2022-03-02 00:00:00')],
             'COD_EQUIPMENT': [98765, 98765],
             'COD_MAINT_PLANT': ['ABC', 'ABC'],
             'COD_MAINT_ACT_TYPE': ['XYZ', 'XYZ'],
             'COD_CREATED_BY': ['A1234', 'B6789'],
             'COD_ORDER_TYPE': ['A', 'B'],
-            'DAT_REFERENCE': [pd.Timestamp('2022-01-01 00:00:00'), pd.Timestamp('2022-03-01 00:00:00')],
-            'DAT_CREATED_ON': [pd.Timestamp('2022-03-01 00:00:00'), pd.Timestamp('2022-04-18 00:00:00')],
+            'DAT_REFERENCE': [pd.Timestamp('2022-01-01 00:00:00'),
+                              pd.Timestamp('2022-03-01 00:00:00')],
+            'DAT_CREATED_ON': [pd.Timestamp('2022-03-01 00:00:00'),
+                               pd.Timestamp('2022-04-18 00:00:00')],
             'DAT_VALID_END': [pd.NaT, pd.NaT],
             'DAT_VALID_START': [pd.NaT, pd.NaT],
             'COD_SYSTEM_STAT': ['ABC XYZ', 'LMN OPQ'],
@@ -86,7 +98,8 @@ def base_dfs():
             'PI_LOCAL_SITE_NAME': ['LOC0']
         })
         pidata_df = pd.DataFrame({
-            'time': [pd.Timestamp('2022-01-02 13:21:01'), pd.Timestamp('2022-03-08 13:21:01')],
+            'time': [pd.Timestamp('2022-01-02 13:21:01'),
+                     pd.Timestamp('2022-03-08 13:21:01')],
             'COD_ELEMENT': [0, 0],
             'val1': [9872.0, 559.0],
             'val2': [10.0, -7.0]
@@ -153,40 +166,47 @@ def setup_class(cls):
 
     def test_initialize_class(self):
         _ = Zephyr()
-        
 
     def test_generate_entityset(self):
         zephyr = Zephyr()
-        zephyr.generate_entityset(**self.__class__.kwargs["generate_entityset"])
+        zephyr.generate_entityset(
+            **self.__class__.kwargs["generate_entityset"])
         es = zephyr.get_entityset()
         assert es is not None
         assert es.id == 'pidata'
 
     def test_generate_label_times(self):
         zephyr = Zephyr()
-        zephyr.generate_entityset(**self.__class__.kwargs["generate_entityset"])
-        zephyr.generate_label_times(**self.__class__.kwargs["generate_label_times"])
+        zephyr.generate_entityset(
+            **self.__class__.kwargs["generate_entityset"])
+        zephyr.generate_label_times(
+            **self.__class__.kwargs["generate_label_times"])
         label_times = zephyr.get_label_times(visualize=False)
         assert label_times is not None
 
     def test_generate_feature_matrix_and_labels(self):
         zephyr = Zephyr()
-        zephyr.generate_entityset(**self.__class__.kwargs["generate_entityset"])
-        zephyr.generate_label_times(**self.__class__.kwargs["generate_label_times"])
+        zephyr.generate_entityset(
+            **self.__class__.kwargs["generate_entityset"])
+        zephyr.generate_label_times(
+            **self.__class__.kwargs["generate_label_times"])
         zephyr.generate_feature_matrix(
             **self.__class__.kwargs["generate_feature_matrix"])
-        feature_matrix, label_col_name, features= zephyr.get_feature_matrix()
+        feature_matrix, label_col_name, features = zephyr.get_feature_matrix()
         assert feature_matrix is not None
         assert label_col_name in feature_matrix.columns
         assert features is not None
 
     def test_generate_train_test_split(self):
         zephyr = Zephyr()
-        zephyr.generate_entityset(**self.__class__.kwargs["generate_entityset"])
-        zephyr.generate_label_times(**self.__class__.kwargs["generate_label_times"])
+        zephyr.generate_entityset(
+            **self.__class__.kwargs["generate_entityset"])
+        zephyr.generate_label_times(
+            **self.__class__.kwargs["generate_label_times"])
         zephyr.generate_feature_matrix(
             **self.__class__.kwargs["generate_feature_matrix"])
-        zephyr.generate_train_test_split(**self.__class__.kwargs["generate_train_test_split"])
+        zephyr.generate_train_test_split(
+            **self.__class__.kwargs["generate_train_test_split"])
         train_test_split = zephyr.get_train_test_split()
         assert train_test_split is not None
         X_train, X_test, y_train, y_test = train_test_split
@@ -217,7 +237,8 @@ def test_fit_pipeline_no_visual(self):
     def test_fit_pipeline_visual(self):
         zephyr = Zephyr()
         zephyr.set_train_test_split(*self.base_train_test_split())
-        output = zephyr.fit_pipeline(visual=True, **self.__class__.kwargs["fit_pipeline"])
+        output = zephyr.fit_pipeline(
+            visual=True, **self.__class__.kwargs["fit_pipeline"])
         assert isinstance(output, dict)
         assert list(output.keys()) == ['threshold', 'scores']
         pipeline = zephyr.get_fitted_pipeline()
 
@@ -170,8 +170,10 @@ def test_process_signals_pidata(pidata_es, transformations, aggregations):
         "fft.mean.mean_value": [9872, None, 559]
     })
     expected['COD_ELEMENT'] = expected['COD_ELEMENT'].astype('category')
-    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype('float64')
-    processed['fft.mean.mean_value'] = processed['fft.mean.mean_value'].astype('float64')
+    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype(
+        'float64')
+    processed['fft.mean.mean_value'] = processed['fft.mean.mean_value'].astype(
+        'float64')
 
     assert pidata_es['pidata_processed'].shape[0] == 3
     assert pidata_es['pidata_processed'].shape[1] == 4
@@ -202,8 +204,10 @@ def test_process_signals_pidata_replace(pidata_es, transformations, aggregations
         "fft.mean.mean_value": [9872, None, 559]
     })
     expected['COD_ELEMENT'] = expected['COD_ELEMENT'].astype('category')
-    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype('float64')
-    processed['fft.mean.mean_value'] = processed['fft.mean.mean_value'].astype('float64')
+    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype(
+        'float64')
+    processed['fft.mean.mean_value'] = processed['fft.mean.mean_value'].astype(
+        'float64')
 
     assert pidata_es['pidata'].shape[0] == 3
     assert pidata_es['pidata'].shape[1] == 4
@@ -233,7 +237,8 @@ def test_process_signals_scada(scada_es, transformations, aggregations):
         "fft.mean.mean_value": [1002, None, 56.8]
     })
     expected['COD_ELEMENT'] = expected['COD_ELEMENT'].astype('category')
-    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype('float64')
+    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype(
+        'float64')
     after = scada_es['scada'].copy()
 
     assert scada_es['scada_processed'].shape[0] == 3
@@ -263,7 +268,8 @@ def test_process_signals_scada_replace(scada_es, transformations, aggregations):
         "fft.mean.mean_value": [1002, None, 56.8]
     })
     expected['COD_ELEMENT'] = expected['COD_ELEMENT'].astype('category')
-    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype('float64')
+    expected['fft.mean.mean_value'] = expected['fft.mean.mean_value'].astype(
+        'float64')
 
     assert scada_es['scada'].shape[0] == 3
     assert scada_es['scada'].shape[1] == 4
 
@@ -10,7 +10,8 @@ def test_default_scada_mapped_kwargs():
 
 
 def test_default_pidata_mapped_kwargs():
-    expected = {**DEFAULT_ES_KWARGS, 'pidata': DEFAULT_ES_TYPE_KWARGS['pidata']}
+    expected = {**DEFAULT_ES_KWARGS,
+                'pidata': DEFAULT_ES_TYPE_KWARGS['pidata']}
     actual = get_mapped_kwargs('pidata')
     assert expected == actual
 
 
@@ -9,16 +9,9 @@
 import os
 
 from zephyr_ml.core import Zephyr
-from zephyr_ml.entityset import (
-    # create_pidata_entityset,
-    # create_scada_entityset,
-    _create_entityset,
-    VALIDATE_DATA_FUNCTIONS,
-)
+from zephyr_ml.entityset import VALIDATE_DATA_FUNCTIONS, _create_entityset
 from zephyr_ml.labeling import DataLabeler
 
-MLBLOCKS_PRIMITIVES = os.path.join(os.path.dirname(__file__), "primitives", "jsons")
+MLBLOCKS_PRIMITIVES = os.path.join(
+    os.path.dirname(__file__), "primitives", "jsons")
 MLBLOCKS_PIPELINES = os.path.join(os.path.dirname(__file__), "pipelines")
-# import os, sys
-
-# sys.path.append(os.path.dirname(os.path.realpath(__file__)))