snipsco
diff --git a/‎.travis.yml‎
Lines changed: 4 additions & 6 deletions b/‎.travis.yml‎
Lines changed: 4 additions & 6 deletions
diff --git a/‎CHANGELOG.md‎
Lines changed: 5 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎MANIFEST.in‎
Lines changed: 2 additions & 1 deletion b/‎MANIFEST.in‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎README.rst‎
Lines changed: 1 addition & 3 deletions b/‎README.rst‎
Lines changed: 1 addition & 3 deletions
diff --git a/‎setup.py‎
Lines changed: 3 additions & 1 deletion b/‎setup.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎snips_nlu_metrics/__version__‎
Lines changed: 1 addition & 1 deletion b/‎snips_nlu_metrics/__version__‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎snips_nlu_metrics/metrics.py‎
Lines changed: 22 additions & 14 deletions b/‎snips_nlu_metrics/metrics.py‎
Lines changed: 22 additions & 14 deletions
diff --git a/‎snips_nlu_metrics/tests/mock_engine.py‎
Lines changed: 22 additions & 2 deletions b/‎snips_nlu_metrics/tests/mock_engine.py‎
Lines changed: 22 additions & 2 deletions
@@ -4,15 +4,13 @@ matrix:
   include:
     - python: 2.7
       env: TOXENV=py27
-    - python: 3.4
-      env: TOXENV=py34
     - python: 3.5
       env: TOXENV=py35
     - python: 3.6
       env: TOXENV=py36
+    - python: 3.7
+      env: TOXENV=py37
 
-install:
-  - pip install --upgrade --pre tox
+install: pip install --upgrade --pre tox
 
-script:
-  - tox
+script: tox
@@ -1,6 +1,10 @@
 # Changelog
 All notable changes to this project will be documented in this file.
 
+## [0.14.3] - 2019-05-10
+### Added
+- Add optional parameter `intents_filter` to metrics APIs [#115](https://github.com/snipsco/snips-nlu-metrics/pull/115)
+
 ## [0.14.2] - 2019-03-21
 ### Added
 - Number of exact parsings
@@ -44,6 +48,7 @@ All notable changes to this project will be documented in this file.
 - Samples
 
 
+[0.14.3]: https://github.com/snipsco/snips-nlu-metrics/compare/0.14.2...0.14.3
 [0.14.2]: https://github.com/snipsco/snips-nlu-metrics/compare/0.14.1...0.14.2
 [0.14.1]: https://github.com/snipsco/snips-nlu-metrics/compare/0.14.0...0.14.1
 [0.14.0]: https://github.com/snipsco/snips-nlu-metrics/compare/0.13.0...0.14.0
 
@@ -1,3 +1,4 @@
+recursive-include samples *
 include snips_nlu_metrics/__version__
-include README.rst LICENSE
+include README.rst LICENSE CHANGELOG.md
 global-exclude __pycache__ *.py[cod]
@@ -94,11 +94,9 @@ API as follows:
 
 .. code-block:: python
 
-    from snips_nlu import load_resources, SnipsNLUEngine
+    from snips_nlu import SnipsNLUEngine
     from snips_nlu_metrics import compute_train_test_metrics, compute_cross_val_metrics
 
-    load_resources("en")
-
     tt_metrics = compute_train_test_metrics(train_dataset="samples/train_dataset.json",
                                             test_dataset="samples/test_dataset.json",
                                             engine_class=SnipsNLUEngine)
 
@@ -38,14 +38,16 @@
       author="Adrien Ball",
       author_email="adrien.ball@snips.ai",
       license="Apache 2.0",
+      url="https://github.com/snipsco/snips-nlu-metrics",
       classifiers=[
           "Programming Language :: Python :: 2",
           "Programming Language :: Python :: 2.7",
           "Programming Language :: Python :: 3",
-          "Programming Language :: Python :: 3.4",
           "Programming Language :: Python :: 3.5",
           "Programming Language :: Python :: 3.6",
+          "Programming Language :: Python :: 3.7",
       ],
+      keywords="metrics nlu nlp intent slots entity parsing",
       extras_require=extras_require,
       install_requires=install_requires,
       packages=packages,
 
@@ -1 +1 @@
-0.14.2
+0.14.3
@@ -3,7 +3,6 @@
 import io
 import json
 import logging
-from builtins import map
 
 from future.utils import iteritems
 from joblib import Parallel, delayed
@@ -25,20 +24,20 @@ def compute_cross_val_metrics(
         dataset, engine_class, nb_folds=5, train_size_ratio=1.0,
         drop_entities=False, include_slot_metrics=True,
         slot_matching_lambda=None, progression_handler=None, num_workers=1,
-        seed=None, out_of_domain_utterances=None):
+        seed=None, out_of_domain_utterances=None, intents_filter=None):
     """Compute end-to-end metrics on the dataset using cross validation
 
     Args:
-        dataset (dict or str): Dataset or path to dataset
-        engine_class: Python class to use for training and inference, this
+        dataset (dict or str): dataset or path to dataset
+        engine_class: python class to use for training and inference, this
             class must inherit from `Engine`
-        nb_folds (int, optional): Number of folds to use for cross validation
+        nb_folds (int, optional): number of folds to use for cross validation
             (default=5)
         train_size_ratio (float, optional): ratio of intent utterances to use
             for training (default=1.0)
-        drop_entities (bool, optional): Specify whether or not all entity
+        drop_entities (bool, optional): specify whether or not all entity
             values should be removed from training data (default=False)
-        include_slot_metrics (bool, optional): If false, the slots metrics and
+        include_slot_metrics (bool, optional): if false, the slots metrics and
             the slots parsing errors will not be reported (default=True)
         slot_matching_lambda (lambda, optional):
             lambda expected_slot, actual_slot -> bool,
@@ -52,9 +51,13 @@ class must inherit from `Engine`
         num_workers (int, optional): number of workers to use. Each worker
             is assigned a certain number of splits (default=1)
         seed (int, optional): seed for the split creation
-        out_of_domain_utterances (list, optional): If defined, list of 
-            out-of-domain utterances to be added to the pool of test utterances 
+        out_of_domain_utterances (list, optional): if defined, list of
+            out-of-domain utterances to be added to the pool of test utterances
             in each split
+        intents_filter (list of str, optional): if defined, at inference times
+            test utterances will be restricted to the ones belonging to this
+            filter. Moreover, if the parsing API allows it, the inference will
+            be made using this intents filter.
 
     Returns:
         dict: Metrics results containing the following data
@@ -72,7 +75,7 @@ class must inherit from `Engine`
     try:
         splits = create_shuffle_stratified_splits(
             dataset, nb_folds, train_size_ratio, drop_entities,
-            seed, out_of_domain_utterances)
+            seed, out_of_domain_utterances, intents_filter)
     except NotEnoughDataError as e:
         logger.warning("Skipping metrics computation because of: %s"
                        % e.message)
@@ -93,14 +96,14 @@ def compute_metrics(split_):
         logger.info("Computing metrics for dataset split ...")
         return compute_split_metrics(
             engine_class, split_, intent_list, include_slot_metrics,
-            slot_matching_lambda)
+            slot_matching_lambda, intents_filter)
 
     effective_num_workers = min(num_workers, len(splits))
     if effective_num_workers > 1:
         parallel = Parallel(n_jobs=effective_num_workers)
         results = parallel(delayed(compute_metrics)(split) for split in splits)
     else:
-        results = map(compute_metrics, splits)
+        results = [compute_metrics(s) for s in splits]
 
     for result in enumerate(results):
         split_index, (split_metrics, errors, confusion_matrix) = result
@@ -137,7 +140,7 @@ def compute_metrics(split_):
 
 def compute_train_test_metrics(
         train_dataset, test_dataset, engine_class, include_slot_metrics=True,
-        slot_matching_lambda=None):
+        slot_matching_lambda=None, intents_filter=None):
     """Compute end-to-end metrics on `test_dataset` after having trained on
     `train_dataset`
 
@@ -155,6 +158,10 @@ class must inherit from `Engine`
             metrics, otherwise exact match will be used.
             `expected_slot` corresponds to the slot as defined in the dataset,
             and `actual_slot` corresponds to the slot as returned by the NLU
+        intents_filter (list of str, optional): if defined, at inference times
+            test utterances will be restricted to the ones belonging to this
+            filter. Moreover, if the parsing API allows it, the inference will
+            be made using this intents filter.
 
     Returns
         dict: Metrics results containing the following data
@@ -184,12 +191,13 @@ class must inherit from `Engine`
         (intent_name, utterance)
         for intent_name, intent_data in iteritems(test_dataset[INTENTS])
         for utterance in intent_data[UTTERANCES]
+        if intents_filter is None or intent_name in intents_filter
     ]
 
     logger.info("Computing metrics...")
     metrics, errors, confusion_matrix = compute_engine_metrics(
         engine, test_utterances, intent_list, include_slot_metrics,
-        slot_matching_lambda)
+        slot_matching_lambda, intents_filter)
     metrics = compute_precision_recall_f1(metrics)
     average_metrics = compute_average_metrics(metrics)
     nb_utterances = {intent: len(data[UTTERANCES])
 
@@ -3,11 +3,11 @@
 from snips_nlu_metrics import Engine
 
 
-def dummy_parsing_result(text):
+def dummy_parsing_result(text, intent_name=None):
     return {
         "input": text,
         "intent": {
-            "intentName": None,
+            "intentName": intent_name,
             "probability": 0.5
         },
         "slots": []
@@ -25,6 +25,26 @@ def parse(self, text):
         return dummy_parsing_result(text)
 
 
+class KeyWordMatchingEngine(Engine):
+    def __init__(self):
+        self.fitted = False
+        self.intents_list = []
+
+    def fit(self, dataset):
+        self.fitted = True
+        self.intents_list = sorted(dataset["intents"])
+
+    def parse(self, text, intents_filter=None):
+        intent = None
+        for intent_name in self.intents_list:
+            if intent_name in text:
+                intent = intent_name
+                break
+        if intents_filter is not None and intent not in intents_filter:
+            intent = None
+        return dummy_parsing_result(text, intent)
+
+
 class MockEngineSegfault(Engine):
     def __init__(self):
         self.fitted = False