cedadev
diff --git a/‎extraction_methods/core/extraction_method.py‎
Lines changed: 3 additions & 0 deletions b/‎extraction_methods/core/extraction_method.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/__init__.py‎ renamed to ‎extraction_methods/plugins/__init__.py‎
Lines changed: 2 additions & 2 deletions b/‎extraction_methods/plugins/extraction_methods/__init__.py‎ renamed to ‎extraction_methods/plugins/__init__.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎extraction_methods/plugins/asset_aggregator.py‎
Lines changed: 145 additions & 0 deletions b/‎extraction_methods/plugins/asset_aggregator.py‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/basename.py‎ renamed to ‎extraction_methods/plugins/basename.py‎
Lines changed: 2 additions & 2 deletions b/‎extraction_methods/plugins/extraction_methods/basename.py‎ renamed to ‎extraction_methods/plugins/basename.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/bbox.py‎ renamed to ‎extraction_methods/plugins/bbox.py‎
Lines changed: 15 additions & 7 deletions b/‎extraction_methods/plugins/extraction_methods/bbox.py‎ renamed to ‎extraction_methods/plugins/bbox.py‎
Lines changed: 15 additions & 7 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/boto_stats.py‎ renamed to ‎extraction_methods/plugins/boto_stats.py‎
Lines changed: 3 additions & 3 deletions b/‎extraction_methods/plugins/extraction_methods/boto_stats.py‎ renamed to ‎extraction_methods/plugins/boto_stats.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/categories.py‎ renamed to ‎extraction_methods/plugins/categories.py‎
Lines changed: 2 additions & 2 deletions b/‎extraction_methods/plugins/extraction_methods/categories.py‎ renamed to ‎extraction_methods/plugins/categories.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/ceda_observation.py‎ renamed to ‎extraction_methods/plugins/ceda_observation.py‎
Lines changed: 2 additions & 2 deletions b/‎extraction_methods/plugins/extraction_methods/ceda_observation.py‎ renamed to ‎extraction_methods/plugins/ceda_observation.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/ceda_vocabulary.py‎ renamed to ‎extraction_methods/plugins/ceda_vocabulary.py‎
Lines changed: 2 additions & 2 deletions b/‎extraction_methods/plugins/extraction_methods/ceda_vocabulary.py‎ renamed to ‎extraction_methods/plugins/ceda_vocabulary.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎extraction_methods/plugins/extraction_methods/controlled_vocabulary.py‎ renamed to ‎extraction_methods/plugins/controlled_vocabulary.py‎ b/‎extraction_methods/plugins/extraction_methods/controlled_vocabulary.py‎ renamed to ‎extraction_methods/plugins/controlled_vocabulary.py‎
@@ -29,6 +29,9 @@ def __init__(self, **kwargs):
         # Override with specific processor settings
         self._set_attrs(kwargs)
 
+        if not hasattr(self, "exists_key"):
+            self.exists_key = "$"
+
     def _set_attrs(self, conf: dict) -> None:
         """
         Set instance attributes
 
@@ -1,8 +1,8 @@
 # encoding: utf-8
 """
 """
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "27 May 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
@@ -0,0 +1,145 @@
+# encoding: utf-8
+"""
+..  _elasticsearch-extract:
+
+Elasticsearch Extract
+------------------
+"""
+__author__ = "Rhys Evans"
+__date__ = "24 May 2022"
+__copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
+__license__ = "BSD - see LICENSE file in top-level package directory"
+__contact__ = "[email protected]"
+
+import logging
+
+# Third party imports
+from elasticsearch import Elasticsearch
+
+from extraction_methods.core.extraction_method import ExtractionMethod
+
+LOGGER = logging.getLogger(__name__)
+
+
+class AssetAggregatorExtract(ExtractionMethod):
+    """
+    Description:
+        Using an ID. Generate a summary of information for higher level entities.
+
+    Configuration Options:
+        - ``index``: Name of the index holding the STAC entities
+        - ``id_term``: Term used for agregating the STAC entities
+        - ``session_kwargs``: Session parameters passed to
+        `elasticsearch.Elasticsearch<https://elasticsearch-py.readthedocs.io/en/7.10.0/api.html>`_
+        - ``bbox``: list of terms for which their aggregate bbox should be returned.
+        - ``min``: list of terms for which the minimum of their aggregate should be returned.
+        - ``max``: list of terms for which the maximum of their aggregate should be returned.
+        - ``sum``: list of terms for which the sum of their aggregate should be returned.
+        - ``list``: list of terms for which a list of their aggregage should be returned.
+
+    Configuration Example:
+
+        .. code-block:: yaml
+
+                name: elasticsearch
+                inputs:
+                    index: ceda-index
+                    id_term: item_id
+                    connection_kwargs:
+                      hosts: ['host1:9200','host2:9200']
+                    bbox:
+                      - bbox
+                    min:
+                      - start_time
+                    max:
+                      - end_time
+                    sum:
+                      - size
+                    list:
+                      - term1
+                      - term2
+    """
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+
+        if not hasattr(self, "list_terms"):
+            self.list_terms = []
+
+        if not hasattr(self, "sum_terms"):
+            self.sum_terms = []
+
+        if not hasattr(self, "avg_terms"):
+            self.avg_terms = []
+
+        if not hasattr(self, "min_terms"):
+            self.min_terms = []
+
+        if not hasattr(self, "max_terms"):
+            self.max_terms = []
+
+
+    def run(self, body: dict, **kwargs) -> dict:
+        for index, list_term in enumerate(self.list_terms):
+            body[list_term["name"]] = []
+
+            if not hasattr(list_term, "key"):
+                list_term["key"] = list_term["name"]
+
+            self.list_terms[index] = list_term
+
+        for index, sum_term in enumerate(self.sum_terms):
+            body[sum_term["name"]] = 0
+
+            if not hasattr(sum_term, "key"):
+                sum_term["key"] = sum_term["name"]
+        
+            self.sum_terms[index] = sum_term
+
+        len_sum_terms = index + 1
+        for index, avg_term in enumerate(self.avg_terms):
+            body[avg_term["name"]] = 0
+
+            if not hasattr(avg_term, "key"):
+                avg_term["key"] = avg_term["name"]
+        
+            self.sum_terms.append(avg_term)
+            self.avg_terms[index] = avg_term
+
+        for index, min_term in enumerate(self.min_terms):
+            if not hasattr(min_term, "key"):
+                min_term["key"] = min_term["name"]
+        
+            min_terms[index] = min_term
+
+            body[min_term["name"]] = body["assets"].values()[0][min_term["key"]]
+
+        for index, max_term in enumerate(self.max_terms):
+            if not hasattr(max_term, "key"):
+                max_term["key"] = max_term["name"]
+        
+            max_terms[index] = max_term
+
+            body[max_term["name"]] = body["assets"].values()[0][max_term["key"]]
+
+        for asset in body["assets"].values():
+            for list_term in self.list_terms:
+                if list_term["key"] in asset:
+                    body[list_term["name"]].append(asset[list_term["key"]])
+
+            for sum_term in self.sum_terms:
+                if sum_term["key"] in asset:
+                    body[sum_term["name"]] += asset[sum_term["key"]]
+            
+            for avg_term in self.avg_terms:
+                body[avg_term["name"]] /= len(body["assets"])
+
+            for min_term in self.min_terms:
+                if min_term["key"] in asset and asset[min_term["key"]] < body[min_term["name"]]:
+                    body[min_term["name"]] = asset[min_term["key"]]
+
+            for max_term in self.max_terms:
+                if max_term["key"] in asset and asset[max_term["key"]] < body[max_term["name"]]:
+                    body[max_term["name"]] = asset[max_term["key"]]
+
+        return body
@@ -1,9 +1,9 @@
 # encoding: utf-8
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "11 Jun 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 import logging
 import os
 
@@ -1,8 +1,8 @@
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "28 May 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 
 import logging
@@ -31,7 +31,7 @@ class BboxExtract(ExtractionMethod):
 
         - method: bbox
             inputs:
-            coordinate_keys:
+              coordinate_keys:
                 - west
                 - south
                 - east
@@ -41,14 +41,19 @@ class BboxExtract(ExtractionMethod):
 
     def run(self, body: dict, **kwargs):
         try:
+            west = body[self.coordinate_keys[0]]
+            south = body[self.coordinate_keys[1]]
+            east = body[self.coordinate_keys[2]]
+            north = body[self.coordinate_keys[3]]
+
             coordinates = [
                 [
-                    float(body[self.coordinate_keys[0]]),
-                    float(body[self.coordinate_keys[1]]),
+                    float(west) if west is not None else west,
+                    float(south) if south is not None else south,
                 ],
                 [
-                    float(body[self.coordinate_keys[2]]),
-                    float(body[self.coordinate_keys[3]]),
+                    float(east) if east is not None else east,
+                    float(north) if north is not None else north,
                 ],
             ]
 
@@ -57,6 +62,9 @@ def run(self, body: dict, **kwargs):
                 "coordinates": coordinates,
             }
 
+        except TypeError:
+            LOGGER.warning("Unable to convert bbox.", exc_info=True)
+
         except KeyError:
             LOGGER.warning("Unable to convert bbox.", exc_info=True)
 
 
@@ -5,11 +5,11 @@
 Regex
 ------
 """
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "27 May 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 
 import logging
@@ -24,9 +24,9 @@
 from boto3.session import Session as BotoSession
 from botocore import UNSIGNED
 from botocore.config import Config
-from stac_generator.core.utils import Stats
 
 from extraction_methods.core.extraction_method import ExtractionMethod
+from extraction_methods.core.utils import Stats
 
 LOGGER = logging.getLogger(__name__)
 
 
@@ -5,11 +5,11 @@
 Regex
 ------
 """
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "27 May 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 
 # Python imports
 
@@ -1,9 +1,9 @@
 # encoding: utf-8
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "11 Jun 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 import logging
 from string import Template
 
@@ -5,11 +5,11 @@
 Regex
 ------
 """
-__author__ = "Rhys Evans"
+__author__ = "Richard Smith"
 __date__ = "27 May 2021"
 __copyright__ = "Copyright 2018 United Kingdom Research and Innovation"
 __license__ = "BSD - see LICENSE file in top-level package directory"
-__contact__ = "rhys.r.evans@stfc.ac.uk"
+__contact__ = "richard.d.smith@stfc.ac.uk"
 
 
 # Python imports