EES-TUe
diff --git a/‎.github/pypi-publish.yml‎
Lines changed: 95 additions & 0 deletions b/‎.github/pypi-publish.yml‎
Lines changed: 95 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 18 additions & 3 deletions b/‎README.md‎
Lines changed: 18 additions & 3 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 9 additions & 5 deletions b/‎pyproject.toml‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎src/electricity_network_file_parser/FileParser.py‎
Lines changed: 141 additions & 0 deletions b/‎src/electricity_network_file_parser/FileParser.py‎
Lines changed: 141 additions & 0 deletions
diff --git a/‎src/electricity_network_file_parser/GnfParser.py‎
Lines changed: 47 additions & 0 deletions b/‎src/electricity_network_file_parser/GnfParser.py‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎…ckage_YOUR_PACKAGE_NAME_HERE/__init__.py‎ ‎…ctricity_network_file_parser/__init__.py‎src/example_package_YOUR_PACKAGE_NAME_HERE/__init__.py renamed to src/electricity_network_file_parser/__init__.py b/‎…ckage_YOUR_PACKAGE_NAME_HERE/__init__.py‎ ‎…ctricity_network_file_parser/__init__.py‎src/example_package_YOUR_PACKAGE_NAME_HERE/__init__.py renamed to src/electricity_network_file_parser/__init__.py
diff --git a/‎src/electricity_network_file_parser/dataclasses.py‎
Lines changed: 6 additions & 0 deletions b/‎src/electricity_network_file_parser/dataclasses.py‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/example_package_YOUR_PACKAGE_NAME_HERE/example_package_YOUR_PACKAGE_NAME_HERE.py‎
Lines changed: 0 additions & 3 deletions b/‎src/example_package_YOUR_PACKAGE_NAME_HERE/example_package_YOUR_PACKAGE_NAME_HERE.py‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎src/main.py‎
Lines changed: 0 additions & 8 deletions b/‎src/main.py‎
Lines changed: 0 additions & 8 deletions
@@ -0,0 +1,95 @@
+name: Publish Python 🐍 distribution 📦 to PyPI
+
+on: push
+
+jobs:
+  build:
+    name: Build distribution 📦
+    runs-on: ubuntu-latest
+
+    steps:
+    - uses: actions/checkout@v4
+      with:
+        persist-credentials: false
+    - name: Set up Python
+      uses: actions/setup-python@v5
+      with:
+        python-version: "3.x"
+    - name: Install pypa/build
+      run: >-
+        python3 -m
+        pip install
+        build
+        --user
+    - name: Build a binary wheel and a source tarball
+      run: python3 -m build
+    - name: Store the distribution packages
+      uses: actions/upload-artifact@v4
+      with:
+        name: python-package-distributions
+        path: dist/
+
+  publish-to-pypi:
+    name: >-
+      Publish Python 🐍 distribution 📦 to PyPI
+    if: startsWith(github.ref, 'refs/tags/')  # only publish to PyPI on tag pushes
+    needs:
+    - build
+    runs-on: ubuntu-latest
+    environment:
+      name: pypi
+      url: https://pypi.org/project/electricity-network-file-parser/  # Replace <package-name> with your PyPI project name
+    permissions:
+      id-token: write  # IMPORTANT: mandatory for trusted publishing
+
+    steps:
+    - name: Download all the dists
+      uses: actions/download-artifact@v4
+      with:
+        name: python-package-distributions
+        path: dist/
+    - name: Publish distribution 📦 to PyPI
+      uses: pypa/gh-action-pypi-publish@release/v1
+
+  github-release:
+    name: >-
+      Sign the Python 🐍 distribution 📦 with Sigstore
+      and upload them to GitHub Release
+    needs:
+    - publish-to-pypi
+    runs-on: ubuntu-latest
+
+    permissions:
+      contents: write  # IMPORTANT: mandatory for making GitHub Releases
+      id-token: write  # IMPORTANT: mandatory for sigstore
+
+    steps:
+    - name: Download all the dists
+      uses: actions/download-artifact@v4
+      with:
+        name: python-package-distributions
+        path: dist/
+    - name: Sign the dists with Sigstore
+      uses: sigstore/gh-action-sigstore-python@v3.0.0
+      with:
+        inputs: >-
+          ./dist/*.tar.gz
+          ./dist/*.whl
+    - name: Create GitHub Release
+      env:
+        GITHUB_TOKEN: ${{ github.token }}
+      run: >-
+        gh release create
+        "$GITHUB_REF_NAME"
+        --repo "$GITHUB_REPOSITORY"
+        --notes ""
+    - name: Upload artifact signatures to GitHub Release
+      env:
+        GITHUB_TOKEN: ${{ github.token }}
+      # Upload to GitHub Release using the `gh` CLI.
+      # `dist/` contains the built packages, and the
+      # sigstore-produced signatures and certificates.
+      run: >-
+        gh release upload
+        "$GITHUB_REF_NAME" dist/**
+        --repo "$GITHUB_REPOSITORY"
@@ -1,8 +1,23 @@
-# Python-project-template
-A template repository for new python projects
+# Network file parser
+A python package parsing gaia files. It takes a gaia file as input and parses the data in pandas data frames.
+
+Example usage:
+
+```python
+from electricity_network_file_parser.GnfParser import GnfParser
+
+gnf_parser = GnfParser("test.gnf")
+gnf_parser.parse_file()
+
+# To acces the dataframe of a single entity type
+gnf_parser.data_frames["CABLE"]
+
+# Write all data to a single excel file each tab in the excel file represents an entity in the gaia file
+gnf_parser.write_all_data_frames()
+```
 
 ## Installation
 
 Create a new python environment and run the following command:
 
-`pip install -e . `
+`pip install electricity_network_file_parser `
@@ -3,20 +3,24 @@ requires = ["hatchling"]
 build-backend = "hatchling.build"
 
 [project]
-name = "example_package_YOUR_PACKAGE_NAME_HERE"
+name = "electricity_network_file_parser"
 version = "0.0.1"
 authors = [
-  { name="Example Author", email="author@example.com" },
+  { name="Leo van Schooten", email="l.g.t.v.schooten@tue.nl" },
 ]
-description = "A small example package"
+description = "A Python package for parsing gaia and vision files. "
 readme = "README.md"
 requires-python = ">=3.8"
 classifiers = [
     "Programming Language :: Python :: 3",
     "License :: OSI Approved :: MIT License",
     "Operating System :: OS Independent",
 ]
+dependencies = [
+  'pandas==2.2.3',
+  'openpyxl==3.1.5'
+]
 
 [project.urls]
-Homepage = "https://github.com/pypa/sampleproject"
-Issues = "https://github.com/pypa/sampleproject/issues"
+Homepage = "https://github.com/EES-TUe/network-file-parser"
+Issues = "https://github.com/EES-TUe/network-file-parser/issues"
@@ -0,0 +1,141 @@
+from typing import List
+import pandas as pd
+
+from pathlib import Path
+
+from electricity_network_file_parser.dataclasses import PropertyDescription
+
+class FileParser:
+    def __init__(self, file_path):
+        self.file_path = Path(file_path)
+        self.data_frames :dict[str, pd.DataFrame] = {} 
+
+        with open(self.file_path, mode='r') as file:
+            lines = file.readlines()
+
+        self.entity_dict = self.create_entity_dict(lines)
+        self.parse_entities_dict = { }
+
+    def is_integer(self, s : str):
+        to_check = s
+
+        if to_check.startswith('-') or to_check.startswith('+'):
+            to_check = to_check[1:]
+
+        return to_check.isdigit()
+
+    def parse_value(self, value):
+        if value == 'True':
+            return True
+        elif value == 'False':
+            return False
+        elif self.is_integer(value):
+            return int(value)
+        elif value.startswith("'") and value.endswith("'"):
+            return value[1:-1]
+        else:
+            return float(value.replace(",", "."))
+        
+    def extend_dictionary(self, dict_to_extend : dict, dict_extension : dict):
+        for key, value in dict_extension.items():
+            dict_to_extend[key] = value
+
+    def parse_property_line(self, property_line : str):
+        property_name = property_line[1: property_line.index(" ")]
+        property_attributes = property_line[property_line.index(" "):]
+        col_name = ''
+        value = ''
+        reading_value = False
+        reading_string = False
+        property_dict = {}
+        for char in property_attributes:
+            if char == ':' and not reading_value:
+                reading_value = True
+            elif not reading_value:
+                col_name += char
+            elif char == ' ' and not reading_string and value != '':
+                property_dict[col_name.strip()] = self.parse_value(value)
+                reading_value = False
+                value = ''
+                col_name = ''
+            elif reading_value:
+                if char == "'" and not reading_string:
+                    reading_string = True
+                elif char == "'" and reading_string:
+                    reading_string = False
+                value += char
+
+        property_dict[col_name.strip()] = self.parse_value(value)
+        return PropertyDescription(property_name, property_dict)
+
+    def parse_entities(self, lines : List[str], property_attributes_to_parse : List[str]):
+        parsed_property_types = []
+        data_instance = {}
+        data_instances = []
+        for line in lines:
+            line_stripped = line.strip()
+            property_name = ""
+            if " " in line_stripped:
+                property_name = line_stripped[1: line_stripped.index(" ")]
+            started_new_entity = property_name in parsed_property_types and property_name == "General"
+            all_property_types_parsed = len(parsed_property_types) == len(property_attributes_to_parse)
+            if started_new_entity or all_property_types_parsed:
+                if not all_property_types_parsed:
+                    print(f"Not all property types are present for entity {line_stripped}")
+                data_instances.append(data_instance)
+                data_instance = {}
+                parsed_property_types = []
+            if property_name in property_attributes_to_parse:
+                general_properties = self.parse_property_line(line_stripped)
+                self.extend_dictionary(data_instance, general_properties.property_attributes)
+                parsed_property_types.append(general_properties.property_type)
+
+        if len(data_instance.items()) > 0:
+            data_instances.append(data_instance)
+
+        return pd.DataFrame(data_instances)
+
+    def create_entity_dict(self, lines):
+        entity_indices = [i for i, line in enumerate(lines) if line.strip().startswith("[") and line.strip().endswith("]")]
+        entity_start_indices = [val for i, val in enumerate(entity_indices) if i % 2 == 0]
+        entity_end_indices = [val for i,val in enumerate(entity_indices) if i % 2 != 0]
+
+        entity_dict = {}
+
+        for i in range(0, len(entity_start_indices)):
+            entity_name = lines[entity_start_indices[i]].strip()[1:-1]
+            entity_dict[entity_name] = lines[entity_start_indices[i] + 1:entity_end_indices[i]]
+        return entity_dict
+    
+    def group_data_frame_by_columns(self, df : pd.DataFrame, columns_to_group_by : List[str]) -> pd.DataFrame:
+        for col in columns_to_group_by:
+            df[col] = df.apply(lambda x, col=col: -1 if pd.isnull(x[col]) or pd.isna(x[col]) else x[col], axis=1)
+        result = df.groupby(columns_to_group_by).size().reset_index().rename(columns={0:'count'})
+        return result
+    
+    def get_records_containing_field_values(self, df : pd.DataFrame, fields : dict) -> pd.DataFrame:
+        query = " and ".join([f"{key} == {value}" for key, value in fields.items()])
+        return df.query(query)
+
+    def parse_cable_types(self, cables_df : pd.DataFrame) -> pd.DataFrame:
+        pass
+
+    def write_all_data_frames(self, file_name : str = "data.xlsx"):
+        self.data_frames["CABLETYPE"] = self.get_cable_type_data_as_dataframe()
+        with pd.ExcelWriter(file_name) as writer:
+            for name, dataframe in self.data_frames.items():
+                dataframe.to_excel(writer, sheet_name=name, index=False)
+
+    def parse_file(self):
+        for key, value in self.parse_entities_dict.items():
+            if key in self.parse_entities_dict.keys() and key in self.entity_dict.keys():
+                if key not in self.data_frames.keys():
+                    self.data_frames[key] = pd.DataFrame()
+                self.data_frames[key] = pd.concat([self.data_frames[key], self.parse_entities(self.entity_dict[key], value)])
+        if "CABLE" in self.data_frames.keys():
+            self.data_frames["CABLETYPE"] = self.parse_cable_types(self.data_frames["CABLE"])
+
+    def write_all_data_frames(self, file_name : str = "data.xlsx"):
+        with pd.ExcelWriter(file_name) as writer:
+            for name, dataframe in self.data_frames.items():
+                dataframe.to_excel(writer, sheet_name=name, index=False)
@@ -0,0 +1,47 @@
+import pandas as pd
+from electricity_network_file_parser.FileParser import FileParser
+
+class GnfParser(FileParser):
+
+    def __init__(self, file_path):
+        super().__init__(file_path)
+        self.parse_entities_dict = {
+            "PROFILE" : ["General", "ProfileType"],
+            "GM TYPE" : ["General"],
+            "NODE" : ["General"],
+            "LINK" : ["General"],
+            "CABLE" : ["General", "CablePart", "CableType"],
+            "TRANSFORMER" : ["General", "VoltageControl", "TransformerType"],
+            "SOURCE" : ["General"],
+            "LOAD" : ["General"],
+            "HOME" : ["General", "ConnectionCableType", "FuseType"],
+            "MEASURE FIELD" : ["General"],
+            "FUSE": ["General"]
+        }
+
+    def parse_cable_types(self, cables_df : pd.DataFrame) -> pd.DataFrame:
+        columns_to_group_by = ["Unom", "Price", "C", "C0", 
+                               "Inom0", "G1", "Inom1", "G2", 
+                               "Inom2", "G3", "Inom3", "Ik1s", 
+                               "Tr", "TInom", "TIk1s", "Frequency", 
+                               "R_c", "X_c", "R_cc_n", "X_cc_n", "R_cc_o", 
+                               "X_cc_o", "R_e", "X_e", "R_ce", "X_ce", "Inom_e", "Ik1s_e", 
+                               "R_h", "X_h", "R_ch_n", "X_ch_n", "R_ch_o", 
+                               "X_ch_o", "R_hh_n", "X_hh_n", "R_hh_o", "X_hh_o", "R_he", "X_he", 
+                               "Inom_h", "Ik1s_h"]
+
+        unique_cable_types = self.group_data_frame_by_columns(cables_df, columns_to_group_by)
+        dictionaries = unique_cable_types.to_dict('records')
+        long_names = []
+        short_names = []
+        for dictionary in dictionaries:
+            dictionary.pop("count")
+            cables_with_cable_type_params = self.get_records_containing_field_values(cables_df, dictionary)
+            cable_types = cables_with_cable_type_params["CableType"].unique()
+            short_names_values = cables_with_cable_type_params["ShortName"].unique()
+            long_names.append(",".join(cable_types))
+            short_names.append(",".join(short_names_values))
+
+        unique_cable_types["Longnames"] = long_names
+        unique_cable_types["Shortnames"] = short_names
+        return unique_cable_types
@@ -0,0 +1,6 @@
+from dataclasses import dataclass
+
+@dataclass
+class PropertyDescription:
+    property_type : str
+    property_attributes : dict