Complete Fibonacci example

mhkarsten · mhkarsten · commit f087f96e5202 · 2025-05-01T17:02:26.000+02:00
diff --git a/.gitignore b/.gitignore
@@ -22,3 +22,5 @@ python
 Session.vim
 Vagrantfile
 scratch.py
+
+__MACOSX/
diff --git a/examples/hello-world-fibonacci/README.md b/examples/hello-world-fibonacci/README.md
@@ -1,16 +1,23 @@
 
-# Hello World
+# Hello World Fibonacci
+
+A simple platform independent example that runs three different fibonacci implementations, 
+and measures their power consumption, runtime, and memory usage using [EnergiBridge](https://github.com/tdurieux/EnergiBridge).
+
+Note that admin permissions are needed to make use of EnergiBridge.
 
-A simple example that just prints on each event. This examples serves as an equivalent of a "Hello World" program.
 
 ## Running
 
 From the root directory of the repo, run the following command:
 
 ```bash
-python experiment-runner/ examples/hello-world/RunnerConfig.py
+python experiment-runner/ examples/hello-world-fibonacci/RunnerConfig.py
 ```
 
 ## Results
 
-The results are generated in the `examples/hello-world/experiments` folder.
+The results are generated in the `examples/hello-world-fibonacci/experiments` folder.
+
+**!!! WARNING !!!**: COLUMNS IN THE `energibridge.csv` FILES CAN BE DIFFERENT ACROSS MACHINES.
+ADJUST THE DATAFRAME COLUMN NAMES ACCORDINGLY.
diff --git a/examples/hello-world-fibonacci/RunnerConfig.py b/examples/hello-world-fibonacci/RunnerConfig.py
@@ -55,11 +55,11 @@ def create_run_table_model(self) -> RunTableModel:
         """Create and return the run_table model here. A run_table is a List (rows) of tuples (columns),
         representing each run performed"""
         factor1 = FactorModel("fib_type", ['iter', 'mem', 'rec'])
-        factor2 = FactorModel("problem_size", [10, 100, 1000, 10000])
+        factor2 = FactorModel("problem_size", [10, 20, 30])
         self.run_table_model = RunTableModel(
             factors=[factor1, factor2],
             repetitions = 3,
-            data_columns=["total_power", "runtime", "avg_cpu", "avg_mem"]
+            data_columns=["total_power (J)", "runtime (sec)", "avg_mem (bytes)"]
         )
         return self.run_table_model
 
@@ -84,8 +84,10 @@ def start_measurement(self, context: RunnerContext) -> None:
         fib_type = context.run_variation["fib_type"]
         problem_size = context.run_variation["problem_size"]
 
-        self.profiler = EnergiBridge(target_program=f"./fibonacci_{fib_type}.py {problem_size}")
-        
+        EnergiBridge.source_name = "../EnergiBridge/target/release/energibridge"
+        self.profiler = EnergiBridge(target_program=f"python examples/hello-world-fibonacci/fibonacci_{fib_type}.py {problem_size}",
+                                     out_file=context.run_dir / "energibridge.csv")
+
         self.profiler.start()
 
     def interact(self, context: RunnerContext) -> None:
@@ -106,13 +108,12 @@ def populate_run_data(self, context: RunnerContext) -> Optional[Dict[str, Any]]:
         You can also store the raw measurement data under `context.run_dir`
         Returns a dictionary with keys `self.run_table_model.data_columns` and their values populated"""
         
-        eb_log = self.profiler.parse_log(context.run_dir / self.profiler.logfile)
-        eb_summary = self.profiler.parse_log(context.run_dir / self.profiler.summaryfile)
-
-        return {"total_power": 0, 
-                "runtime": 0, 
-                "avg_cpu": 0, 
-                "avg_mem": 0}
+        eb_log, eb_summary = self.profiler.parse_log(self.profiler.logfile, 
+                                                     self.profiler.summary_logfile)
+        
+        return {"total_power (J)": eb_summary["total_joules"], 
+                "runtime (sec)": eb_summary["runtime_seconds"], 
+                "total_mem (bytes)": list(eb_log["TOTAL_MEMORY"].values())[-1]}
 
     def after_experiment(self) -> None:
         """Perform any activity required after stopping the experiment here
diff --git a/examples/hello-world-fibonacci/fibonacci_iter.py b/examples/hello-world-fibonacci/fibonacci_iter.py
@@ -1,10 +1,11 @@
 # Implementation by Mandy Wong (https://realpython.com/fibonacci-sequence-python/)
+import sys
 
 def fib(n):
 	a, b = 0, 1
 	for i in range(0, n):
 		a, b = b, a + b
 	return a
 
-for n in range(10000):
-	print(fib(n))
+for n in range(int(sys.argv[1])):
+	print(fib(n))
diff --git a/examples/hello-world-fibonacci/fibonacci_mem.py b/examples/hello-world-fibonacci/fibonacci_mem.py
@@ -1,4 +1,5 @@
 # Implementation by Mandy Wong (https://realpython.com/fibonacci-sequence-python/)
+import sys
 
 cache = {0: 0, 1: 1}
 
@@ -9,5 +10,5 @@ def fib(n):
 	cache[n] = fib(n - 1) + fib(n - 2)  # Recursive case
 	return cache[n]
 
-for n in range(10000):
-	print(fib(n))
+for n in range(int(sys.argv[1])):
+	print(fib(n))
diff --git a/examples/hello-world-fibonacci/fibonacci_rec.py b/examples/hello-world-fibonacci/fibonacci_rec.py
@@ -1,9 +1,10 @@
 # Implementation by Mandy Wong (https://realpython.com/fibonacci-sequence-python/)
+import sys
 
 def fib(n):
 	if n in {0, 1}:  # Base case
 		return n
 	return fib(n - 1) + fib(n - 2)  # Recursive case
 
-for n in range(10000):
-	print(fib(n))
+for n in range(int(sys.argv[1])):
+	print(fib(n))
diff --git a/experiment-runner/ConfigValidator/Config/Validation/ConfigValidator.py b/experiment-runner/ConfigValidator/Config/Validation/ConfigValidator.py
@@ -24,28 +24,28 @@ def __check_expression(name, value, expected, expression):
     
     # Verifies that an energybridge executable is present, and can be executed without error
     @staticmethod
-    def __validate_energibridge(measure_enabled, eb_path, eb_logfile):
+    def __validate_energibridge(config):
         # Do nothing if its not enabled
-        if not measure_enabled:
+        if not config.self_measure:
             return
 
         if  not platform.system() == "Linux"    \
-            or not os.path.exists(eb_path)      \
-            or not os.access(eb_path, os.X_OK):
+            or not os.path.exists(config.self_measure_bin)      \
+            or not os.access(config.self_measure_bin, os.X_OK):
 
             ConfigValidator.error_found = True
             ConfigValidator \
             .config_values_or_exception_dict["EnergiBridge"] = "EnergiBridge executable was not present or valid"
         
-        if  eb_logfile \
-            and not is_path_exists_or_creatable_portable(eb_logfile):
+        if  config.self_measure_logfile \
+            and not is_path_exists_or_creatable_portable(config.self_measure_logfile):
             ConfigValidator.error_found = True
             ConfigValidator \
-            .config_values_or_exception_dict["EnergiBridge"] = f"EnergiBridge logfile ({eb_logfile}) was not a valid path"
+            .config_values_or_exception_dict["EnergiBridge"] = f"EnergiBridge logfile ({config.self_measure_logfile}) was not a valid path"
         
         # Test run to see if energibridge works
         try:
-            eb_args = [eb_path, "--summary", "-o", "/dev/null", "--", "sleep", "0.5"]
+            eb_args = [config.self_measure_bin, "--summary", "-o", "/dev/null", "--", "sleep", "0.5"]
             p = subprocess.Popen(eb_args, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
 
             stdout, stderr = p.communicate(timeout=5)
@@ -112,10 +112,7 @@ def validate_config(config: RunnerConfig):
                             (lambda a, b: is_path_exists_or_creatable_portable(a))
                         )
         
-        ConfigValidator.__validate_energibridge(config.self_measure, 
-                                                config.self_measure_bin, 
-                                                config.self_measure_logfile
-                        )
+        ConfigValidator.__validate_energibridge(config)
 
         # Display config in user-friendly manner, including potential errors found
         print(
diff --git a/experiment-runner/Plugins/Profilers/DataSource.py b/experiment-runner/Plugins/Profilers/DataSource.py
@@ -7,6 +7,8 @@
 import shlex
 from enum import StrEnum
 import shutil
+import ctypes
+import os
 import subprocess
 
 class ParameterDict(UserDict):
@@ -73,6 +75,12 @@ def _validate_platform(self):
 
         raise RuntimeError(f"One of: {self.supported_platforms} is required for this plugin")
 
+    def is_admin(self):
+        try:
+            return os.getuid() == 0
+        except:
+            return ctypes.windll.shell32.IsUserAdmin() == 1
+
     @property
     @abstractmethod
     def supported_platforms(self) -> list[str]:
@@ -96,7 +104,8 @@ def parse_log(logfile):
 class CLISource(DataSource):
     def __init__(self):
         super().__init__()
-
+        
+        self.requires_admin = False
         self.process = None
         self.args = None
 
@@ -112,7 +121,8 @@ def parameters(self) -> ParameterDict:
     def _validate_platform(self):
         super()._validate_platform()
                 
-        if shutil.which(self.source_name) is None:
+        if shutil.which(self.source_name) is None       \
+            and not os.access(self.source_name, os.X_OK):
             raise RuntimeError(f"The {self.source_name} cli tool is required for this plugin")
     
     def _validate_start(self):
@@ -150,7 +160,11 @@ def _validate_parameters(self, parameters: dict):
 
     def _format_cmd(self):
         self._validate_parameters(self.args)
+
         cmd = self.source_name
+
+        if self.requires_admin:
+            cmd = f"sudo {cmd}"
         
         # Transform the parameter dict into string format to be parsed by shlex
         for p, v in self.args.items():
@@ -195,7 +209,8 @@ def stop(self, wait=False):
         try:
             if not wait:
                 self.process.terminate()
-            stdout, stderr = self.process.communicate(timeout=5)
+            
+            stdout, stderr = self.process.communicate(timeout=None if wait else 5)
 
         except Exception as e:
             self.process.kill()
diff --git a/experiment-runner/Plugins/Profilers/EnergiBridge.py b/experiment-runner/Plugins/Profilers/EnergiBridge.py
@@ -1,5 +1,6 @@
 from pathlib import Path
 import pandas as pd
+import re
 from Plugins.Profilers.DataSource import CLISource, ParameterDict
 
 # Supported Paramters for the PowerJoular metrics plugin
@@ -16,18 +17,19 @@
 class EnergiBridge(CLISource):
     parameters = ParameterDict(ENERGIBRIDGE_PARAMETERS)
     source_name = "energibridge"
-    supported_platforms = ["Linux"]
+    supported_platforms = ["Linux", "Darwin", "Windows"]
 
     """An integration of PowerJoular into experiment-runner as a data source plugin"""
     def __init__(self,
-                 sample_frequency:      int                 = 5000,
+                 sample_frequency:      int                 = 200,
                  out_file:              Path                = "energibridge.csv",
                  summary:               bool                = True,
                  target_program:        str                 = "sleep 1000000",
                  additional_args:       dict                = {}):
         
         super().__init__()
-
+        
+        self.requires_admin = True
         self.target_program = target_program
         self.logfile = out_file
         self.args = {
@@ -39,13 +41,77 @@ def __init__(self,
             self.update_parameters(add={"--summary": None})
 
         self.update_parameters(add=additional_args)
+    
+    @property
+    def summary(self):
+        return "--summary" in self.args.keys()
+                    
+    @property
+    def summary_logfile(self):
+        if  not self.logfile \
+            or not any(map(lambda x: x in self.args.keys(), ["-o", "--output"])):
+            
+            return None
+
+        return self.logfile.parent / Path(self.logfile.name.split(".")[0] + "-summary.txt")
+    
+    def _stat_delta(self, data, stat):
+        return list(data[stat].values())[-1] - list(data[stat].values())[0]
+
+    # Less accurate than the summary from EB, but better than nothing
+    # TODO: EnergiBridge calculates this differently in a system dependent way,
+    #       this approximates using available data
+    def generate_summary(self):
+        log_data = self.parse_log(self.logfile)
+        
+        elapsed_time = self._stat_delta(log_data, "Time") / 1000
+        total_joules = self._stat_delta(log_data, "PACKAGE_ENERGY (J)")
+
+        return f"Energy consumption in joules: {total_joules} for {elapsed_time} sec of execution"
+
+    # We also want to save the summary of EnergiBridge if present
+    def stop(self, wait=False):
+
+        stdout = super().stop(wait)
+
+        if self.summary and self.summary_logfile:
+            with open(self.summary_logfile, "w") as f:
+                # The last line is the summary, if present
+                last_line = stdout.splitlines()[-1]
+                
+                # If runtime was too short, energibridge doesnt provide a summary
+                # Approximate this instead
+                if not last_line.startswith("Energy consumption"):
+                    last_line = self.generate_summary()
+
+                f.write(last_line)
+
+        return stdout
 
     def _format_cmd(self):
         cmd = super()._format_cmd()
 
         return cmd + f" -- {self.target_program}"
 
     @staticmethod
-    def parse_log(logfile: Path):
+    def parse_log(logfile: Path, summary_logfile: Path|None=None):
         # Things are already in csv format here, no checks needed
-        return pd.read_csv(logfile).to_dict()
+        log_data = pd.read_csv(logfile).to_dict()
+
+        if not summary_logfile:
+            return log_data
+
+        with open(summary_logfile, "r") as f:
+            summary_data = f.read()
+            
+            # Extract the floats from the string, we expect always positive X.X
+            values = re.findall("[0-9]+[.]?[0-9]*", summary_data)
+
+            if len(values) == 2:
+                summary_data = {
+                    "total_joules": float(values[0]), 
+                    "runtime_seconds": float(values[1])
+                }
+
+        return (log_data, summary_data)
+