formulaslug
diff --git a/‎.clang-format
Lines changed: 2 additions & 0 deletions b/‎.clang-format
Lines changed: 2 additions & 0 deletions
diff --git a/‎Telemetry-SD-Card/CMakeLists.txt
Lines changed: 41 additions & 0 deletions b/‎Telemetry-SD-Card/CMakeLists.txt
Lines changed: 41 additions & 0 deletions
diff --git a/‎Telemetry-SD-Card/arrowStream.py
Lines changed: 90 additions & 0 deletions b/‎Telemetry-SD-Card/arrowStream.py
Lines changed: 90 additions & 0 deletions
diff --git a/‎Telemetry-SD-Card/dbc_to_cpp.py
Lines changed: 245 additions & 0 deletions b/‎Telemetry-SD-Card/dbc_to_cpp.py
Lines changed: 245 additions & 0 deletions
@@ -0,0 +1,2 @@
+IndentWidth: 4
+BasedOnStyle: LLVM
@@ -0,0 +1,41 @@
+cmake_minimum_required(VERSION 3.19)
+cmake_policy(VERSION 3.19...3.22)
+
+set(MBED_APP_JSON_PATH mbed_app.json5)
+set(CMAKE_EXPORT_COMPILE_COMMANDS 1)
+
+
+# Main project definition
+include(../mbed-os/tools/cmake/mbed_toolchain_setup.cmake)
+project(SDCard LANGUAGES C CXX ASM)
+include(mbed_project_setup)
+
+# Include MBED OS
+add_subdirectory(../mbed-os ../mbed-os-build)
+
+# Fetch Nanoarrow - a minimal implementation of Apache Arrow
+include(FetchContent)
+# This enables the nanoarrow IPC extension (required to use Arrow IPC functions)
+# (note: the nanoarrow_ipc library is created conditionally based on this flag)
+set(NANOARROW_IPC ON CACHE BOOL "Build IPC extension")
+FetchContent_Declare(
+  nanoarrow
+  URL https://github.com/apache/arrow-nanoarrow/releases/download/apache-arrow-nanoarrow-0.6.0/apache-arrow-nanoarrow-0.6.0.tar.gz
+  URL_HASH SHA512=25e81c119c16bfa29a9943d3904acd8f29f225ff4a1c99decde7c8235300232402106a4b5249921df773fb797bb0149a885fa3a4524c34c67c06199edd72250c
+  DOWNLOAD_EXTRACT_TIMESTAMP ON
+)
+FetchContent_MakeAvailable(nanoarrow)
+
+
+# Add our main executable, and link all the above libraries to it
+set(CMAKE_CXX_STANDARD 20)
+add_executable(${PROJECT_NAME} main.cpp)
+
+target_link_libraries(${PROJECT_NAME} mbed-os mbed-storage-sd mbed-storage-fat)
+# "SYSTEM" should remove warnings when compiling the generated flatbuffers code
+# target_include_directories(${PROJECT_NAME} SYSTEM PUBLIC include)
+# target_link_libraries(${PROJECT_NAME} mbed-os mbed-storage-sd mbed-storage-fat nanoarrow nanoarrow_ipc)
+# target_link_libraries(${PROJECT_NAME} mbed-baremetal mbed-storage-sd mbed-storage-fat)
+# target_link_libraries(${PROJECT_NAME} mbed-baremetal mbed-storage-sd mbed-storage-fat nanoarrow nanoarrow_ipc)
+
+mbed_set_post_build(${PROJECT_NAME})
@@ -0,0 +1,90 @@
+import argparse
+import numpy as np
+import polars as pl
+import serial
+
+parser = argparse.ArgumentParser()
+parser.add_argument('--input_file','-i',type=str, action='store', help='input file name', required=True)
+parser.add_argument('--port','-P',type=str, action='store', help='serial_port', required=True)
+parser.add_argument('--log','-l',type=str, action='store', help='serial_port', required=True)
+parser.add_argument('--output_file','-o',type=str, action='store', help='output file name', default='out.arrow')
+args = parser.parse_args()
+
+# Conversion from ASCII defined types in custom binary to numpy types.
+# [type, n] where size is 2**n bits
+types_dict = {
+    "i3": np.int8,
+    "i4": np.int16,
+    "i5": np.int32,
+    "i6": np.int64,
+    "u3": np.uint8,
+    "u4": np.uint16,
+    "u5": np.uint32,
+    "u6": np.uint64,
+    "f4": np.float16,
+    "f5": np.float32,
+    "f6": np.float64,
+    "b0": bool
+    }
+
+# Initialize dataframe
+df = pl.DataFrame()
+
+# Open serial port. Intentionall have no timeout so that we can read until we get the expected header/schema.
+s = serial.Serial(args.port, baudrate=115200)
+s.set_buffer_size(rx_size=1000000)
+s.reset_input_buffer()
+s.reset_output_buffer()
+s.write(b'QS') # Query Schema
+
+# Attempts to read the schema from the serial port.
+# Requests by sending 'QS' 
+for i in range(1000):
+    header = ascii(s.read(8))
+    m = np.frombuffer(s.read(4), dtype=np.uint32, count=1)[0]
+    n = np.frombuffer(s.read(4), dtype=np.uint32, count=1)[0]
+
+    ## Expects to receive record bathes in some multiple of bytes therefore it will not work if n is not a multiple of 8.
+    if ((n%8 != 0) or (n <= 0) or (m <= 0) or (header[:5] != "FSDAQ")):
+        s.write(b'QS') # Query Schema again if n is not a multiple of 8 - Indicates failed attempt to receive schema to the NUCLEO
+    else:
+        s.write(b'RS') # Received Schema - Indicates to NUCLEO to start sending data
+        break
+    if i == 999:
+        s.write(b'SE') # Schema Error - Indicates to the NUCLEO that it failed to get the schema and will exit the program.
+        s.close()
+        raise Exception("Schema Error: Failed to receive valid schema after 1000 attempts.")
+
+# print(f"Header: {header}, m: {m}, n: {n}")
+
+# Reading in the colum titles. They are specified as 
+colTitles = []
+for i in range(m):
+    length = s.read() # uint8 length of title
+    title = s.read(length).decode('ascii') # ascii string of title
+    colTitles.append(title) # Add title to list of titles
+
+# Reading in the column types. They are specified as 2 byte ascii strings where 
+# the first character is type of type (int, uint, float, bool)
+# and the second character is log2() the size of the type in bits (3, 4, 5, 6). Ex. f5 = float32, b0 = bool, u4 = uint16
+colTypes = []
+for i in range(m):
+    colType = s.read(2).decode('ascii') # 2 byte ascii string of type
+    if colType not in types_dict:
+        s.write(b'SE') # Schema Error - Indicates to the NUCLEO that it failed to get the schema and will exit the program.
+        s.close()
+        raise Exception(f"Schema Error: Invalid column type {colType} received.")
+    colTypes.append((types_dict[colType], int((2**int(colType[1]))/8*n)))
+
+
+while (True):
+    frame_pieces = []
+    for i in range(m):
+        col_byte_len = colTypes[i][1]
+        col_type = colTypes[i][0]
+        col_bit = np.frombuffer(s.read(col_byte_len), dtype=col_type, count=n)
+        frame_piece_series = pl.Series(colTitles[i], col_bit)
+        frame_pieces.append(frame_piece_series)
+        pos += col_byte_len
+    frame_piece = pl.DataFrame(frame_pieces)
+    df.to_arrow()
@@ -0,0 +1,245 @@
+import os
+import cantools
+import pyarrow as pa
+import numpy as np
+
+# See choose_float_type() for explanation
+DEFAULT_FLOAT_TOLERANCE = 0.1
+
+FSDAQ_TYPE_TO_C_TYPE = {
+    "b0": "bool",
+    "u3": "uint8_t",
+    "i3": "int8_t",
+    "u4": "uint16_t",
+    "i4": "int16_t",
+    "u5": "uint32_t",
+    "i5": "int32_t",
+    "u6": "uint64_t",
+    "i6": "int64_t",
+    "f5": "float",
+    "f6": "double",
+}
+
+# Find the appropriate type to represent a given signal.
+# - If length==1, bool is used
+# - If scale==1, the correctly sized integer type is used
+# - Otherwise, choose_float_type() is used
+# See choose_float_type() for a description of float_tolerance
+def get_fsdaq_type_for_signal(
+    s: cantools.db.Signal, float_tolerance: float = DEFAULT_FLOAT_TOLERANCE
+) -> str:
+    if s.length == 1 and s.scale == 1 and s.offset == 0:
+        return "b0"
+
+    raw_min = -(1 << (s.length - 1)) if s.is_signed else 0
+    raw_max = (1 << (s.length - 1)) - 1 if s.is_signed else (1 << s.length) - 1
+
+    if s.scale == 1:
+        decoded_min = raw_min
+        decoded_max = raw_max
+        candidates = [
+            ("u3", 0, 255),
+            ("i3", -128, 127),
+            ("u4", 0, 65535),
+            ("i4", -32768, 32767),
+            ("u5", 0, 2**32 - 1),
+            ("i5", -(2**31), 2**31 - 1),
+        ]
+        for arrow_type, min_val, max_val in candidates:
+            if decoded_min >= min_val and decoded_max <= max_val:
+                return arrow_type
+        return "i5" if s.is_signed else "u5"
+
+    return choose_float_type(s, float_tolerance)
+
+
+# Find the appropriate float type to represent the signal within the given
+# tolerance to the signal's scale. Determined by testing if every possible real
+# (scaled) value is representable within tolerance. Eg: if tolerance is 0.5
+# (50%), then any float whose value is within 50%*(signal's scale) of the actual
+# value is considered close enough
+def choose_float_type(s: cantools.db.Signal, tolerance: float):
+    raw_min = -(1 << (s.length - 1)) if s.is_signed else 0
+    raw_max = (1 << (s.length - 1)) - 1 if s.is_signed else (1 << s.length) - 1
+
+    # Interpret min/max as integers, create a range of every integer in between
+    possible_raw_values = np.arange(raw_min, raw_max + 1)
+    # Scale that range of integers to get every possible decimal value
+    possible_decoded_values = possible_raw_values * s.scale + s.offset
+
+    # Make sure every possible decimal value is representable by some float
+    # type, up to a precision of 10% of the signal's scale
+    atol = abs(s.scale) * tolerance
+    for dtype, fsdaq_type in [
+        # (np.float16, "f?"),
+        (np.float32, "f5"),
+        (np.float64, "f6"),
+    ]:
+        # If every possibel real value is close enough using a certain float
+        # type, choose that float type. rtol is 0 as we don't care about
+        # relative tolerance, only tolerance based on the signal's scale
+        if np.allclose(
+            possible_decoded_values,
+            possible_decoded_values.astype(dtype),
+            rtol=0,
+            atol=atol,
+        ):
+            return fsdaq_type
+
+    # Fallback if not exactly representable within 5% tolerance of scale (rare)
+    print(
+        f"Warning: Signal ${s.name} not representable as 64 bit float within 5% tolerance; ignoring!"
+    )
+    return pa.float64()
+
+
+def generate_cpp_code(signal_to_fsdaq_datatype: dict[str, str], rows: int = 8):
+    assert rows % 8 == 0
+
+    out_file = open("./fsdaq_encoder_generated_from_dbc.hpp", "w")
+    template_file = open("./fsdaq_encoder_generated_from_dbc.hpp.in", "r")
+
+    template = template_file.read()
+    template = template.replace("@COLS@", str(len(signal_to_fsdaq_datatype)))
+    template = template.replace("@ROWS@", str(rows))
+
+    col_names = ", ".join(['"' + col + '"' for col in signal_to_fsdaq_datatype.keys()])
+    col_name_sizes = ", ".join([str(len(col_name)) for col_name in signal_to_fsdaq_datatype.keys()])
+    col_name_types = ", ".join(['"' + fsdaq_type + '"' for fsdaq_type in signal_to_fsdaq_datatype.values()])
+    template = template.replace("@COL_NAMES@", col_names)
+    template = template.replace("@COL_NAME_SIZES@", col_name_sizes)
+    template = template.replace("@COL_NAME_TYPES@", col_name_types)
+
+    values_struct_fields = []
+    values_row_struct_fields = []
+    update_fields_from_row = []
+    for col_name, fsdaq_type in signal_to_fsdaq_datatype.items():
+        if fsdaq_type == "b0":
+            values_struct_fields.append(" "*4 + "uint8_t" + " " + col_name + "[ROWS/8];")
+            update_fields_from_row.append(" "*8 + "this->" + col_name + "[idx/8] |= row." + col_name + " << idx;")
+        else:
+            values_struct_fields.append("    " + FSDAQ_TYPE_TO_C_TYPE[fsdaq_type] + " " + col_name + "[ROWS];")
+            update_fields_from_row.append(" "*8 + "this->" + col_name + "[idx] = row." + col_name + ";")
+        values_row_struct_fields.append(" "*4 + FSDAQ_TYPE_TO_C_TYPE[fsdaq_type] + " " + col_name + ";")
+    template = template.replace("@VALUES_STRUCT_FIELDS@", "\n".join(values_struct_fields))
+    template = template.replace("@VALUES_ROW_STRUCT_FIELDS@", "\n".join(values_row_struct_fields))
+
+    template = template.replace("@UPDATE_FIELDS_FROM_ROW@", "\n".join(update_fields_from_row))
+
+    
+    
+    out_file.write(template)
+    out_file.close()
+    template_file.close()
+
+
+if __name__ == "__main__":
+    # for debugging purposes
+    np.set_printoptions(formatter={"float_kind": "{:.8f}".format})
+
+    db = cantools.db.Database()
+
+    db.add_dbc_file("../CANbus.dbc")
+
+    signal_to_datatype: dict[str, pa.DataType] = {}
+
+    for msg in db.messages:
+        for signal in msg.signals:
+            signal_to_datatype[signal.name] = get_fsdaq_type_for_signal(signal)
+
+    # for k, v in signal_to_datatype.items():
+    #     v = str(v).removeprefix("(DataType(")
+    #     v = v.removesuffix("),)")
+    #     print("{:33s} {}".format(k, v))
+
+    # n = 50
+    # generate_nanoarrow_code({k: signal_to_datatype[k] for k in list(signal_to_datatype)[:n]}, 8)
+    generate_cpp_code({k: signal_to_datatype[k] for k in list(signal_to_datatype)}, 80)
+
+
+
+
+# OLD NANOARROW GENERATION CODE:
+#
+# def generate_nanoarrow_code(signal_to_datatype: dict[str, pa.DataType]):
+#     with open("./nanoarrow_generated_from_dbc.hpp", "w") as f:
+#         cols = len(signal_to_datatype)
+#
+#         f.writelines(
+#             [
+#                 f"#include <nanoarrow/nanoarrow.hpp>\n",
+#                 f"#include <nanoarrow/nanoarrow.h>\n",
+#                 f"#include <nanoarrow/nanoarrow_ipc.hpp>\n",
+#                 f"#include <nanoarrow/nanoarrow_ipc.h>\n",
+#                 f"\n"
+#                 f"na::UniqueSchema make_nanoarrow_schema() {{\n"
+#                 f"    na::UniqueSchema schema_root;\n"
+#                 f"    ArrowSchemaInit(schema_root.get());\n"
+#                 f"    ArrowSchemaSetTypeStruct(schema_root.get(), {cols});\n"
+#                 f"\n",
+#             ]
+#         )
+#         for i, (name, datatype) in enumerate(signal_to_datatype.items()):
+#             nanoarrow_type_macro = PYARROW_TO_NANOARROW[datatype]
+#             f.writelines(
+#                 [
+#                     f"    ArrowSchemaInitFromType(schema_root->children[{i}], {nanoarrow_type_macro});\n",
+#                     f'    ArrowSchemaSetName(schema_root->children[{i}], "{name}");\n',
+#                 ]
+#             )
+#         f.writelines(
+#             [
+#                 "    return schema_root;\n"
+#                 "}\n",
+#             ]
+#         )
+#
+#         f.writelines(
+#             [
+#                 f"na::UniqueArray make_nanoarrow_array(ArrowSchema *schema_root, int batch_rows) {{\n",
+#                 f"    ArrowError error;\n",
+#                 f"\n",
+#                 f"    na::UniqueArray array_root;\n",
+#                 f"    ARROW_ERROR_PRINT(ArrowArrayInitFromSchema(array_root.get(), schema_root, &error));\n",
+#                 f"    ArrowArrayAllocateChildren(array_root.get(), {cols});\n",
+#                 f"    for (int i = 0; i < {cols}; i++) {{\n",
+#                 f"        ARROW_ERROR_PRINT(ArrowArrayInitFromSchema(array_root->children[i], schema_root->children[i], &error));\n",
+#                 # f"        ArrowArrayStartAppending(array_root->children[i]);",
+#                 f"        ArrowArrayReserve(array_root->children[i], batch_rows);\n",
+#                 # f"    for (int i = 0; i < ROWS; i++) {{",
+#                 # f"      ArrowArrayAppendInt(array_root->children[i], 12340 + i);",
+#                 # f"    }}",
+#                 # f"    ARROW_ERROR_PRINT(ArrowArrayFinishBuildingDefault(array_root->children[i], &error));",
+#             ]
+#         )
+#         f.writelines(
+#             [
+#                 "    }\n",
+#                 "    return array_root;\n",
+#                 "}\n",
+#             ]
+#         )
+
+# # NOTE: This mapping is NOT exhuastive
+# PYARROW_TO_NANOARROW: dict[pa.DataType, str] = {
+#     pa.null(): "NANOARROW_TYPE_NA",
+#     pa.bool_(): "NANOARROW_TYPE_BOOL",
+#     pa.int8(): "NANOARROW_TYPE_INT8",
+#     pa.uint8(): "NANOARROW_TYPE_UINT8",
+#     pa.int16(): "NANOARROW_TYPE_INT16",
+#     pa.uint16(): "NANOARROW_TYPE_UINT16",
+#     pa.int32(): "NANOARROW_TYPE_INT32",
+#     pa.uint32(): "NANOARROW_TYPE_UINT32",
+#     pa.int64(): "NANOARROW_TYPE_INT64",
+#     pa.uint64(): "NANOARROW_TYPE_UINT64",
+#     pa.float16(): "NANOARROW_TYPE_HALF_FLOAT",
+#     pa.float32(): "NANOARROW_TYPE_FLOAT",
+#     pa.float64(): "NANOARROW_TYPE_DOUBLE",
+#     pa.float64(): "NANOARROW_TYPE_DOUBLE",
+#     pa.date32(): "NANOARROW_TYPE_DATE32",
+#     pa.date64(): "NANOARROW_TYPE_DATE64",
+#     pa.time32("ms"): "NANOARROW_TYPE_TIME32",
+#     pa.time64("ns"): "NANOARROW_TYPE_TIME64",
+#     pa.timestamp("ms"): "NANOARROW_TYPE_TIMESTAMP",
+#     pa.duration("ms"): "NANOARROW_TYPE_DURATION",
+# }
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+IndentWidth: 4`
	`2`	`+BasedOnStyle: LLVM`