pre-commit fixes

jmitrevs · jmitrevs · commit 7e028e608283 · 2025-03-26T14:23:45.000-05:00
diff --git a/hls4ml/backends/oneapi/oneapi_backend.py b/hls4ml/backends/oneapi/oneapi_backend.py
@@ -153,7 +153,7 @@ def create_initial_config(self, part='Arria10', clock_period=5, io_type='io_para
             # TODO:  add namespace
             'WriteTar': write_tar,
         }
-        
+
         if 'use_bsp' in _:
             config['IS_BSP'] = True
 
diff --git a/hls4ml/backends/oneapi/oneapi_types.py b/hls4ml/backends/oneapi/oneapi_types.py
@@ -200,7 +200,7 @@ def definition_cpp(self, name_suffix='', as_reference=True):
         return f'{self.name}{name_suffix}'
 
     def declare_cpp(self, indent=''):
-        streaming_beat_t = f"{self.pipe_name}BeatT";
+        streaming_beat_t = f"{self.pipe_name}BeatT"
         lines = (
             f"{indent}class {self.pipe_id};\n"
             f"{indent}using {streaming_beat_t} = "
diff --git a/hls4ml/templates/oneapi/firmware/myproject.h b/hls4ml/templates/oneapi/firmware/myproject.h
@@ -11,13 +11,9 @@ using PipeProps = decltype(sycl::ext::oneapi::experimental::properties(sycl::ext
 // Pipe properties for host pipes. Host pipes connect to the data source DMA and sink DMA.
 // They are connected to the first and the last layer to stream data into and out from the kernel.
 using HostPipePropertiesT = decltype(sycl::ext::oneapi::experimental::properties(
-    sycl::ext::intel::experimental::ready_latency<0>,
-    sycl::ext::intel::experimental::bits_per_symbol<8>,
-    sycl::ext::intel::experimental::uses_valid<true>,
-    sycl::ext::intel::experimental::first_symbol_in_high_order_bits<true>,
-    sycl::ext::intel::experimental::protocol_avalon_streaming_uses_ready
-));
-
+    sycl::ext::intel::experimental::ready_latency<0>, sycl::ext::intel::experimental::bits_per_symbol<8>,
+    sycl::ext::intel::experimental::uses_valid<true>, sycl::ext::intel::experimental::first_symbol_in_high_order_bits<true>,
+    sycl::ext::intel::experimental::protocol_avalon_streaming_uses_ready));
 
 namespace nnet {
 
@@ -27,30 +23,27 @@ inline constexpr unsigned kInputBufferLocation = 0;
 inline constexpr unsigned kOutputBufferLocation = 1;
 #endif
 
-// Implementation of a direct memory access kernel. Move data from source, convert, 
+// Implementation of a direct memory access kernel. Move data from source, convert,
 // and send to the sink. Adaptive to SYCL HLS and hardware acceleration flow.
-template <class src_T, class dest_pipe> 
-struct DMA_convert_data {
+template <class src_T, class dest_pipe> struct DMA_convert_data {
 #if !defined(IS_BSP)
-    // When targeting a device family, we instantiate an Avalon Memory Mapped Host for 
+    // When targeting a device family, we instantiate an Avalon Memory Mapped Host for
     // data transaction between host and the DMA kernel during emulation and simulation.
-    sycl::ext::oneapi::experimental::annotated_arg<src_T *, 
-      decltype(sycl::ext::oneapi::experimental::properties{
-          sycl::ext::intel::experimental::latency<0>,
-          sycl::ext::intel::experimental::dwidth<16>,
-          sycl::ext::intel::experimental::buffer_location<kInputBufferLocation>,
-          sycl::ext::intel::experimental::read_write_mode_read,
-          sycl::ext::intel::experimental::wait_request_requested})>
+    sycl::ext::oneapi::experimental::annotated_arg<
+        src_T *,
+        decltype(sycl::ext::oneapi::experimental::properties{
+            sycl::ext::intel::experimental::latency<0>, sycl::ext::intel::experimental::dwidth<16>,
+            sycl::ext::intel::experimental::buffer_location<kInputBufferLocation>,
+            sycl::ext::intel::experimental::read_write_mode_read, sycl::ext::intel::experimental::wait_request_requested})>
 #else
     // When targeting oneAPI BSP, we can use USM pointer to access host memory.
     src_T *const
 #endif
         src;
     size_t num_iteration;
 
-    [[intel::kernel_args_restrict]]
-    void operator()() const {
-        
+    [[intel::kernel_args_restrict]] void operator()() const {
+
 #if defined(IS_BSP)
         // Access data using host pointer.
         sycl::ext::intel::host_ptr<src_T> src_ptr(src);
@@ -64,8 +57,7 @@ struct DMA_convert_data {
         using DstDataType = typename nnet::ExtractDataType<PipeDataType>::value_type;
         constexpr auto dstTypeSize = std::tuple_size<DstDataType>{};
 
-        [[intel::fpga_register]]
-        typename nnet::ExtractPipeType<dest_pipe>::value_type packet;
+        [[intel::fpga_register]] typename nnet::ExtractPipeType<dest_pipe>::value_type packet;
 
         // Keep sending data to the input layer and keep the kernels running.
         for (size_t i = 0; i < num_iteration; i++) {
@@ -82,28 +74,25 @@ struct DMA_convert_data {
     }
 };
 
-// Symmetrical to the DMA_convert_data above, this DMA drains the output pipe and 
+// Symmetrical to the DMA_convert_data above, this DMA drains the output pipe and
 // writes result to memory.
-template <class src_pipe, class dst_T> 
-struct DMA_convert_data_back {
+template <class src_pipe, class dst_T> struct DMA_convert_data_back {
 #if !defined(IS_BSP)
     // Without BSP, instantiate an Avalon Memory Mapped Host to write to host.
-    sycl::ext::oneapi::experimental::annotated_arg<dst_T *, 
-      decltype(sycl::ext::oneapi::experimental::properties{
-          sycl::ext::intel::experimental::latency<0>,
-          sycl::ext::intel::experimental::dwidth<16>,
-          sycl::ext::intel::experimental::buffer_location<kOutputBufferLocation>,
-          sycl::ext::intel::experimental::read_write_mode_write,
-          sycl::ext::intel::experimental::wait_request_requested})>
+    sycl::ext::oneapi::experimental::annotated_arg<
+        dst_T *,
+        decltype(sycl::ext::oneapi::experimental::properties{
+            sycl::ext::intel::experimental::latency<0>, sycl::ext::intel::experimental::dwidth<16>,
+            sycl::ext::intel::experimental::buffer_location<kOutputBufferLocation>,
+            sycl::ext::intel::experimental::read_write_mode_write, sycl::ext::intel::experimental::wait_request_requested})>
 #else
     // USM pointer, otherwise.
     dst_T *const
 #endif
         dst;
     size_t num_iteration;
 
-    [[intel::kernel_args_restrict]]
-    void operator()() const {
+    [[intel::kernel_args_restrict]] void operator()() const {
 #if defined(IS_BSP)
         sycl::ext::intel::host_ptr<dst_T> dst_ptr(dst);
 #else
@@ -115,9 +104,8 @@ struct DMA_convert_data_back {
         using SrcDataType = typename nnet::ExtractDataType<PipeDataType>::value_type;
         constexpr auto srcTypeSize = std::tuple_size<SrcDataType>{};
 
-        [[intel::fpga_register]] 
-        typename nnet::ExtractPipeType<src_pipe>::value_type packet;
-        
+        [[intel::fpga_register]] typename nnet::ExtractPipeType<src_pipe>::value_type packet;
+
         // Drain the output pipe and write result to memory.
         for (size_t i = 0; i < num_iteration; i++) {
             packet = src_pipe::read();
@@ -129,7 +117,7 @@ struct DMA_convert_data_back {
     }
 };
 
-}   // namespace nnet
+} // namespace nnet
 
 // Need to declare the input and output pipes
 
diff --git a/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_activation_stream.h b/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_activation_stream.h
@@ -29,19 +29,17 @@ template <class data_pipe, class res_pipe, typename CONFIG_T> void linear_stream
 // *************************************************
 //       ReLU Activation
 // *************************************************
-template <class data_pipe, class res_pipe, typename CONFIG_T> 
-[[intel::use_stall_enable_clusters]] void relu_stream() {
+template <class data_pipe, class res_pipe, typename CONFIG_T> [[intel::use_stall_enable_clusters]] void relu_stream() {
     using namespace nnet;
     using ResT = typename ExtractDataType<typename ExtractPipeType<res_pipe>::value_type>::value_type;
     [[intel::fpga_register]] typename ExtractPipeType<res_pipe>::value_type out_data;
-    
+
     bool keep_going = true;
 ReLUActLoop:
-    [[intel::initiation_interval(1)]]
-    while(keep_going) {
+    [[intel::initiation_interval(1)]] while (keep_going) {
         for (int i = 0; i < CONFIG_T::n_in / std::tuple_size<ResT>{}; i++) {
             [[intel::fpga_register]] auto in_data = data_pipe::read();
-ReLUPackLoop:
+        ReLUPackLoop:
             #pragma unroll
             for (int j = 0; j < std::tuple_size<ResT>{}; j++) {
                 if (in_data.data[j] > 0)
diff --git a/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_dense_stream.h b/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_dense_stream.h
@@ -11,17 +11,17 @@ namespace nnet {
 // Computation is carried out in a while-1 loop as long as there is valid input.
 // The loop breaks when the end-of-packet signal is asserted by upstream task.
 template <class data_pipe, class res_pipe, typename CONFIG_T>
-[[intel::use_stall_enable_clusters]] void dense_resource_stream(const typename CONFIG_T::weight_t weights, const typename CONFIG_T::bias_t biases) {
+[[intel::use_stall_enable_clusters]] void dense_resource_stream(const typename CONFIG_T::weight_t weights,
+                                                                const typename CONFIG_T::bias_t biases) {
     using namespace nnet;
     using DataT = typename ExtractDataType<typename ExtractPipeType<data_pipe>::value_type>::value_type;
     using ResT = typename ExtractDataType<typename ExtractPipeType<res_pipe>::value_type>::value_type;
-    
+
     [[intel::fpga_register]] typename ExtractPipeType<res_pipe>::value_type resbeat;
 
     bool keep_going = true;
     bool did_read_input;
-    [[intel::initiation_interval(1)]]
-    while (keep_going) {
+    [[intel::initiation_interval(1)]] while (keep_going) {
         did_read_input = false;
         [[intel::fpga_register]] auto databeat = data_pipe::read(did_read_input);
 
diff --git a/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_types.h b/hls4ml/templates/oneapi/firmware/nnet_utils/nnet_types.h
@@ -8,7 +8,7 @@
 #include <tuple>
 #include <utility>
 
-#include <sycl/ext/intel/prototype/pipes_ext.hpp>   // Streaming Beat and pipe properties.
+#include <sycl/ext/intel/prototype/pipes_ext.hpp> // Streaming Beat and pipe properties.
 
 namespace nnet {
 
diff --git a/hls4ml/templates/oneapi/myproject_test.cpp b/hls4ml/templates/oneapi/myproject_test.cpp
@@ -28,23 +28,19 @@ using sycl::ext::intel::experimental::property::usm::buffer_location;
 // Functions that reads input and prediction data from files.
 // Returns `true` if files are read successfully and not empty.
 // Returns `false` otherwise.
-bool prepare_data_from_file(
-    std::string &fin_path,
-    std::string &fpr_path,
-    std::vector<std::vector<float>> &inputs,
-    std::vector<std::vector<float>> &predictions
-) {
+bool prepare_data_from_file(std::string &fin_path, std::string &fpr_path, std::vector<std::vector<float>> &inputs,
+                            std::vector<std::vector<float>> &predictions) {
     // load input data from text file
     std::ifstream fin(fin_path.c_str());
     // load predictions from text file
     std::ifstream fpr(fpr_path.c_str());
-    
+
     std::string iline;
     std::string pline;
 
     if (fin.is_open() && fpr.is_open()) {
         size_t num_iterations = 0;
-        
+
         // Prepare input data from file. Load predictions from file.
         for (; std::getline(fin, iline) && std::getline(fpr, pline); num_iterations++) {
             if (num_iterations % CHECKPOINT == 0) {
@@ -106,8 +102,8 @@ int main(int argc, char **argv) {
 
     std::cout << "Running on device: " << device.get_info<sycl::info::device::name>().c_str() << std::endl;
 
-    std::string INPUT_FILE  = "tb_data/tb_input_features.dat";
-    std::string PRED_FILE   = "tb_data/tb_output_predictions.dat";
+    std::string INPUT_FILE = "tb_data/tb_input_features.dat";
+    std::string PRED_FILE = "tb_data/tb_output_predictions.dat";
     std::string RESULTS_LOG = "tb_data/results.log";
     std::ofstream fout(RESULTS_LOG);
 
@@ -138,10 +134,12 @@ int main(int argc, char **argv) {
             std::cerr << "ERROR: host allocation failed for output\n";
             fout.close();
             return 1;
-        }    
+        }
 #else
-        float *vals = sycl::malloc_shared<float>(kInputSz, q, sycl::property_list{buffer_location(nnet::kInputBufferLocation)});
-        float *outputs = sycl::malloc_shared<float>(kOutputSz, q, sycl::property_list{buffer_location(nnet::kOutputBufferLocation)});
+        float *vals =
+            sycl::malloc_shared<float>(kInputSz, q, sycl::property_list{buffer_location(nnet::kInputBufferLocation)});
+        float *outputs =
+            sycl::malloc_shared<float>(kOutputSz, q, sycl::property_list{buffer_location(nnet::kOutputBufferLocation)});
 #endif
 
         if (file_valid) {
@@ -175,7 +173,7 @@ int main(int argc, char **argv) {
             }
         } else {
             std::cout << "INFO: Unable to open input/predictions file, using default input with " << num_iterations
-                    << " invocations." << std::endl;
+                      << " invocations." << std::endl;
             q.single_task(MyProject{});
             // hls-fpga-machine-learning insert top-level-function
             // hls-fpga-machine-learning insert zero
@@ -195,12 +193,10 @@ int main(int argc, char **argv) {
         std::cout << "INFO: Saved inference results to file: " << RESULTS_LOG << std::endl;
     } catch (sycl::exception const &e) {
         // Catches exceptions in the host code.
-        std::cerr << "Caught a SYCL host exception:\n"
-                  << e.what() << "\n";
+        std::cerr << "Caught a SYCL host exception:\n" << e.what() << "\n";
 
         // Most likely the runtime couldn't find FPGA hardware!
-        if (e.code().value() == CL_DEVICE_NOT_FOUND)
-        {
+        if (e.code().value() == CL_DEVICE_NOT_FOUND) {
             std::cerr << "If you are targeting an FPGA, please ensure that your "
                          "system has a correctly configured FPGA board.\n";
             std::cerr << "Run sys_check in the oneAPI root directory to verify.\n";
diff --git a/hls4ml/writer/oneapi_writer.py b/hls4ml/writer/oneapi_writer.py
@@ -137,10 +137,7 @@ def write_project_cpp(self, model):
                 elif '// hls-fpga-machine-learning read in' in line:
                     newline = line
                     if io_type == 'io_parallel':
-                        restartable_kernel_loop = (
-                            f"bool keep_going = true;\n\n"
-                            f"{indent}while (keep_going) {{\n"
-                        )
+                        restartable_kernel_loop = f"bool keep_going = true;\n\n" f"{indent}while (keep_going) {{\n"
                         newline += indent + restartable_kernel_loop
                         for inp in model_inputs:
                             newline += indent * 2 + f'auto {inp.name}_beat = {inp.pipe_name}::read();\n'
@@ -202,7 +199,9 @@ def write_project_cpp(self, model):
                         newline = indent + newline
                         for out in model_outputs:
                             out_beat = f"{out.name}_beat"
-                            newline += indent * 2 + f'typename nnet::ExtractPipeType<{out.pipe_name}>::value_type {out_beat};\n'
+                            newline += (
+                                indent * 2 + f'typename nnet::ExtractPipeType<{out.pipe_name}>::value_type {out_beat};\n'
+                            )
                             newline += indent * 2 + f'{out_beat}.data = {out.name};\n'
                             newline += indent * 2 + f'{out.pipe_name}::write({out_beat});\n'
                         newline += indent * 2 + '// stops the kernel when the last input seen.\n'
@@ -422,7 +421,7 @@ def write_test_bench(self, model):
                         f'{indent}const size_t kInputLayerSize = {model_inputs[0].size_cpp()};\n'
                         f'{indent}const size_t kOutLayerSize = {model_outputs[0].size_cpp()};\n'
                     )
-                    newline += insert_constant_lines;
+                    newline += insert_constant_lines
                 elif '// hls-fpga-machine-learning insert zero' in line:
                     newline = line
                     inp = model_inputs[0]
@@ -445,8 +444,8 @@ def write_test_bench(self, model):
                 elif '// hls-fpga-machine-learning convert output' in line:
                     newline = line
                     out = model_outputs[0]
-                    newline += \
-                        f'{indent}q.single_task(nnet::DMA_convert_data_back<{out.pipe_name}, float>{{outputs, num_iterations}}).wait();\n'
+                    newline += f'{indent}q.single_task(nnet::DMA_convert_data_back<{out.pipe_name}, float>'
+                    newline += '{outputs, num_iterations}).wait();\n'
                 else:
                     newline = line
 

Original file line number	Diff line number	Diff line change
`@@ -153,7 +153,7 @@ def create_initial_config(self, part='Arria10', clock_period=5, io_type='io_para`
`153`	`153`	`# TODO: add namespace`
`154`	`154`	`'WriteTar': write_tar,`
`155`	`155`	`}`
`156`		`-`
	`156`	`+`
`157`	`157`	`if 'use_bsp' in _:`
`158`	`158`	`config['IS_BSP'] = True`
`159`	`159`