root-project
diff --git a/‎root/tmva/sofie/CMakeLists.txt‎
Lines changed: 33 additions & 1 deletion b/‎root/tmva/sofie/CMakeLists.txt‎
Lines changed: 33 additions & 1 deletion
diff --git a/‎root/tmva/sofie/RDF_ONNXRuntime_Inference.cxx‎
Lines changed: 173 additions & 0 deletions b/‎root/tmva/sofie/RDF_ONNXRuntime_Inference.cxx‎
Lines changed: 173 additions & 0 deletions
diff --git a/‎root/tmva/sofie/RDF_SOFIE_Inference.cxx‎
Lines changed: 76 additions & 0 deletions b/‎root/tmva/sofie/RDF_SOFIE_Inference.cxx‎
Lines changed: 76 additions & 0 deletions
diff --git a/‎root/tmva/sofie/RDF_lwtnn_Inference.cxx‎
Lines changed: 101 additions & 0 deletions b/‎root/tmva/sofie/RDF_lwtnn_Inference.cxx‎
Lines changed: 101 additions & 0 deletions
@@ -128,6 +128,38 @@ if(ROOT_tmva_FOUND AND ROOT_tmva-sofie_FOUND)
     #LIBRARIES TMVA ROOTTMVASofie /Applications/Xcode.app/Contents/Developer/Platforms/MacOSX.platform/Developer/SDKs/MacOSX10.14.sdk/System/Library/Frameworks/Accelerate.framework
     LIBRARIES TMVA  ROOTTMVASofie  /home/moneta/intel/mkl/lib/intel64/libmkl_intel_lp64.so   /home/moneta/intel/mkl/lib/intel64/libmkl_sequential.so /home/moneta/intel/mkl/lib/intel64/libmkl_core.so -lpthread
   )
-  target_include_directories(SOFIEInference PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
+ # target_include_directories(SOFIEInference PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
 
+set(SOFIE_BLAS_LIBS /home/moneta/intel/mkl/lib/intel64/libmkl_intel_lp64.so   /home/moneta/intel/mkl/lib/intel64/libmkl_sequential.so /home/moneta/intel/mkl/lib/intel64/libmkl_core.so -lpthread)
+
+configure_file(input_models/compiled/higgs_model_dense.hxx higgs_model_dense.hxx COPYONLY)
+configure_file(input_models/compiled/higgs_model_dense.dat higgs_model_dense.dat COPYONLY)
+RB_ADD_GBENCHMARK(RDF_SOFIE_Inference
+    RDF_SOFIE_Inference.cxx
+    LABEL short
+    #LIBRARIES TMVA   ROOTTMVASofie  openblas
+    #LIBRARIES TMVA ROOTTMVASofie /Applications/Xcode.app/Contents/Developer/Platforms/MacOSX.platform/Developer/SDKs/MacOSX10.14.sdk/System/Library/Frameworks/Accelerate.framework
+    LIBRARIES Core Hist Imt RIO Tree TreePlayer ROOTDataFrame ROOTVecOps TMVA  ROOTTMVASofie  ${SOFIE_BLAS_LIBS}
+)
+  
 endif()
+
+configure_file(input_models/higgs_model_dense.json higgs_model_dense.json COPYONLY)
+set(LWTNN_INCLUDE_DIR /home/moneta/cernbox/root/tests/tmva/sofie/lwtnn-build/include)
+set(LWTNN_LIBS /home/moneta/cernbox/root/tests/tmva/sofie/lwtnn-build/lib/liblwtnn.so)
+RB_ADD_GBENCHMARK(RDF_lwtnn_Inference
+    RDF_lwtnn_Inference.cxx
+    LABEL short
+    LIBRARIES Core Hist Imt RIO Tree TreePlayer ROOTDataFrame ROOTVecOps TMVA  ROOTTMVASofie  ${LWTNN_LIBS}
+)
+target_include_directories(RDF_lwtnn_Inference PRIVATE ${LWTNN_INCLUDE_DIR})
+
+
+configure_file(input_models/higgs_model_dense.onnx higgs_model_dense.onnx COPYONLY)
+RB_ADD_GBENCHMARK(RDF_ONNXRuntime_Inference
+    RDF_ONNXRuntime_Inference.cxx
+    LABEL short
+    LIBRARIES Core Hist Imt RIO Tree TreePlayer ROOTDataFrame ROOTVecOps TMVA  ROOTTMVASofie onnxruntime
+)
+target_link_directories(RDF_ONNXRuntime_Inference PRIVATE ${ONNXRuntime_LIBRARIES})
+target_include_directories(RDF_ONNXRuntime_Inference PRIVATE ${ONNXRuntime_INCLUDE_DIR})
@@ -0,0 +1,173 @@
+#include "higgs_model_dense.hxx"
+#include <iostream>
+#include "TROOT.h"
+#include "TSystem.h"
+#include "ROOT/RDataFrame.hxx"
+
+#include <onnxruntime_cxx_api.h>
+
+
+#include <string>
+#include <fstream>
+#include <stdlib.h>
+
+#include <benchmark/benchmark.h>
+
+// template <typename Func>
+struct ONNXFunctor {
+
+   // std::vector<float> input;
+   // std::vector<std::shared_ptr<Func>> sessions;
+
+   std::map<std::string, double> inputs;
+   std::vector<std::string> names;
+
+   std::shared_ptr<Ort::Session> session;
+
+   //td::vector<Ort::Value>  input_tensors;
+
+   //Ort::Value  * ort_input = nullptr;
+
+   //float *input_arr = nullptr;
+
+   std::vector<const char *> input_node_names;
+   std::vector<const char *> output_node_names;
+
+   std::vector<float> input_tensor_values;
+
+   std::vector<int64_t> input_node_dims;
+   std::vector<int64_t> output_node_dims;
+
+   ONNXFunctor(unsigned nslots)
+   {
+
+      Ort::Env env(ORT_LOGGING_LEVEL_WARNING, "benchmark");
+
+      std::string model_path = "higgs_model_dense.onnx";
+
+      Ort::SessionOptions session_options;
+      session_options.SetIntraOpNumThreads(1);
+      session_options.SetGraphOptimizationLevel(GraphOptimizationLevel::ORT_ENABLE_EXTENDED);
+
+      // std::cout << "benchmarking model " << model_path << std::endl;
+      session = std::make_shared<Ort::Session>(env, model_path.c_str(), session_options);
+
+     
+
+      Ort::AllocatorWithDefaultOptions allocator;
+      input_node_names.push_back(session->GetInputName(0, allocator));
+      output_node_names.push_back( session->GetOutputName(0, allocator));
+
+      // Getting the shapes
+
+      input_node_dims = session->GetInputTypeInfo(0).GetTensorTypeAndShapeInfo().GetShape();
+      output_node_dims = session->GetOutputTypeInfo(0).GetTensorTypeAndShapeInfo().GetShape();
+
+      // Calculating the dimension of the input tensor
+     
+      //int bsize = input_node_dims[0];
+      // std::cout << "Using bsize = " << bsize << std::endl;
+      //int nbatches = nevt / bsize;
+
+      size_t input_tensor_size = std::accumulate(input_node_dims.begin(), input_node_dims.end(), 1, std::multiplies<int>());
+      //std::vector<float> input_tensor_values(input_tensor_size );
+
+      input_tensor_values.resize(input_tensor_size);
+
+      auto memory_info = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);
+
+      //input_tensors.push_back(Ort::Value::CreateTensor<float>(
+      //   memory_info, input_tensor_values.data(), input_tensor_size, input_node_dims.data(), input_node_dims.size()) );
+
+      
+      // Ort::Value
+      // Ort::Value *ort_input = new Ort::Value(nullptr);
+      // // input_tensor =
+      // *ort_input = Ort::Value::CreateTensor<float>(memory_info, input_tensor_values.data(), input_tensor_values.size(),
+      //                                 input_node_dims.data(), input_node_dims.size());
+
+      //input_arr = input_tensor.GetTensorMutableData<float>();
+
+      // Running the model
+      //input_arr = input_tensors[0].GetTensorMutableData<float>();
+     
+      ///////
+
+
+      // // Load inputs from argv
+      // std::cout << "input size is " << config.inputs.size() << std::endl;
+      // for (size_t n = 0; n < config.inputs.size(); n++) {
+      //    inputs[config.inputs.at(n).name] = 0.0;
+      //    names.push_back(config.inputs.at(n).name);
+      // }
+   }
+
+   double operator()(unsigned nslots, float x0, float x1, float x2, float x3, float x4, float x5, float x6)
+   {
+
+      // not sure how to cache input ort tensor
+      auto memory_info = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);
+      Ort::Value 
+      input_tensor = Ort::Value::CreateTensor<float>(
+         memory_info, input_tensor_values.data(), input_tensor_values.size(), input_node_dims.data(), input_node_dims.size());
+      float * input_arr = input_tensor.GetTensorMutableData<float>();
+
+      int off = 0;
+      input_arr[off] = x0;
+      input_arr[off + 1] = x1;
+      input_arr[off + 2] = x2;
+      input_arr[off + 3] = x3;
+      input_arr[off + 4] = x4;
+      input_arr[off + 5] = x5;
+      input_arr[off + 6] = x6;
+
+      
+
+      auto output_tensors = session->Run(Ort::RunOptions{nullptr}, input_node_names.data(), &input_tensor, 1, output_node_names.data(), 1);
+      float * floatarr = output_tensors.front().GetTensorMutableData<float>();
+      return floatarr[0];
+   }
+};
+
+void BM_RDF_ONNX_Inference(benchmark::State &state)
+{
+
+   int nslot = 1;
+   if (nslot > 1)
+      ROOT::EnableImplicitMT(nslot);
+
+   auto fileName = "Higgs_data_full.root";
+   // file is available at "https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download";
+   // do curl https://cernbox.cern.ch/index.php/s/XaPBtaGrnN38wU0 -o Higgs_data_full.root
+   if (gSystem->AccessPathName(fileName)) {
+      std::string cmd = "curl https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download -o ";
+      cmd += fileName;
+      gSystem->Exec(cmd.c_str());
+   }
+   auto treeName = "test_tree";
+   ROOT::RDataFrame df(treeName, fileName);
+
+   ONNXFunctor functor(nslot);
+
+   for (auto _ : state) {
+
+      auto h1 = df.DefineSlot("DNN_Value", functor, {"m_jj", "m_jjj", "m_lv", "m_jlv", "m_bb", "m_wbb", "m_wwbb"})
+                   .Histo1D("DNN_Value");
+
+      auto t1 = std::chrono::high_resolution_clock::now();
+
+      auto n = h1->GetEntries();
+      auto t2 = std::chrono::high_resolution_clock::now();
+      auto duration = std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count();
+
+      std::cout << " Processed " << n << " entries "
+                << " time = " << duration / 1.E6 << " (sec)  time/event = " << duration / double(n) << " musec"
+                << std::endl;
+
+      // h1->DrawClone();
+   }
+}
+
+
+BENCHMARK(BM_RDF_ONNX_Inference)->Unit(benchmark::kMillisecond);
+BENCHMARK_MAIN();
@@ -0,0 +1,76 @@
+#include "higgs_model_dense.hxx"
+#include <iostream>
+#include <memory>
+#include "TROOT.h"
+#include "TSystem.h"
+#include "ROOT/RDataFrame.hxx"
+
+#include <benchmark/benchmark.h>
+
+// Functor to wrap SOFIE session to RDF functor signature 
+template <typename Func>
+struct SofieFunctor {
+   std::vector<float> input;
+   std::vector<std::shared_ptr<Func>> sessions;
+   SofieFunctor(unsigned nslots) :
+      input(7*nslots,0) {
+      for (int i = 0; i < nslots; i++) {
+         sessions.push_back(std::make_shared<Func>());
+      }
+   }
+
+   double operator()(unsigned nslots, float x0, float x1, float x2, float x3, float x4, float x5, float x6) {
+      int off = nslots*7;
+      input[off] = x0;
+      input[off+1] = x1;
+      input[off+2] = x2;
+      input[off+3] = x3;
+      input[off+4] = x4;
+      input[off+5] = x5;
+      input[off+6] = x6;
+      auto y =  sessions[nslots]->infer(input.data()+nslots*7);
+      return y[0];
+   }
+   
+};
+
+void BM_RDF_SOFIE_Inference(benchmark::State &state)
+{
+   int nslot = 1;
+
+   if (nslot > 1) ROOT::EnableImplicitMT(nslot);
+   auto fileName = "Higgs_data_full.root";
+   //file is available at "https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download";
+   // do curl https://cernbox.cern.ch/index.php/s/XaPBtaGrnN38wU0 -o Higgs_data_full.root
+   if (gSystem->AccessPathName(fileName) ) {
+      std::string cmd = "curl https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download -o ";
+      cmd  += fileName;
+      gSystem->Exec(cmd.c_str());
+   }
+   auto treeName = "test_tree";
+   ROOT::RDataFrame df(treeName, fileName);
+
+
+   SofieFunctor<TMVA_SOFIE_higgs_model_dense::Session> functor(nslot);
+
+   for (auto _ : state) {
+
+      auto h1 = df.DefineSlot("DNN_Value", functor, {"m_jj", "m_jjj", "m_lv", "m_jlv", "m_bb", "m_wbb", "m_wwbb"})
+                   .Histo1D("DNN_Value");
+
+      auto t1 = std::chrono::high_resolution_clock::now();
+
+      auto n = h1->GetEntries();
+      auto t2 = std::chrono::high_resolution_clock::now();
+      auto duration = std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count();
+
+      std::cout << " Processed " << n << " entries "
+                << " time = " << duration / 1.E6 << " (sec)  time/event = " << duration / double(n) << " musec"
+                << std::endl;
+   }
+   // h1->DrawClone();
+}
+
+
+BENCHMARK(BM_RDF_SOFIE_Inference)->Unit(benchmark::kMillisecond);
+BENCHMARK_MAIN();
@@ -0,0 +1,101 @@
+#include "higgs_model_dense.hxx"
+#include <iostream>
+#include "TROOT.h"
+#include "TSystem.h"
+#include "ROOT/RDataFrame.hxx"
+
+#include "lwtnn/LightweightNeuralNetwork.hh"
+#include "lwtnn/parse_json.hh"
+
+#include <string>
+#include <fstream>
+#include <stdlib.h>
+
+#include <benchmark/benchmark.h>
+
+// template <typename Func>
+struct LWTNNFunctor {
+
+   // std::vector<float> input;
+   // std::vector<std::shared_ptr<Func>> sessions;
+
+   std::map<std::string, double> inputs;
+   std::vector<std::string> names;
+
+   std::shared_ptr<lwt::LightweightNeuralNetwork> model;
+
+   LWTNNFunctor(unsigned nslots)
+   {
+      std::string config_filename("higgs_model_dense.json");
+      std::ifstream config_file(config_filename);
+      auto config = lwt::parse_json(config_file);
+
+      // Set up neural network model from config
+      model = std::make_shared<lwt::LightweightNeuralNetwork>(config.inputs, config.layers, config.outputs);
+
+      // Load inputs from argv
+      std::cout << "input size is " << config.inputs.size() << std::endl;
+      for (size_t n = 0; n < config.inputs.size(); n++) {
+         inputs[config.inputs.at(n).name] = 0.0;
+         names.push_back(config.inputs.at(n).name);
+      }
+   }
+
+   double operator()(unsigned nslots, float x0, float x1, float x2, float x3, float x4, float x5, float x6)
+   {
+      // int off = 0;//nslots*7;
+      inputs[names[0]] = x0;
+      inputs[names[1]] = x1;
+      inputs[names[2]] = x2;
+      inputs[names[3]] = x3;
+      inputs[names[4]] = x4;
+      inputs[names[5]] = x5;
+      inputs[names[6]] = x6;
+
+      auto y = model->compute(inputs);
+      return y.begin()->second;
+   }
+};
+
+void BM_RDF_LWTNN_Inference(benchmark::State &state)
+{
+
+   int nslot = 1;
+   if (nslot > 1)
+      ROOT::EnableImplicitMT(nslot);
+
+   auto fileName = "Higgs_data_full.root";
+   // file is available at "https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download";
+   // do curl https://cernbox.cern.ch/index.php/s/XaPBtaGrnN38wU0 -o Higgs_data_full.root
+   if (gSystem->AccessPathName(fileName)) {
+      std::string cmd = "curl https://cernbox.cern.ch/index.php/s/YuSHwTXBa0UBEhD/download -o ";
+      cmd += fileName;
+      gSystem->Exec(cmd.c_str());
+   }
+   auto treeName = "test_tree";
+   ROOT::RDataFrame df(treeName, fileName);
+
+   LWTNNFunctor functor(nslot);
+
+   for (auto _ : state) {
+
+      auto h1 = df.DefineSlot("DNN_Value", functor, {"m_jj", "m_jjj", "m_lv", "m_jlv", "m_bb", "m_wbb", "m_wwbb"})
+                   .Histo1D("DNN_Value");
+
+      auto t1 = std::chrono::high_resolution_clock::now();
+
+      auto n = h1->GetEntries();
+      auto t2 = std::chrono::high_resolution_clock::now();
+      auto duration = std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count();
+
+      std::cout << " Processed " << n << " entries "
+                << " time = " << duration / 1.E6 << " (sec)  time/event = " << duration / double(n) << " musec"
+                << std::endl;
+
+      // h1->DrawClone();
+   }
+}
+
+
+BENCHMARK(BM_RDF_LWTNN_Inference)->Unit(benchmark::kMillisecond);
+BENCHMARK_MAIN();