cleanup

kpedro88 · kpedro88 · commit 46785ff55c9b · 2020-04-22T21:03:13.000-05:00
diff --git a/Core/interface/SonicEDProducer.h b/Core/interface/SonicEDProducer.h
@@ -27,10 +27,10 @@ class SonicEDProducer : public edm::stream::EDProducer<edm::ExternalWork, Capabi
 		//derived classes use a dedicated acquire() interface that incorporates client_.input()
 		//(no need to interact with callback holder)
 		void acquire(edm::Event const& iEvent, edm::EventSetup const& iSetup, edm::WaitingTaskWithArenaHolder holder) override final {
-			//auto t0 = std::chrono::high_resolution_clock::now();
+			auto t0 = std::chrono::high_resolution_clock::now();
 			acquire(iEvent, iSetup, client_.input());
-			//auto t1 = std::chrono::high_resolution_clock::now();
-			//if(!debugName_.empty()) edm::LogInfo(debugName_) << "Load time: " << std::chrono::duration_cast<std::chrono::microseconds>(t1 - t0).count();
+			auto t1 = std::chrono::high_resolution_clock::now();
+			if(!debugName_.empty()) edm::LogInfo(debugName_) << "Load time: " << std::chrono::duration_cast<std::chrono::microseconds>(t1 - t0).count();
 			client_.predict(holder);
 		}
 		virtual void acquire(edm::Event const& iEvent, edm::EventSetup const& iSetup, Input& iInput) = 0;
diff --git a/TensorRT/plugins/DeepCaloProducer.cc b/TensorRT/plugins/DeepCaloProducer.cc
@@ -31,8 +31,6 @@ class DeepCaloProducer : public SonicEDProducer<Client>
 			//for debugging
 			this->setDebugName("DeepCaloProducer");
 
-			// printf("Loading data...\n");
-
 			// Load the bin data
 			std::streampos fileSize;
 			std::ifstream file(binDataPath_, std::ios::binary);
@@ -45,25 +43,16 @@ class DeepCaloProducer : public SonicEDProducer<Client>
 				fileSize = file.tellg();
 				file.seekg(0, std::ios::beg);
 
-				// std::cout << fileSize << " bytes in the file." << std::endl;
 				imageData_.reserve(fileSize/sizeof(float));
 
 				for (size_t i = 0; i < imageData_.capacity(); i++)
 				{
 					float f;
 					file.read(reinterpret_cast<char*>(&f), sizeof(float));
 					imageData_.push_back(f);
-				}      
-				
-				// file.read(reinterpret_cast<char*>(imageData_.data()), fileSize / sizeof(float));
-				// // file.read(reinterpret_cast<char*>(test.data()), 32/4);
-				// // std::vector<unsigned char> buffer(std::istreambuf_iterator<char>(file), {});
-
-				// // std::cout << "Segfault check" << std::endl;
+				}
 				file.close();
-			} else std::cout << "Could not read the file!" << std::endl;
-
-			// std::cout << imageData_.size() << " floats loaded!" << std::endl;
+			} else throw cms::Exception("MissingInputFile") << "Could not read the file: " << binDataPath_;
 
 			imageID_ = 0;
 			imageN_ = imageData_.size() / (56*11*4);
@@ -72,13 +61,6 @@ class DeepCaloProducer : public SonicEDProducer<Client>
 			auto ninput = client_.ninput();
 			auto batchSize = client_.batchSize();
 			iInput = Input(ninput*batchSize, 0.f);
-			//make some random channels
-			// for(unsigned ib = 0; ib < batchSize; ib++) { 
-			// 	for(unsigned i0 = 0; i0 < ninput; i0++) { 
-			// 		for(unsigned i1 = 0; i1 < ninput; i1++) iInput[ib*ninput+i1] = float(rand() % 10000)*1e-8;
-			// 	}
-			// }
-
 
 			if (imageID_ + batchSize >= imageN_)
 				imageID_ = 0;
diff --git a/TensorRT/plugins/JetImageProducer.cc b/TensorRT/plugins/JetImageProducer.cc
@@ -49,15 +49,14 @@ class JetImageProducer : public SonicEDProducer<Client>
 		}
 		void acquire(edm::Event const& iEvent, edm::EventSetup const& iSetup, Input& iInput) override {
 			//input data from event
-
 			edm::Handle<edm::View<pat::Jet>> h_jets;
 			iEvent.getByToken(JetTok_, h_jets);
 			const auto& jets = *h_jets.product();
 
 			// create a jet image for the leading jet in the event
 			// 224 x 224 image which is centered at the jet axis and +/- 1 unit in eta and phi
 			std::vector<float> img(client_.ninput()*client_.batchSize(),0.f);
-			
+
 			const unsigned npix = 224;
 			float pixel_width = 2./float(npix);
 
@@ -93,7 +92,7 @@ class JetImageProducer : public SonicEDProducer<Client>
 				if (jet_ctr > 0) break; // just do one jet for now
 				//////////////////////////////
 			}
-			
+
 			iInput = Input(client_.ninput()*client_.batchSize(),0.f);
 			for(unsigned i0 = 0; i0 < client_.batchSize(); i0++ ) { 
 				for(unsigned i1 = 0; i1 < client_.ninput(); i1++) {
diff --git a/TensorRT/python/process_result.py b/TensorRT/python/process_result.py
@@ -21,14 +21,6 @@
         client_time.append(int(this_line[-1]))
     if (this_line[0] == "Output"):
         output_time.append(int(this_line[-1]))
-   
-#print(output_time)
-#print(remote_time)
-
-#plt.figure()
-#plt.xlabel("Test number")
-#plt.ylabel("Time (usec)")
-#plt.savefig("fnal_result.png")
 
 result_dic = {}
 
@@ -37,4 +29,4 @@
 result_dic["Client"] = client_time
 
 with open(domain_name+'_result.pkl', 'wb') as handle:
-    pickle.dump(result_dic, handle, protocol=pickle.HIGHEST_PROTOCOL)
+    pickle.dump(result_dic, handle, protocol=pickle.HIGHEST_PROTOCOL)
diff --git a/TensorRT/src/TRTClient.cc b/TensorRT/src/TRTClient.cc
@@ -16,73 +16,62 @@ using ModelInfo = std::pair<std::string, int64_t>;
 //based on https://github.com/NVIDIA/tensorrt-inference-server/blob/master/src/clients/c++/examples/simple_callback_client.cc
 
 template <typename Client>
-TRTClient<Client>::TRTClient(const edm::ParameterSet &params) : Client(),
-																url_(params.getParameter<std::string>("address") + ":" + std::to_string(params.getParameter<unsigned>("port"))),
-																timeout_(params.getParameter<unsigned>("timeout")),
-																modelName_(params.getParameter<std::string>("modelName")),
-																batchSize_(params.getParameter<unsigned>("batchSize")),
-																ninput_(params.getParameter<unsigned>("ninput")),
-																noutput_(params.getParameter<unsigned>("noutput"))
+TRTClient<Client>::TRTClient(const edm::ParameterSet& params) :
+	Client(),
+	url_(params.getParameter<std::string>("address")+":"+std::to_string(params.getParameter<unsigned>("port"))),
+	timeout_(params.getParameter<unsigned>("timeout")),
+	modelName_(params.getParameter<std::string>("modelName")),
+	batchSize_(params.getParameter<unsigned>("batchSize")),
+	ninput_(params.getParameter<unsigned>("ninput")),
+	noutput_(params.getParameter<unsigned>("noutput"))
 {
 }
 
 template <typename Client>
-void TRTClient<Client>::setup()
-{
+void TRTClient<Client>::setup() {
 	auto err = nic::InferGrpcContext::Create(&context_, url_, modelName_, -1, false);
-	if (!err.IsOk())
-		throw cms::Exception("BadGrpc") << "unable to create inference context: " << err;
-
-	// nic::ServerStatusGrpcContext::Create(&server_ctx_, url_, false);
-	// if (!err.IsOk())
-	// 	throw cms::Exception("BadServer") << "unable to create server inference context: " << err;
+	if (!err.IsOk()) throw cms::Exception("BadGrpc") << "unable to create inference context: " << err;
 
 	std::unique_ptr<nic::InferContext::Options> options;
 	nic::InferContext::Options::Create(&options);
 
 	options->SetBatchSize(batchSize_);
-	for (const auto &output : context_->Outputs())
-	{
+	for (const auto& output : context_->Outputs()) {
 		options->AddRawResult(output);
 	}
 	context_->SetRunOptions(*options);
 
-	const std::vector<std::shared_ptr<nic::InferContext::Input>> &nicinputs = context_->Inputs();
+	const std::vector<std::shared_ptr<nic::InferContext::Input>>& nicinputs = context_->Inputs();
 	nicinput_ = nicinputs[0];
 	nicinput_->Reset();
 
 	auto t2 = std::chrono::high_resolution_clock::now();
 	std::vector<int64_t> input_shape;
-	for (unsigned i0 = 0; i0 < batchSize_; i0++)
-	{
+	for(unsigned i0 = 0; i0 < batchSize_; i0++) {
 		float *arr = &(this->input_.data()[i0 * ninput_]);
 		nic::Error err1 = nicinput_->SetRaw(reinterpret_cast<const uint8_t *>(arr), ninput_ * sizeof(float));
 	}
 	auto t3 = std::chrono::high_resolution_clock::now();
-	edm::LogInfo("TRTClient") << "Image array time: " << std::chrono::duration_cast<std::chrono::microseconds>(t3 - t2).count();
+	edm::LogInfo("TRTClient") << "Image array time: " << std::chrono::duration_cast<std::chrono::microseconds>(t3-t2).count();
 }
 
 template <typename Client>
-void TRTClient<Client>::getResults(const std::unique_ptr<nic::InferContext::Result> &result)
-{
+void TRTClient<Client>::getResults(const std::unique_ptr<nic::InferContext::Result>& result) {
 	auto t2 = std::chrono::high_resolution_clock::now();
-	this->output_.resize(noutput_ * batchSize_, 0.f);
-	for (unsigned i0 = 0; i0 < batchSize_; i0++)
-	{
+	this->output_.resize(noutput_*batchSize_,0.f);
+	for (unsigned i0 = 0; i0 < batchSize_; i0++) {
 		const uint8_t *r0;
 		size_t content_byte_size;
 		result->GetRaw(i0, &r0, &content_byte_size);
-		const float *lVal = reinterpret_cast<const float *>(r0);
-		for (unsigned i1 = 0; i1 < noutput_; i1++)
-			this->output_[i0 * noutput_ + i1] = lVal[i1]; //This should be replaced with a memcpy
+		const float *lVal = reinterpret_cast<const float*>(r0);
+		for(unsigned i1 = 0; i1 < noutput_; i1++) this->output_[i0*noutput_+i1] = lVal[i1]; //This should be replaced with a memcpy
 	}
 	auto t3 = std::chrono::high_resolution_clock::now();
-	edm::LogInfo("TRTClient") << "Output time: " << std::chrono::duration_cast<std::chrono::microseconds>(t3 - t2).count();
+	edm::LogInfo("TRTClient") << "Output time: " << std::chrono::duration_cast<std::chrono::microseconds>(t3-t2).count();
 }
 
 template <typename Client>
-void TRTClient<Client>::predictImpl()
-{
+void TRTClient<Client>::predictImpl(){
 	//common operations first
 	setup();
 
@@ -91,7 +80,7 @@ void TRTClient<Client>::predictImpl()
 	std::map<std::string, std::unique_ptr<nic::InferContext::Result>> results;
 	nic::Error err = context_->Run(&results);
 	if (!err.IsOk()) {
-		std::cout << "Could not read the result" <<  ": " << err << std::endl;
+		edm::LogWarning("TRTClient") << "Could not read the result" <<  ": " << err;
 		this->output_.resize(noutput_ * batchSize_, 0.f);
 	} else {
 	auto t3 = std::chrono::high_resolution_clock::now();
@@ -102,28 +91,21 @@ void TRTClient<Client>::predictImpl()
 
 //specialization for true async
 template <>
-void TRTClientAsync::predictImpl()
-{
+void TRTClientAsync::predictImpl(){
 	//common operations first
-	try
-	{
+	try {
 		setup();
 	}
-	catch (...)
-	{
+	catch (...) {
 		finish(std::current_exception());
 		return;
 	}
 
 	//non-blocking call
 
-	// Get the status of the server prior to the request being made.
-	// std::map<std::string, ni::ModelStatus> start_status;
-	// GetServerSideStatus(&start_status);
-
 	auto t2 = std::chrono::high_resolution_clock::now();
 	nic::Error erro0 = context_->AsyncRun(
-		[t2, this](nic::InferContext *ctx, const std::shared_ptr<nic::InferContext::Request> &request) {
+		[t2,this](nic::InferContext* ctx, const std::shared_ptr<nic::InferContext::Request>& request) {
 			//get results
 			std::map<std::string, std::unique_ptr<nic::InferContext::Result>> results;
 			//this function interface will change in the next tensorrtis version
@@ -142,16 +124,17 @@ void TRTClientAsync::predictImpl()
 
 			edm::LogInfo("TRTClient") << "Remote time: " << std::chrono::duration_cast<std::chrono::microseconds>(t3 - t2).count();
 
-			//check result
-				this->getResults(results.begin()->second);
-
 			//ServerSideStats stats;
 			// SummarizeServerStats(std::make_pair(modelName_, -1), start_status, end_status, &stats);
 			//ReportServerSideState(stats);
+
+			//check result
+			this->getResults(results.begin()->second);
 			}
 			//finish
 			this->finish();
-		});
+		}
+	);
 }
 
 template <typename Client>
@@ -162,7 +145,7 @@ TRTClient<Client>::ReportServerSideState(const ServerSideStats& stats)
 	const uint64_t cnt = stats.request_count;
 	if (cnt == 0)
 	{
-		std::cout << "  Request count: " << cnt << std::endl;
+		edm::LogInfo("TRTClient") << "  Request count: " << cnt;
 		return;
 	}
 
@@ -178,13 +161,12 @@ TRTClient<Client>::ReportServerSideState(const ServerSideStats& stats)
 	const uint64_t overhead = (cumm_avg_us > queue_avg_us + compute_avg_us)
 								  ? (cumm_avg_us - queue_avg_us - compute_avg_us)
 								  : 0;
-	std::cout << "  Request count: " << cnt << std::endl
+	edm::LogInfo("TRTClient") << "  Request count: " << cnt << std::endl
 			  << "  Avg request latency: " << cumm_avg_us << " usec";
 
-	std::cout << " (overhead " << overhead << " usec + "
+	edm::LogInfo("TRTClient") << " (overhead " << overhead << " usec + "
 				<< "queue " << queue_avg_us << " usec + "
-				<< "compute " << compute_avg_us << " usec)" << std::endl
-				<< std::endl;
+				<< "compute " << compute_avg_us << " usec)" << std::endl;
 }
 
 template <typename Client>
@@ -199,24 +181,6 @@ TRTClient<Client>::SummarizeServerStats(
       model_info.first, model_info.second,
       start_status.find(model_info.first)->second,
       end_status.find(model_info.first)->second, server_stats);
-
-//   // Summarize the composing models, if any.
-//   for (const auto& composing_model_info : composing_models_map_[model_info]) {
-//     auto it = server_stats->composing_models_stat
-//                   .emplace(composing_model_info, ServerSideStats())
-//                   .first;
-//     if (composing_models_map_.find(composing_model_info) !=
-//         composing_models_map_.end()) {
-//       RETURN_IF_ERROR(SummarizeServerStats(
-//           composing_model_info, start_status, end_status, &(it->second)));
-//     } else {
-//       RETURN_IF_ERROR(SummarizeServerModelStats(
-//           composing_model_info.first, composing_model_info.second,
-//           start_status.find(composing_model_info.first)->second,
-//           end_status.find(composing_model_info.first)->second, &(it->second)));
-//     }
-
-//   return nic::Error::Success;
 }
 
 template <typename Client>
@@ -302,25 +266,6 @@ TRTClient<Client>::GetServerSideStatus(
   } else {
     model_status->emplace(model_info.first, itr->second);
   }
-
-//   // Also get status for composing models if any
-//   for (const auto& composing_model_info : composing_models_map_[model_info]) {
-//     if (composing_models_map_.find(composing_model_info) !=
-//         composing_models_map_.end()) {
-//       GetServerSideStatus(
-//           server_status, composing_model_info, model_status);
-//     } else {
-//       const auto& itr =
-//           server_status.model_status().find(composing_model_info.first);
-//       if (itr == server_status.model_status().end()) {
-//         return nic::Error(
-//             ni::RequestStatusCode::INTERNAL,
-//             "unable to find status for composing model" +
-//                 composing_model_info.first);
-//       } else {
-//         model_status->emplace(composing_model_info.first, itr->second);
-//       }
-//     }
 }
 
 //explicit template instantiations