Skip to content

Commit 9a88d19

Browse files
violatingcpkpedro88
authored andcommitted
small fix to get to large batch
1 parent 9145f09 commit 9a88d19

File tree

2 files changed

+6
-4
lines changed

2 files changed

+6
-4
lines changed

TensorRT/python/HcalTest_mc_cfg_fpga.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
options.register("params", "", VarParsing.multiplicity.singleton, VarParsing.varType.string)
1515
options.register("threads", 1, VarParsing.multiplicity.singleton, VarParsing.varType.int)
1616
options.register("streams", 1, VarParsing.multiplicity.singleton, VarParsing.varType.int)
17-
options.register("batchsize", 15000, VarParsing.multiplicity.singleton, VarParsing.varType.int)
17+
options.register("batchsize", 16000, VarParsing.multiplicity.singleton, VarParsing.varType.int)
1818
options.register("modelname","facile", VarParsing.multiplicity.singleton, VarParsing.varType.string)
1919
options.register("mode", "Async", VarParsing.multiplicity.singleton, VarParsing.varType.string)
2020
options.parseArguments()

TensorRT/src/TRTClientFPGA.cc

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ void TRTClientFPGA<Client>::setup() {
3333
std::unique_ptr<nic::InferContext::Options> options;
3434
nic::InferContext::Options::Create(&options);
3535

36-
options->SetBatchSize(batchSize_);
36+
//options->SetBatchSize(batchSize_);
3737
for (const auto& output : context_->Outputs()) {
3838
options->AddRawResult(output);
3939
}
@@ -46,7 +46,8 @@ void TRTClientFPGA<Client>::setup() {
4646

4747
auto t2 = std::chrono::high_resolution_clock::now();
4848
for(unsigned i0 = 0; i0 < batchSize_; i0++) {
49-
nic::Error err1 = nicinput_->SetRaw(reinterpret_cast<const uint8_t*>(&(this->input_[i0*ninput_])), ninput_ * sizeof(unsigned short));
49+
nic::Error err1 = nicinput_->SetRaw(reinterpret_cast<const uint8_t*>(&(this->input_[i0*ninput_])), ninput_ * sizeof(unsigned short));
50+
//nic::Error err1 = nicinput_->SetRaw(reinterpret_cast<const uint8_t*>(this->input_.data()), ninput_ * sizeof(unsigned short));
5051
}
5152
//nic::Error err1 = nicinput_->SetRaw(reinterpret_cast<const uint8_t*>(this->input_.data()), batchSize_*ninput_ * sizeof(unsigned short));
5253
auto t3 = std::chrono::high_resolution_clock::now();
@@ -56,7 +57,8 @@ void TRTClientFPGA<Client>::setup() {
5657
template <typename Client>
5758
void TRTClientFPGA<Client>::getResults(const std::unique_ptr<nic::InferContext::Result>& result) {
5859
auto t2 = std::chrono::high_resolution_clock::now();
59-
this->output_.resize(noutput_*batchSize_,0.f);
60+
unsigned short tmp=0;
61+
this->output_.resize(noutput_*batchSize_,tmp);
6062
//for(unsigned i0 = 0; i0 < batchSize_; i0++) {
6163
const uint8_t* r0;
6264
size_t content_byte_size;

0 commit comments

Comments
 (0)