@@ -178,7 +178,7 @@ class DaliModelInstance : public ::triton::backend::BackendModelInstance {
178178 }
179179
180180 void Execute (const std::vector<TritonRequest>& requests) {
181- DeviceGuard dg (DetermineDeviceId ());
181+ DeviceGuard dg (GetDaliDeviceId ());
182182 int total_batch_size = 0 ;
183183 TimeInterval batch_compute_interval{};
184184 TimeInterval batch_exec_interval{};
@@ -215,7 +215,7 @@ class DaliModelInstance : public ::triton::backend::BackendModelInstance {
215215 auto serialized_pipeline = dali_model_->GetModelProvider ().GetModel ();
216216 auto max_batch_size = dali_model_->MaxBatchSize ();
217217 auto num_threads = dali_model_->GetModelParamters ().GetNumThreads ();
218- DaliPipeline pipeline (serialized_pipeline, max_batch_size, num_threads, DetermineDeviceId ());
218+ DaliPipeline pipeline (serialized_pipeline, max_batch_size, num_threads, GetDaliDeviceId ());
219219 dali_executor_ = std::make_unique<DaliExecutor>(std::move (pipeline));
220220 }
221221
@@ -261,15 +261,15 @@ class DaliModelInstance : public ::triton::backend::BackendModelInstance {
261261 std::vector<IBufferDescr> buffers;
262262 buffers.reserve (input_buffer_count);
263263 for (uint32_t buffer_idx = 0 ; buffer_idx < input_buffer_count; ++buffer_idx) {
264- auto buffer = input.GetBuffer (buffer_idx, device_type_t ::CPU, DetermineDeviceId ());
264+ auto buffer = input.GetBuffer (buffer_idx, device_type_t ::CPU, GetDaliDeviceId ());
265265 buffers.push_back (buffer);
266266 }
267267 ret.push_back ({input.Meta (), std::move (buffers)});
268268 }
269269 return ret;
270270 }
271271
272- int32_t DetermineDeviceId () {
272+ int32_t GetDaliDeviceId () {
273273 return !CudaStream () ? ::dali::CPU_ONLY_DEVICE_ID : device_id_;
274274 }
275275
@@ -296,7 +296,7 @@ class DaliModelInstance : public ::triton::backend::BackendModelInstance {
296296 out_meta.type = outputs_info[output_idx].type ;
297297 out_meta.shape = outputs_info[output_idx].shape ;
298298 auto output = response.GetOutput (out_meta);
299- auto buffer = output.AllocateBuffer (outputs_info[output_idx].device , DetermineDeviceId ());
299+ auto buffer = output.AllocateBuffer (outputs_info[output_idx].device , GetDaliDeviceId ());
300300 outputs[output_idx] = {out_meta, {buffer}};
301301 }
302302 return outputs;
0 commit comments