File tree Expand file tree Collapse file tree 1 file changed +3
-6
lines changed Expand file tree Collapse file tree 1 file changed +3
-6
lines changed Original file line number Diff line number Diff line change @@ -485,6 +485,9 @@ RequestExecutor::Infer(
485485 reinterpret_cast <void *>(infer_payload->ResponseAllocUserp ().get ()),
486486 InferResponseComplete, reinterpret_cast <void *>(infer_payload.get ())));
487487
488+ THROW_IF_TRITON_ERROR (
489+ TRITONSERVER_ServerInferAsync (server_, irequest, trace));
490+
488491 {
489492 std::lock_guard<std::mutex> lk (on_going_request_addresses_mu_);
490493 on_going_request_addresses_.insert (
@@ -493,15 +496,9 @@ RequestExecutor::Infer(
493496 // Store the inference request address submitted to the Triton server for
494497 // retrieval
495498 infer_payload->SetRequestAddress (reinterpret_cast <intptr_t >(irequest));
496-
497- THROW_IF_TRITON_ERROR (
498- TRITONSERVER_ServerInferAsync (server_, irequest, trace));
499499 }
500500 }
501501 catch (const PythonBackendException& pb_exception) {
502- EraseRequestAddress (reinterpret_cast <intptr_t >(irequest));
503- infer_payload->SetRequestAddress (0L );
504-
505502 LOG_IF_ERROR (
506503 TRITONSERVER_InferenceRequestDelete (irequest),
507504 " Failed to delete inference request." );
You can’t perform that action at this time.
0 commit comments