Skip to content

Commit 2028ab2

Browse files
Tabrizianmikeiovine
authored andcommitted
[https://nvbugs/5601682][fix] Fix cacheTransceiver hang (NVIDIA#9311)
Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> Signed-off-by: Mike Iovine <6158008+mikeiovine@users.noreply.github.com> Signed-off-by: Mike Iovine <miovine@nvidia.com>
1 parent 31ab367 commit 2028ab2

File tree

2 files changed

+8
-4
lines changed

2 files changed

+8
-4
lines changed

cpp/tensorrt_llm/nanobind/batch_manager/cacheTransceiver.cpp

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -88,8 +88,10 @@ void tb::CacheTransceiverBindings::initBindings(nb::module_& m)
8888
.def("respond_and_send_async", &BaseCacheTransceiver::respondAndSendAsync)
8989
.def("request_and_receive_sync", &BaseCacheTransceiver::requestAndReceiveSync)
9090
.def("request_and_receive_async", &BaseCacheTransceiver::requestAndReceiveAsync)
91-
.def("check_context_transfer_status", &BaseCacheTransceiver::checkContextTransferStatus)
92-
.def("check_gen_transfer_status", &BaseCacheTransceiver::checkGenTransferStatus)
91+
.def("check_context_transfer_status", &BaseCacheTransceiver::checkContextTransferStatus,
92+
nb::call_guard<nb::gil_scoped_release>())
93+
.def("check_gen_transfer_status", &BaseCacheTransceiver::checkGenTransferStatus,
94+
nb::call_guard<nb::gil_scoped_release>())
9395
.def("check_gen_transfer_complete", &BaseCacheTransceiver::checkGenTransferComplete)
9496
.def("cancel_request", &BaseCacheTransceiver::cancelRequest);
9597

cpp/tensorrt_llm/pybind/batch_manager/cacheTransceiver.cpp

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -84,8 +84,10 @@ void tb::CacheTransceiverBindings::initBindings(py::module_& m)
8484
.def("respond_and_send_async", &BaseCacheTransceiver::respondAndSendAsync)
8585
.def("request_and_receive_sync", &BaseCacheTransceiver::requestAndReceiveSync)
8686
.def("request_and_receive_async", &BaseCacheTransceiver::requestAndReceiveAsync)
87-
.def("check_context_transfer_status", &BaseCacheTransceiver::checkContextTransferStatus)
88-
.def("check_gen_transfer_status", &BaseCacheTransceiver::checkGenTransferStatus)
87+
.def("check_context_transfer_status", &BaseCacheTransceiver::checkContextTransferStatus,
88+
py::call_guard<py::gil_scoped_release>())
89+
.def("check_gen_transfer_status", &BaseCacheTransceiver::checkGenTransferStatus,
90+
py::call_guard<py::gil_scoped_release>())
8991
.def("check_gen_transfer_complete", &BaseCacheTransceiver::checkGenTransferComplete)
9092
.def("cancel_request", &BaseCacheTransceiver::cancelRequest);
9193

0 commit comments

Comments
 (0)