NVIDIA · rgsl888prabhu · Nov 7, 2025 · Nov 7, 2025 · Nov 7, 2025 · Nov 10, 2025
@@ -25,19 +25,19 @@ namespace cython {
 // aggregate for call_solve() return type
 // to be exposed to cython:
 struct linear_programming_ret_t {
-  std::unique_ptr<rmm::device_buffer> primal_solution_;
-  std::unique_ptr<rmm::device_buffer> dual_solution_;
-  std::unique_ptr<rmm::device_buffer> reduced_cost_;
+  std::vector<double> primal_solution_;
+  std::vector<double> dual_solution_;
+  std::vector<double> reduced_cost_;
   /* -- PDLP Warm Start Data -- */
-  std::unique_ptr<rmm::device_buffer> current_primal_solution_;
-  std::unique_ptr<rmm::device_buffer> current_dual_solution_;
-  std::unique_ptr<rmm::device_buffer> initial_primal_average_;
-  std::unique_ptr<rmm::device_buffer> initial_dual_average_;
-  std::unique_ptr<rmm::device_buffer> current_ATY_;
-  std::unique_ptr<rmm::device_buffer> sum_primal_solutions_;
-  std::unique_ptr<rmm::device_buffer> sum_dual_solutions_;
-  std::unique_ptr<rmm::device_buffer> last_restart_duality_gap_primal_solution_;
-  std::unique_ptr<rmm::device_buffer> last_restart_duality_gap_dual_solution_;
+  std::vector<double> current_primal_solution_;
+  std::vector<double> current_dual_solution_;
+  std::vector<double> initial_primal_average_;
+  std::vector<double> initial_dual_average_;
+  std::vector<double> current_ATY_;
+  std::vector<double> sum_primal_solutions_;
+  std::vector<double> sum_dual_solutions_;
+  std::vector<double> last_restart_duality_gap_primal_solution_;
+  std::vector<double> last_restart_duality_gap_dual_solution_;
   double initial_primal_weight_;
   double initial_step_size_;
   int total_pdlp_iterations_;
@@ -64,7 +64,7 @@ struct linear_programming_ret_t {
 };
 
 struct mip_ret_t {
-  std::unique_ptr<rmm::device_buffer> solution_;
+  std::vector<double> solution_;
 
   linear_programming::mip_termination_status_t termination_status_;
   error_type_t error_status_;

@@ -131,28 +131,21 @@ linear_programming_ret_t call_solve_lp(
   const bool use_pdlp_solver_mode = true;
   auto solution                   = cuopt::linear_programming::solve_lp(
     op_problem, solver_settings, problem_checking, use_pdlp_solver_mode, is_batch_mode);
+
+  // Convert device vectors to host vectors for LP solution
   linear_programming_ret_t lp_ret{
-    std::make_unique<rmm::device_buffer>(solution.get_primal_solution().release()),
-    std::make_unique<rmm::device_buffer>(solution.get_dual_solution().release()),
-    std::make_unique<rmm::device_buffer>(solution.get_reduced_cost().release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().current_primal_solution_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().current_dual_solution_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().initial_primal_average_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().initial_dual_average_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().current_ATY_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().sum_primal_solutions_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().sum_dual_solutions_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_.release()),
-    std::make_unique<rmm::device_buffer>(
-      solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_.release()),
+    cuopt::host_copy(solution.get_primal_solution()),
+    cuopt::host_copy(solution.get_dual_solution()),
+    cuopt::host_copy(solution.get_reduced_cost()),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_primal_solution_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_dual_solution_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_primal_average_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_dual_average_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_ATY_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_primal_solutions_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_dual_solutions_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_),
+    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_),
     solution.get_pdlp_warm_start_data().initial_primal_weight_,
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_primal_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_dual_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_primal_average_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_dual_average_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_ATY_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_primal_solutions_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_dual_solutions_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_),
-    solution.get_pdlp_warm_start_data().initial_primal_weight_,
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_primal_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_dual_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_primal_average_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_dual_average_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_ATY_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_primal_solutions_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_dual_solutions_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_),
+    solution.get_pdlp_warm_start_data().initial_primal_weight_,
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_primal_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_dual_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_primal_average_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_dual_average_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().current_ATY_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_primal_solutions_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_dual_solutions_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_),
-    cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_),
-    solution.get_pdlp_warm_start_data().initial_primal_weight_,
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_primal_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_dual_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_primal_average_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().initial_dual_average_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().current_ATY_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_primal_solutions_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().sum_dual_solutions_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_primal_solution_),
+    is_batch_mode ? std::vector<double>{}
+                  : cuopt::host_copy(solution.get_pdlp_warm_start_data().last_restart_duality_gap_dual_solution_),
+    solution.get_pdlp_warm_start_data().initial_primal_weight_,
     solution.get_pdlp_warm_start_data().initial_step_size_,
     solution.get_pdlp_warm_start_data().total_pdlp_iterations_,
@@ -194,7 +187,9 @@ mip_ret_t call_solve_mip(
     error_type_t::ValidationError,
     "MIP solve cannot be called on an LP problem!");
   auto solution = cuopt::linear_programming::solve_mip(op_problem, solver_settings);
-  mip_ret_t mip_ret{std::make_unique<rmm::device_buffer>(solution.get_solution().release()),
+
+  // Convert device vector to host vector for MILP solution
+  mip_ret_t mip_ret{cuopt::host_copy(solution.get_solution()),
                     solution.get_termination_status(),
                     solution.get_error_status().get_error_type(),
                     solution.get_error_status().what(),

@@ -120,19 +120,19 @@ cdef extern from "cuopt/linear_programming/pdlp/solver_solution.hpp" namespace "
 
 cdef extern from "cuopt/linear_programming/utilities/cython_solve.hpp" namespace "cuopt::cython": # noqa
     cdef cppclass linear_programming_ret_t:
-        unique_ptr[device_buffer] primal_solution_
-        unique_ptr[device_buffer] dual_solution_
-        unique_ptr[device_buffer] reduced_cost_
+        vector[double] primal_solution_
+        vector[double] dual_solution_
+        vector[double] reduced_cost_
         # PDLP warm start data
-        unique_ptr[device_buffer] current_primal_solution_
-        unique_ptr[device_buffer] current_dual_solution_
-        unique_ptr[device_buffer] initial_primal_average_
-        unique_ptr[device_buffer] initial_dual_average_
-        unique_ptr[device_buffer] current_ATY_
-        unique_ptr[device_buffer] sum_primal_solutions_
-        unique_ptr[device_buffer] sum_dual_solutions_
-        unique_ptr[device_buffer] last_restart_duality_gap_primal_solution_
-        unique_ptr[device_buffer] last_restart_duality_gap_dual_solution_
+        vector[double] current_primal_solution_
+        vector[double] current_dual_solution_
+        vector[double] initial_primal_average_
+        vector[double] initial_dual_average_
+        vector[double] current_ATY_
+        vector[double] sum_primal_solutions_
+        vector[double] sum_dual_solutions_
+        vector[double] last_restart_duality_gap_primal_solution_
+        vector[double] last_restart_duality_gap_dual_solution_
         double initial_primal_weight_
         double initial_step_size_
         int total_pdlp_iterations_
@@ -155,7 +155,7 @@ cdef extern from "cuopt/linear_programming/utilities/cython_solve.hpp" namespace
         bool solved_by_pdlp_
 
     cdef cppclass mip_ret_t:
-        unique_ptr[device_buffer] solution_
+        vector[double] solution_
         mip_termination_status_t termination_status_
         error_type_t error_status_
         string error_message_

@@ -25,7 +25,7 @@ from libcpp.string cimport string
 from libcpp.utility cimport move
 from libcpp.vector cimport vector
 
-from rmm.pylibrmm.device_buffer cimport DeviceBuffer
+# DeviceBuffer import removed - now using host vectors directly from C++
 
 from cuopt.linear_programming.data_model.data_model cimport data_model_view_t
 from cuopt.linear_programming.data_model.data_model_wrapper cimport DataModel
@@ -46,18 +46,16 @@ import sys
 import warnings
 from enum import IntEnum
 
-import cupy as cp
 import numpy as np
 from numba import cuda
 
 import cudf
-from cudf.core.buffer import as_buffer
 
 from cuopt.linear_programming.solver_settings.solver_settings import (
     PDLPSolverMode,
     SolverSettings,
 )
-from cuopt.utilities import InputValidationError, col_from_buf
+from cuopt.utilities import InputValidationError
 
 
 cdef extern from "cuopt/linear_programming/utilities/internals.hpp" namespace "cuopt::internals": # noqa
@@ -299,9 +297,9 @@ cdef create_solution(unique_ptr[solver_ret_t] sol_ret_ptr,
     sol_ret = move(sol_ret_ptr.get()[0])
 
     if sol_ret.problem_type == ProblemCategory.MIP or sol_ret.problem_type == ProblemCategory.IP: # noqa
-        solution = DeviceBuffer.c_from_unique_ptr(
-            move(sol_ret.mip_ret.solution_)
-        )
+        # Extract and copy host solution vector from C++
+        cdef double[:] solution_view = sol_ret.mip_ret.solution_
+        solution = np.asarray(solution_view).copy()
         termination_status = sol_ret.mip_ret.termination_status_
         error_status = sol_ret.mip_ret.error_status_
         error_message = sol_ret.mip_ret.error_message_
@@ -316,11 +314,6 @@ cdef create_solution(unique_ptr[solver_ret_t] sol_ret_ptr,
         num_nodes = sol_ret.mip_ret.nodes_
         num_simplex_iterations = sol_ret.mip_ret.simplex_iterations_
 
-        solution_buf = as_buffer(solution)
-        solution = cudf.Series._from_column(
-            col_from_buf(solution_buf, np.float64)
-        ).to_numpy()
-
         return Solution(
             ProblemCategory(sol_ret.problem_type),
             dict(zip(data_model_obj.get_variable_names(), solution)),
@@ -341,25 +334,13 @@ cdef create_solution(unique_ptr[solver_ret_t] sol_ret_ptr,
         )
 
     else:
-        primal_solution = DeviceBuffer.c_from_unique_ptr(
-            move(sol_ret.lp_ret.primal_solution_)
-        )
-        dual_solution = DeviceBuffer.c_from_unique_ptr(move(sol_ret.lp_ret.dual_solution_)) # noqa
-        reduced_cost = DeviceBuffer.c_from_unique_ptr(move(sol_ret.lp_ret.reduced_cost_)) # noqa
-
-        primal_solution_buf = as_buffer(primal_solution)
-        dual_solution_buf = as_buffer(dual_solution)
-        reduced_cost_buf = as_buffer(reduced_cost)
-
-        primal_solution = cudf.Series._from_column(
-            col_from_buf(primal_solution_buf, np.float64)
-        ).to_numpy()
-        dual_solution = cudf.Series._from_column(
-            col_from_buf(dual_solution_buf, np.float64)
-        ).to_numpy()
-        reduced_cost = cudf.Series._from_column(
-            col_from_buf(reduced_cost_buf, np.float64)
-        ).to_numpy()
+        # Extract and copy host solution vectors from C++ for LP
+        cdef double[:] primal_view = sol_ret.lp_ret.primal_solution_
+        cdef double[:] dual_view = sol_ret.lp_ret.dual_solution_
+        cdef double[:] reduced_view = sol_ret.lp_ret.reduced_cost_
+        primal_solution = np.asarray(primal_view).copy()
+        dual_solution = np.asarray(dual_view).copy()
+        reduced_cost = np.asarray(reduced_view).copy()
 
         termination_status = sol_ret.lp_ret.termination_status_
         error_status = sol_ret.lp_ret.error_status_
@@ -375,33 +356,26 @@ cdef create_solution(unique_ptr[solver_ret_t] sol_ret_ptr,
 
         # In BatchSolve, we don't get the warm start data
         if not is_batch:
-            current_primal_solution = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.current_primal_solution_)
-            )
-            current_dual_solution = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.current_dual_solution_)
-            )
-            initial_primal_average = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.initial_primal_average_)
-            )
-            initial_dual_average = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.initial_dual_average_)
-            )
-            current_ATY = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.current_ATY_)
-            )
-            sum_primal_solutions = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.sum_primal_solutions_)
-            )
-            sum_dual_solutions = DeviceBuffer.c_from_unique_ptr(
-                move(sol_ret.lp_ret.sum_dual_solutions_)
-            )
-            last_restart_duality_gap_primal_solution = DeviceBuffer.c_from_unique_ptr( # noqa
-                move(sol_ret.lp_ret.last_restart_duality_gap_primal_solution_)
-            )
-            last_restart_duality_gap_dual_solution = DeviceBuffer.c_from_unique_ptr( # noqa
-                move(sol_ret.lp_ret.last_restart_duality_gap_dual_solution_)
-            )
+            # Extract and copy host warm start data vectors from C++
+            cdef double[:] curr_primal_view = sol_ret.lp_ret.current_primal_solution_
+            cdef double[:] curr_dual_view = sol_ret.lp_ret.current_dual_solution_
+            cdef double[:] init_primal_avg_view = sol_ret.lp_ret.initial_primal_average_
+            cdef double[:] init_dual_avg_view = sol_ret.lp_ret.initial_dual_average_
+            cdef double[:] curr_aty_view = sol_ret.lp_ret.current_ATY_
+            cdef double[:] sum_primal_view = sol_ret.lp_ret.sum_primal_solutions_
+            cdef double[:] sum_dual_view = sol_ret.lp_ret.sum_dual_solutions_
+            cdef double[:] last_restart_primal_view = sol_ret.lp_ret.last_restart_duality_gap_primal_solution_
+            cdef double[:] last_restart_dual_view = sol_ret.lp_ret.last_restart_duality_gap_dual_solution_
+
+            current_primal_solution = np.asarray(curr_primal_view).copy()
+            current_dual_solution = np.asarray(curr_dual_view).copy()
+            initial_primal_average = np.asarray(init_primal_avg_view).copy()
+            initial_dual_average = np.asarray(init_dual_avg_view).copy()
+            current_ATY = np.asarray(curr_aty_view).copy()
+            sum_primal_solutions = np.asarray(sum_primal_view).copy()
+            sum_dual_solutions = np.asarray(sum_dual_view).copy()
+            last_restart_duality_gap_primal_solution = np.asarray(last_restart_primal_view).copy()
+            last_restart_duality_gap_dual_solution = np.asarray(last_restart_dual_view).copy()
             initial_primal_weight = sol_ret.lp_ret.initial_primal_weight_
             initial_step_size = sol_ret.lp_ret.initial_step_size_
             total_pdlp_iterations = sol_ret.lp_ret.total_pdlp_iterations_
@@ -411,54 +385,6 @@ cdef create_solution(unique_ptr[solver_ret_t] sol_ret_ptr,
             sum_solution_weight = sol_ret.lp_ret.sum_solution_weight_
             iterations_since_last_restart = sol_ret.lp_ret.iterations_since_last_restart_ # noqa
 
-            current_primal_solution_buf = as_buffer(current_primal_solution)
-            current_dual_solution_buf = as_buffer(current_dual_solution)
-            initial_primal_average_buf = as_buffer(initial_primal_average)
-            initial_dual_average_buf = as_buffer(initial_dual_average)
-            current_ATY_buf = as_buffer(current_ATY)
-            sum_primal_solutions_buf = as_buffer(sum_primal_solutions)
-            sum_dual_solutions_buf = as_buffer(sum_dual_solutions)
-            last_restart_duality_gap_primal_solution_buf = as_buffer(
-                last_restart_duality_gap_primal_solution
-            )
-            last_restart_duality_gap_dual_solution_buf = as_buffer(
-                last_restart_duality_gap_dual_solution
-            )
-
-            current_primal_solution = cudf.Series._from_column(
-                col_from_buf(current_primal_solution_buf, np.float64)
-            ).to_numpy()
-            current_dual_solution = cudf.Series._from_column(
-                col_from_buf(current_dual_solution_buf, np.float64)
-            ).to_numpy()
-            initial_primal_average = cudf.Series._from_column(
-                col_from_buf(initial_primal_average_buf, np.float64)
-            ).to_numpy()
-            initial_dual_average = cudf.Series._from_column(
-                col_from_buf(initial_dual_average_buf, np.float64)
-            ).to_numpy()
-            current_ATY = cudf.Series._from_column(
-                col_from_buf(current_ATY_buf, np.float64)
-            ).to_numpy()
-            sum_primal_solutions = cudf.Series._from_column(
-                col_from_buf(sum_primal_solutions_buf, np.float64)
-            ).to_numpy()
-            sum_dual_solutions = cudf.Series._from_column(
-                col_from_buf(sum_dual_solutions_buf, np.float64)
-            ).to_numpy()
-            last_restart_duality_gap_primal_solution = cudf.Series._from_column( # noqa
-                col_from_buf(
-                    last_restart_duality_gap_primal_solution_buf,
-                    np.float64
-                )
-            ).to_numpy()
-            last_restart_duality_gap_dual_solution = cudf.Series._from_column(
-                col_from_buf(
-                    last_restart_duality_gap_dual_solution_buf,
-                    np.float64
-                )
-            ).to_numpy()
-
             return Solution(
                 ProblemCategory(sol_ret.problem_type),
                 dict(zip(data_model_obj.get_variable_names(), primal_solution)), # noqa