Added cuda-sandbox

jajhall · jajhall · commit 660dcae72201 · 2025-10-28T17:03:01.000Z
diff --git a/check/TestPdlp.cpp b/check/TestPdlp.cpp
@@ -6,6 +6,12 @@
 #include "SpecialLps.h"
 #include "catch.hpp"
 
+#ifdef CUPDLP_GPU
+#include <cublas_v2.h>
+#include <cuda_runtime.h>
+#include <cusparse.h>
+#endif
+
 const bool dev_run = false;
 const double double_equal_tolerance = 1e-3;
 const double kkt_tolerance = 1e-4;
@@ -419,5 +425,46 @@ TEST_CASE("hi-pdlp-timer", "[pdlp]") {
       kPdlpAdaptiveStepSizeOff;
   h.setOptionValue("pdlp_features_off", pdlp_features_off);
   HighsStatus run_status = h.run();
+
   h.resetGlobalScheduler(true);
 }
+
+#ifdef CUPDLP_GPU
+TEST_CASE("cuda-sandbox", "[pdlp]") {
+  printf("Hello World - cuda-sandbox\n");
+  cusparseHandle_t cusparsehandle;
+  cusparseCreate(&cusparsehandle);
+  int v_cuda_runtime = 0;
+  int v_cuda_driver = 0;
+  int v_cusparse = 0;
+  int n_devices = 0;
+  cudaGetDeviceCount(&n_devices);
+  assert(n_devices == 1);
+  cudaDeviceProp prop;
+  cudaGetDeviceProperties(&prop, 0);
+  printf("Cuda device %d: %s\n", 0, prop.name);
+  printf("  Clock rate (KHz): %d\n", prop.clockRate);
+  printf("  Memory clock rate (KHz): %d\n", prop.memoryClockRate);
+  printf("  Memory bus width (bits): %d\n", prop.memoryBusWidth);
+  printf("  Peak memory bandwidth (GB/s): %f\n",
+         2.0 * prop.memoryClockRate * (prop.memoryBusWidth / 8) / 1.0e6);
+  printf("  Global memory available on device (GB): %f\n",
+         prop.totalGlobalMem / 1.0e9);
+  printf("  Shared memory available per block (B): %zu\n",
+         prop.sharedMemPerBlock);
+  printf("  Warp size in threads: %d\n", prop.warpSize);
+  printf("  Maximum number of threads per block: %d\n",
+         prop.maxThreadsPerBlock);
+  printf("  Compute capability: %d.%d\n", prop.major, prop.minor);
+  printf("  Number of multiprocessors on device: %d\n",
+         prop.multiProcessorCount);
+
+  cudaRuntimeGetVersion(&v_cuda_runtime);
+  cudaDriverGetVersion(&v_cuda_driver);
+
+  cusparseGetVersion(cusparsehandle, &v_cusparse);
+  printf("Cuda runtime version %d\n", v_cuda_runtime);
+  printf("Cuda driver  version %d\n", v_cuda_driver);
+  printf("cuSparse     version %d\n", v_cusparse);
+}
+#endif
diff --git a/highs/pdlp/hipdlp/linalg.cc b/highs/pdlp/hipdlp/linalg.cc
@@ -214,7 +214,7 @@ std::vector<double> compute_row_norms(const HighsLp& lp, double p) {
 }
 
 std::vector<double> vector_subtrac(const std::vector<double>& a,
-                                  const std::vector<double>& b) {
+                                   const std::vector<double>& b) {
   if (a.size() != b.size()) {
     throw std::invalid_argument(
         "Vectors must be of the same size for subtraction.");
diff --git a/highs/pdlp/hipdlp/linalg.hpp b/highs/pdlp/hipdlp/linalg.hpp
@@ -54,7 +54,7 @@ std::vector<double> compute_row_norms(
     const HighsLp& lp, double p = std::numeric_limits<double>::infinity());
 
 std::vector<double> vector_subtrac(const std::vector<double>& a,
-                                  const std::vector<double>& b);
+                                   const std::vector<double>& b);
 
 }  // namespace linalg
 
diff --git a/highs/pdlp/hipdlp/pdhg.cc b/highs/pdlp/hipdlp/pdhg.cc
@@ -442,19 +442,19 @@ PostSolveRetcode PDLPSolver::postprocess(HighsSolution& solution) {
 
   // Compute Ax using only the original columns (not slack variables)
   for (int col = 0; col < original_num_col_; ++col) {
-      double x_val = x_current_[col];  // Use unscaled x values
-      
-      for (int el = orig_matrix.start_[col]; 
-          el < orig_matrix.start_[col + 1]; ++el) {
-          int row = orig_matrix.index_[el];
-          double a_val = orig_matrix.value_[el];
-          ax_original[row] += a_val * x_val;
-      }
+    double x_val = x_current_[col];  // Use unscaled x values
+
+    for (int el = orig_matrix.start_[col]; el < orig_matrix.start_[col + 1];
+         ++el) {
+      int row = orig_matrix.index_[el];
+      double a_val = orig_matrix.value_[el];
+      ax_original[row] += a_val * x_val;
+    }
   }
 
   // Now ax_original contains the correct row activity values
   for (int orig_row = 0; orig_row < original_lp_->num_row_; ++orig_row) {
-      solution.row_value[orig_row] = ax_original[orig_row];
+    solution.row_value[orig_row] = ax_original[orig_row];
   }
 
   // 6. Recover Dual Column Values (Reduced Costs)
@@ -566,16 +566,14 @@ void PDLPSolver::solve(std::vector<double>& x, std::vector<double>& y) {
 
       hipdlpTimerStart(kHipdlpClockConvergenceCheck);
       // Compute residuals for current iterate
-      bool current_converged =
-          checkConvergence(iter, x_current_, y_current_, Ax_cache_, ATy_cache_,
-                           params_.tolerance, current_results, "[L]",
-                           dSlackPos_, dSlackNeg_);
+      bool current_converged = checkConvergence(
+          iter, x_current_, y_current_, Ax_cache_, ATy_cache_,
+          params_.tolerance, current_results, "[L]", dSlackPos_, dSlackNeg_);
 
       // Compute residuals for average iterate
-      bool average_converged =
-          checkConvergence(iter, x_avg_, y_avg_, Ax_avg, ATy_avg,
-                           params_.tolerance, average_results, "[A]",
-                           dSlackPosAvg_, dSlackNegAvg_);
+      bool average_converged = checkConvergence(
+          iter, x_avg_, y_avg_, Ax_avg, ATy_avg, params_.tolerance,
+          average_results, "[A]", dSlackPosAvg_, dSlackNegAvg_);
       hipdlpTimerStop(kHipdlpClockConvergenceCheck);
 
       debugPdlpIterHeaderLog(debug_pdlp_log_file_);
@@ -907,14 +905,14 @@ void PDLPSolver::computeDualSlacks(const std::vector<double>& dualResidual,
   }
 }
 
-double PDLPSolver::computeDualFeasibility(
-    const std::vector<double>& ATy_vector, std::vector<double>& dSlackPos,
-    std::vector<double>& dSlackNeg) {
+double PDLPSolver::computeDualFeasibility(const std::vector<double>& ATy_vector,
+                                          std::vector<double>& dSlackPos,
+                                          std::vector<double>& dSlackNeg) {
   std::vector<double> dualResidual(lp_.num_col_, 0.0);
   // dualResidual = c-A'y
   dualResidual = linalg::vector_subtrac(lp_.col_cost_, ATy_vector);
   double dualResidualNorm = linalg::vector_norm(dualResidual);
-  
+
   // Call the refactored function to populate dSlackPos and dSlackNeg
   computeDualSlacks(dualResidual, dSlackPos, dSlackNeg);
 
@@ -985,9 +983,9 @@ PDLPSolver::computeDualityGap(const std::vector<double>& x,
                          cTx);
 }
 
-double PDLPSolver::computeDualObjective(
-    const std::vector<double>& y, const std::vector<double>& dSlackPos,
-    const std::vector<double>& dSlackNeg) {
+double PDLPSolver::computeDualObjective(const std::vector<double>& y,
+                                        const std::vector<double>& dSlackPos,
+                                        const std::vector<double>& dSlackNeg) {
   double dual_obj = lp_.offset_;
 
   // Compute b'y (or rhs'y in cuPDLP notation)
@@ -1012,15 +1010,12 @@ double PDLPSolver::computeDualObjective(
   return dual_obj;
 }
 
-bool PDLPSolver::checkConvergence(const int iter, const std::vector<double>& x,
-                                  const std::vector<double>& y,
-                                  const std::vector<double>& ax_vector,
-                                  const std::vector<double>& aty_vector,
-                                  double epsilon, SolverResults& results,
-                                  const char* type,
-                                  // Add slack vectors as non-const references
-                                  std::vector<double>& dSlackPos,
-                                  std::vector<double>& dSlackNeg) {
+bool PDLPSolver::checkConvergence(
+    const int iter, const std::vector<double>& x, const std::vector<double>& y,
+    const std::vector<double>& ax_vector, const std::vector<double>& aty_vector,
+    double epsilon, SolverResults& results, const char* type,
+    // Add slack vectors as non-const references
+    std::vector<double>& dSlackPos, std::vector<double>& dSlackNeg) {
   // computeDualSlacks is now called inside computeDualFeasibility
 
   // Compute primal feasibility
diff --git a/highs/pdlp/hipdlp/pdhg.hpp b/highs/pdlp/hipdlp/pdhg.hpp
@@ -61,14 +61,13 @@ class PDLPSolver {
   void initialize();
   void printConstraintInfo();
   bool checkConvergence(const int iter, const std::vector<double>& x,
-                                  const std::vector<double>& y,
-                                  const std::vector<double>& ax_vector,
-                                  const std::vector<double>& aty_vector,
-                                  double epsilon, SolverResults& results,
-                                  const char* type,
-                                  // Add slack vectors as non-const references
-                                  std::vector<double>& dSlackPos,
-                                  std::vector<double>& dSlackNeg);
+                        const std::vector<double>& y,
+                        const std::vector<double>& ax_vector,
+                        const std::vector<double>& aty_vector, double epsilon,
+                        SolverResults& results, const char* type,
+                        // Add slack vectors as non-const references
+                        std::vector<double>& dSlackPos,
+                        std::vector<double>& dSlackNeg);
   void updateAverageIterates(const std::vector<double>& x,
                              const std::vector<double>& y,
                              const PrimalDualParams& params, int inner_iter);
@@ -100,14 +99,16 @@ class PDLPSolver {
   // --- Feasibility, Duality, and KKT Checks ---
   std::vector<double> computeLambda(const std::vector<double>& y,
                                     const std::vector<double>& ATy_vector);
-  double computeDualObjective(const std::vector<double>& y, const std::vector<double>& dSlackPos,
-    const std::vector<double>& dSlackNeg);
+  double computeDualObjective(const std::vector<double>& y,
+                              const std::vector<double>& dSlackPos,
+                              const std::vector<double>& dSlackNeg);
   double computePrimalFeasibility(const std::vector<double>& Ax_vector);
   void computeDualSlacks(const std::vector<double>& dualResidual,
-                                   std::vector<double>& dSlackPos,
-                                   std::vector<double>& dSlackNeg);
-  double computeDualFeasibility(const std::vector<double>& ATy_vector, std::vector<double>& dSlackPos,
-    std::vector<double>& dSlackNeg);
+                         std::vector<double>& dSlackPos,
+                         std::vector<double>& dSlackNeg);
+  double computeDualFeasibility(const std::vector<double>& ATy_vector,
+                                std::vector<double>& dSlackPos,
+                                std::vector<double>& dSlackNeg);
   std::tuple<double, double, double, double, double> computeDualityGap(
       const std::vector<double>& x, const std::vector<double>& y,
       const std::vector<double>& lambda);

Original file line number	Diff line number	Diff line change
`@@ -214,7 +214,7 @@ std::vector<double> compute_row_norms(const HighsLp& lp, double p) {`
`214`	`214`	`}`
`215`	`215`
`216`	`216`	`std::vector<double> vector_subtrac(const std::vector<double>& a,`
`217`		`- const std::vector<double>& b) {`
	`217`	`+ const std::vector<double>& b) {`
`218`	`218`	`if (a.size() != b.size()) {`
`219`	`219`	`throw std::invalid_argument(`
`220`	`220`	`"Vectors must be of the same size for subtraction.");`