Test CUDA conv2D type conversion fix

qnixsynapse · qnixsynapse · commit fa3d9d307882 · 2025-08-31T09:16:37.000+05:30
diff --git a/.github/workflows/menlo-build.yml b/.github/workflows/menlo-build.yml
@@ -56,7 +56,6 @@ jobs:
 
   build-and-test:
     runs-on: ${{ matrix.runs-on }}
-    needs: [create-draft-release]
     timeout-minutes: 270
     strategy:
       fail-fast: false
@@ -285,7 +284,7 @@ jobs:
         uses: actions/checkout@v3
         with:
           submodules: recursive
-      
+
       - name: Replace our Makefile
         run: |
           cat menlo/Makefile | tee Makefile
@@ -635,4 +634,4 @@ jobs:
           upload_url: ${{ needs.create-draft-release.outputs.upload_url }}
           asset_path: /tmp/cudart-llama-bin-win-cu11.7-x64.tar.gz
           asset_name: cudart-llama-bin-win-cu11.7-x64.tar.gz
-          asset_content_type: application/gzip
+          asset_content_type: application/gzip
diff --git a/ggml/src/ggml-cuda/conv2d.cu b/ggml/src/ggml-cuda/conv2d.cu
@@ -17,6 +17,15 @@ struct kernel_bounds {
     int64_t x_min, x_max;
 };
 
+template<typename T>
+__device__ __forceinline__ float to_float(const T& val) {
+    if constexpr (std::is_same_v<T, __half>) {
+        return __half2float(val);
+    } else {
+        return val;  // Assumes T is float
+    }
+}
+
 __device__ __forceinline__ int64_t max64(int64_t a, int64_t b) {
     return (a > b) ? a : b;
 }
@@ -94,8 +103,8 @@ static __global__ void conv2d_kernel(const float * __restrict__ input,
                 const int64_t in_x = calculate_input_coord(out_x, kx, P.ST_X, P.DL_X, P.PD_X);
 
                 const float input_val = input[Layout::input_index(n, c_in, in_y, in_x, P)];
-                const float kernel_val = kernel[Layout::kernel_index(c_out, c_in, ky, kx, P)];
-                acc += (input_val * kernel_val);
+                const T kernel_val = kernel[Layout::kernel_index(c_out, c_in, ky, kx, P)];
+                acc += (input_val * to_float(kernel_val));
             }
         }
     }

Original file line number	Diff line number	Diff line change
`@@ -17,6 +17,15 @@ struct kernel_bounds {`
`17`	`17`	`int64_t x_min, x_max;`
`18`	`18`	`};`
`19`	`19`
	`20`	`+template<typename T>`
	`21`	`+__device__ __forceinline__ float to_float(const T& val) {`
	`22`	`+ if constexpr (std::is_same_v<T, __half>) {`
	`23`	`+ return __half2float(val);`
	`24`	`+ } else {`
	`25`	`+ return val; // Assumes T is float`
	`26`	`+ }`
	`27`	`+}`
	`28`	`+`
`20`	`29`	`__device__ __forceinline__ int64_t max64(int64_t a, int64_t b) {`
`21`	`30`	`return (a > b) ? a : b;`
`22`	`31`	`}`
`@@ -94,8 +103,8 @@ static __global__ void conv2d_kernel(const float * __restrict__ input,`
`94`	`103`	`const int64_t in_x = calculate_input_coord(out_x, kx, P.ST_X, P.DL_X, P.PD_X);`
`95`	`104`
`96`	`105`	`const float input_val = input[Layout::input_index(n, c_in, in_y, in_x, P)];`
`97`		`- const float kernel_val = kernel[Layout::kernel_index(c_out, c_in, ky, kx, P)];`
`98`		`- acc += (input_val * kernel_val);`
	`106`	`+ const T kernel_val = kernel[Layout::kernel_index(c_out, c_in, ky, kx, P)];`
	`107`	`+ acc += (input_val * to_float(kernel_val));`
`99`	`108`	`}`
`100`	`109`	`}`
`101`	`110`	`}`