From e0b5651d2be83bbb02cc8fdd18d9f37d2496ffa0 Mon Sep 17 00:00:00 2001 From: siwasaki Date: Mon, 11 Sep 2023 14:14:09 -0700 Subject: [PATCH 1/2] Use a relative include path in DotOpToLLVM/WGMMA.cpp --- lib/Conversion/TritonGPUToLLVM/DotOpToLLVM/WGMMA.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/lib/Conversion/TritonGPUToLLVM/DotOpToLLVM/WGMMA.cpp b/lib/Conversion/TritonGPUToLLVM/DotOpToLLVM/WGMMA.cpp index f03d09788c9d..9f943a615fa1 100644 --- a/lib/Conversion/TritonGPUToLLVM/DotOpToLLVM/WGMMA.cpp +++ b/lib/Conversion/TritonGPUToLLVM/DotOpToLLVM/WGMMA.cpp @@ -21,8 +21,8 @@ * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ -#include "DotOpToLLVM.h" -#include "Utility.h" +#include "../DotOpToLLVM.h" +#include "../Utility.h" using namespace mlir; using namespace mlir::triton; From dd17f99c297590fc4d64ca3dacba0115c3eb1b80 Mon Sep 17 00:00:00 2001 From: siwasaki Date: Mon, 11 Sep 2023 14:14:37 -0700 Subject: [PATCH 2/2] [backends] Explicitly cast a void pointer type --- python/triton/runtime/backends/cuda.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/python/triton/runtime/backends/cuda.c b/python/triton/runtime/backends/cuda.c index 7dd60528f28f..278310473597 100644 --- a/python/triton/runtime/backends/cuda.c +++ b/python/triton/runtime/backends/cuda.c @@ -330,7 +330,7 @@ static PyObject *memFree(PyObject *self, PyObject *args) { // Helper function to convert a Python list to a cuuint64_t array static cuuint64_t *list_to_cuuint64_array(PyObject *listObj) { Py_ssize_t len = PyList_Size(listObj); - cuuint64_t *array = malloc(len * sizeof(cuuint64_t)); + cuuint64_t *array = (cuuint64_t *)malloc(len * sizeof(cuuint64_t)); for (Py_ssize_t i = 0; i < len; i++) { PyObject *item = PyList_GetItem(listObj, i); array[i] = (cuuint64_t)PyLong_AsUnsignedLongLong(item); @@ -341,7 +341,7 @@ static cuuint64_t *list_to_cuuint64_array(PyObject *listObj) { // Helper function to convert a Python list to a cuuint32_t array static cuuint32_t *list_to_cuuint32_array(PyObject *listObj) { Py_ssize_t len = PyList_Size(listObj); - cuuint32_t *array = malloc(len * sizeof(cuuint32_t)); + cuuint32_t *array = (cuuint32_t *)malloc(len * sizeof(cuuint32_t)); for (Py_ssize_t i = 0; i < len; i++) { PyObject *item = PyList_GetItem(listObj, i); array[i] = (cuuint32_t)PyLong_AsUnsignedLong(item);