diff --git a/csrc/kernels.hip b/csrc/kernels.hip index 6c9c8a5bd..383685888 100644 --- a/csrc/kernels.hip +++ b/csrc/kernels.hip @@ -2853,10 +2853,10 @@ template __global__ void kspmm_coo_very_sparse_naive(int *max_count, int *max_idx, int *offset_rowidx, int *rowidx, int *colidx, half *values, T *B, half *out, float * __restrict__ const dequant_stats, int nnz, int rowsA, int rowsB, int colsB) diff --git a/csrc/ops.hip b/csrc/ops.hip index 17d350951..3cf36b87c 100644 --- a/csrc/ops.hip +++ b/csrc/ops.hip @@ -20,10 +20,10 @@ #define ERR_NOT_IMPLEMENTED 100 -#if defined(__GFX9__) - #define WARP_SIZE 64 +#ifdef __AMDGCN_WAVEFRONT_SIZE + #define WARP_SIZE __AMDGCN_WAVEFRONT_SIZE #else - #define WARP_SIZE 32 + #define WARP_SIZE 64 #endif using namespace BinSearch;