[Easy][Building] Fix the warning of int4mm.cu when building (pytorch#151427)

FFFrog · pytorchmergebot · commit 49c91b4be99e · 2025-04-17T08:21:32.000Z
As the title stated. **Changes Before:** ```C++ [999/1526] Building CUDA object caffe2/CMakeFiles/torch_cuda.dir/__/aten/src/ATen/native/cuda/int4mm.cu.o /root/Git.d/pytorch/pytorch/aten/src/ATen/native/cuda/int4mm.cu(142): warning ROCm#177-D: variable "at::native::kWarpSize" was declared but never referenced constexpr int32_t kWarpSize = 32; ^ Remark: The warnings can be suppressed with "-diag-suppress <warning-number>" ``` Pull Request resolved: pytorch#151427 Approved by: https://github.com/Skylion007, https://github.com/malfet
diff --git a/aten/src/ATen/native/cuda/int4mm.cu b/aten/src/ATen/native/cuda/int4mm.cu
@@ -127,6 +127,14 @@ inline __host__ __device__ uint32_t getAlignmentRoundUp(const void* p) {
   return diff == 0 ? 0 : uint32_t(Align) - diff;
 }
 
+#if defined (__gfx90a__) || defined(__gfx942__)
+#define CDNA2_OR_LATER 1
+#else
+#define CDNA2_OR_LATER 0
+#endif
+
+#if (defined(USE_ROCM) && ROCM_VERSION >= 50700) || ((defined(CUDA_VERSION) && CUDA_VERSION >= 12000) && (!defined(__CUDA_ARCH__) || (__CUDA_ARCH__ >= 800)))
+
 #if defined(USE_ROCM)
 // TODO: Support RDNA
 constexpr int32_t kWarpSize = 64;
@@ -142,14 +150,6 @@ static bool isCDNA2orLater(int index) {
 constexpr int32_t kWarpSize = 32;
 #endif
 
-#if defined (__gfx90a__) || defined(__gfx942__)
-#define CDNA2_OR_LATER 1
-#else
-#define CDNA2_OR_LATER 0
-#endif
-
-#if (defined(USE_ROCM) && ROCM_VERSION >= 50700) || ((defined(CUDA_VERSION) && CUDA_VERSION >= 12000) && (!defined(__CUDA_ARCH__) || (__CUDA_ARCH__ >= 800)))
-
 // f16 vector types
 struct __align__(2) f16x1 {
   __half vals[1];