Skip to content

Commit c9ec96c

Browse files
committed
clean up rebase: fix ne error in half2
1 parent 74d9aea commit c9ec96c

File tree

1 file changed

+1
-10
lines changed

1 file changed

+1
-10
lines changed

ggml/src/ggml-cuda/mma.cuh

Lines changed: 1 addition & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -290,11 +290,8 @@ namespace ggml_cuda_mma {
290290
}
291291
}
292292
#elif defined(AMD_WMMA_AVAILABLE)
293-
#if defined(RDNA3)
294-
static constexpr int ne = (I == 16 && J == 16) ? I * J / 32 : I * J / 16;
295-
#else
293+
296294
static constexpr int ne = I * J / 32;
297-
#endif // defined(RDNA3)
298295
half2 x[ne] = {{0.0f, 0.0f}};
299296

300297
static constexpr __device__ bool supported() {
@@ -371,12 +368,6 @@ namespace ggml_cuda_mma {
371368
static constexpr data_layout dl = DATA_LAYOUT_I_MAJOR;
372369
static constexpr int ne = I * J / WARP_SIZE;
373370

374-
#if defined(AMD_WMMA_AVAILABLE)
375-
#if defined(RDNA3)
376-
static constexpr int ne = (I == 16 && J == 16) ? I * J / 32 : I * J / 16;
377-
#else
378-
static constexpr int ne = I * J / 32;
379-
#endif // defined(RDNA3)
380371
nv_bfloat162 x[ne] = {{0.0f, 0.0f}};
381372

382373
#if defined(AMD_WMMA_AVAILABLE)

0 commit comments

Comments
 (0)