Skip to content

Commit 3829ae7

Browse files
committed
attempt to debug
1 parent 6529326 commit 3829ae7

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

ggml/src/ggml-cuda/fattn-mma-f16.cuh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1243,10 +1243,11 @@ static __global__ void flash_attn_ext_f16(
12431243
}
12441244
#if __CUDA_ARCH__ == GGML_CUDA_CC_TURING
12451245
if (ncols1*ncols2 > 32) {
1246+
printf("\nCUDA_ARCH:%d, DKQ:%d, DV:%d, ncols1:%d, ncols2:%d, nwarps:%d, ntiles:%d, ne00:%d, ne01:%d\n",__CUDA_ARCH__,DKQ, DV, ncols1, ncols2, nwarps, ntiles,ne00,ne01);
12461247
NO_DEVICE_CODE;
12471248
return;
12481249
}
1249-
#endif __CUDA_ARCH__ == GGML_CUDA_CC_TURING
1250+
#endif // __CUDA_ARCH__ == GGML_CUDA_CC_TURING
12501251

12511252
static_assert(!mla || DKQ >= DV, "MLA needs DKQ >= DV");
12521253

0 commit comments

Comments
 (0)