@@ -37,16 +37,16 @@ static __global__ void flash_attn_tile_ext_f32(
37
37
#endif // FP16_MMA_AVAILABLE
38
38
if (use_logit_softcap && !(D == 128 || D == 256 )) {
39
39
GGML_UNUSED (Q); GGML_UNUSED (K); GGML_UNUSED (V); GGML_UNUSED (mask);
40
- GGML_UNUSED (dst); GGML_UNUSED (dst_meta); GGML_UNUSED (scale);
41
- GGML_UNUSED (max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
40
+ GGML_UNUSED (dst); GGML_UNUSED (dst_meta);
41
+ GGML_UNUSED (scale); GGML_UNUSED ( max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
42
42
GGML_UNUSED (n_head_log2); GGML_UNUSED (logit_softcap);
43
- GGML_UNUSED (ne00); GGML_UNUSED (ne01); GGML_UNUSED (ne02);
44
- GGML_UNUSED (ne03 ); GGML_UNUSED (ne10 ); GGML_UNUSED (ne11 );
45
- GGML_UNUSED (ne12 ); GGML_UNUSED (ne13 ); GGML_UNUSED (ne31 ); GGML_UNUSED (ne32 );
46
- GGML_UNUSED (nb31 ); GGML_UNUSED (nb32 ); GGML_UNUSED (nb01); GGML_UNUSED (nb02 );
47
- GGML_UNUSED (nb03 ); GGML_UNUSED (nb11 ); GGML_UNUSED (nb12 );
48
- GGML_UNUSED (nb13 ); GGML_UNUSED (nb21 ); GGML_UNUSED (nb22 );
49
- GGML_UNUSED (nb23 );
43
+ GGML_UNUSED (ne00); GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (ne03);
44
+ GGML_UNUSED (nb01 ); GGML_UNUSED (nb02 ); GGML_UNUSED (nb03 );
45
+ GGML_UNUSED (ne10 ); GGML_UNUSED (ne11 ); GGML_UNUSED (ne12 ); GGML_UNUSED (ne13 );
46
+ GGML_UNUSED (nb11 ); GGML_UNUSED (nb12 ); GGML_UNUSED (nb13 );
47
+ GGML_UNUSED (nb21 ); GGML_UNUSED (nb22 ); GGML_UNUSED (nb23 );
48
+ GGML_UNUSED (ne31 ); GGML_UNUSED (ne32 ); GGML_UNUSED (ne33 );
49
+ GGML_UNUSED (nb31); GGML_UNUSED (nb32); GGML_UNUSED (nb33 );
50
50
NO_DEVICE_CODE;
51
51
return ;
52
52
}
@@ -282,16 +282,16 @@ static __global__ void flash_attn_tile_ext_f32(
282
282
}
283
283
#else
284
284
GGML_UNUSED (Q); GGML_UNUSED (K); GGML_UNUSED (V); GGML_UNUSED (mask);
285
- GGML_UNUSED (dst); GGML_UNUSED (dst_meta); GGML_UNUSED (scale);
286
- GGML_UNUSED (max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
285
+ GGML_UNUSED (dst); GGML_UNUSED (dst_meta);
286
+ GGML_UNUSED (scale); GGML_UNUSED ( max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
287
287
GGML_UNUSED (n_head_log2); GGML_UNUSED (logit_softcap);
288
288
GGML_UNUSED (ne00); GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (ne03);
289
- GGML_UNUSED (ne10); GGML_UNUSED (ne11); GGML_UNUSED (ne12); GGML_UNUSED (ne13);
290
- GGML_UNUSED (ne31); GGML_UNUSED (ne32);
291
- GGML_UNUSED (nb31); GGML_UNUSED (nb32);
292
289
GGML_UNUSED (nb01); GGML_UNUSED (nb02); GGML_UNUSED (nb03);
290
+ GGML_UNUSED (ne10); GGML_UNUSED (ne11); GGML_UNUSED (ne12); GGML_UNUSED (ne13);
293
291
GGML_UNUSED (nb11); GGML_UNUSED (nb12); GGML_UNUSED (nb13);
294
292
GGML_UNUSED (nb21); GGML_UNUSED (nb22); GGML_UNUSED (nb23);
293
+ GGML_UNUSED (ne31); GGML_UNUSED (ne32); GGML_UNUSED (ne33);
294
+ GGML_UNUSED (nb31); GGML_UNUSED (nb32); GGML_UNUSED (nb33);
295
295
NO_DEVICE_CODE;
296
296
#endif // FLASH_ATTN_AVAILABLE
297
297
}
0 commit comments