Skip to content

Commit 59792ff

Browse files
committed
cuda : disable BF16 FA
ggml-ci
1 parent 3cf5d1c commit 59792ff

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

ggml/src/ggml-cuda.cu

+3
Original file line numberDiff line numberDiff line change
@@ -3159,6 +3159,9 @@ static bool ggml_backend_cuda_device_supports_op(ggml_backend_dev_t dev, const g
31593159
#ifndef FLASH_ATTN_AVAILABLE
31603160
return false;
31613161
#endif
3162+
if (op->src[1]->type == GGML_TYPE_BF16 || op->src[2]->type == GGML_TYPE_BF16) {
3163+
return false;
3164+
}
31623165
if (op->src[0]->ne[0] == 64 && op->src[1]->type == GGML_TYPE_F16) {
31633166
return true;
31643167
}

0 commit comments

Comments
 (0)