Skip to content

Commit 80a9082

Browse files
committed
q5_1 kv in cuda
1 parent 9be8106 commit 80a9082

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

ggml/src/ggml-cuda/fattn.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -409,11 +409,11 @@ static best_fattn_kernel ggml_cuda_get_best_fattn_kernel(const int device, const
409409
break;
410410
case GGML_TYPE_Q4_1:
411411
case GGML_TYPE_Q5_0:
412-
case GGML_TYPE_Q5_1:
413412
#ifndef GGML_CUDA_FA_ALL_QUANTS
414413
return BEST_FATTN_KERNEL_NONE;
415414
#endif // GGML_CUDA_FA_ALL_QUANTS
416415
case GGML_TYPE_Q4_0:
416+
case GGML_TYPE_Q5_1: //kcpp: support q5_1 kv
417417
case GGML_TYPE_Q8_0:
418418
case GGML_TYPE_BF16:
419419
break;

0 commit comments

Comments
 (0)