cuda : fix LLAMA_CUDA_F16 build (#6298)

This commit is contained in:
slaren
2024-03-25 15:43:22 +01:00
committed by GitHub
parent ae1f211ce2
commit 2f34b865b6

View File

@ -1,5 +1,6 @@
#include "dmmv.cuh" #include "dmmv.cuh"
#include "dequantize.cuh" #include "dequantize.cuh"
#include "convert.cuh"
// dmmv = dequantize_mul_mat_vec // dmmv = dequantize_mul_mat_vec
#ifndef GGML_CUDA_DMMV_X #ifndef GGML_CUDA_DMMV_X