From 1e6ebb2b1b8d27c597f8c9c44f75a780543496f2 Mon Sep 17 00:00:00 2001 From: Aaron Teo Date: Tue, 24 Jun 2025 22:56:05 +0800 Subject: [PATCH] ggml-cpu: fix wrong refactor of ggml-base ref: https://github.com/ggml-org/llama.cpp/pull/14317#discussion_r2164176555 Signed-off-by: Aaron Teo --- ggml/src/ggml-impl.h | 3 +++ ggml/src/ggml-quants.c | 1 - 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/ggml/src/ggml-impl.h b/ggml/src/ggml-impl.h index 59bae840f..8d9bdc74c 100644 --- a/ggml/src/ggml-impl.h +++ b/ggml/src/ggml-impl.h @@ -390,6 +390,9 @@ static inline ggml_fp16_t ggml_compute_fp32_to_fp16(float f) { #define GGML_COMPUTE_FP16_TO_FP32(x) ggml_compute_fp16_to_fp32(x) #define GGML_COMPUTE_FP32_TO_FP16(x) ggml_compute_fp32_to_fp16(x) +#define GGML_FP16_TO_FP32(x) GGML_COMPUTE_FP16_TO_FP32(x) +#define GGML_FP32_TO_FP16(x) GGML_COMPUTE_FP32_TO_FP16(x) + // precomputed f32 table for f16 (256 KB) // defined in ggml.c, initialized in ggml_init() GGML_API float ggml_table_f32_f16[1 << 16]; diff --git a/ggml/src/ggml-quants.c b/ggml/src/ggml-quants.c index 5bd027159..e389a46db 100644 --- a/ggml/src/ggml-quants.c +++ b/ggml/src/ggml-quants.c @@ -4,7 +4,6 @@ #include "ggml-quants.h" #include "ggml-impl.h" #include "ggml-cpu/ggml-cpu-impl.h" -#include "ggml-cpu/simd-mappings.h" #include "ggml-cpu.h" #include