ggml : introduce structs for the q4 data blocks (#356)

* Introduce structs for the q4 data blocks * ggml : rename quant struct variables + fix ARM_NEON --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
2025-08-18 05:56:00 -04:00 · 2023-03-28 15:56:03 +00:00
parent e0670260fb
commit c1f885067c
6 changed files with 150 additions and 235 deletions
--- a/tests/test-quantize.c
+++ b/tests/test-quantize.c
@@ -13,7 +13,7 @@ int main(void) {
        src[i] = (float)(i + 1);
    }

-    size_t size = ggml_quantize_q4_0(src, dst, QK, QK, QK, hist);
+    size_t size = ggml_quantize_q4_0(src, dst, QK, QK, hist);
    assert(size == 20);
    float max_result = ((float *)dst)[0];
    float max_expected = src[31] / ((1 << 3) - 1);
@@ -24,7 +24,7 @@ int main(void) {
        assert(q4_result == q4_expected);
    }

-    size = ggml_quantize_q4_1(src, dst, QK, QK, QK, hist);
+    size = ggml_quantize_q4_1(src, dst, QK, QK, hist);
    assert(size == 24);
    float delta_result = ((float *)dst)[0];
    float delta_expected = (src[31] - src[0]) / ((1 << 4) - 1);