mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-08-15 04:33:06 -04:00
k-quants : fix zero-weight guard in Q6_K (ref #3040)
This commit is contained in:
@@ -1089,6 +1089,7 @@ void quantize_row_q6_K_reference(const float * restrict x, block_q6_K * restrict
|
|||||||
if (!max_abs_scale) {
|
if (!max_abs_scale) {
|
||||||
memset(&y[i], 0, sizeof(block_q6_K));
|
memset(&y[i], 0, sizeof(block_q6_K));
|
||||||
y[i].d = ggml_fp32_to_fp16(0.f);
|
y[i].d = ggml_fp32_to_fp16(0.f);
|
||||||
|
x += QK_K;
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Reference in New Issue
Block a user