mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-08-15 20:53:00 -04:00
metal : fix warnings (skipme) (#0)
This commit is contained in:
@@ -2217,7 +2217,7 @@ kernel void kernel_flash_attn_ext_f16(
|
|||||||
|
|
||||||
// ALiBi
|
// ALiBi
|
||||||
if (max_bias > 0.0f) {
|
if (max_bias > 0.0f) {
|
||||||
const short h = iq2;
|
const uint32_t h = iq2;
|
||||||
|
|
||||||
const float base = h < n_head_log2 ? m0 : m1;
|
const float base = h < n_head_log2 ? m0 : m1;
|
||||||
const int exph = h < n_head_log2 ? h + 1 : 2*(h - n_head_log2) + 1;
|
const int exph = h < n_head_log2 ? h + 1 : 2*(h - n_head_log2) + 1;
|
||||||
@@ -2473,7 +2473,7 @@ kernel void kernel_flash_attn_ext_vec_f16(
|
|||||||
|
|
||||||
// ALiBi
|
// ALiBi
|
||||||
if (max_bias > 0.0f) {
|
if (max_bias > 0.0f) {
|
||||||
const short h = iq2;
|
const uint32_t h = iq2;
|
||||||
|
|
||||||
const float base = h < n_head_log2 ? m0 : m1;
|
const float base = h < n_head_log2 ? m0 : m1;
|
||||||
const int exp = h < n_head_log2 ? h + 1 : 2*(h - n_head_log2) + 1;
|
const int exp = h < n_head_log2 ? h + 1 : 2*(h - n_head_log2) + 1;
|
||||||
|
@@ -1 +1 @@
|
|||||||
d2ad1793f45922665c99f5cf4244dcab77e16c00
|
30f54cbb3ada3e4c5bc6924de3e5918e5be4ff11
|
||||||
|
Reference in New Issue
Block a user