cann: fix buffer_num and runtime speed slowly error (#8865)

2025-07-06 03:53:29 +00:00 · 2024-08-05 21:10:37 +08:00
parent b42978e7e4
commit bc0f887e15
2 changed files with 15 additions and 14 deletions
--- a/ggml/src/ggml-cann.cpp
+++ b/ggml/src/ggml-cann.cpp
@ -1670,10 +1670,6 @@ GGML_CALL static bool ggml_backend_cann_supports_op(ggml_backend_t backend,
                    // TODO: fix me
                    // Current groupsize should not be greater than k-1 in
                    // aclnnWeightQuantBatchMatmulV2GetWorkspaceSize().
-                    if (op->src[0]->ne[0]-1 > QK8_0) {
-                        return true;
-                    }
-                    return false;
                case GGML_TYPE_Q4_0:
                    return true;
                default: