CUDA: add mean operation (#14313)

* CUDA: add mean operation * add back sum_rows_f32_cuda * Review: early exit if col!=0
2025-06-26 11:45:21 +00:00 · 2025-06-22 12:39:54 +08:00
parent aa0ef5c578
commit aa064b2eb7
7 changed files with 54 additions and 19 deletions
--- a/tests/test-backend-ops.cpp
+++ b/tests/test-backend-ops.cpp
@ -4652,6 +4652,8 @@ static std::vector<std::unique_ptr<test_case>> make_test_cases_perf() {

    test_cases.emplace_back(new test_conv_transpose_2d({256, 256, 256, 1}, {3, 3, 16, 256}, 1));

+    test_cases.emplace_back(new test_mean(GGML_TYPE_F32, {256, 256, 3, 1}));
+
    return test_cases;
 }