From: Jeff Bolz Date: Fri, 6 Feb 2026 14:50:30 +0000 (-0600) Subject: tests: reduce number of FA test permutations (#19381) X-Git-Tag: upstream/0.0.8067~107 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=db6adb3c88a96845b7d6863f451a54484a9f5a7e;p=pkg%2Fggml%2Fsources%2Fllama.cpp tests: reduce number of FA test permutations (#19381) Only test non-F16 for head size 64 and 72 (one a multiple of QK, one not). --- diff --git a/tests/test-backend-ops.cpp b/tests/test-backend-ops.cpp index fbe23037c..6fe1780f3 100644 --- a/tests/test-backend-ops.cpp +++ b/tests/test-backend-ops.cpp @@ -8231,6 +8231,7 @@ static std::vector> make_test_cases_eval() { for (ggml_prec prec : {GGML_PREC_F32, GGML_PREC_DEFAULT}) { if (hsk != 128 && prec == GGML_PREC_DEFAULT) continue; for (ggml_type type_KV : {GGML_TYPE_F32, GGML_TYPE_F16, GGML_TYPE_BF16, GGML_TYPE_Q8_0, GGML_TYPE_Q4_0}) { + if (type_KV != GGML_TYPE_F16 && hsk != 64 && hsk != 72) continue; test_cases.emplace_back(new test_flash_attn_ext( hsk, hsv, nh, {nr2, nr3}, kv, nb, mask, sinks, max_bias, logit_softcap, prec, type_KV)); // run fewer test cases permuted