]> git.djapps.eu Git - pkg/ggml/sources/whisper.cpp/commit
supprt Flash Attention for fp32/fp16/Q4/Q5/Q8 (llama/20190)
authorNeo Zhang <redacted>
Sun, 8 Mar 2026 04:00:07 +0000 (12:00 +0800)
committerGeorgi Gerganov <redacted>
Mon, 16 Mar 2026 11:10:15 +0000 (13:10 +0200)
commit8a9b0ba1dff0d73c132a89a047320a5718e71f85
treed3b384fc8ba0937a6281d0fb9e7c216e584130f4
parent49489bfbd1704bf8e222ea7bef49153da23d45d2
supprt Flash Attention for fp32/fp16/Q4/Q5/Q8 (llama/20190)

* support flash-attention for fp32/fp16/Q4/Q5/Q8

* rm warining

* update for JIT
62 files changed:
ggml/src/ggml-sycl/CMakeLists.txt
ggml/src/ggml-sycl/backend.hpp
ggml/src/ggml-sycl/common.hpp
ggml/src/ggml-sycl/convert.cpp
ggml/src/ggml-sycl/convert.hpp
ggml/src/ggml-sycl/count-equal.cpp
ggml/src/ggml-sycl/dpct/helper.hpp
ggml/src/ggml-sycl/fattn-common.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/fattn-tile.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/fattn-tile.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/fattn-vec.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/fattn.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/fattn.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/ggml-sycl.cpp
ggml/src/ggml-sycl/presets.hpp
ggml/src/ggml-sycl/softmax.cpp
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq112-dv112.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq128-dv128.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq256-dv256.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq40-dv40.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq576-dv512.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq64-dv64.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq72-dv72.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq80-dv80.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq96-dv96.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-f16.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_1.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q8_0.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/vecdotq.hpp