]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commit
ggml : reduce hash table reset cost (#8698)
authorslaren <redacted>
Sat, 27 Jul 2024 02:41:55 +0000 (04:41 +0200)
committerGitHub <redacted>
Sat, 27 Jul 2024 02:41:55 +0000 (04:41 +0200)
commit2b1f616b208a4a21c4ee7a7eb85d822ff1d787af
treec1fab2623895ee6d239936669cbdcebedff76998
parent01245f5b1629075543bc4478418c7d72a0b4b3c7
ggml : reduce hash table reset cost (#8698)

* ggml : reduce hash table reset cost

* fix unreachable code warnings after GGML_ASSERT(false)

* GGML_ASSERT(false) -> GGML_ABORT("fatal error")

* GGML_ABORT use format string
46 files changed:
Makefile
examples/eval-callback/eval-callback.cpp
examples/imatrix/imatrix.cpp
examples/llama-bench/llama-bench.cpp
examples/llava/clip.cpp
examples/tokenize/tokenize.cpp
ggml/include/ggml.h
ggml/src/ggml-alloc.c
ggml/src/ggml-backend.c
ggml/src/ggml-blas.cpp
ggml/src/ggml-cann.cpp
ggml/src/ggml-cann/aclnn_ops.cpp
ggml/src/ggml-cuda.cu
ggml/src/ggml-cuda/argsort.cu
ggml/src/ggml-cuda/binbcast.cu
ggml/src/ggml-cuda/common.cuh
ggml/src/ggml-cuda/cpy.cu
ggml/src/ggml-cuda/dmmv.cu
ggml/src/ggml-cuda/fattn-common.cuh
ggml/src/ggml-cuda/fattn-tile-f16.cu
ggml/src/ggml-cuda/fattn-tile-f32.cu
ggml/src/ggml-cuda/fattn.cu
ggml/src/ggml-cuda/getrows.cu
ggml/src/ggml-cuda/mmq.cu
ggml/src/ggml-cuda/mmq.cuh
ggml/src/ggml-cuda/mmvq.cu
ggml/src/ggml-cuda/quantize.cu
ggml/src/ggml-cuda/rope.cu
ggml/src/ggml-impl.h
ggml/src/ggml-kompute.cpp
ggml/src/ggml-metal.m
ggml/src/ggml-quants.c
ggml/src/ggml-sycl.cpp
ggml/src/ggml-sycl/common.hpp
ggml/src/ggml-sycl/dmmv.cpp
ggml/src/ggml-sycl/dpct/helper.hpp
ggml/src/ggml-sycl/mmq.cpp
ggml/src/ggml-sycl/mmvq.cpp
ggml/src/ggml-sycl/rope.cpp
ggml/src/ggml-vulkan.cpp
ggml/src/ggml.c
src/llama-grammar.cpp
src/llama-vocab.cpp
src/llama.cpp
tests/test-backend-ops.cpp
tests/test-sampling.cpp