]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commit
llama : reorganize source code + improve CMake (#8006)
authorGeorgi Gerganov <redacted>
Wed, 26 Jun 2024 15:33:02 +0000 (18:33 +0300)
committerGitHub <redacted>
Wed, 26 Jun 2024 15:33:02 +0000 (18:33 +0300)
commitf3f65429c44bb195a9195bfdc19a30a79709db7b
tree3d44ce270dd666d8343013fb2f363eb90e9abcbf
parent88540445615e77a0177fcca43aaa8e9d8eea6864
llama : reorganize source code + improve CMake (#8006)

* scripts : update sync [no ci]

* files : relocate [no ci]

* ci : disable kompute build [no ci]

* cmake : fixes [no ci]

* server : fix mingw build

ggml-ci

* cmake : minor [no ci]

* cmake : link math library [no ci]

* cmake : build normal ggml library (not object library) [no ci]

* cmake : fix kompute build

ggml-ci

* make,cmake : fix LLAMA_CUDA + replace GGML_CDEF_PRIVATE

ggml-ci

* move public backend headers to the public include directory (#8122)

* move public backend headers to the public include directory

* nix test

* spm : fix metal header

---------

Co-authored-by: Georgi Gerganov <redacted>
* scripts : fix sync paths [no ci]

* scripts : sync ggml-blas.h [no ci]

---------

Co-authored-by: slaren <redacted>
650 files changed:
.devops/nix/package.nix
.github/labeler.yml
.github/workflows/bench.yml
.github/workflows/build.yml
.github/workflows/server.yml
.gitignore
.gitmodules
CMakeLists.txt
CMakePresets.json
Makefile
Package.swift
README-sycl.md
README.md
ci/run.sh
cmake/FindSIMD.cmake [deleted file]
cmake/build-info.cmake [new file with mode: 0644]
cmake/git-vars.cmake [new file with mode: 0644]
cmake/llama-config.cmake.in [new file with mode: 0644]
common/CMakeLists.txt
common/cmake/build-info-gen-cpp.cmake [new file with mode: 0644]
docs/BLIS.md
examples/CMakeLists.txt
examples/imatrix/README.md
examples/llava/MobileVLM-README.md
examples/rpc/README.md
examples/server/CMakeLists.txt
examples/sycl/build.sh
examples/sycl/win-build-sycl.bat
ggml-alloc.c [deleted file]
ggml-alloc.h [deleted file]
ggml-backend-impl.h [deleted file]
ggml-backend.c [deleted file]
ggml-backend.h [deleted file]
ggml-blas.cpp [deleted file]
ggml-blas.h [deleted file]
ggml-common.h [deleted file]
ggml-cuda.cu [deleted file]
ggml-cuda.h [deleted file]
ggml-cuda/acc.cu [deleted file]
ggml-cuda/acc.cuh [deleted file]
ggml-cuda/arange.cu [deleted file]
ggml-cuda/arange.cuh [deleted file]
ggml-cuda/argsort.cu [deleted file]
ggml-cuda/argsort.cuh [deleted file]
ggml-cuda/binbcast.cu [deleted file]
ggml-cuda/binbcast.cuh [deleted file]
ggml-cuda/clamp.cu [deleted file]
ggml-cuda/clamp.cuh [deleted file]
ggml-cuda/common.cuh [deleted file]
ggml-cuda/concat.cu [deleted file]
ggml-cuda/concat.cuh [deleted file]
ggml-cuda/convert.cu [deleted file]
ggml-cuda/convert.cuh [deleted file]
ggml-cuda/cpy.cu [deleted file]
ggml-cuda/cpy.cuh [deleted file]
ggml-cuda/dequantize.cuh [deleted file]
ggml-cuda/diagmask.cu [deleted file]
ggml-cuda/diagmask.cuh [deleted file]
ggml-cuda/dmmv.cu [deleted file]
ggml-cuda/dmmv.cuh [deleted file]
ggml-cuda/fattn-common.cuh [deleted file]
ggml-cuda/fattn-tile-f16.cu [deleted file]
ggml-cuda/fattn-tile-f16.cuh [deleted file]
ggml-cuda/fattn-tile-f32.cu [deleted file]
ggml-cuda/fattn-tile-f32.cuh [deleted file]
ggml-cuda/fattn-vec-f16.cuh [deleted file]
ggml-cuda/fattn-vec-f32.cuh [deleted file]
ggml-cuda/fattn-wmma-f16.cuh [deleted file]
ggml-cuda/fattn.cu [deleted file]
ggml-cuda/fattn.cuh [deleted file]
ggml-cuda/getrows.cu [deleted file]
ggml-cuda/getrows.cuh [deleted file]
ggml-cuda/im2col.cu [deleted file]
ggml-cuda/im2col.cuh [deleted file]
ggml-cuda/mma.cuh [deleted file]
ggml-cuda/mmq.cu [deleted file]
ggml-cuda/mmq.cuh [deleted file]
ggml-cuda/mmvq.cu [deleted file]
ggml-cuda/mmvq.cuh [deleted file]
ggml-cuda/norm.cu [deleted file]
ggml-cuda/norm.cuh [deleted file]
ggml-cuda/pad.cu [deleted file]
ggml-cuda/pad.cuh [deleted file]
ggml-cuda/pool2d.cu [deleted file]
ggml-cuda/pool2d.cuh [deleted file]
ggml-cuda/quantize.cu [deleted file]
ggml-cuda/quantize.cuh [deleted file]
ggml-cuda/rope.cu [deleted file]
ggml-cuda/rope.cuh [deleted file]
ggml-cuda/scale.cu [deleted file]
ggml-cuda/scale.cuh [deleted file]
ggml-cuda/softmax.cu [deleted file]
ggml-cuda/softmax.cuh [deleted file]
ggml-cuda/sumrows.cu [deleted file]
ggml-cuda/sumrows.cuh [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_0.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_1.cu [deleted file]
ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q8_0.cu [deleted file]
ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu [deleted file]
ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu [deleted file]
ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu [deleted file]
ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu [deleted file]
ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu [deleted file]
ggml-cuda/template-instances/generate_cu_files.py [deleted file]
ggml-cuda/template-instances/mmq-instance-q2_k.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q3_k.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q4_0.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q4_1.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q4_k.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q5_0.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q5_1.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q5_k.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q6_k.cu [deleted file]
ggml-cuda/template-instances/mmq-instance-q8_0.cu [deleted file]
ggml-cuda/tsembd.cu [deleted file]
ggml-cuda/tsembd.cuh [deleted file]
ggml-cuda/unary.cu [deleted file]
ggml-cuda/unary.cuh [deleted file]
ggml-cuda/upscale.cu [deleted file]
ggml-cuda/upscale.cuh [deleted file]
ggml-cuda/vecdotq.cuh [deleted file]
ggml-impl.h [deleted file]
ggml-kompute.cpp [deleted file]
ggml-kompute.h [deleted file]
ggml-metal.h [deleted file]
ggml-metal.m [deleted file]
ggml-metal.metal [deleted file]
ggml-quants.c [deleted file]
ggml-quants.h [deleted file]
ggml-rpc.cpp [deleted file]
ggml-rpc.h [deleted file]
ggml-sycl.cpp [deleted file]
ggml-sycl.h [deleted file]
ggml-sycl/backend.hpp [deleted file]
ggml-sycl/common.cpp [deleted file]
ggml-sycl/common.hpp [deleted file]
ggml-sycl/convert.cpp [deleted file]
ggml-sycl/convert.hpp [deleted file]
ggml-sycl/dequantize.hpp [deleted file]
ggml-sycl/dmmv.cpp [deleted file]
ggml-sycl/dmmv.hpp [deleted file]
ggml-sycl/dpct/helper.hpp [deleted file]
ggml-sycl/mmq.cpp [deleted file]
ggml-sycl/mmq.hpp [deleted file]
ggml-sycl/mmvq.cpp [deleted file]
ggml-sycl/mmvq.hpp [deleted file]
ggml-sycl/presets.hpp [deleted file]
ggml-sycl/vecdotq.hpp [deleted file]
ggml-vulkan-shaders.hpp [deleted file]
ggml-vulkan.cpp [deleted file]
ggml-vulkan.h [deleted file]
ggml.c [deleted file]
ggml.h [deleted file]
ggml/CMakeLists.txt [new file with mode: 0644]
ggml/cmake/FindSIMD.cmake [new file with mode: 0644]
ggml/ggml_vk_generate_shaders.py [new file with mode: 0644]
ggml/include/ggml-alloc.h [new file with mode: 0644]
ggml/include/ggml-backend.h [new file with mode: 0644]
ggml/include/ggml-blas.h [new file with mode: 0644]
ggml/include/ggml-cuda.h [new file with mode: 0644]
ggml/include/ggml-kompute.h [new file with mode: 0644]
ggml/include/ggml-metal.h [new file with mode: 0644]
ggml/include/ggml-rpc.h [new file with mode: 0644]
ggml/include/ggml-sycl.h [new file with mode: 0644]
ggml/include/ggml-vulkan.h [new file with mode: 0644]
ggml/include/ggml.h [new file with mode: 0644]
ggml/src/CMakeLists.txt [new file with mode: 0644]
ggml/src/ggml-alloc.c [new file with mode: 0644]
ggml/src/ggml-backend-impl.h [new file with mode: 0644]
ggml/src/ggml-backend.c [new file with mode: 0644]
ggml/src/ggml-blas.cpp [new file with mode: 0644]
ggml/src/ggml-common.h [new file with mode: 0644]
ggml/src/ggml-cuda.cu [new file with mode: 0644]
ggml/src/ggml-cuda/acc.cu [new file with mode: 0644]
ggml/src/ggml-cuda/acc.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/arange.cu [new file with mode: 0644]
ggml/src/ggml-cuda/arange.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/argsort.cu [new file with mode: 0644]
ggml/src/ggml-cuda/argsort.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/binbcast.cu [new file with mode: 0644]
ggml/src/ggml-cuda/binbcast.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/clamp.cu [new file with mode: 0644]
ggml/src/ggml-cuda/clamp.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/common.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/concat.cu [new file with mode: 0644]
ggml/src/ggml-cuda/concat.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/convert.cu [new file with mode: 0644]
ggml/src/ggml-cuda/convert.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/cpy.cu [new file with mode: 0644]
ggml/src/ggml-cuda/cpy.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/dequantize.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/diagmask.cu [new file with mode: 0644]
ggml/src/ggml-cuda/diagmask.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/dmmv.cu [new file with mode: 0644]
ggml/src/ggml-cuda/dmmv.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-common.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-tile-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-tile-f16.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-tile-f32.cu [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-tile-f32.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-vec-f16.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-vec-f32.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn-wmma-f16.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/fattn.cu [new file with mode: 0644]
ggml/src/ggml-cuda/fattn.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/getrows.cu [new file with mode: 0644]
ggml/src/ggml-cuda/getrows.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/im2col.cu [new file with mode: 0644]
ggml/src/ggml-cuda/im2col.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/mma.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/mmq.cu [new file with mode: 0644]
ggml/src/ggml-cuda/mmq.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/mmvq.cu [new file with mode: 0644]
ggml/src/ggml-cuda/mmvq.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/norm.cu [new file with mode: 0644]
ggml/src/ggml-cuda/norm.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/pad.cu [new file with mode: 0644]
ggml/src/ggml-cuda/pad.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/pool2d.cu [new file with mode: 0644]
ggml/src/ggml-cuda/pool2d.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/quantize.cu [new file with mode: 0644]
ggml/src/ggml-cuda/quantize.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/rope.cu [new file with mode: 0644]
ggml/src/ggml-cuda/rope.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/scale.cu [new file with mode: 0644]
ggml/src/ggml-cuda/scale.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/softmax.cu [new file with mode: 0644]
ggml/src/ggml-cuda/softmax.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/sumrows.cu [new file with mode: 0644]
ggml/src/ggml-cuda/sumrows.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_1-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q5_1-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_1-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q5_1-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/generate_cu_files.py [new file with mode: 0755]
ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu [new file with mode: 0644]
ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu [new file with mode: 0644]
ggml/src/ggml-cuda/tsembd.cu [new file with mode: 0644]
ggml/src/ggml-cuda/tsembd.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/unary.cu [new file with mode: 0644]
ggml/src/ggml-cuda/unary.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/upscale.cu [new file with mode: 0644]
ggml/src/ggml-cuda/upscale.cuh [new file with mode: 0644]
ggml/src/ggml-cuda/vecdotq.cuh [new file with mode: 0644]
ggml/src/ggml-impl.h [new file with mode: 0644]
ggml/src/ggml-kompute.cpp [new file with mode: 0644]
ggml/src/ggml-metal.m [new file with mode: 0644]
ggml/src/ggml-metal.metal [new file with mode: 0644]
ggml/src/ggml-quants.c [new file with mode: 0644]
ggml/src/ggml-quants.h [new file with mode: 0644]
ggml/src/ggml-rpc.cpp [new file with mode: 0644]
ggml/src/ggml-sycl.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/backend.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/common.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/common.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/convert.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/convert.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/dequantize.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/dmmv.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/dmmv.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/dpct/helper.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/mmq.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/mmq.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/mmvq.cpp [new file with mode: 0644]
ggml/src/ggml-sycl/mmvq.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/presets.hpp [new file with mode: 0644]
ggml/src/ggml-sycl/vecdotq.hpp [new file with mode: 0644]
ggml/src/ggml-vulkan-shaders.hpp [new file with mode: 0644]
ggml/src/ggml-vulkan.cpp [new file with mode: 0644]
ggml/src/ggml.c [new file with mode: 0644]
ggml/src/kompute [new submodule]
ggml/src/kompute-shaders/common.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_add.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_addrow.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_cpy_f16_f16.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_cpy_f16_f32.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_cpy_f32_f16.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_cpy_f32_f32.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_diagmask.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_gelu.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows_f16.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows_f32.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows_q4_0.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows_q4_1.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_getrows_q6_k.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_f16.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_mat_f32.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_q4_0.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_q4_1.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_q6_k.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mat_q8_0.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mv_q_n.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_mul_mv_q_n_pre.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_norm.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_relu.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_rmsnorm.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_rope_f16.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_rope_f32.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_scale.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_scale_8.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_silu.comp [new file with mode: 0644]
ggml/src/kompute-shaders/op_softmax.comp [new file with mode: 0644]
ggml/src/kompute-shaders/rope_common.comp [new file with mode: 0644]
ggml/src/sgemm.cpp [new file with mode: 0644]
ggml/src/sgemm.h [new file with mode: 0644]
ggml/src/vulkan-shaders/add.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/argsort.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/clamp.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/copy.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_f32.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_funcs.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_head.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q2_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q3_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q4_0.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q4_1.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q4_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q5_0.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q5_1.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q5_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q6_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/dequant_q8_0.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/diag_mask_inf.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/div.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/gelu.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/generic_binary_head.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/generic_head.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/generic_unary_head.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/get_rows.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/get_rows_quant.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_split_k_reduce.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_base.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_nc.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_p021.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_q2_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_q3_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_q4_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_q5_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mat_vec_q6_k.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/mul_mm.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/norm.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/relu.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/rms_norm.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/rope_head.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/rope_neox.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/rope_norm.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/scale.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/silu.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/soft_max.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/square.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/sum_rows.comp [new file with mode: 0644]
ggml/src/vulkan-shaders/types.comp [new file with mode: 0644]
ggml_vk_generate_shaders.py [deleted file]
include/llama.h [new file with mode: 0644]
kompute [deleted submodule]
kompute-shaders/common.comp [deleted file]
kompute-shaders/op_add.comp [deleted file]
kompute-shaders/op_addrow.comp [deleted file]
kompute-shaders/op_cpy_f16_f16.comp [deleted file]
kompute-shaders/op_cpy_f16_f32.comp [deleted file]
kompute-shaders/op_cpy_f32_f16.comp [deleted file]
kompute-shaders/op_cpy_f32_f32.comp [deleted file]
kompute-shaders/op_diagmask.comp [deleted file]
kompute-shaders/op_gelu.comp [deleted file]
kompute-shaders/op_getrows.comp [deleted file]
kompute-shaders/op_getrows_f16.comp [deleted file]
kompute-shaders/op_getrows_f32.comp [deleted file]
kompute-shaders/op_getrows_q4_0.comp [deleted file]
kompute-shaders/op_getrows_q4_1.comp [deleted file]
kompute-shaders/op_getrows_q6_k.comp [deleted file]
kompute-shaders/op_mul.comp [deleted file]
kompute-shaders/op_mul_mat_f16.comp [deleted file]
kompute-shaders/op_mul_mat_mat_f32.comp [deleted file]
kompute-shaders/op_mul_mat_q4_0.comp [deleted file]
kompute-shaders/op_mul_mat_q4_1.comp [deleted file]
kompute-shaders/op_mul_mat_q6_k.comp [deleted file]
kompute-shaders/op_mul_mat_q8_0.comp [deleted file]
kompute-shaders/op_mul_mv_q_n.comp [deleted file]
kompute-shaders/op_mul_mv_q_n_pre.comp [deleted file]
kompute-shaders/op_norm.comp [deleted file]
kompute-shaders/op_relu.comp [deleted file]
kompute-shaders/op_rmsnorm.comp [deleted file]
kompute-shaders/op_rope_f16.comp [deleted file]
kompute-shaders/op_rope_f32.comp [deleted file]
kompute-shaders/op_scale.comp [deleted file]
kompute-shaders/op_scale_8.comp [deleted file]
kompute-shaders/op_silu.comp [deleted file]
kompute-shaders/op_softmax.comp [deleted file]
kompute-shaders/rope_common.comp [deleted file]
llama.cpp [deleted file]
llama.h [deleted file]
scripts/LlamaConfig.cmake.in [deleted file]
scripts/build-info.cmake [deleted file]
scripts/build-info.sh
scripts/compare-commits.sh
scripts/debug-test.sh
scripts/gen-build-info-cpp.cmake [deleted file]
scripts/pod-llama.sh
scripts/server-llm.sh
scripts/sync-ggml-am.sh
scripts/sync-ggml.sh
sgemm.cpp [deleted file]
sgemm.h [deleted file]
spm-headers/ggml-alloc.h
spm-headers/ggml-backend.h
spm-headers/ggml-metal.h [new symlink]
spm-headers/ggml.h
spm-headers/llama.h
src/CMakeLists.txt [new file with mode: 0644]
src/llama.cpp [new file with mode: 0644]
src/unicode-data.cpp [new file with mode: 0644]
src/unicode-data.h [new file with mode: 0644]
src/unicode.cpp [new file with mode: 0644]
src/unicode.h [new file with mode: 0644]
tests/test-backend-ops.cpp
unicode-data.cpp [deleted file]
unicode-data.h [deleted file]
unicode.cpp [deleted file]
unicode.h [deleted file]
vulkan-shaders/add.comp [deleted file]
vulkan-shaders/argsort.comp [deleted file]
vulkan-shaders/clamp.comp [deleted file]
vulkan-shaders/copy.comp [deleted file]
vulkan-shaders/dequant_f32.comp [deleted file]
vulkan-shaders/dequant_funcs.comp [deleted file]
vulkan-shaders/dequant_head.comp [deleted file]
vulkan-shaders/dequant_q2_k.comp [deleted file]
vulkan-shaders/dequant_q3_k.comp [deleted file]
vulkan-shaders/dequant_q4_0.comp [deleted file]
vulkan-shaders/dequant_q4_1.comp [deleted file]
vulkan-shaders/dequant_q4_k.comp [deleted file]
vulkan-shaders/dequant_q5_0.comp [deleted file]
vulkan-shaders/dequant_q5_1.comp [deleted file]
vulkan-shaders/dequant_q5_k.comp [deleted file]
vulkan-shaders/dequant_q6_k.comp [deleted file]
vulkan-shaders/dequant_q8_0.comp [deleted file]
vulkan-shaders/diag_mask_inf.comp [deleted file]
vulkan-shaders/div.comp [deleted file]
vulkan-shaders/gelu.comp [deleted file]
vulkan-shaders/generic_binary_head.comp [deleted file]
vulkan-shaders/generic_head.comp [deleted file]
vulkan-shaders/generic_unary_head.comp [deleted file]
vulkan-shaders/get_rows.comp [deleted file]
vulkan-shaders/get_rows_quant.comp [deleted file]
vulkan-shaders/mul.comp [deleted file]
vulkan-shaders/mul_mat_split_k_reduce.comp [deleted file]
vulkan-shaders/mul_mat_vec.comp [deleted file]
vulkan-shaders/mul_mat_vec_base.comp [deleted file]
vulkan-shaders/mul_mat_vec_nc.comp [deleted file]
vulkan-shaders/mul_mat_vec_p021.comp [deleted file]
vulkan-shaders/mul_mat_vec_q2_k.comp [deleted file]
vulkan-shaders/mul_mat_vec_q3_k.comp [deleted file]
vulkan-shaders/mul_mat_vec_q4_k.comp [deleted file]
vulkan-shaders/mul_mat_vec_q5_k.comp [deleted file]
vulkan-shaders/mul_mat_vec_q6_k.comp [deleted file]
vulkan-shaders/mul_mm.comp [deleted file]
vulkan-shaders/norm.comp [deleted file]
vulkan-shaders/relu.comp [deleted file]
vulkan-shaders/rms_norm.comp [deleted file]
vulkan-shaders/rope_head.comp [deleted file]
vulkan-shaders/rope_neox.comp [deleted file]
vulkan-shaders/rope_norm.comp [deleted file]
vulkan-shaders/scale.comp [deleted file]
vulkan-shaders/silu.comp [deleted file]
vulkan-shaders/soft_max.comp [deleted file]
vulkan-shaders/square.comp [deleted file]
vulkan-shaders/sum_rows.comp [deleted file]
vulkan-shaders/types.comp [deleted file]