From: Georgi Gerganov Date: Sat, 22 Apr 2023 13:31:56 +0000 (+0300) Subject: ggml : fix Q4_3 cuBLAS X-Git-Tag: gguf-v0.4.0~888 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=0e018fe008eacebdbcfa2d61b6c988c245c961cd;p=pkg%2Fggml%2Fsources%2Fllama.cpp ggml : fix Q4_3 cuBLAS --- diff --git a/CMakeLists.txt b/CMakeLists.txt index 2d4e30e5..11ebe9eb 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -312,6 +312,7 @@ add_library(ggml OBJECT target_include_directories(ggml PUBLIC .) target_compile_features(ggml PUBLIC c_std_11) # don't bump target_link_libraries(ggml PUBLIC Threads::Threads ${LLAMA_EXTRA_LIBS}) + if (BUILD_SHARED_LIBS) set_target_properties(ggml PROPERTIES POSITION_INDEPENDENT_CODE ON) endif() @@ -324,6 +325,7 @@ add_library(llama target_include_directories(llama PUBLIC .) target_compile_features(llama PUBLIC cxx_std_11) # don't bump target_link_libraries(llama PRIVATE ggml ${LLAMA_EXTRA_LIBS}) + if (BUILD_SHARED_LIBS) set_target_properties(llama PROPERTIES POSITION_INDEPENDENT_CODE ON) target_compile_definitions(llama PRIVATE LLAMA_SHARED LLAMA_BUILD) diff --git a/ggml.c b/ggml.c index d9a95af8..281b2028 100644 --- a/ggml.c +++ b/ggml.c @@ -7992,6 +7992,9 @@ static void ggml_compute_forward_mul_mat_q_f32( else if (type == GGML_TYPE_Q4_2) { dequantize_row_q_cuda = dequantize_row_q4_2_cuda; } + else if (type == GGML_TYPE_Q4_3) { + dequantize_row_q_cuda = dequantize_row_q4_3_cuda; + } else { GGML_ASSERT(false); }