]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
make: fix nvcc optimization flags for host code (#5309)
authorJohannes Gäßler <redacted>
Sat, 3 Feb 2024 19:14:59 +0000 (20:14 +0100)
committerGitHub <redacted>
Sat, 3 Feb 2024 19:14:59 +0000 (20:14 +0100)
Makefile

index a55d15888f53b98a570cda6d41b9174616ae2899..40b16e0ea8c4ed262dc845806070be9f1cdc4f91 100644 (file)
--- a/Makefile
+++ b/Makefile
@@ -109,6 +109,7 @@ MK_NVCCFLAGS  += -O3
 else
 MK_CFLAGS     += -O3
 MK_CXXFLAGS   += -O3
+MK_NVCCFLAGS  += -O3
 endif
 
 # clock_gettime came in POSIX.1b (1993)
@@ -365,7 +366,7 @@ ifdef LLAMA_CUBLAS
        MK_CPPFLAGS  += -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I/opt/cuda/include -I$(CUDA_PATH)/targets/x86_64-linux/include -I/usr/local/cuda/targets/aarch64-linux/include
        MK_LDFLAGS   += -lcuda -lcublas -lculibos -lcudart -lcublasLt -lpthread -ldl -lrt -L/usr/local/cuda/lib64 -L/opt/cuda/lib64 -L$(CUDA_PATH)/targets/x86_64-linux/lib -L/usr/local/cuda/targets/aarch64-linux/lib -L/usr/lib/wsl/lib
        OBJS         += ggml-cuda.o
-       MK_NVCCFLAGS  = -use_fast_math
+       MK_NVCCFLAGS += -use_fast_math
 ifndef JETSON_EOL_MODULE_DETECT
        MK_NVCCFLAGS += --forward-unknown-to-host-compiler
 endif # JETSON_EOL_MODULE_DETECT