llama: update vendored code to commit 40c6d79f (#7875)

2025-12-11 08:17:03 +00:00 · 2024-12-10 19:21:34 -08:00
parent a37f4a86a7
commit 527cc97899
289 changed files with 58552 additions and 41806 deletions
--- a/make/cuda.make
+++ b/make/cuda.make
@@ -41,7 +41,9 @@ GPU_COMPILER_CUFLAGS = \
 	-DGGML_CUDA_PEER_MAX_BATCH_SIZE=128 \
 	-DGGML_USE_CUDA=1 \
 	-DGGML_SHARED=1 \
+	-DGGML_BACKEND_SHARED=1 \
 	-DGGML_BUILD=1 \
+	-DGGML_BACKEND_BUILD=1 \
 	-DGGML_USE_LLAMAFILE \
 	-DK_QUANTS_PER_ITERATION=2 \
 	-DNDEBUG \