Add cgo implementation for llama.cpp

Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions.
2025-12-11 16:26:59 +00:00 · 2023-11-13 17:20:34 -08:00
parent 5e7fd6906f
commit d4cd695759
27 changed files with 1189 additions and 765 deletions
--- a/llm/llama.cpp/gen_linux.sh
+++ b/llm/llama.cpp/gen_linux.sh
@@ -0,0 +1,17 @@
+#!/bin/sh
+# This script is intended to run inside the go generate
+# working directory must be ../llm/llama.cpp
+
+set -ex
+set -o pipefail
+
+# TODO - stopped here - map the variables from above over and refine the case statement below
+
+echo "Starting linux generate script"
+source $(dirname $0)/gen_common.sh
+init_vars
+CMAKE_DEFS="-DLLAMA_CUBLAS=on -DLLAMA_NATIVE=off -DLLAMA_AVX=on -DLLAMA_AVX2=off -DLLAMA_AVX512=off -DLLAMA_FMA=off -DLLAMA_F16C=off ${CMAKE_DEFS}"
+BUILD_DIR="gguf/build/cuda"
+git_module_setup
+apply_patches
+build