update llama.cpp submodule to 66c1968f7 (#2618)

2025-12-14 01:37:04 +00:00 · 2024-02-20 17:42:31 -05:00
parent ace2cdf1c6
commit 4613a080e7
6 changed files with 39 additions and 130 deletions
--- a/llm/ext_server/ext_server.h
+++ b/llm/ext_server/ext_server.h
@@ -41,7 +41,7 @@ typedef struct ext_server_params {
  int32_t main_gpu;      // the GPU that is used for scratch and small tensors
  bool use_mlock;        // force system to keep model in RAM
  bool use_mmap;         // use mmap if possible
-  bool numa;             // attempt optimizations that help on some NUMA systems
+  int numa;              // attempt optimizations that help on some NUMA systems
  bool embedding;        // get only sentence embedding
  ext_server_lora_adapter_t *lora_adapters;
  char *mmproj;