update llama.cpp submodule to 66c1968f7 (#2618)

This commit is contained in:
Jeffrey Morgan
2024-02-20 17:42:31 -05:00
committed by GitHub
parent ace2cdf1c6
commit 4613a080e7
6 changed files with 39 additions and 130 deletions

View File

@@ -41,7 +41,7 @@ typedef struct ext_server_params {
int32_t main_gpu; // the GPU that is used for scratch and small tensors
bool use_mlock; // force system to keep model in RAM
bool use_mmap; // use mmap if possible
bool numa; // attempt optimizations that help on some NUMA systems
int numa; // attempt optimizations that help on some NUMA systems
bool embedding; // get only sentence embedding
ext_server_lora_adapter_t *lora_adapters;
char *mmproj;