Bump llama.cpp to b2474

The release just before ggml-cuda.cu refactoring
2025-12-10 15:57:04 +00:00 · 2024-03-23 09:54:56 +01:00
parent a5ba0fcf78
commit 43799532c1
5 changed files with 7 additions and 184 deletions
--- a/llm/ext_server/server.cpp
+++ b/llm/ext_server/server.cpp
@@ -343,6 +343,12 @@ struct llama_server_context

    ~llama_server_context()
    {
+        if (clp_ctx)
+        {
+            LOG_INFO("freeing clip model", {});
+            clip_free(clp_ctx);
+            clp_ctx = nullptr;
+        }
        if (ctx)
        {
            llama_free(ctx);