no gpu for 70B model

2025-12-13 17:27:05 +00:00 · 2023-08-01 16:57:14 -07:00
parent 7a1c3e62dc
commit 74a5f7e698
1 changed files with 5 additions and 0 deletions
--- a/llama/llama.go
+++ b/llama/llama.go
@@ -128,6 +128,11 @@ func New(model string, opts api.Options) (*LLM, error) {
 	C.llama_backend_init(C.bool(llm.UseNUMA))
 	// TODO: GQA == 8 suggests 70B model which doesn't support metal
 	if llm.NumGQA == 8 {
 		llm.NumGPU = 0
 	}
 	params := C.llama_context_default_params()
 	params.seed = C.uint(llm.Seed)
 	params.n_ctx = C.int(llm.NumCtx)