enable metal gpu acceleration

ggml-metal.metal must be in the same directory as the ollama binary otherwise llama.cpp will not be able to find it and load it. 1. go generate llama/llama_metal.go 2. go build . 3. ./ollama serve
2025-12-10 07:46:59 +00:00 · 2023-07-05 17:45:11 -07:00
parent b9fb988112
commit 1b7183c5a1
3 changed files with 15 additions and 15 deletions
--- a/server/routes.go
+++ b/server/routes.go
@@ -22,7 +22,7 @@ func pull(c *gin.Context) {

 func generate(c *gin.Context) {
 	// TODO: these should be request parameters
-	gpulayers := 0
+	gpulayers := 1
 	tokens := 512
 	threads := runtime.NumCPU()
 	// TODO: set prompt from template