ollamarunner: Pass runner performance parameters to backends

Currently the following parameters are in the runner but not used:
 - numGPULayers
 - mainGPU
 - threads
 - tensorSplit

This passes them through to the backend, which is where they would
actually get used. However, the GGML backend does not yet do anything
with them.
This commit is contained in:
Jesse Gross
2025-02-20 11:18:01 -08:00
committed by Jesse Gross
parent 14b5a9a150
commit bd6a7d5e64
4 changed files with 40 additions and 20 deletions

View File

@@ -84,7 +84,7 @@ type Backend struct {
tensors map[string]*Context
}
func New(r *os.File) (ml.Backend, error) {
func New(r *os.File, params ml.BackendParams) (ml.Backend, error) {
meta, n, err := fs.Decode(r, -1)
if err != nil {
return nil, err