mirror of
https://github.com/dogkeeper886/ollama37.git
synced 2025-12-11 00:07:07 +00:00
Reset NumCtx.
This commit is contained in:
@@ -736,6 +736,7 @@ func pickBestFullFitByLibrary(req *LlmRequest, ggml *llm.GGML, gpus gpu.GpuInfoL
|
|||||||
func pickBestPartialFitByLibrary(req *LlmRequest, ggml *llm.GGML, gpus gpu.GpuInfoList, numParallel *int) gpu.GpuInfoList {
|
func pickBestPartialFitByLibrary(req *LlmRequest, ggml *llm.GGML, gpus gpu.GpuInfoList, numParallel *int) gpu.GpuInfoList {
|
||||||
if *numParallel <= 0 {
|
if *numParallel <= 0 {
|
||||||
*numParallel = 1
|
*numParallel = 1
|
||||||
|
req.opts.NumCtx = req.origNumCtx
|
||||||
}
|
}
|
||||||
byLibrary := gpus.ByLibrary()
|
byLibrary := gpus.ByLibrary()
|
||||||
if len(byLibrary) <= 1 {
|
if len(byLibrary) <= 1 {
|
||||||
|
|||||||
Reference in New Issue
Block a user