llm: add minimum based on layer size

This commit is contained in:
Michael Yang
2024-05-06 17:04:19 -07:00
parent 7c5330413b
commit 4736391bfb
3 changed files with 7 additions and 7 deletions

View File

@@ -31,8 +31,8 @@ type handles struct {
}
const (
cudaMinimumMemory = 457 * format.MebiByte
rocmMinimumMemory = 457 * format.MebiByte
cudaMinimumMemory = 256 * format.MebiByte
rocmMinimumMemory = 256 * format.MebiByte
)
var gpuMutex sync.Mutex

View File

@@ -15,7 +15,7 @@ import (
)
const (
metalMinimumMemory = 512 * format.MebiByte
metalMinimumMemory = 384 * format.MebiByte
)
func GetGPUInfo() GpuInfoList {