mirror of
https://github.com/ollama/ollama.git
synced 2025-05-11 02:16:36 +02:00
Bump VRAM buffer back up
Under stress scenarios we're seeing OOMs so this should help stabilize the allocations under heavy concurrency stress.
This commit is contained in:
parent
200a18820e
commit
30a7d7096c
2 changed files with 3 additions and 3 deletions
|
@ -15,7 +15,7 @@ import (
|
|||
)
|
||||
|
||||
const (
|
||||
metalMinimumMemory = 384 * format.MebiByte
|
||||
metalMinimumMemory = 512 * format.MebiByte
|
||||
)
|
||||
|
||||
func GetGPUInfo() GpuInfoList {
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue