Bump VRAM buffer back up

Under stress scenarios we're seeing OOMs so this should help stabilize
the allocations under heavy concurrency stress.
This commit is contained in:
Daniel Hiltgen 2024-05-10 09:15:28 -07:00
parent 200a18820e
commit 30a7d7096c
2 changed files with 3 additions and 3 deletions

View file

@ -31,8 +31,8 @@ type handles struct {
}
const (
cudaMinimumMemory = 256 * format.MebiByte
rocmMinimumMemory = 256 * format.MebiByte
cudaMinimumMemory = 457 * format.MebiByte
rocmMinimumMemory = 457 * format.MebiByte
)
var gpuMutex sync.Mutex