mirror of
https://github.com/ollama/ollama.git
synced 2025-05-10 18:06:33 +02:00
Merge pull request #10468 from ollama/drifkin/num-parallel-1
This commit is contained in:
commit
db428adbb8
1 changed files with 1 additions and 1 deletions
|
@ -58,7 +58,7 @@ var defaultModelsPerGPU = 3
|
|||
// Default automatic value for parallel setting
|
||||
// Model will still need to fit in VRAM. If this setting won't fit
|
||||
// we'll back off down to 1 to try to get it to fit
|
||||
var defaultParallel = 4
|
||||
var defaultParallel = 2
|
||||
|
||||
var ErrMaxQueue = errors.New("server busy, please try again. maximum pending requests exceeded")
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue