api: return model capabilities from the show endpoint (#10066)

With support for multimodal models becoming more varied and common it is important for clients to be able to easily see what capabilities a model has. Retuning these from the show endpoint will allow clients to easily see what a model can do.
2025-05-11 02:16:36 +02:00 · 2025-04-01 15:21:46 -07:00 · 2025-04-01 15:21:46 -07:00 · e172f095ba
commit e172f095ba
parent c001b98087
9 changed files with 521 additions and 69 deletions
--- a/server/sched.go
+++ b/server/sched.go
@ -20,6 +20,7 @@ import (
 	"github.com/ollama/ollama/format"
 	"github.com/ollama/ollama/fs/ggml"
 	"github.com/ollama/ollama/llm"
+	"github.com/ollama/ollama/types/model"
 )

 type LlmRequest struct {
@ -195,7 +196,7 @@ func (s *Scheduler) processPending(ctx context.Context) {
 					}

 					// Embedding models should always be loaded with parallel=1
-					if pending.model.CheckCapabilities(CapabilityCompletion) != nil {
+					if pending.model.CheckCapabilities(model.CapabilityCompletion) != nil {
 						numParallel = 1
 					}