cache: group models by provider and fix slash-in-model-ID lookups

SantiagoDePolonia · claude · SantiagoDePolonia · commit b29c82c48fd2 · 2026-03-04T22:51:13.000+01:00
Restructure ModelCache to group models by provider, eliminating
per-model repetition of provider_type, owned_by, and object fields.
Drop the always-"model" Object field entirely.

Fix splitModelSelector fallthrough: when a qualified lookup fails
(e.g. "meta-llama/Meta-Llama-3-70B" where "meta-llama" is not a
provider name), fall through to unqualified lookup using the original
model string instead of returning nil. Applied to GetProvider,
GetModel, Supports, and GetProviderType.

Harden cache tests with fatal guards before slice indexing.

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/internal/cache/cache.go b/internal/cache/cache.go
@@ -9,23 +9,27 @@ import (
 )
 
 // ModelCache represents the cached model data structure.
-// This is the data that gets stored and retrieved from the cache.
+// Models are grouped by provider to avoid repeating shared fields (provider_type, owned_by)
+// on every model entry.
 type ModelCache struct {
-	UpdatedAt     time.Time              `json:"updated_at"`
-	Models        []CachedModel          `json:"models"`
+	UpdatedAt     time.Time                `json:"updated_at"`
+	Providers     map[string]CachedProvider `json:"providers"`
 	// ModelListData holds the raw JSON model registry bytes for cache persistence,
 	// allowing the registry to restore its full model list without re-fetching.
 	ModelListData json.RawMessage `json:"model_list_data,omitempty"`
 }
 
-// CachedModel represents a single cached model entry.
+// CachedProvider holds shared fields for all models from a single provider.
+type CachedProvider struct {
+	ProviderType string        `json:"provider_type"`
+	OwnedBy      string        `json:"owned_by"`
+	Models       []CachedModel `json:"models"`
+}
+
+// CachedModel represents a single cached model entry within a provider group.
 type CachedModel struct {
-	ModelID      string `json:"model_id"`
-	Provider     string `json:"provider"`
-	ProviderType string `json:"provider_type"`
-	Object       string `json:"object"`
-	OwnedBy      string `json:"owned_by"`
-	Created      int64  `json:"created"`
+	ID      string `json:"id"`
+	Created int64  `json:"created"`
 }
 
 // Cache defines the interface for model cache storage.
diff --git a/internal/cache/cache_test.go b/internal/cache/cache_test.go
@@ -29,14 +29,13 @@ func TestLocalCache(t *testing.T) {
 		// Set data
 		data := &ModelCache{
 			UpdatedAt: time.Now().UTC(),
-			Models: []CachedModel{
-				{
-					ModelID:      "test-model",
-					Provider:     "openai",
+			Providers: map[string]CachedProvider{
+				"openai": {
 					ProviderType: "openai",
-					Object:       "model",
 					OwnedBy:      "openai",
-					Created:      1234567890,
+					Models: []CachedModel{
+						{ID: "test-model", Created: 1234567890},
+					},
 				},
 			},
 		}
@@ -54,11 +53,12 @@ func TestLocalCache(t *testing.T) {
 		if result == nil {
 			t.Fatal("expected result, got nil")
 		}
-		if len(result.Models) != 1 {
-			t.Errorf("expected 1 model, got %d", len(result.Models))
+		p, ok := result.Providers["openai"]
+		if !ok || len(p.Models) != 1 {
+			t.Fatalf("expected 1 model in openai provider, got %v", result.Providers)
 		}
-		if result.Models[0].ModelID != "test-model" {
-			t.Errorf("expected test-model in cache, got %q", result.Models[0].ModelID)
+		if p.Models[0].ID != "test-model" {
+			t.Errorf("expected test-model in cache, got %q", p.Models[0].ID)
 		}
 	})
 
@@ -70,7 +70,7 @@ func TestLocalCache(t *testing.T) {
 		ctx := context.Background()
 
 		data := &ModelCache{
-			Models: []CachedModel{},
+			Providers: map[string]CachedProvider{},
 		}
 
 		err := cache.Set(ctx, data)
@@ -136,22 +136,20 @@ func TestModelCacheSerialization(t *testing.T) {
 	t.Run("JSONRoundTrip", func(t *testing.T) {
 		original := &ModelCache{
 			UpdatedAt: time.Date(2024, 1, 1, 0, 0, 0, 0, time.UTC),
-			Models: []CachedModel{
-				{
-					ModelID:      "gpt-4",
-					Provider:     "openai-main",
+			Providers: map[string]CachedProvider{
+				"openai-main": {
 					ProviderType: "openai",
-					Object:       "model",
 					OwnedBy:      "openai",
-					Created:      1234567890,
+					Models: []CachedModel{
+						{ID: "gpt-4", Created: 1234567890},
+					},
 				},
-				{
-					ModelID:      "claude-3",
-					Provider:     "anthropic-main",
+				"anthropic-main": {
 					ProviderType: "anthropic",
-					Object:       "model",
 					OwnedBy:      "anthropic",
-					Created:      1234567891,
+					Models: []CachedModel{
+						{ID: "claude-3", Created: 1234567891},
+					},
 				},
 			},
 		}
@@ -166,17 +164,22 @@ func TestModelCacheSerialization(t *testing.T) {
 			t.Fatalf("failed to unmarshal: %v", err)
 		}
 
-		if len(restored.Models) != len(original.Models) {
-			t.Errorf("model count mismatch: got %d, want %d", len(restored.Models), len(original.Models))
+		if len(restored.Providers) != len(original.Providers) {
+			t.Fatalf("provider count mismatch: got %d, want %d", len(restored.Providers), len(original.Providers))
 		}
-		if restored.Models[0].ModelID != original.Models[0].ModelID {
-			t.Errorf("first model ID mismatch: got %q, want %q", restored.Models[0].ModelID, original.Models[0].ModelID)
+		openai, ok := restored.Providers["openai-main"]
+		if !ok || len(openai.Models) == 0 {
+			t.Fatalf("expected openai-main provider with models, got %v", restored.Providers)
 		}
-		if restored.Models[0].Provider != original.Models[0].Provider {
-			t.Errorf("first provider mismatch: got %q, want %q", restored.Models[0].Provider, original.Models[0].Provider)
+		if openai.Models[0].ID != "gpt-4" {
+			t.Errorf("openai model ID mismatch: got %q, want %q", openai.Models[0].ID, "gpt-4")
 		}
-		if restored.Models[1].ProviderType != original.Models[1].ProviderType {
-			t.Errorf("second provider type mismatch: got %q, want %q", restored.Models[1].ProviderType, original.Models[1].ProviderType)
+		if openai.ProviderType != "openai" {
+			t.Errorf("openai provider type mismatch: got %q, want %q", openai.ProviderType, "openai")
+		}
+		anthropic := restored.Providers["anthropic-main"]
+		if anthropic.ProviderType != "anthropic" {
+			t.Errorf("anthropic provider type mismatch: got %q, want %q", anthropic.ProviderType, "anthropic")
 		}
 	})
 }
diff --git a/internal/providers/registry.go b/internal/providers/registry.go
@@ -247,31 +247,32 @@ func (r *ModelRegistry) LoadFromCache(ctx context.Context) (int, error) {
 	}
 	r.mu.RUnlock()
 
-	// Populate model maps from cache rows. Unqualified lookups keep "first provider wins".
-	newModels := make(map[string]*ModelInfo, len(modelCache.Models))
+	// Populate model maps from grouped cache structure. Unqualified lookups keep "first provider wins".
+	newModels := make(map[string]*ModelInfo)
 	newModelsByProvider := make(map[string]map[string]*ModelInfo)
-	for _, cached := range modelCache.Models {
-		provider, ok := nameToProvider[cached.Provider]
+	for providerName, cachedProvider := range modelCache.Providers {
+		provider, ok := nameToProvider[providerName]
 		if !ok {
-			// Provider not configured, skip this model
+			// Provider not configured, skip all its models
 			continue
 		}
-		info := &ModelInfo{
-			Model: core.Model{
-				ID:      cached.ModelID,
-				Object:  cached.Object,
-				OwnedBy: cached.OwnedBy,
-				Created: cached.Created,
-			},
-			Provider: provider,
-		}
-		if _, ok := newModelsByProvider[cached.Provider]; !ok {
-			newModelsByProvider[cached.Provider] = make(map[string]*ModelInfo)
-		}
-		newModelsByProvider[cached.Provider][cached.ModelID] = info
-		if _, exists := newModels[cached.ModelID]; !exists {
-			newModels[cached.ModelID] = info
+		providerModels := make(map[string]*ModelInfo, len(cachedProvider.Models))
+		for _, cached := range cachedProvider.Models {
+			info := &ModelInfo{
+				Model: core.Model{
+					ID:      cached.ID,
+					Object:  "model",
+					OwnedBy: cachedProvider.OwnedBy,
+					Created: cached.Created,
+				},
+				Provider: provider,
+			}
+			providerModels[cached.ID] = info
+			if _, exists := newModels[cached.ID]; !exists {
+				newModels[cached.ID] = info
+			}
 		}
+		newModelsByProvider[providerName] = providerModels
 	}
 
 	// Load model list data from cache if available
@@ -331,49 +332,58 @@ func (r *ModelRegistry) SaveToCache(ctx context.Context) error {
 		return nil
 	}
 
-	// Build cache structure as a slice of provider/model rows.
+	// Build grouped cache structure: one entry per provider with its models.
 	modelCache := &cache.ModelCache{
 		UpdatedAt:     time.Now().UTC(),
-		Models:        make([]cache.CachedModel, 0),
+		Providers:     make(map[string]cache.CachedProvider, len(modelsByProvider)),
 		ModelListData: modelListRaw,
 	}
 
-	providerNames := make([]string, 0, len(modelsByProvider))
-	for providerName := range modelsByProvider {
-		providerNames = append(providerNames, providerName)
-	}
-	sort.Strings(providerNames)
+	var totalModels int
+	for providerName, models := range modelsByProvider {
+		// Determine provider type and owned_by from any model in this provider group.
+		var pType, ownedBy string
+		for _, info := range models {
+			t, ok := providerTypes[info.Provider]
+			if !ok {
+				continue
+			}
+			pType = t
+			ownedBy = info.Model.OwnedBy
+			break
+		}
+		if pType == "" {
+			// No known provider type for this provider, skip entirely.
+			continue
+		}
 
-	for _, providerName := range providerNames {
-		modelIDs := make([]string, 0, len(modelsByProvider[providerName]))
-		for modelID := range modelsByProvider[providerName] {
+		modelIDs := make([]string, 0, len(models))
+		for modelID := range models {
 			modelIDs = append(modelIDs, modelID)
 		}
 		sort.Strings(modelIDs)
 
+		cachedModels := make([]cache.CachedModel, 0, len(modelIDs))
 		for _, modelID := range modelIDs {
-			info := modelsByProvider[providerName][modelID]
-			pType, ok := providerTypes[info.Provider]
-			if !ok {
-				// Skip models without a known provider type.
-				continue
-			}
-			modelCache.Models = append(modelCache.Models, cache.CachedModel{
-				ModelID:      modelID,
-				Provider:     providerName,
-				ProviderType: pType,
-				Object:       info.Model.Object,
-				OwnedBy:      info.Model.OwnedBy,
-				Created:      info.Model.Created,
+			info := models[modelID]
+			cachedModels = append(cachedModels, cache.CachedModel{
+				ID:      modelID,
+				Created: info.Model.Created,
 			})
 		}
+		modelCache.Providers[providerName] = cache.CachedProvider{
+			ProviderType: pType,
+			OwnedBy:      ownedBy,
+			Models:       cachedModels,
+		}
+		totalModels += len(cachedModels)
 	}
 
 	if err := cacheBackend.Set(ctx, modelCache); err != nil {
 		return fmt.Errorf("failed to save cache: %w", err)
 	}
 
-	slog.Debug("saved models to cache", "models", len(modelCache.Models))
+	slog.Debug("saved models to cache", "models", totalModels)
 	return nil
 }
 
@@ -427,10 +437,10 @@ func (r *ModelRegistry) GetProvider(model string) core.Provider {
 				return info.Provider
 			}
 		}
-		return nil
+		// Fall through: the slash may be part of the model ID (e.g. "meta-llama/Meta-Llama-3-70B")
 	}
 
-	if info, ok := r.models[modelID]; ok {
+	if info, ok := r.models[model]; ok {
 		return info.Provider
 	}
 	return nil
@@ -444,12 +454,14 @@ func (r *ModelRegistry) GetModel(model string) *ModelInfo {
 	providerName, modelID := splitModelSelector(model)
 	if providerName != "" {
 		if providerModels, ok := r.modelsByProvider[providerName]; ok {
-			return providerModels[modelID]
+			if info, exists := providerModels[modelID]; exists {
+				return info
+			}
 		}
-		return nil
+		// Fall through: the slash may be part of the model ID
 	}
 
-	if info, ok := r.models[modelID]; ok {
+	if info, ok := r.models[model]; ok {
 		return info
 	}
 	return nil
@@ -462,15 +474,15 @@ func (r *ModelRegistry) Supports(model string) bool {
 
 	providerName, modelID := splitModelSelector(model)
 	if providerName != "" {
-		providerModels, ok := r.modelsByProvider[providerName]
-		if !ok {
-			return false
+		if providerModels, ok := r.modelsByProvider[providerName]; ok {
+			if _, exists := providerModels[modelID]; exists {
+				return true
+			}
 		}
-		_, ok = providerModels[modelID]
-		return ok
+		// Fall through: the slash may be part of the model ID
 	}
 
-	_, ok := r.models[modelID]
+	_, ok := r.models[model]
 	return ok
 }
 
@@ -522,14 +534,12 @@ func (r *ModelRegistry) GetProviderType(model string) string {
 				return r.providerTypes[info.Provider]
 			}
 		}
-		return ""
+		// Fall through: the slash may be part of the model ID
 	}
 
-	info, ok := r.models[modelID]
-	if ok {
+	if info, ok := r.models[model]; ok {
 		return r.providerTypes[info.Provider]
 	}
-
 	return ""
 }
 
diff --git a/internal/providers/registry_cache_test.go b/internal/providers/registry_cache_test.go