maximhq · Pratham-Mishra04 · Nov 4, 2025 · coderabbitai · Nov 4, 2025 · coderabbitai
diff --git a/core/bifrost.go b/core/bifrost.go
@@ -54,6 +54,7 @@ type Bifrost struct {
 	responseStreamPool  sync.Pool                          // Pool for response stream channels, initial pool size is set in Init
 	pluginPipelinePool  sync.Pool                          // Pool for PluginPipeline objects
 	bifrostRequestPool  sync.Pool                          // Pool for BifrostRequest objects
+	pricingData         sync.Map                           // pricing data for each model
 	logger              schemas.Logger                     // logger instance, default logger is used if not provided
 	mcpManager          *MCPManager                        // MCP integration manager (nil if MCP not configured)
 	dropExcessRequests  atomic.Bool                        // If true, in cases where the queue is full, requests will not wait for the queue to be empty and will be dropped instead.
@@ -98,6 +99,7 @@ func Init(ctx context.Context, config schemas.BifrostConfig) (*Bifrost, error) {
 		plugins:       atomic.Pointer[[]schemas.Plugin]{},
 		requestQueues: sync.Map{},
 		waitGroups:    sync.Map{},
+		pricingData:   sync.Map{},
 		keySelector:   config.KeySelector,
 		logger:        config.Logger,
 	}
@@ -287,6 +289,8 @@ func (bifrost *Bifrost) ListModelsRequest(ctx context.Context, req *schemas.Bifr
 		}
 		return nil, bifrostErr
 	}
+	// Add pricing data to the response
+	response.AddPricing(bifrost.GetPricingDataForModel)
 	return response, nil
 }
 
@@ -369,6 +373,9 @@ func (bifrost *Bifrost) ListAllModels(ctx context.Context, request *schemas.Bifr
 					break
 				}
 
+				// Add pricing data to the response
+				response.AddPricing(bifrost.GetPricingDataForModel)
+
 				providerModels = append(providerModels, response.Data...)
 
 				// Check if there are more pages
@@ -822,6 +829,38 @@ func (bifrost *Bifrost) ReloadPlugin(plugin schemas.Plugin) error {
 	}
 }
 
+// SetPricingData sets pricing data for all the models.
+// This is used to set pricing data for all the models at once.
+//
+// Parameters:
+//   - pricingData: A map of model names to pricing data
+func (bifrost *Bifrost) SetPricingData(pricingData map[string]schemas.DataSheetPricingEntry) {
+	for model, pricing := range pricingData {
+		bifrost.pricingData.Store(pricing.Provider+"/"+model, pricing)
+	}
+}
-	for model, pricing := range pricingData {
-		bifrost.pricingData.Store(pricing.Provider+"/"+model, pricing)
-	}
-}
+func (bifrost *Bifrost) SetPricingData(pricingData map[string]schemas.DataSheetPricingEntry) {
+	for model, pricing := range pricingData {
+		// Normalize model: strip "<provider>/" if present
+		if strings.HasPrefix(model, pricing.Provider+"/") {
+			model = strings.TrimPrefix(model, pricing.Provider+"/")
+		}
+		bifrost.pricingData.Store(pricing.Provider+"/"+model, pricing)
+	}
+}
-	for model, pricing := range pricingData {
-		bifrost.pricingData.Store(pricing.Provider+"/"+model, pricing)
-	}
-}
+func (bifrost *Bifrost) SetPricingData(pricingData map[string]schemas.DataSheetPricingEntry) {
+	for model, pricing := range pricingData {
+		// Normalize model: strip "<provider>/" if present
+		if strings.HasPrefix(model, pricing.Provider+"/") {
+			model = strings.TrimPrefix(model, pricing.Provider+"/")
+		}
+		bifrost.pricingData.Store(pricing.Provider+"/"+model, pricing)
+	}
+}
+
+// GetPricingDataForModel returns pricing data for a model.
+// This is used to get pricing data for a model.
+//
+// Parameters:
+//   - model: The model to get pricing data for
+//   - provider: The provider to get pricing data for
+//
+// Returns:
+//   - pricing: The pricing data for the model, nil if not found
+func (bifrost *Bifrost) GetPricingDataForModel(model string, provider schemas.ModelProvider) *schemas.DataSheetPricingEntry {
+	pricing, ok := bifrost.pricingData.Load(string(provider) + "/" + model)
+	if !ok {
+		return nil
+	}
+	if pricing, ok := pricing.(schemas.DataSheetPricingEntry); ok {
+		return &pricing
+	}
+	return nil
+}
+
+// GetConfiguredProviders returns a configured providers list.
 func (bifrost *Bifrost) GetConfiguredProviders() ([]schemas.ModelProvider, error) {
 	providers := bifrost.providers.Load()
 	if providers == nil {

diff --git a/core/schemas/models.go b/core/schemas/models.go
@@ -3,6 +3,7 @@ package schemas
 import (
 	"encoding/base64"
 	"fmt"
+	"strings"
 
 	"github.com/bytedance/sonic"
 )
@@ -44,9 +45,95 @@ type BifrostListModelsResponse struct {
 	HasMore *bool   `json:"-"`
 }
 
+// ApplyPagination applies offset-based pagination to a BifrostListModelsResponse.
+// Uses opaque tokens with LastID validation to ensure cursor integrity.
+// Returns the paginated response with properly set NextPageToken.
+func (response *BifrostListModelsResponse) ApplyPagination(pageSize int, pageToken string) *BifrostListModelsResponse {
+	if response == nil {
+		return nil
+	}
+
+	totalItems := len(response.Data)
+
+	if pageSize <= 0 {
+		return response
+	}
+
+	cursor := decodePaginationCursor(pageToken)
+	offset := cursor.Offset
+
+	// Validate cursor integrity if LastID is present
+	if cursor.LastID != "" && !validatePaginationCursor(cursor, response.Data) {
+		// Invalid cursor: reset to beginning
+		offset = 0
+	}
+
+	if offset >= totalItems {
+		// Return empty page, no next token
+		return &BifrostListModelsResponse{
+			Data:          []Model{},
+			ExtraFields:   response.ExtraFields,
+			NextPageToken: "",
+		}
+	}
+
+	endIndex := offset + pageSize
+	if endIndex > totalItems {
+		endIndex = totalItems
+	}
+
+	paginatedData := response.Data[offset:endIndex]
+
+	paginatedResponse := &BifrostListModelsResponse{
+		Data:        paginatedData,
+		ExtraFields: response.ExtraFields,
+	}
+
+	if endIndex < totalItems {
+		// Get the last item ID for cursor validation
+		var lastID string
+		if len(paginatedData) > 0 {
+			lastID = paginatedData[len(paginatedData)-1].ID
+		}
+
+		nextToken, err := encodePaginationCursor(endIndex, lastID)
+		if err == nil {
+			paginatedResponse.NextPageToken = nextToken
+		}
+	} else {
+		paginatedResponse.NextPageToken = ""
+	}
+
+	return paginatedResponse
+}
+
+type PricingFetcher func(model string, provider ModelProvider) *DataSheetPricingEntry
+
+// AddPricing adds pricing data to the response.
+// This is used to add pricing data to the response.
+//
+// Parameters:
+//   - fetcher: The pricing fetcher function
+//
+// Returns:
+//   - response: The response with pricing data
+func (response *BifrostListModelsResponse) AddPricing(fetcher PricingFetcher) {
+	for i, modelData := range response.Data {
+		model := strings.TrimPrefix(modelData.ID, string(response.ExtraFields.Provider)+"/")
+		pricing := fetcher(model, response.ExtraFields.Provider)
+		if pricing != nil {
+			if response.Data[i].Pricing == nil {
+				response.Data[i].Pricing = &Pricing{}
+			}
+			response.Data[i].Pricing.DataSheetPricingEntry = pricing
+		}
+	}
+}
+
 type Model struct {
 	ID                  string             `json:"id"`
 	CanonicalSlug       *string            `json:"canonical_slug,omitempty"`
+	DeploymentName      *string            `json:"deployment_name,omitempty"`
 	Name                *string            `json:"name,omitempty"`
 	Created             *int64             `json:"created,omitempty"`
 	ContextLength       *int               `json:"context_length,omitempty"`
@@ -82,6 +169,8 @@ type Pricing struct {
 	InternalReasoning *string `json:"internal_reasoning,omitempty"`
 	InputCacheRead    *string `json:"input_cache_read,omitempty"`
 	InputCacheWrite   *string `json:"input_cache_write,omitempty"`
+
+	*DataSheetPricingEntry
 }
 
 type TopProvider struct {
@@ -107,6 +196,38 @@ type paginationCursor struct {
 	LastID string `json:"l,omitempty"`
 }
 
+// PricingEntry represents a single model's pricing information
+type DataSheetPricingEntry struct {
+	// Basic pricing
+	InputCostPerToken  float64 `json:"input_cost_per_token"`
+	OutputCostPerToken float64 `json:"output_cost_per_token"`
+	Provider           string  `json:"provider"`
+	Mode               string  `json:"mode"`
+
+	// Additional pricing for media
+	InputCostPerImage          *float64 `json:"input_cost_per_image,omitempty"`
+	InputCostPerVideoPerSecond *float64 `json:"input_cost_per_video_per_second,omitempty"`
+	InputCostPerAudioPerSecond *float64 `json:"input_cost_per_audio_per_second,omitempty"`
+
+	// Character-based pricing
+	InputCostPerCharacter  *float64 `json:"input_cost_per_character,omitempty"`
+	OutputCostPerCharacter *float64 `json:"output_cost_per_character,omitempty"`
+
+	// Pricing above 128k tokens
+	InputCostPerTokenAbove128kTokens          *float64 `json:"input_cost_per_token_above_128k_tokens,omitempty"`
+	InputCostPerCharacterAbove128kTokens      *float64 `json:"input_cost_per_character_above_128k_tokens,omitempty"`
+	InputCostPerImageAbove128kTokens          *float64 `json:"input_cost_per_image_above_128k_tokens,omitempty"`
+	InputCostPerVideoPerSecondAbove128kTokens *float64 `json:"input_cost_per_video_per_second_above_128k_tokens,omitempty"`
+	InputCostPerAudioPerSecondAbove128kTokens *float64 `json:"input_cost_per_audio_per_second_above_128k_tokens,omitempty"`
+	OutputCostPerTokenAbove128kTokens         *float64 `json:"output_cost_per_token_above_128k_tokens,omitempty"`
+	OutputCostPerCharacterAbove128kTokens     *float64 `json:"output_cost_per_character_above_128k_tokens,omitempty"`
+
+	// Cache and batch pricing
+	CacheReadInputTokenCost   *float64 `json:"cache_read_input_token_cost,omitempty"`
+	InputCostPerTokenBatches  *float64 `json:"input_cost_per_token_batches,omitempty"`
+	OutputCostPerTokenBatches *float64 `json:"output_cost_per_token_batches,omitempty"`
+}
+
 // encodePaginationCursor creates an opaque base64-encoded page token from cursor data.
 // Returns empty string if offset is 0 or negative.
 func encodePaginationCursor(offset int, lastID string) (string, error) {
@@ -172,65 +293,3 @@ func validatePaginationCursor(cursor paginationCursor, data []Model) bool {
 
 	return true
 }
-
-// ApplyPagination applies offset-based pagination to a BifrostListModelsResponse.
-// Uses opaque tokens with LastID validation to ensure cursor integrity.
-// Returns the paginated response with properly set NextPageToken.
-func (response *BifrostListModelsResponse) ApplyPagination(pageSize int, pageToken string) *BifrostListModelsResponse {
-	if response == nil {
-		return nil
-	}
-
-	totalItems := len(response.Data)
-
-	if pageSize <= 0 {
-		return response
-	}
-
-	cursor := decodePaginationCursor(pageToken)
-	offset := cursor.Offset
-
-	// Validate cursor integrity if LastID is present
-	if cursor.LastID != "" && !validatePaginationCursor(cursor, response.Data) {
-		// Invalid cursor: reset to beginning
-		offset = 0
-	}
-
-	if offset >= totalItems {
-		// Return empty page, no next token
-		return &BifrostListModelsResponse{
-			Data:          []Model{},
-			ExtraFields:   response.ExtraFields,
-			NextPageToken: "",
-		}
-	}
-
-	endIndex := offset + pageSize
-	if endIndex > totalItems {
-		endIndex = totalItems
-	}
-
-	paginatedData := response.Data[offset:endIndex]
-
-	paginatedResponse := &BifrostListModelsResponse{
-		Data:        paginatedData,
-		ExtraFields: response.ExtraFields,
-	}
-
-	if endIndex < totalItems {
-		// Get the last item ID for cursor validation
-		var lastID string
-		if len(paginatedData) > 0 {
-			lastID = paginatedData[len(paginatedData)-1].ID
-		}
-
-		nextToken, err := encodePaginationCursor(endIndex, lastID)
-		if err == nil {
-			paginatedResponse.NextPageToken = nextToken
-		}
-	} else {
-		paginatedResponse.NextPageToken = ""
-	}
-
-	return paginatedResponse
-}
diff --git a/framework/modelcatalog/main.go b/framework/modelcatalog/main.go
@@ -24,8 +24,9 @@ const (
 
 // Config is the model pricing configuration.
 type Config struct {
-	PricingURL          *string        `json:"pricing_url,omitempty"`
-	PricingSyncInterval *time.Duration `json:"pricing_sync_interval,omitempty"`
+	PricingURL          *string                                        `json:"pricing_url,omitempty"`
+	PricingSyncInterval *time.Duration                                 `json:"pricing_sync_interval,omitempty"`
+	PricingSyncCallback func(map[string]schemas.DataSheetPricingEntry) `json:"pricing_sync_callback,omitempty"`
 }
 
 type ModelCatalog struct {
@@ -49,41 +50,9 @@ type ModelCatalog struct {
 	wg         sync.WaitGroup
 	syncCtx    context.Context
 	syncCancel context.CancelFunc
-}
 
-// PricingData represents the structure of the pricing.json file
-type PricingData map[string]PricingEntry
-
-// PricingEntry represents a single model's pricing information
-type PricingEntry struct {
-	// Basic pricing
-	InputCostPerToken  float64 `json:"input_cost_per_token"`
-	OutputCostPerToken float64 `json:"output_cost_per_token"`
-	Provider           string  `json:"provider"`
-	Mode               string  `json:"mode"`
-
-	// Additional pricing for media
-	InputCostPerImage          *float64 `json:"input_cost_per_image,omitempty"`
-	InputCostPerVideoPerSecond *float64 `json:"input_cost_per_video_per_second,omitempty"`
-	InputCostPerAudioPerSecond *float64 `json:"input_cost_per_audio_per_second,omitempty"`
-
-	// Character-based pricing
-	InputCostPerCharacter  *float64 `json:"input_cost_per_character,omitempty"`
-	OutputCostPerCharacter *float64 `json:"output_cost_per_character,omitempty"`
-
-	// Pricing above 128k tokens
-	InputCostPerTokenAbove128kTokens          *float64 `json:"input_cost_per_token_above_128k_tokens,omitempty"`
-	InputCostPerCharacterAbove128kTokens      *float64 `json:"input_cost_per_character_above_128k_tokens,omitempty"`
-	InputCostPerImageAbove128kTokens          *float64 `json:"input_cost_per_image_above_128k_tokens,omitempty"`
-	InputCostPerVideoPerSecondAbove128kTokens *float64 `json:"input_cost_per_video_per_second_above_128k_tokens,omitempty"`
-	InputCostPerAudioPerSecondAbove128kTokens *float64 `json:"input_cost_per_audio_per_second_above_128k_tokens,omitempty"`
-	OutputCostPerTokenAbove128kTokens         *float64 `json:"output_cost_per_token_above_128k_tokens,omitempty"`
-	OutputCostPerCharacterAbove128kTokens     *float64 `json:"output_cost_per_character_above_128k_tokens,omitempty"`
-
-	// Cache and batch pricing
-	CacheReadInputTokenCost   *float64 `json:"cache_read_input_token_cost,omitempty"`
-	InputCostPerTokenBatches  *float64 `json:"input_cost_per_token_batches,omitempty"`
-	OutputCostPerTokenBatches *float64 `json:"output_cost_per_token_batches,omitempty"`
+	// Callback after pricing data is synced
+	pricingSyncCallback func(map[string]schemas.DataSheetPricingEntry)
 }
 
 // Init initializes the pricing manager
@@ -105,6 +74,7 @@ func Init(ctx context.Context, config *Config, configStore configstore.ConfigSto
 		pricingData:         make(map[string]configstoreTables.TableModelPricing),
 		modelPool:           make(map[schemas.ModelProvider][]string),
 		done:                make(chan struct{}),
+		pricingSyncCallback: config.PricingSyncCallback,
 	}
 
 	logger.Info("initializing pricing manager...")
@@ -189,6 +159,19 @@ func (mc *ModelCatalog) getPricingSyncInterval() time.Duration {
 	return mc.pricingSyncInterval
 }
 
+// GetPricingData returns the pricing data
+func (mc *ModelCatalog) GetPricingData() map[string]schemas.DataSheetPricingEntry {
+	mc.mu.RLock()
+	defer mc.mu.RUnlock()
+	// Make a copy of the pricing data
+	pricingData := make(map[string]schemas.DataSheetPricingEntry)
+	for key, pricing := range mc.pricingData {
+		model, _, _ := splitKey(key)
+		pricingData[model] = convertTableModelPricingToPricingData(pricing)
+	}
+	return pricingData
+}
+
 // GetModelsForProvider returns all available models for a given provider (thread-safe)
 func (mc *ModelCatalog) GetModelsForProvider(provider schemas.ModelProvider) []string {
 	mc.mu.RLock()