go-llm/v2/pricing.go

package llm

import "sync"

// ModelPricing defines per-token pricing for a model.
type ModelPricing struct {
	InputPricePerToken       float64 // USD per input token
	OutputPricePerToken      float64 // USD per output token
	CachedInputPricePerToken float64 // USD per cached input token (0 = same as input)
}

// Cost computes the total USD cost from a Usage.
// When CachedInputPricePerToken is set and the usage includes cached_input_tokens,
// those tokens are charged at the cached rate instead of the regular input rate.
func (mp ModelPricing) Cost(u *Usage) float64 {
	if u == nil {
		return 0
	}

	inputTokens := u.InputTokens
	cachedTokens := 0
	if u.Details != nil {
		cachedTokens = u.Details[UsageDetailCachedInputTokens]
	}

	var cost float64

	if mp.CachedInputPricePerToken > 0 && cachedTokens > 0 {
		regularInput := inputTokens - cachedTokens
		if regularInput < 0 {
			regularInput = 0
		}
		cost += float64(regularInput) * mp.InputPricePerToken
		cost += float64(cachedTokens) * mp.CachedInputPricePerToken
	} else {
		cost += float64(inputTokens) * mp.InputPricePerToken
	}

	cost += float64(u.OutputTokens) * mp.OutputPricePerToken

	return cost
}

// PricingRegistry maps model names to their pricing.
// Callers populate it with the models and prices relevant to their use case.
type PricingRegistry struct {
	mu     sync.RWMutex
	models map[string]ModelPricing
}

// NewPricingRegistry creates an empty pricing registry.
func NewPricingRegistry() *PricingRegistry {
	return &PricingRegistry{
		models: make(map[string]ModelPricing),
	}
}

// Set registers pricing for a model.
func (pr *PricingRegistry) Set(model string, pricing ModelPricing) {
	pr.mu.Lock()
	defer pr.mu.Unlock()
	pr.models[model] = pricing
}

// Has returns true if pricing is registered for the given model.
func (pr *PricingRegistry) Has(model string) bool {
	pr.mu.RLock()
	defer pr.mu.RUnlock()
	_, ok := pr.models[model]
	return ok
}

// Cost computes the USD cost for the given model and usage.
// Returns 0 if the model is not registered.
func (pr *PricingRegistry) Cost(model string, u *Usage) float64 {
	pr.mu.RLock()
	pricing, ok := pr.models[model]
	pr.mu.RUnlock()
	if !ok {
		return 0
	}
	return pricing.Cost(u)
}