91ed4e196a
- Added support for tiered billing expressions in the billing system. - Introduced new types and functions for handling billing expressions, including caching and execution. - Updated existing billing logic to accommodate tiered billing scenarios. - Enhanced request handling to support incoming billing expression requests. - Added tests for tiered billing functionality to ensure correctness.
275 lines
9.4 KiB
Go
275 lines
9.4 KiB
Go
package helper
|
|
|
|
import (
|
|
"fmt"
|
|
|
|
"github.com/QuantumNous/new-api/common"
|
|
"github.com/QuantumNous/new-api/logger"
|
|
"github.com/QuantumNous/new-api/pkg/billingexpr"
|
|
relaycommon "github.com/QuantumNous/new-api/relay/common"
|
|
"github.com/QuantumNous/new-api/setting/billing_setting"
|
|
"github.com/QuantumNous/new-api/setting/operation_setting"
|
|
"github.com/QuantumNous/new-api/setting/ratio_setting"
|
|
"github.com/QuantumNous/new-api/types"
|
|
|
|
"github.com/gin-gonic/gin"
|
|
)
|
|
|
|
// https://docs.claude.com/en/docs/build-with-claude/prompt-caching#1-hour-cache-duration
|
|
const claudeCacheCreation1hMultiplier = 6 / 3.75
|
|
|
|
// HandleGroupRatio checks for "auto_group" in the context and updates the group ratio and relayInfo.UsingGroup if present
|
|
func HandleGroupRatio(ctx *gin.Context, relayInfo *relaycommon.RelayInfo) types.GroupRatioInfo {
|
|
groupRatioInfo := types.GroupRatioInfo{
|
|
GroupRatio: 1.0, // default ratio
|
|
GroupSpecialRatio: -1,
|
|
}
|
|
|
|
// check auto group
|
|
autoGroup, exists := ctx.Get("auto_group")
|
|
if exists {
|
|
logger.LogDebug(ctx, fmt.Sprintf("final group: %s", autoGroup))
|
|
relayInfo.UsingGroup = autoGroup.(string)
|
|
}
|
|
|
|
// check user group special ratio
|
|
userGroupRatio, ok := ratio_setting.GetGroupGroupRatio(relayInfo.UserGroup, relayInfo.UsingGroup)
|
|
if ok {
|
|
// user group special ratio
|
|
groupRatioInfo.GroupSpecialRatio = userGroupRatio
|
|
groupRatioInfo.GroupRatio = userGroupRatio
|
|
groupRatioInfo.HasSpecialRatio = true
|
|
} else {
|
|
// normal group ratio
|
|
groupRatioInfo.GroupRatio = ratio_setting.GetGroupRatio(relayInfo.UsingGroup)
|
|
}
|
|
|
|
return groupRatioInfo
|
|
}
|
|
|
|
func ModelPriceHelper(c *gin.Context, info *relaycommon.RelayInfo, promptTokens int, meta *types.TokenCountMeta) (types.PriceData, error) {
|
|
modelPrice, usePrice := ratio_setting.GetModelPrice(info.OriginModelName, false)
|
|
|
|
groupRatioInfo := HandleGroupRatio(c, info)
|
|
|
|
// Check if this model uses tiered_expr billing
|
|
if billing_setting.GetBillingMode(info.OriginModelName) == billing_setting.BillingModeTieredExpr {
|
|
return modelPriceHelperTiered(c, info, promptTokens, meta, groupRatioInfo)
|
|
}
|
|
|
|
var preConsumedQuota int
|
|
var modelRatio float64
|
|
var completionRatio float64
|
|
var cacheRatio float64
|
|
var imageRatio float64
|
|
var cacheCreationRatio float64
|
|
var cacheCreationRatio5m float64
|
|
var cacheCreationRatio1h float64
|
|
var audioRatio float64
|
|
var audioCompletionRatio float64
|
|
var freeModel bool
|
|
if !usePrice {
|
|
preConsumedTokens := common.Max(promptTokens, common.PreConsumedQuota)
|
|
if meta.MaxTokens != 0 {
|
|
preConsumedTokens += meta.MaxTokens
|
|
}
|
|
var success bool
|
|
var matchName string
|
|
modelRatio, success, matchName = ratio_setting.GetModelRatio(info.OriginModelName)
|
|
if !success {
|
|
acceptUnsetRatio := false
|
|
if info.UserSetting.AcceptUnsetRatioModel {
|
|
acceptUnsetRatio = true
|
|
}
|
|
if !acceptUnsetRatio {
|
|
return types.PriceData{}, fmt.Errorf("模型 %s 倍率或价格未配置,请联系管理员设置或开始自用模式;Model %s ratio or price not set, please set or start self-use mode", matchName, matchName)
|
|
}
|
|
}
|
|
completionRatio = ratio_setting.GetCompletionRatio(info.OriginModelName)
|
|
cacheRatio, _ = ratio_setting.GetCacheRatio(info.OriginModelName)
|
|
cacheCreationRatio, _ = ratio_setting.GetCreateCacheRatio(info.OriginModelName)
|
|
cacheCreationRatio5m = cacheCreationRatio
|
|
// 固定1h和5min缓存写入价格的比例
|
|
cacheCreationRatio1h = cacheCreationRatio * claudeCacheCreation1hMultiplier
|
|
imageRatio, _ = ratio_setting.GetImageRatio(info.OriginModelName)
|
|
audioRatio = ratio_setting.GetAudioRatio(info.OriginModelName)
|
|
audioCompletionRatio = ratio_setting.GetAudioCompletionRatio(info.OriginModelName)
|
|
ratio := modelRatio * groupRatioInfo.GroupRatio
|
|
preConsumedQuota = int(float64(preConsumedTokens) * ratio)
|
|
} else {
|
|
if meta.ImagePriceRatio != 0 {
|
|
modelPrice = modelPrice * meta.ImagePriceRatio
|
|
}
|
|
preConsumedQuota = int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
|
|
}
|
|
|
|
// check if free model pre-consume is disabled
|
|
if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
|
|
// if model price or ratio is 0, do not pre-consume quota
|
|
if groupRatioInfo.GroupRatio == 0 {
|
|
preConsumedQuota = 0
|
|
freeModel = true
|
|
} else if usePrice {
|
|
if modelPrice == 0 {
|
|
preConsumedQuota = 0
|
|
freeModel = true
|
|
}
|
|
} else {
|
|
if modelRatio == 0 {
|
|
preConsumedQuota = 0
|
|
freeModel = true
|
|
}
|
|
}
|
|
}
|
|
|
|
priceData := types.PriceData{
|
|
FreeModel: freeModel,
|
|
ModelPrice: modelPrice,
|
|
ModelRatio: modelRatio,
|
|
CompletionRatio: completionRatio,
|
|
GroupRatioInfo: groupRatioInfo,
|
|
UsePrice: usePrice,
|
|
CacheRatio: cacheRatio,
|
|
ImageRatio: imageRatio,
|
|
AudioRatio: audioRatio,
|
|
AudioCompletionRatio: audioCompletionRatio,
|
|
CacheCreationRatio: cacheCreationRatio,
|
|
CacheCreation5mRatio: cacheCreationRatio5m,
|
|
CacheCreation1hRatio: cacheCreationRatio1h,
|
|
QuotaToPreConsume: preConsumedQuota,
|
|
}
|
|
|
|
if common.DebugEnabled {
|
|
println(fmt.Sprintf("model_price_helper result: %s", priceData.ToSetting()))
|
|
}
|
|
info.PriceData = priceData
|
|
return priceData, nil
|
|
}
|
|
|
|
// ModelPriceHelperPerCall 按次计费的 PriceHelper (MJ、Task)
|
|
func ModelPriceHelperPerCall(c *gin.Context, info *relaycommon.RelayInfo) (types.PriceData, error) {
|
|
groupRatioInfo := HandleGroupRatio(c, info)
|
|
|
|
modelPrice, success := ratio_setting.GetModelPrice(info.OriginModelName, true)
|
|
// 如果没有配置价格,检查模型倍率配置
|
|
if !success {
|
|
|
|
// 没有配置费用,也要使用默认费用,否则按费率计费模型无法使用
|
|
defaultPrice, ok := ratio_setting.GetDefaultModelPriceMap()[info.OriginModelName]
|
|
if ok {
|
|
modelPrice = defaultPrice
|
|
} else {
|
|
// 没有配置倍率也不接受没配置,那就返回错误
|
|
_, ratioSuccess, matchName := ratio_setting.GetModelRatio(info.OriginModelName)
|
|
acceptUnsetRatio := false
|
|
if info.UserSetting.AcceptUnsetRatioModel {
|
|
acceptUnsetRatio = true
|
|
}
|
|
if !ratioSuccess && !acceptUnsetRatio {
|
|
return types.PriceData{}, fmt.Errorf("模型 %s 倍率或价格未配置,请联系管理员设置或开始自用模式;Model %s ratio or price not set, please set or start self-use mode", matchName, matchName)
|
|
}
|
|
// 未配置价格但配置了倍率,使用默认预扣价格
|
|
modelPrice = float64(common.PreConsumedQuota) / common.QuotaPerUnit
|
|
}
|
|
|
|
}
|
|
quota := int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
|
|
|
|
// 免费模型检测(与 ModelPriceHelper 对齐)
|
|
freeModel := false
|
|
if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
|
|
if groupRatioInfo.GroupRatio == 0 || modelPrice == 0 {
|
|
quota = 0
|
|
freeModel = true
|
|
}
|
|
}
|
|
|
|
priceData := types.PriceData{
|
|
FreeModel: freeModel,
|
|
ModelPrice: modelPrice,
|
|
Quota: quota,
|
|
GroupRatioInfo: groupRatioInfo,
|
|
}
|
|
return priceData, nil
|
|
}
|
|
|
|
func ContainPriceOrRatio(modelName string) bool {
|
|
_, ok := ratio_setting.GetModelPrice(modelName, false)
|
|
if ok {
|
|
return true
|
|
}
|
|
_, ok, _ = ratio_setting.GetModelRatio(modelName)
|
|
if ok {
|
|
return true
|
|
}
|
|
if billing_setting.GetBillingMode(modelName) == billing_setting.BillingModeTieredExpr {
|
|
_, ok = billing_setting.GetBillingExpr(modelName)
|
|
return ok
|
|
}
|
|
return false
|
|
}
|
|
|
|
func modelPriceHelperTiered(c *gin.Context, info *relaycommon.RelayInfo, promptTokens int, meta *types.TokenCountMeta, groupRatioInfo types.GroupRatioInfo) (types.PriceData, error) {
|
|
exprStr, ok := billing_setting.GetBillingExpr(info.OriginModelName)
|
|
if !ok {
|
|
return types.PriceData{}, fmt.Errorf("model %s is configured as tiered_expr but has no billing expression", info.OriginModelName)
|
|
}
|
|
|
|
estimatedCompletionTokens := 0
|
|
if meta.MaxTokens != 0 {
|
|
estimatedCompletionTokens = meta.MaxTokens
|
|
}
|
|
|
|
requestInput, err := ResolveIncomingBillingExprRequestInput(c, info)
|
|
if err != nil {
|
|
return types.PriceData{}, err
|
|
}
|
|
|
|
rawQuota, trace, err := billingexpr.RunExprWithRequest(exprStr, billingexpr.TokenParams{
|
|
P: float64(promptTokens),
|
|
C: float64(estimatedCompletionTokens),
|
|
}, requestInput)
|
|
if err != nil {
|
|
return types.PriceData{}, fmt.Errorf("model %s tiered expr run failed: %w", info.OriginModelName, err)
|
|
}
|
|
|
|
preConsumedQuota := billingexpr.QuotaRound(rawQuota * groupRatioInfo.GroupRatio)
|
|
|
|
freeModel := false
|
|
if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
|
|
if groupRatioInfo.GroupRatio == 0 || rawQuota == 0 {
|
|
preConsumedQuota = 0
|
|
freeModel = true
|
|
}
|
|
}
|
|
|
|
exprHash := billingexpr.ExprHashString(exprStr)
|
|
snapshot := &billingexpr.BillingSnapshot{
|
|
BillingMode: billing_setting.BillingModeTieredExpr,
|
|
ModelName: info.OriginModelName,
|
|
ExprString: exprStr,
|
|
ExprHash: exprHash,
|
|
GroupRatio: groupRatioInfo.GroupRatio,
|
|
EstimatedPromptTokens: promptTokens,
|
|
EstimatedCompletionTokens: estimatedCompletionTokens,
|
|
EstimatedQuotaBeforeGroup: rawQuota,
|
|
EstimatedQuotaAfterGroup: preConsumedQuota,
|
|
EstimatedTier: trace.MatchedTier,
|
|
}
|
|
info.TieredBillingSnapshot = snapshot
|
|
info.BillingRequestInput = &requestInput
|
|
|
|
priceData := types.PriceData{
|
|
FreeModel: freeModel,
|
|
GroupRatioInfo: groupRatioInfo,
|
|
QuotaToPreConsume: preConsumedQuota,
|
|
}
|
|
|
|
if common.DebugEnabled {
|
|
println(fmt.Sprintf("model_price_helper_tiered result: model=%s preConsume=%d rawQuota=%.2f groupRatio=%.2f tier=%s", info.OriginModelName, preConsumedQuota, rawQuota, groupRatioInfo.GroupRatio, trace.MatchedTier))
|
|
}
|
|
|
|
info.PriceData = priceData
|
|
return priceData, nil
|
|
}
|