| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172 |
- package helper
- import (
- "fmt"
- "github.com/QuantumNous/new-api/common"
- "github.com/QuantumNous/new-api/logger"
- relaycommon "github.com/QuantumNous/new-api/relay/common"
- "github.com/QuantumNous/new-api/setting/operation_setting"
- "github.com/QuantumNous/new-api/setting/ratio_setting"
- "github.com/QuantumNous/new-api/types"
- "github.com/gin-gonic/gin"
- )
- // https://docs.claude.com/en/docs/build-with-claude/prompt-caching#1-hour-cache-duration
- const claudeCacheCreation1hMultiplier = 6 / 3.75
- // HandleGroupRatio checks for "auto_group" in the context and updates the group ratio and relayInfo.UsingGroup if present
- func HandleGroupRatio(ctx *gin.Context, relayInfo *relaycommon.RelayInfo) types.GroupRatioInfo {
- groupRatioInfo := types.GroupRatioInfo{
- GroupRatio: 1.0, // default ratio
- GroupSpecialRatio: -1,
- }
- // check auto group
- autoGroup, exists := ctx.Get("auto_group")
- if exists {
- logger.LogDebug(ctx, fmt.Sprintf("final group: %s", autoGroup))
- relayInfo.UsingGroup = autoGroup.(string)
- }
- // check user group special ratio
- userGroupRatio, ok := ratio_setting.GetGroupGroupRatio(relayInfo.UserGroup, relayInfo.UsingGroup)
- if ok {
- // user group special ratio
- groupRatioInfo.GroupSpecialRatio = userGroupRatio
- groupRatioInfo.GroupRatio = userGroupRatio
- groupRatioInfo.HasSpecialRatio = true
- } else {
- // normal group ratio
- groupRatioInfo.GroupRatio = ratio_setting.GetGroupRatio(relayInfo.UsingGroup)
- }
- return groupRatioInfo
- }
- func ModelPriceHelper(c *gin.Context, info *relaycommon.RelayInfo, promptTokens int, meta *types.TokenCountMeta) (types.PriceData, error) {
- modelPrice, usePrice := ratio_setting.GetModelPrice(info.OriginModelName, false)
- groupRatioInfo := HandleGroupRatio(c, info)
- var preConsumedQuota int
- var modelRatio float64
- var completionRatio float64
- var cacheRatio float64
- var imageRatio float64
- var cacheCreationRatio float64
- var cacheCreationRatio5m float64
- var cacheCreationRatio1h float64
- var audioRatio float64
- var audioCompletionRatio float64
- var freeModel bool
- if !usePrice {
- preConsumedTokens := common.Max(promptTokens, common.PreConsumedQuota)
- if meta.MaxTokens != 0 {
- preConsumedTokens += meta.MaxTokens
- }
- var success bool
- var matchName string
- modelRatio, success, matchName = ratio_setting.GetModelRatio(info.OriginModelName)
- if !success {
- acceptUnsetRatio := false
- if info.UserSetting.AcceptUnsetRatioModel {
- acceptUnsetRatio = true
- }
- if !acceptUnsetRatio {
- return types.PriceData{}, fmt.Errorf("模型 %s 倍率或价格未配置,请联系管理员设置或开始自用模式;Model %s ratio or price not set, please set or start self-use mode", matchName, matchName)
- }
- }
- completionRatio = ratio_setting.GetCompletionRatio(info.OriginModelName)
- cacheRatio, _ = ratio_setting.GetCacheRatio(info.OriginModelName)
- cacheCreationRatio, _ = ratio_setting.GetCreateCacheRatio(info.OriginModelName)
- cacheCreationRatio5m = cacheCreationRatio
- // 固定1h和5min缓存写入价格的比例
- cacheCreationRatio1h = cacheCreationRatio * claudeCacheCreation1hMultiplier
- imageRatio, _ = ratio_setting.GetImageRatio(info.OriginModelName)
- audioRatio = ratio_setting.GetAudioRatio(info.OriginModelName)
- audioCompletionRatio = ratio_setting.GetAudioCompletionRatio(info.OriginModelName)
- ratio := modelRatio * groupRatioInfo.GroupRatio
- preConsumedQuota = int(float64(preConsumedTokens) * ratio)
- } else {
- if meta.ImagePriceRatio != 0 {
- modelPrice = modelPrice * meta.ImagePriceRatio
- }
- preConsumedQuota = int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
- }
- // check if free model pre-consume is disabled
- if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
- // if model price or ratio is 0, do not pre-consume quota
- if usePrice {
- if modelPrice == 0 {
- preConsumedQuota = 0
- freeModel = true
- }
- } else {
- if modelRatio == 0 {
- preConsumedQuota = 0
- freeModel = true
- }
- }
- }
- priceData := types.PriceData{
- FreeModel: freeModel,
- ModelPrice: modelPrice,
- ModelRatio: modelRatio,
- CompletionRatio: completionRatio,
- GroupRatioInfo: groupRatioInfo,
- UsePrice: usePrice,
- CacheRatio: cacheRatio,
- ImageRatio: imageRatio,
- AudioRatio: audioRatio,
- AudioCompletionRatio: audioCompletionRatio,
- CacheCreationRatio: cacheCreationRatio,
- CacheCreation5mRatio: cacheCreationRatio5m,
- CacheCreation1hRatio: cacheCreationRatio1h,
- QuotaToPreConsume: preConsumedQuota,
- }
- if common.DebugEnabled {
- println(fmt.Sprintf("model_price_helper result: %s", priceData.ToSetting()))
- }
- info.PriceData = priceData
- return priceData, nil
- }
- // ModelPriceHelperPerCall 按次计费的 PriceHelper (MJ、Task)
- func ModelPriceHelperPerCall(c *gin.Context, info *relaycommon.RelayInfo) types.PerCallPriceData {
- groupRatioInfo := HandleGroupRatio(c, info)
- modelPrice, success := ratio_setting.GetModelPrice(info.OriginModelName, true)
- // 如果没有配置价格,则使用默认价格
- if !success {
- defaultPrice, ok := ratio_setting.GetDefaultModelPriceMap()[info.OriginModelName]
- if !ok {
- modelPrice = 0.1
- } else {
- modelPrice = defaultPrice
- }
- }
- quota := int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
- priceData := types.PerCallPriceData{
- ModelPrice: modelPrice,
- Quota: quota,
- GroupRatioInfo: groupRatioInfo,
- }
- return priceData
- }
- func ContainPriceOrRatio(modelName string) bool {
- _, ok := ratio_setting.GetModelPrice(modelName, false)
- if ok {
- return true
- }
- _, ok, _ = ratio_setting.GetModelRatio(modelName)
- if ok {
- return true
- }
- return false
- }
|