mirror of
https://github.com/QuantumNous/new-api.git
synced 2026-03-30 05:00:06 +00:00
Restructure the task relay system for better separation of concerns: - Extract task billing into service/task_billing.go with unified settlement flow - Move task polling loop from controller to service/task_polling.go (supports Suno + video platforms) - Split RelayTask into fetch/submit paths with dedicated retry logic (taskSubmitWithRetry) - Add TaskDto, TaskResponse generics, and FetchReq to dto/task.go - Add taskcommon/helpers.go for shared task adaptor utilities - Remove controller/task_video.go (logic consolidated into service layer) - Update all task adaptors (ali, doubao, gemini, hailuo, jimeng, kling, sora, suno, vertex, vidu) - Simplify frontend task logs to use new TaskDto response format
187 lines
5.9 KiB
Go
187 lines
5.9 KiB
Go
package helper
|
||
|
||
import (
|
||
"fmt"
|
||
|
||
"github.com/QuantumNous/new-api/common"
|
||
"github.com/QuantumNous/new-api/logger"
|
||
relaycommon "github.com/QuantumNous/new-api/relay/common"
|
||
"github.com/QuantumNous/new-api/setting/operation_setting"
|
||
"github.com/QuantumNous/new-api/setting/ratio_setting"
|
||
"github.com/QuantumNous/new-api/types"
|
||
|
||
"github.com/gin-gonic/gin"
|
||
)
|
||
|
||
// https://docs.claude.com/en/docs/build-with-claude/prompt-caching#1-hour-cache-duration
|
||
const claudeCacheCreation1hMultiplier = 6 / 3.75
|
||
|
||
// HandleGroupRatio checks for "auto_group" in the context and updates the group ratio and relayInfo.UsingGroup if present
|
||
func HandleGroupRatio(ctx *gin.Context, relayInfo *relaycommon.RelayInfo) types.GroupRatioInfo {
|
||
groupRatioInfo := types.GroupRatioInfo{
|
||
GroupRatio: 1.0, // default ratio
|
||
GroupSpecialRatio: -1,
|
||
}
|
||
|
||
// check auto group
|
||
autoGroup, exists := ctx.Get("auto_group")
|
||
if exists {
|
||
logger.LogDebug(ctx, fmt.Sprintf("final group: %s", autoGroup))
|
||
relayInfo.UsingGroup = autoGroup.(string)
|
||
}
|
||
|
||
// check user group special ratio
|
||
userGroupRatio, ok := ratio_setting.GetGroupGroupRatio(relayInfo.UserGroup, relayInfo.UsingGroup)
|
||
if ok {
|
||
// user group special ratio
|
||
groupRatioInfo.GroupSpecialRatio = userGroupRatio
|
||
groupRatioInfo.GroupRatio = userGroupRatio
|
||
groupRatioInfo.HasSpecialRatio = true
|
||
} else {
|
||
// normal group ratio
|
||
groupRatioInfo.GroupRatio = ratio_setting.GetGroupRatio(relayInfo.UsingGroup)
|
||
}
|
||
|
||
return groupRatioInfo
|
||
}
|
||
|
||
func ModelPriceHelper(c *gin.Context, info *relaycommon.RelayInfo, promptTokens int, meta *types.TokenCountMeta) (types.PriceData, error) {
|
||
modelPrice, usePrice := ratio_setting.GetModelPrice(info.OriginModelName, false)
|
||
|
||
groupRatioInfo := HandleGroupRatio(c, info)
|
||
|
||
var preConsumedQuota int
|
||
var modelRatio float64
|
||
var completionRatio float64
|
||
var cacheRatio float64
|
||
var imageRatio float64
|
||
var cacheCreationRatio float64
|
||
var cacheCreationRatio5m float64
|
||
var cacheCreationRatio1h float64
|
||
var audioRatio float64
|
||
var audioCompletionRatio float64
|
||
var freeModel bool
|
||
if !usePrice {
|
||
preConsumedTokens := common.Max(promptTokens, common.PreConsumedQuota)
|
||
if meta.MaxTokens != 0 {
|
||
preConsumedTokens += meta.MaxTokens
|
||
}
|
||
var success bool
|
||
var matchName string
|
||
modelRatio, success, matchName = ratio_setting.GetModelRatio(info.OriginModelName)
|
||
if !success {
|
||
acceptUnsetRatio := false
|
||
if info.UserSetting.AcceptUnsetRatioModel {
|
||
acceptUnsetRatio = true
|
||
}
|
||
if !acceptUnsetRatio {
|
||
return types.PriceData{}, fmt.Errorf("模型 %s 倍率或价格未配置,请联系管理员设置或开始自用模式;Model %s ratio or price not set, please set or start self-use mode", matchName, matchName)
|
||
}
|
||
}
|
||
completionRatio = ratio_setting.GetCompletionRatio(info.OriginModelName)
|
||
cacheRatio, _ = ratio_setting.GetCacheRatio(info.OriginModelName)
|
||
cacheCreationRatio, _ = ratio_setting.GetCreateCacheRatio(info.OriginModelName)
|
||
cacheCreationRatio5m = cacheCreationRatio
|
||
// 固定1h和5min缓存写入价格的比例
|
||
cacheCreationRatio1h = cacheCreationRatio * claudeCacheCreation1hMultiplier
|
||
imageRatio, _ = ratio_setting.GetImageRatio(info.OriginModelName)
|
||
audioRatio = ratio_setting.GetAudioRatio(info.OriginModelName)
|
||
audioCompletionRatio = ratio_setting.GetAudioCompletionRatio(info.OriginModelName)
|
||
ratio := modelRatio * groupRatioInfo.GroupRatio
|
||
preConsumedQuota = int(float64(preConsumedTokens) * ratio)
|
||
} else {
|
||
if meta.ImagePriceRatio != 0 {
|
||
modelPrice = modelPrice * meta.ImagePriceRatio
|
||
}
|
||
preConsumedQuota = int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
|
||
}
|
||
|
||
// check if free model pre-consume is disabled
|
||
if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
|
||
// if model price or ratio is 0, do not pre-consume quota
|
||
if groupRatioInfo.GroupRatio == 0 {
|
||
preConsumedQuota = 0
|
||
freeModel = true
|
||
} else if usePrice {
|
||
if modelPrice == 0 {
|
||
preConsumedQuota = 0
|
||
freeModel = true
|
||
}
|
||
} else {
|
||
if modelRatio == 0 {
|
||
preConsumedQuota = 0
|
||
freeModel = true
|
||
}
|
||
}
|
||
}
|
||
|
||
priceData := types.PriceData{
|
||
FreeModel: freeModel,
|
||
ModelPrice: modelPrice,
|
||
ModelRatio: modelRatio,
|
||
CompletionRatio: completionRatio,
|
||
GroupRatioInfo: groupRatioInfo,
|
||
UsePrice: usePrice,
|
||
CacheRatio: cacheRatio,
|
||
ImageRatio: imageRatio,
|
||
AudioRatio: audioRatio,
|
||
AudioCompletionRatio: audioCompletionRatio,
|
||
CacheCreationRatio: cacheCreationRatio,
|
||
CacheCreation5mRatio: cacheCreationRatio5m,
|
||
CacheCreation1hRatio: cacheCreationRatio1h,
|
||
QuotaToPreConsume: preConsumedQuota,
|
||
}
|
||
|
||
if common.DebugEnabled {
|
||
println(fmt.Sprintf("model_price_helper result: %s", priceData.ToSetting()))
|
||
}
|
||
info.PriceData = priceData
|
||
return priceData, nil
|
||
}
|
||
|
||
// ModelPriceHelperPerCall 按次计费的 PriceHelper (MJ、Task)
|
||
func ModelPriceHelperPerCall(c *gin.Context, info *relaycommon.RelayInfo) types.PriceData {
|
||
groupRatioInfo := HandleGroupRatio(c, info)
|
||
|
||
modelPrice, success := ratio_setting.GetModelPrice(info.OriginModelName, true)
|
||
// 如果没有配置价格,则使用默认价格
|
||
if !success {
|
||
defaultPrice, ok := ratio_setting.GetDefaultModelPriceMap()[info.OriginModelName]
|
||
if !ok {
|
||
modelPrice = 0.1
|
||
} else {
|
||
modelPrice = defaultPrice
|
||
}
|
||
}
|
||
quota := int(modelPrice * common.QuotaPerUnit * groupRatioInfo.GroupRatio)
|
||
|
||
// 免费模型检测(与 ModelPriceHelper 对齐)
|
||
freeModel := false
|
||
if !operation_setting.GetQuotaSetting().EnableFreeModelPreConsume {
|
||
if groupRatioInfo.GroupRatio == 0 || modelPrice == 0 {
|
||
quota = 0
|
||
freeModel = true
|
||
}
|
||
}
|
||
|
||
priceData := types.PriceData{
|
||
FreeModel: freeModel,
|
||
ModelPrice: modelPrice,
|
||
Quota: quota,
|
||
GroupRatioInfo: groupRatioInfo,
|
||
}
|
||
return priceData
|
||
}
|
||
|
||
func ContainPriceOrRatio(modelName string) bool {
|
||
_, ok := ratio_setting.GetModelPrice(modelName, false)
|
||
if ok {
|
||
return true
|
||
}
|
||
_, ok, _ = ratio_setting.GetModelRatio(modelName)
|
||
if ok {
|
||
return true
|
||
}
|
||
return false
|
||
}
|