mirror of
https://github.com/QuantumNous/new-api.git
synced 2026-03-29 23:28:36 +00:00
198 lines
7.1 KiB
Go
198 lines
7.1 KiB
Go
package relay
|
|
|
|
import (
|
|
"bytes"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io"
|
|
"net/http"
|
|
"strings"
|
|
|
|
"github.com/QuantumNous/new-api/common"
|
|
"github.com/QuantumNous/new-api/constant"
|
|
"github.com/QuantumNous/new-api/dto"
|
|
relaycommon "github.com/QuantumNous/new-api/relay/common"
|
|
"github.com/QuantumNous/new-api/relay/helper"
|
|
"github.com/QuantumNous/new-api/service"
|
|
"github.com/QuantumNous/new-api/setting/model_setting"
|
|
"github.com/QuantumNous/new-api/setting/reasoning"
|
|
"github.com/QuantumNous/new-api/types"
|
|
|
|
"github.com/gin-gonic/gin"
|
|
)
|
|
|
|
func ClaudeHelper(c *gin.Context, info *relaycommon.RelayInfo) (newAPIError *types.NewAPIError) {
|
|
|
|
info.InitChannelMeta(c)
|
|
|
|
claudeReq, ok := info.Request.(*dto.ClaudeRequest)
|
|
|
|
if !ok {
|
|
return types.NewErrorWithStatusCode(fmt.Errorf("invalid request type, expected *dto.ClaudeRequest, got %T", info.Request), types.ErrorCodeInvalidRequest, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
request, err := common.DeepCopy(claudeReq)
|
|
if err != nil {
|
|
return types.NewError(fmt.Errorf("failed to copy request to ClaudeRequest: %w", err), types.ErrorCodeInvalidRequest, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
err = helper.ModelMappedHelper(c, info, request)
|
|
if err != nil {
|
|
return types.NewError(err, types.ErrorCodeChannelModelMappedError, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
adaptor := GetAdaptor(info.ApiType)
|
|
if adaptor == nil {
|
|
return types.NewError(fmt.Errorf("invalid api type: %d", info.ApiType), types.ErrorCodeInvalidApiType, types.ErrOptionWithSkipRetry())
|
|
}
|
|
adaptor.Init(info)
|
|
|
|
if request.MaxTokens == nil || *request.MaxTokens == 0 {
|
|
defaultMaxTokens := uint(model_setting.GetClaudeSettings().GetDefaultMaxTokens(request.Model))
|
|
request.MaxTokens = &defaultMaxTokens
|
|
}
|
|
|
|
if baseModel, effortLevel, ok := reasoning.TrimEffortSuffix(request.Model); ok && effortLevel != "" &&
|
|
strings.HasPrefix(request.Model, "claude-opus-4-6") {
|
|
request.Model = baseModel
|
|
request.Thinking = &dto.Thinking{
|
|
Type: "adaptive",
|
|
}
|
|
request.OutputConfig = json.RawMessage(fmt.Sprintf(`{"effort":"%s"}`, effortLevel))
|
|
request.TopP = common.GetPointer[float64](0)
|
|
request.Temperature = common.GetPointer[float64](1.0)
|
|
info.UpstreamModelName = request.Model
|
|
} else if model_setting.GetClaudeSettings().ThinkingAdapterEnabled &&
|
|
strings.HasSuffix(request.Model, "-thinking") {
|
|
if request.Thinking == nil {
|
|
// 因为BudgetTokens 必须大于1024
|
|
if request.MaxTokens == nil || *request.MaxTokens < 1280 {
|
|
request.MaxTokens = common.GetPointer[uint](1280)
|
|
}
|
|
|
|
// BudgetTokens 为 max_tokens 的 80%
|
|
request.Thinking = &dto.Thinking{
|
|
Type: "enabled",
|
|
BudgetTokens: common.GetPointer[int](int(float64(*request.MaxTokens) * model_setting.GetClaudeSettings().ThinkingAdapterBudgetTokensPercentage)),
|
|
}
|
|
// TODO: 临时处理
|
|
// https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking
|
|
request.TopP = common.GetPointer[float64](0)
|
|
request.Temperature = common.GetPointer[float64](1.0)
|
|
}
|
|
if !model_setting.ShouldPreserveThinkingSuffix(info.OriginModelName) {
|
|
request.Model = strings.TrimSuffix(request.Model, "-thinking")
|
|
}
|
|
info.UpstreamModelName = request.Model
|
|
}
|
|
|
|
if info.ChannelSetting.SystemPrompt != "" {
|
|
if request.System == nil {
|
|
request.SetStringSystem(info.ChannelSetting.SystemPrompt)
|
|
} else if info.ChannelSetting.SystemPromptOverride {
|
|
common.SetContextKey(c, constant.ContextKeySystemPromptOverride, true)
|
|
if request.IsStringSystem() {
|
|
existing := strings.TrimSpace(request.GetStringSystem())
|
|
if existing == "" {
|
|
request.SetStringSystem(info.ChannelSetting.SystemPrompt)
|
|
} else {
|
|
request.SetStringSystem(info.ChannelSetting.SystemPrompt + "\n" + existing)
|
|
}
|
|
} else {
|
|
systemContents := request.ParseSystem()
|
|
newSystem := dto.ClaudeMediaMessage{Type: dto.ContentTypeText}
|
|
newSystem.SetText(info.ChannelSetting.SystemPrompt)
|
|
if len(systemContents) == 0 {
|
|
request.System = []dto.ClaudeMediaMessage{newSystem}
|
|
} else {
|
|
request.System = append([]dto.ClaudeMediaMessage{newSystem}, systemContents...)
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
if !model_setting.GetGlobalSettings().PassThroughRequestEnabled &&
|
|
!info.ChannelSetting.PassThroughBodyEnabled &&
|
|
service.ShouldChatCompletionsUseResponsesGlobal(info.ChannelId, info.ChannelType, info.OriginModelName) {
|
|
openAIRequest, convErr := service.ClaudeToOpenAIRequest(*request, info)
|
|
if convErr != nil {
|
|
return types.NewError(convErr, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
usage, newApiErr := chatCompletionsViaResponses(c, info, adaptor, openAIRequest)
|
|
if newApiErr != nil {
|
|
return newApiErr
|
|
}
|
|
|
|
service.PostClaudeConsumeQuota(c, info, usage)
|
|
return nil
|
|
}
|
|
|
|
var requestBody io.Reader
|
|
if model_setting.GetGlobalSettings().PassThroughRequestEnabled || info.ChannelSetting.PassThroughBodyEnabled {
|
|
storage, err := common.GetBodyStorage(c)
|
|
if err != nil {
|
|
return types.NewErrorWithStatusCode(err, types.ErrorCodeReadRequestBodyFailed, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
|
|
}
|
|
requestBody = common.ReaderOnly(storage)
|
|
} else {
|
|
convertedRequest, err := adaptor.ConvertClaudeRequest(c, info, request)
|
|
if err != nil {
|
|
return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
|
|
}
|
|
relaycommon.AppendRequestConversionFromRequest(info, convertedRequest)
|
|
jsonData, err := common.Marshal(convertedRequest)
|
|
if err != nil {
|
|
return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
// remove disabled fields for Claude API
|
|
jsonData, err = relaycommon.RemoveDisabledFields(jsonData, info.ChannelOtherSettings, info.ChannelSetting.PassThroughBodyEnabled)
|
|
if err != nil {
|
|
return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
|
|
}
|
|
|
|
// apply param override
|
|
if len(info.ParamOverride) > 0 {
|
|
jsonData, err = relaycommon.ApplyParamOverrideWithRelayInfo(jsonData, info)
|
|
if err != nil {
|
|
return newAPIErrorFromParamOverride(err)
|
|
}
|
|
}
|
|
|
|
if common.DebugEnabled {
|
|
println("requestBody: ", string(jsonData))
|
|
}
|
|
requestBody = bytes.NewBuffer(jsonData)
|
|
}
|
|
|
|
statusCodeMappingStr := c.GetString("status_code_mapping")
|
|
var httpResp *http.Response
|
|
resp, err := adaptor.DoRequest(c, info, requestBody)
|
|
if err != nil {
|
|
return types.NewOpenAIError(err, types.ErrorCodeDoRequestFailed, http.StatusInternalServerError)
|
|
}
|
|
|
|
if resp != nil {
|
|
httpResp = resp.(*http.Response)
|
|
info.IsStream = info.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
|
|
if httpResp.StatusCode != http.StatusOK {
|
|
newAPIError = service.RelayErrorHandler(c.Request.Context(), httpResp, false)
|
|
// reset status code 重置状态码
|
|
service.ResetStatusCode(newAPIError, statusCodeMappingStr)
|
|
return newAPIError
|
|
}
|
|
}
|
|
|
|
usage, newAPIError := adaptor.DoResponse(c, httpResp, info)
|
|
//log.Printf("usage: %v", usage)
|
|
if newAPIError != nil {
|
|
// reset status code 重置状态码
|
|
service.ResetStatusCode(newAPIError, statusCodeMappingStr)
|
|
return newAPIError
|
|
}
|
|
|
|
service.PostClaudeConsumeQuota(c, info, usage.(*dto.Usage))
|
|
return nil
|
|
}
|