Merge pull request #1110 from wangr0031/fix_parallel_tool_calls

feat: chat/completion路由透传parallel_tool_calls参数
Update openai_request.go
2026-04-04 18:24:14 +00:00 · 2025-05-28 14:25:43 +08:00 · 2025-05-28 14:25:24 +08:00 · 2025-05-28 14:16:47 +08:00 · 2025-05-28 14:11:17 +08:00 · 2025-05-27 21:50:53 +08:00
8 changed files with 89 additions and 16 deletions
--- a/controller/channel.go
+++ b/controller/channel.go
@@ -119,8 +119,11 @@ func FetchUpstreamModels(c *gin.Context) {
 		baseURL = channel.GetBaseURL()
 	}
 	url := fmt.Sprintf("%s/v1/models", baseURL)
-	if channel.Type == common.ChannelTypeGemini {
+	switch channel.Type {
+	case common.ChannelTypeGemini:
 		url = fmt.Sprintf("%s/v1beta/openai/models", baseURL)
+	case common.ChannelTypeAli:
+		url = fmt.Sprintf("%s/compatible-mode/v1/models", baseURL)
 	}
 	body, err := GetResponseBody("GET", url, channel, GetAuthHeader(channel.Key))
 	if err != nil {
--- a/dto/openai_request.go
+++ b/dto/openai_request.go
@@ -43,6 +43,7 @@ type GeneralOpenAIRequest struct {
 	ResponseFormat   *ResponseFormat   `json:"response_format,omitempty"`
 	EncodingFormat   any               `json:"encoding_format,omitempty"`
 	Seed             float64           `json:"seed,omitempty"`
+	ParallelTooCalls bool              `json:"parallel_tool_calls,omitempty"`
 	Tools            []ToolCallRequest `json:"tools,omitempty"`
 	ToolChoice       any               `json:"tool_choice,omitempty"`
 	User             string            `json:"user,omitempty"`
@@ -53,6 +54,7 @@ type GeneralOpenAIRequest struct {
 	Audio            any               `json:"audio,omitempty"`
 	EnableThinking   any               `json:"enable_thinking,omitempty"` // ali
 	ExtraBody        any               `json:"extra_body,omitempty"`
+	WebSearchOptions *WebSearchOptions `json:"web_search_options,omitempty"`
 }

 type ToolCallRequest struct {
@@ -371,6 +373,11 @@ func (m *Message) ParseContent() []MediaContent {
 	return contentList
 }

+type WebSearchOptions struct {
+	SearchContextSize string          `json:"search_context_size,omitempty"`
+	UserLocation      json.RawMessage `json:"user_location,omitempty"`
+}
+
 type OpenAIResponsesRequest struct {
 	Model              string               `json:"model"`
 	Input              json.RawMessage      `json:"input,omitempty"`
--- a/relay/channel/ali/adaptor.go
+++ b/relay/channel/ali/adaptor.go
@@ -57,6 +57,12 @@ func (a *Adaptor) ConvertOpenAIRequest(c *gin.Context, info *relaycommon.RelayIn
 	if request == nil {
 		return nil, errors.New("request is nil")
 	}
+
+	// fix: ali parameter.enable_thinking must be set to false for non-streaming calls
+	if !info.IsStream {
+		request.EnableThinking = false
+	}
+
 	switch info.RelayMode {
 	default:
 		aliReq := requestOpenAI2Ali(*request)
--- a/relay/channel/vertex/adaptor.go
+++ b/relay/channel/vertex/adaptor.go
@@ -95,14 +95,23 @@ func (a *Adaptor) GetRequestURL(info *relaycommon.RelayInfo) (string, error) {
 		} else {
 			suffix = "generateContent"
 		}
-		return fmt.Sprintf(
-			"https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/google/models/%s:%s",
-			region,
-			adc.ProjectID,
-			region,
-			info.UpstreamModelName,
-			suffix,
-		), nil
+		if region == "global" {
+			return fmt.Sprintf(
+				"https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/google/models/%s:%s",
+				adc.ProjectID,
+				info.UpstreamModelName,
+				suffix,
+			), nil
+		} else {
+			return fmt.Sprintf(
+				"https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/google/models/%s:%s",
+				region,
+				adc.ProjectID,
+				region,
+				info.UpstreamModelName,
+				suffix,
+			), nil
+		}
 	} else if a.RequestMode == RequestModeClaude {
 		if info.IsStream {
 			suffix = "streamRawPredict?alt=sse"
--- a/relay/relay-text.go
+++ b/relay/relay-text.go
@@ -47,6 +47,20 @@ func getAndValidateTextRequest(c *gin.Context, relayInfo *relaycommon.RelayInfo)
 	if textRequest.Model == "" {
 		return nil, errors.New("model is required")
 	}
+	if textRequest.WebSearchOptions != nil {
+		if textRequest.WebSearchOptions.SearchContextSize != "" {
+			validSizes := map[string]bool{
+				"high":   true,
+				"medium": true,
+				"low":    true,
+			}
+			if !validSizes[textRequest.WebSearchOptions.SearchContextSize] {
+				return nil, errors.New("invalid search_context_size, must be one of: high, medium, low")
+			}
+		} else {
+			textRequest.WebSearchOptions.SearchContextSize = "medium"
+		}
+	}
 	switch relayInfo.RelayMode {
 	case relayconstant.RelayModeCompletions:
 		if textRequest.Prompt == "" {
@@ -76,6 +90,10 @@ func TextHelper(c *gin.Context) (openaiErr *dto.OpenAIErrorWithStatusCode) {

 	// get & validate textRequest 获取并验证文本请求
 	textRequest, err := getAndValidateTextRequest(c, relayInfo)
+	if textRequest.WebSearchOptions != nil {
+		c.Set("chat_completion_web_search_context_size", textRequest.WebSearchOptions.SearchContextSize)
+	}
+
 	if err != nil {
 		common.LogError(c, fmt.Sprintf("getAndValidateTextRequest failed: %s", err.Error()))
 		return service.OpenAIErrorWrapperLocal(err, "invalid_text_request", http.StatusBadRequest)
@@ -370,9 +388,20 @@ func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo,
 			dWebSearchQuota = decimal.NewFromFloat(webSearchPrice).
 				Mul(decimal.NewFromInt(int64(webSearchTool.CallCount))).
 				Div(decimal.NewFromInt(1000)).Mul(dGroupRatio).Mul(dQuotaPerUnit)
-			extraContent += fmt.Sprintf("Web Search 调用 %d 次，上下文大小 %s，调用花费 $%s",
+			extraContent += fmt.Sprintf("Web Search 调用 %d 次，上下文大小 %s，调用花费 %s",
 				webSearchTool.CallCount, webSearchTool.SearchContextSize, dWebSearchQuota.String())
 		}
+	} else if strings.HasSuffix(modelName, "search-preview") {
+		// search-preview 模型不支持 response api
+		searchContextSize := ctx.GetString("chat_completion_web_search_context_size")
+		if searchContextSize == "" {
+			searchContextSize = "medium"
+		}
+		webSearchPrice = operation_setting.GetWebSearchPricePerThousand(modelName, searchContextSize)
+		dWebSearchQuota = decimal.NewFromFloat(webSearchPrice).
+			Div(decimal.NewFromInt(1000)).Mul(dGroupRatio).Mul(dQuotaPerUnit)
+		extraContent += fmt.Sprintf("Web Search 调用 1 次，上下文大小 %s，调用花费 %s",
+			searchContextSize, dWebSearchQuota.String())
 	}
 	// file search tool 计费
 	var dFileSearchQuota decimal.Decimal
@@ -463,10 +492,16 @@ func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo,
 		other["image_ratio"] = imageRatio
 		other["image_output"] = imageTokens
 	}
-	if !dWebSearchQuota.IsZero() && relayInfo.ResponsesUsageInfo != nil {
-		if webSearchTool, exists := relayInfo.ResponsesUsageInfo.BuiltInTools[dto.BuildInToolWebSearchPreview]; exists {
+	if !dWebSearchQuota.IsZero() {
+		if relayInfo.ResponsesUsageInfo != nil {
+			if webSearchTool, exists := relayInfo.ResponsesUsageInfo.BuiltInTools[dto.BuildInToolWebSearchPreview]; exists {
+				other["web_search"] = true
+				other["web_search_call_count"] = webSearchTool.CallCount
+				other["web_search_price"] = webSearchPrice
+			}
+		} else if strings.HasSuffix(modelName, "search-preview") {
 			other["web_search"] = true
-			other["web_search_call_count"] = webSearchTool.CallCount
+			other["web_search_call_count"] = 1
 			other["web_search_price"] = webSearchPrice
 		}
 	}
--- a/web/src/components/ChannelsTable.js
+++ b/web/src/components/ChannelsTable.js
@@ -888,9 +888,13 @@ const ChannelsTable = () => {
    const localIdSort = localStorage.getItem('id-sort') === 'true';
    const localPageSize =
      parseInt(localStorage.getItem('page-size')) || ITEMS_PER_PAGE;
+    const localEnableTagMode = localStorage.getItem('enable-tag-mode') === 'true';
+    const localEnableBatchDelete = localStorage.getItem('enable-batch-delete') === 'true';
    setIdSort(localIdSort);
    setPageSize(localPageSize);
-    loadChannels(0, localPageSize, localIdSort, enableTagMode)
+    setEnableTagMode(localEnableTagMode);
+    setEnableBatchDelete(localEnableBatchDelete);
+    loadChannels(0, localPageSize, localIdSort, localEnableTagMode)
      .then()
      .catch((reason) => {
        showError(reason);
@@ -1486,10 +1490,12 @@ const ChannelsTable = () => {
            {t('开启批量操作')}
          </Typography.Text>
          <Switch
+            checked={enableBatchDelete}
            label={t('开启批量操作')}
            uncheckedText={t('关')}
            aria-label={t('是否开启批量操作')}
            onChange={(v) => {
+              localStorage.setItem('enable-batch-delete', v + '');
              setEnableBatchDelete(v);
            }}
          />
@@ -1553,6 +1559,7 @@ const ChannelsTable = () => {
            uncheckedText={t('关')}
            aria-label={t('是否启用标签聚合')}
            onChange={(v) => {
+              localStorage.setItem('enable-tag-mode', v + '');
              setEnableTagMode(v);
              loadChannels(0, pageSize, idSort, v);
            }}
--- a/web/src/pages/Home/index.js
+++ b/web/src/pages/Home/index.js
@@ -158,7 +158,7 @@ const Home = () => {
                  </p>
                  <p>
                    {t('OIDC 身份验证')}：
-                    {statusState?.status?.oidc === true
+                    {statusState?.status?.oidc_enabled === true
                      ? t('已启用')
                      : t('未启用')}
                  </p>
--- a/web/src/pages/Playground/Playground.js
+++ b/web/src/pages/Playground/Playground.js
@@ -64,8 +64,9 @@ const Playground = () => {
    },
  ];

+  const defaultModel = 'gpt-4o-mini';
  const [inputs, setInputs] = useState({
-    model: 'gpt-4o-mini',
+    model: defaultModel,
    group: '',
    max_tokens: 0,
    temperature: 0,
@@ -108,6 +109,11 @@ const Playground = () => {
        value: model,
      }));
      setModels(localModelOptions);
+      // if default model is not in the list, set the first one as default
+      const hasDefault = localModelOptions.some(option => option.value === defaultModel);
+      if (!hasDefault && localModelOptions.length > 0) {
+        setInputs((inputs) => ({ ...inputs, model: localModelOptions[0].value }));
+      }
    } else {
      showError(t(message));
    }
Author	SHA1	Message	Date
IcedTangerine	87540b4f7c	Merge pull request #1110 from wangr0031/fix_parallel_tool_calls feat: chat/completion路由透传parallel_tool_calls参数	2025-05-28 14:25:43 +08:00
IcedTangerine	e3d7b31a49	Update openai_request.go	2025-05-28 14:25:24 +08:00
IcedTangerine	bf016543c3	Merge pull request #1113 from tbphp/tbphp_vertex_gemini_global_region fix: Vertex channel global region format	2025-05-28 14:16:47 +08:00
IcedTangerine	eb94aa13e6	Merge pull request #1111 from feitianbubu/fxm-ali-fetch-models-url fix: ali FetchUpstreamModels url	2025-05-28 14:11:17 +08:00
tbphp	6e72dcd0ba	fix: Vertex channel global region format	2025-05-27 21:50:53 +08:00
skynono	96ab4177ca	fix: ali FetchUpstreamModels url	2025-05-27 11:22:40 +08:00
wang.rong	76824a0337	chat/completion透传parallel_tool_calls参数	2025-05-27 09:32:20 +08:00
IcedTangerine	3cd29a4963	Merge pull request #1109 from feitianbubu/fix-qwen-thinking fix: ali parameter.enable_thinking must be set to false for non-strea…	2025-05-26 19:32:34 +08:00
creamlike1024	41120b4d75	Merge branch 'main' of github.com:QuantumNous/new-api	2025-05-26 18:56:14 +08:00
creamlike1024	30d5a11f46	fix: search-preview model web search billing	2025-05-26 18:53:41 +08:00
skynono	368fd75c86	fix: ali parameter.enable_thinking must be set to false for non-streaming calls	2025-05-26 17:41:02 +08:00
IcedTangerine	ee07762611	Merge pull request #1075 from feitianbubu/fix-default-model-not-exist fix: if default model is not exist, set the first one as default	2025-05-26 17:21:14 +08:00
IcedTangerine	a215538b4d	Merge pull request #1081 from feitianbubu/fixTypoOidcEnabledField fix: typo in oidc_enabled field (previously oidc)	2025-05-26 17:20:35 +08:00
IcedTangerine	873e3f3dc8	Merge pull request #1099 from feitianbubu/fixTagModeStatusSave fix: keep BatchDelete and TagMode enabled status	2025-05-26 17:17:34 +08:00
skynono	2cc2d4f652	fix: keep BatchDelete and TagMode enabled status	2025-05-23 20:17:48 +08:00
skynono	e1190f98e9	fix: typo in oidc_enabled field (previously oidc)	2025-05-21 09:33:57 +08:00
skynono	9c12e02cb5	fix: if default model is not exist, set the first one as default	2025-05-19 14:56:39 +08:00