relay.go 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653
  1. package controller
  2. import (
  3. "errors"
  4. "fmt"
  5. "io"
  6. "log"
  7. "net/http"
  8. "strings"
  9. "time"
  10. "github.com/QuantumNous/new-api/common"
  11. "github.com/QuantumNous/new-api/constant"
  12. "github.com/QuantumNous/new-api/dto"
  13. "github.com/QuantumNous/new-api/logger"
  14. "github.com/QuantumNous/new-api/middleware"
  15. "github.com/QuantumNous/new-api/model"
  16. perfmetrics "github.com/QuantumNous/new-api/pkg/perf_metrics"
  17. "github.com/QuantumNous/new-api/relay"
  18. relaycommon "github.com/QuantumNous/new-api/relay/common"
  19. relayconstant "github.com/QuantumNous/new-api/relay/constant"
  20. "github.com/QuantumNous/new-api/relay/helper"
  21. "github.com/QuantumNous/new-api/service"
  22. "github.com/QuantumNous/new-api/setting"
  23. "github.com/QuantumNous/new-api/setting/operation_setting"
  24. "github.com/QuantumNous/new-api/types"
  25. "github.com/bytedance/gopkg/util/gopool"
  26. "github.com/samber/lo"
  27. "github.com/gin-gonic/gin"
  28. "github.com/gorilla/websocket"
  29. )
  30. func relayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  31. var err *types.NewAPIError
  32. switch info.RelayMode {
  33. case relayconstant.RelayModeImagesGenerations, relayconstant.RelayModeImagesEdits:
  34. err = relay.ImageHelper(c, info)
  35. case relayconstant.RelayModeAudioSpeech:
  36. fallthrough
  37. case relayconstant.RelayModeAudioTranslation:
  38. fallthrough
  39. case relayconstant.RelayModeAudioTranscription:
  40. err = relay.AudioHelper(c, info)
  41. case relayconstant.RelayModeRerank:
  42. err = relay.RerankHelper(c, info)
  43. case relayconstant.RelayModeEmbeddings:
  44. err = relay.EmbeddingHelper(c, info)
  45. case relayconstant.RelayModeResponses, relayconstant.RelayModeResponsesCompact:
  46. err = relay.ResponsesHelper(c, info)
  47. default:
  48. err = relay.TextHelper(c, info)
  49. }
  50. return err
  51. }
  52. func geminiRelayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  53. var err *types.NewAPIError
  54. if strings.Contains(c.Request.URL.Path, "embed") {
  55. err = relay.GeminiEmbeddingHandler(c, info)
  56. } else {
  57. err = relay.GeminiHelper(c, info)
  58. }
  59. return err
  60. }
  61. func Relay(c *gin.Context, relayFormat types.RelayFormat) {
  62. requestId := c.GetString(common.RequestIdKey)
  63. //group := common.GetContextKeyString(c, constant.ContextKeyUsingGroup)
  64. //originalModel := common.GetContextKeyString(c, constant.ContextKeyOriginalModel)
  65. var (
  66. newAPIError *types.NewAPIError
  67. ws *websocket.Conn
  68. )
  69. if relayFormat == types.RelayFormatOpenAIRealtime {
  70. var err error
  71. ws, err = upgrader.Upgrade(c.Writer, c.Request, nil)
  72. if err != nil {
  73. helper.WssError(c, ws, types.NewError(err, types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry()).ToOpenAIError())
  74. return
  75. }
  76. defer ws.Close()
  77. }
  78. defer func() {
  79. if newAPIError != nil {
  80. logger.LogError(c, fmt.Sprintf("relay error: %s", newAPIError.Error()))
  81. newAPIError.SetMessage(common.MessageWithRequestId(newAPIError.Error(), requestId))
  82. switch relayFormat {
  83. case types.RelayFormatOpenAIRealtime:
  84. helper.WssError(c, ws, newAPIError.ToOpenAIError())
  85. case types.RelayFormatClaude:
  86. c.JSON(newAPIError.StatusCode, gin.H{
  87. "type": "error",
  88. "error": newAPIError.ToClaudeError(),
  89. })
  90. default:
  91. c.JSON(newAPIError.StatusCode, gin.H{
  92. "error": newAPIError.ToOpenAIError(),
  93. })
  94. }
  95. }
  96. }()
  97. request, err := helper.GetAndValidateRequest(c, relayFormat)
  98. if err != nil {
  99. // Map "request body too large" to 413 so clients can handle it correctly
  100. if common.IsRequestBodyTooLargeError(err) || errors.Is(err, common.ErrRequestBodyTooLarge) {
  101. newAPIError = types.NewErrorWithStatusCode(err, types.ErrorCodeReadRequestBodyFailed, http.StatusRequestEntityTooLarge, types.ErrOptionWithSkipRetry())
  102. } else {
  103. newAPIError = types.NewError(err, types.ErrorCodeInvalidRequest)
  104. }
  105. return
  106. }
  107. relayInfo, err := relaycommon.GenRelayInfo(c, relayFormat, request, ws)
  108. if err != nil {
  109. newAPIError = types.NewError(err, types.ErrorCodeGenRelayInfoFailed)
  110. return
  111. }
  112. needSensitiveCheck := setting.ShouldCheckPromptSensitive()
  113. needCountToken := constant.CountToken
  114. // Avoid building huge CombineText (strings.Join) when token counting and sensitive check are both disabled.
  115. var meta *types.TokenCountMeta
  116. if needSensitiveCheck || needCountToken {
  117. meta = request.GetTokenCountMeta()
  118. } else {
  119. meta = fastTokenCountMetaForPricing(request)
  120. }
  121. if needSensitiveCheck && meta != nil {
  122. contains, words := service.CheckSensitiveText(meta.CombineText)
  123. if contains {
  124. logger.LogWarn(c, fmt.Sprintf("user sensitive words detected: %s", strings.Join(words, ", ")))
  125. newAPIError = types.NewError(err, types.ErrorCodeSensitiveWordsDetected)
  126. return
  127. }
  128. }
  129. tokens, err := service.EstimateRequestToken(c, meta, relayInfo)
  130. if err != nil {
  131. newAPIError = types.NewError(err, types.ErrorCodeCountTokenFailed)
  132. return
  133. }
  134. relayInfo.SetEstimatePromptTokens(tokens)
  135. priceData, err := helper.ModelPriceHelper(c, relayInfo, tokens, meta)
  136. if err != nil {
  137. newAPIError = types.NewError(err, types.ErrorCodeModelPriceError, types.ErrOptionWithStatusCode(http.StatusBadRequest))
  138. return
  139. }
  140. // common.SetContextKey(c, constant.ContextKeyTokenCountMeta, meta)
  141. if priceData.FreeModel {
  142. logger.LogInfo(c, fmt.Sprintf("模型 %s 免费,跳过预扣费", relayInfo.OriginModelName))
  143. } else {
  144. newAPIError = service.PreConsumeBilling(c, priceData.QuotaToPreConsume, relayInfo)
  145. if newAPIError != nil {
  146. return
  147. }
  148. }
  149. defer func() {
  150. // Only return quota if downstream failed and quota was actually pre-consumed
  151. if newAPIError != nil {
  152. newAPIError = service.NormalizeViolationFeeError(newAPIError)
  153. if relayInfo.Billing != nil {
  154. relayInfo.Billing.Refund(c)
  155. }
  156. service.ChargeViolationFeeIfNeeded(c, relayInfo, newAPIError)
  157. }
  158. }()
  159. retryParam := &service.RetryParam{
  160. Ctx: c,
  161. TokenGroup: relayInfo.TokenGroup,
  162. ModelName: relayInfo.OriginModelName,
  163. Retry: common.GetPointer(0),
  164. }
  165. relayInfo.RetryIndex = 0
  166. relayInfo.LastError = nil
  167. for ; retryParam.GetRetry() <= common.RetryTimes; retryParam.IncreaseRetry() {
  168. relayInfo.RetryIndex = retryParam.GetRetry()
  169. channel, channelErr := getChannel(c, relayInfo, retryParam)
  170. if channelErr != nil {
  171. logger.LogError(c, channelErr.Error())
  172. newAPIError = channelErr
  173. break
  174. }
  175. addUsedChannel(c, channel.Id)
  176. bodyStorage, bodyErr := common.GetBodyStorage(c)
  177. if bodyErr != nil {
  178. // Ensure consistent 413 for oversized bodies even when error occurs later (e.g., retry path)
  179. if common.IsRequestBodyTooLargeError(bodyErr) || errors.Is(bodyErr, common.ErrRequestBodyTooLarge) {
  180. newAPIError = types.NewErrorWithStatusCode(bodyErr, types.ErrorCodeReadRequestBodyFailed, http.StatusRequestEntityTooLarge, types.ErrOptionWithSkipRetry())
  181. } else {
  182. newAPIError = types.NewErrorWithStatusCode(bodyErr, types.ErrorCodeReadRequestBodyFailed, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  183. }
  184. break
  185. }
  186. c.Request.Body = io.NopCloser(bodyStorage)
  187. switch relayFormat {
  188. case types.RelayFormatOpenAIRealtime:
  189. newAPIError = relay.WssHelper(c, relayInfo)
  190. case types.RelayFormatClaude:
  191. newAPIError = relay.ClaudeHelper(c, relayInfo)
  192. case types.RelayFormatGemini:
  193. newAPIError = geminiRelayHandler(c, relayInfo)
  194. default:
  195. newAPIError = relayHandler(c, relayInfo)
  196. }
  197. if newAPIError == nil {
  198. relayInfo.LastError = nil
  199. return
  200. }
  201. newAPIError = service.NormalizeViolationFeeError(newAPIError)
  202. relayInfo.LastError = newAPIError
  203. processChannelError(c, *types.NewChannelError(channel.Id, channel.Type, channel.Name, channel.ChannelInfo.IsMultiKey, common.GetContextKeyString(c, constant.ContextKeyChannelKey), channel.GetAutoBan()), newAPIError)
  204. if !shouldRetry(c, newAPIError, common.RetryTimes-retryParam.GetRetry()) {
  205. break
  206. }
  207. }
  208. useChannel := c.GetStringSlice("use_channel")
  209. if len(useChannel) > 1 {
  210. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  211. logger.LogInfo(c, retryLogStr)
  212. }
  213. if newAPIError != nil {
  214. gopool.Go(func() {
  215. perfmetrics.RecordRelaySample(relayInfo, false)
  216. })
  217. }
  218. }
  219. var upgrader = websocket.Upgrader{
  220. Subprotocols: []string{"realtime"}, // WS 握手支持的协议,如果有使用 Sec-WebSocket-Protocol,则必须在此声明对应的 Protocol TODO add other protocol
  221. CheckOrigin: func(r *http.Request) bool {
  222. return true // 允许跨域
  223. },
  224. }
  225. func addUsedChannel(c *gin.Context, channelId int) {
  226. useChannel := c.GetStringSlice("use_channel")
  227. useChannel = append(useChannel, fmt.Sprintf("%d", channelId))
  228. c.Set("use_channel", useChannel)
  229. }
  230. func fastTokenCountMetaForPricing(request dto.Request) *types.TokenCountMeta {
  231. if request == nil {
  232. return &types.TokenCountMeta{}
  233. }
  234. meta := &types.TokenCountMeta{
  235. TokenType: types.TokenTypeTokenizer,
  236. }
  237. switch r := request.(type) {
  238. case *dto.GeneralOpenAIRequest:
  239. maxCompletionTokens := lo.FromPtrOr(r.MaxCompletionTokens, uint(0))
  240. maxTokens := lo.FromPtrOr(r.MaxTokens, uint(0))
  241. if maxCompletionTokens > maxTokens {
  242. meta.MaxTokens = int(maxCompletionTokens)
  243. } else {
  244. meta.MaxTokens = int(maxTokens)
  245. }
  246. case *dto.OpenAIResponsesRequest:
  247. meta.MaxTokens = int(lo.FromPtrOr(r.MaxOutputTokens, uint(0)))
  248. case *dto.ClaudeRequest:
  249. meta.MaxTokens = int(lo.FromPtr(r.MaxTokens))
  250. case *dto.ImageRequest:
  251. // Pricing for image requests depends on ImagePriceRatio; safe to compute even when CountToken is disabled.
  252. return r.GetTokenCountMeta()
  253. default:
  254. // Best-effort: leave CombineText empty to avoid large allocations.
  255. }
  256. return meta
  257. }
  258. func getChannel(c *gin.Context, info *relaycommon.RelayInfo, retryParam *service.RetryParam) (*model.Channel, *types.NewAPIError) {
  259. if info.ChannelMeta == nil {
  260. autoBan := c.GetBool("auto_ban")
  261. autoBanInt := 1
  262. if !autoBan {
  263. autoBanInt = 0
  264. }
  265. return &model.Channel{
  266. Id: c.GetInt("channel_id"),
  267. Type: c.GetInt("channel_type"),
  268. Name: c.GetString("channel_name"),
  269. AutoBan: &autoBanInt,
  270. }, nil
  271. }
  272. channel, selectGroup, err := service.CacheGetRandomSatisfiedChannel(retryParam)
  273. info.PriceData.GroupRatioInfo = helper.HandleGroupRatio(c, info)
  274. if err != nil {
  275. return nil, types.NewError(fmt.Errorf("获取分组 %s 下模型 %s 的可用渠道失败(retry): %s", selectGroup, info.OriginModelName, err.Error()), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  276. }
  277. if channel == nil {
  278. return nil, types.NewError(fmt.Errorf("分组 %s 下模型 %s 的可用渠道不存在(retry)", selectGroup, info.OriginModelName), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  279. }
  280. newAPIError := middleware.SetupContextForSelectedChannel(c, channel, info.OriginModelName)
  281. if newAPIError != nil {
  282. return nil, newAPIError
  283. }
  284. return channel, nil
  285. }
  286. func shouldRetry(c *gin.Context, openaiErr *types.NewAPIError, retryTimes int) bool {
  287. if openaiErr == nil {
  288. return false
  289. }
  290. if service.ShouldSkipRetryAfterChannelAffinityFailure(c) {
  291. return false
  292. }
  293. if types.IsChannelError(openaiErr) {
  294. return true
  295. }
  296. if types.IsSkipRetryError(openaiErr) {
  297. return false
  298. }
  299. if retryTimes <= 0 {
  300. return false
  301. }
  302. if _, ok := c.Get("specific_channel_id"); ok {
  303. return false
  304. }
  305. code := openaiErr.StatusCode
  306. if code >= 200 && code < 300 {
  307. return false
  308. }
  309. if code < 100 || code > 599 {
  310. return true
  311. }
  312. if operation_setting.IsAlwaysSkipRetryCode(openaiErr.GetErrorCode()) {
  313. return false
  314. }
  315. return operation_setting.ShouldRetryByStatusCode(code)
  316. }
  317. func processChannelError(c *gin.Context, channelError types.ChannelError, err *types.NewAPIError) {
  318. logger.LogError(c, fmt.Sprintf("channel error (channel #%d, status code: %d): %s", channelError.ChannelId, err.StatusCode, err.Error()))
  319. // 不要使用context获取渠道信息,异步处理时可能会出现渠道信息不一致的情况
  320. // do not use context to get channel info, there may be inconsistent channel info when processing asynchronously
  321. if service.ShouldDisableChannel(err) && channelError.AutoBan {
  322. gopool.Go(func() {
  323. service.DisableChannel(channelError, err.ErrorWithStatusCode())
  324. })
  325. }
  326. if constant.ErrorLogEnabled && types.IsRecordErrorLog(err) {
  327. // 保存错误日志到mysql中
  328. userId := c.GetInt("id")
  329. tokenName := c.GetString("token_name")
  330. modelName := c.GetString("original_model")
  331. tokenId := c.GetInt("token_id")
  332. userGroup := c.GetString("group")
  333. channelId := c.GetInt("channel_id")
  334. other := make(map[string]interface{})
  335. if c.Request != nil && c.Request.URL != nil {
  336. other["request_path"] = c.Request.URL.Path
  337. }
  338. other["error_type"] = err.GetErrorType()
  339. other["error_code"] = err.GetErrorCode()
  340. other["status_code"] = err.StatusCode
  341. other["channel_id"] = channelId
  342. other["channel_name"] = c.GetString("channel_name")
  343. other["channel_type"] = c.GetInt("channel_type")
  344. adminInfo := make(map[string]interface{})
  345. adminInfo["use_channel"] = c.GetStringSlice("use_channel")
  346. isMultiKey := common.GetContextKeyBool(c, constant.ContextKeyChannelIsMultiKey)
  347. if isMultiKey {
  348. adminInfo["is_multi_key"] = true
  349. adminInfo["multi_key_index"] = common.GetContextKeyInt(c, constant.ContextKeyChannelMultiKeyIndex)
  350. }
  351. service.AppendChannelAffinityAdminInfo(c, adminInfo)
  352. other["admin_info"] = adminInfo
  353. startTime := common.GetContextKeyTime(c, constant.ContextKeyRequestStartTime)
  354. if startTime.IsZero() {
  355. startTime = time.Now()
  356. }
  357. useTimeSeconds := int(time.Since(startTime).Seconds())
  358. model.RecordErrorLog(c, userId, channelId, modelName, tokenName, err.MaskSensitiveErrorWithStatusCode(), tokenId, useTimeSeconds, common.GetContextKeyBool(c, constant.ContextKeyIsStream), userGroup, other)
  359. }
  360. }
  361. func RelayMidjourney(c *gin.Context) {
  362. relayInfo, err := relaycommon.GenRelayInfo(c, types.RelayFormatMjProxy, nil, nil)
  363. if err != nil {
  364. c.JSON(http.StatusInternalServerError, gin.H{
  365. "description": fmt.Sprintf("failed to generate relay info: %s", err.Error()),
  366. "type": "upstream_error",
  367. "code": 4,
  368. })
  369. return
  370. }
  371. var mjErr *dto.MidjourneyResponse
  372. switch relayInfo.RelayMode {
  373. case relayconstant.RelayModeMidjourneyNotify:
  374. mjErr = relay.RelayMidjourneyNotify(c)
  375. case relayconstant.RelayModeMidjourneyTaskFetch, relayconstant.RelayModeMidjourneyTaskFetchByCondition:
  376. mjErr = relay.RelayMidjourneyTask(c, relayInfo.RelayMode)
  377. case relayconstant.RelayModeMidjourneyTaskImageSeed:
  378. mjErr = relay.RelayMidjourneyTaskImageSeed(c)
  379. case relayconstant.RelayModeSwapFace:
  380. mjErr = relay.RelaySwapFace(c, relayInfo)
  381. default:
  382. mjErr = relay.RelayMidjourneySubmit(c, relayInfo)
  383. }
  384. //err = relayMidjourneySubmit(c, relayMode)
  385. log.Println(mjErr)
  386. if mjErr != nil {
  387. statusCode := http.StatusBadRequest
  388. if mjErr.Code == 30 {
  389. mjErr.Result = "当前分组负载已饱和,请稍后再试,或升级账户以提升服务质量。"
  390. statusCode = http.StatusTooManyRequests
  391. }
  392. c.JSON(statusCode, gin.H{
  393. "description": fmt.Sprintf("%s %s", mjErr.Description, mjErr.Result),
  394. "type": "upstream_error",
  395. "code": mjErr.Code,
  396. })
  397. channelId := c.GetInt("channel_id")
  398. logger.LogError(c, fmt.Sprintf("relay error (channel #%d, status code %d): %s", channelId, statusCode, fmt.Sprintf("%s %s", mjErr.Description, mjErr.Result)))
  399. }
  400. }
  401. func RelayNotImplemented(c *gin.Context) {
  402. err := types.OpenAIError{
  403. Message: "API not implemented",
  404. Type: "new_api_error",
  405. Param: "",
  406. Code: "api_not_implemented",
  407. }
  408. c.JSON(http.StatusNotImplemented, gin.H{
  409. "error": err,
  410. })
  411. }
  412. func RelayNotFound(c *gin.Context) {
  413. err := types.OpenAIError{
  414. Message: fmt.Sprintf("Invalid URL (%s %s)", c.Request.Method, c.Request.URL.Path),
  415. Type: "invalid_request_error",
  416. Param: "",
  417. Code: "",
  418. }
  419. c.JSON(http.StatusNotFound, gin.H{
  420. "error": err,
  421. })
  422. }
  423. func RelayTaskFetch(c *gin.Context) {
  424. relayInfo, err := relaycommon.GenRelayInfo(c, types.RelayFormatTask, nil, nil)
  425. if err != nil {
  426. c.JSON(http.StatusInternalServerError, &dto.TaskError{
  427. Code: "gen_relay_info_failed",
  428. Message: err.Error(),
  429. StatusCode: http.StatusInternalServerError,
  430. })
  431. return
  432. }
  433. if taskErr := relay.RelayTaskFetch(c, relayInfo.RelayMode); taskErr != nil {
  434. respondTaskError(c, taskErr)
  435. }
  436. }
  437. func RelayTask(c *gin.Context) {
  438. relayInfo, err := relaycommon.GenRelayInfo(c, types.RelayFormatTask, nil, nil)
  439. if err != nil {
  440. c.JSON(http.StatusInternalServerError, &dto.TaskError{
  441. Code: "gen_relay_info_failed",
  442. Message: err.Error(),
  443. StatusCode: http.StatusInternalServerError,
  444. })
  445. return
  446. }
  447. if taskErr := relay.ResolveOriginTask(c, relayInfo); taskErr != nil {
  448. respondTaskError(c, taskErr)
  449. return
  450. }
  451. var result *relay.TaskSubmitResult
  452. var taskErr *dto.TaskError
  453. defer func() {
  454. if taskErr != nil && relayInfo.Billing != nil {
  455. relayInfo.Billing.Refund(c)
  456. }
  457. }()
  458. retryParam := &service.RetryParam{
  459. Ctx: c,
  460. TokenGroup: relayInfo.TokenGroup,
  461. ModelName: relayInfo.OriginModelName,
  462. Retry: common.GetPointer(0),
  463. }
  464. for ; retryParam.GetRetry() <= common.RetryTimes; retryParam.IncreaseRetry() {
  465. var channel *model.Channel
  466. if lockedCh, ok := relayInfo.LockedChannel.(*model.Channel); ok && lockedCh != nil {
  467. channel = lockedCh
  468. if retryParam.GetRetry() > 0 {
  469. if setupErr := middleware.SetupContextForSelectedChannel(c, channel, relayInfo.OriginModelName); setupErr != nil {
  470. taskErr = service.TaskErrorWrapperLocal(setupErr.Err, "setup_locked_channel_failed", http.StatusInternalServerError)
  471. break
  472. }
  473. }
  474. } else {
  475. var channelErr *types.NewAPIError
  476. channel, channelErr = getChannel(c, relayInfo, retryParam)
  477. if channelErr != nil {
  478. logger.LogError(c, channelErr.Error())
  479. taskErr = service.TaskErrorWrapperLocal(channelErr.Err, "get_channel_failed", http.StatusInternalServerError)
  480. break
  481. }
  482. }
  483. addUsedChannel(c, channel.Id)
  484. bodyStorage, bodyErr := common.GetBodyStorage(c)
  485. if bodyErr != nil {
  486. if common.IsRequestBodyTooLargeError(bodyErr) || errors.Is(bodyErr, common.ErrRequestBodyTooLarge) {
  487. taskErr = service.TaskErrorWrapperLocal(bodyErr, "read_request_body_failed", http.StatusRequestEntityTooLarge)
  488. } else {
  489. taskErr = service.TaskErrorWrapperLocal(bodyErr, "read_request_body_failed", http.StatusBadRequest)
  490. }
  491. break
  492. }
  493. c.Request.Body = io.NopCloser(bodyStorage)
  494. result, taskErr = relay.RelayTaskSubmit(c, relayInfo)
  495. if taskErr == nil {
  496. break
  497. }
  498. if !taskErr.LocalError {
  499. processChannelError(c,
  500. *types.NewChannelError(channel.Id, channel.Type, channel.Name, channel.ChannelInfo.IsMultiKey,
  501. common.GetContextKeyString(c, constant.ContextKeyChannelKey), channel.GetAutoBan()),
  502. types.NewOpenAIError(taskErr.Error, types.ErrorCodeBadResponseStatusCode, taskErr.StatusCode))
  503. }
  504. if !shouldRetryTaskRelay(c, channel.Id, taskErr, common.RetryTimes-retryParam.GetRetry()) {
  505. break
  506. }
  507. }
  508. useChannel := c.GetStringSlice("use_channel")
  509. if len(useChannel) > 1 {
  510. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  511. logger.LogInfo(c, retryLogStr)
  512. }
  513. // ── 成功:结算 + 日志 + 插入任务 ──
  514. if taskErr == nil {
  515. if settleErr := service.SettleBilling(c, relayInfo, result.Quota); settleErr != nil {
  516. common.SysError("settle task billing error: " + settleErr.Error())
  517. }
  518. service.LogTaskConsumption(c, relayInfo)
  519. task := model.InitTask(result.Platform, relayInfo)
  520. task.PrivateData.UpstreamTaskID = result.UpstreamTaskID
  521. task.PrivateData.BillingSource = relayInfo.BillingSource
  522. task.PrivateData.SubscriptionId = relayInfo.SubscriptionId
  523. task.PrivateData.TokenId = relayInfo.TokenId
  524. task.PrivateData.BillingContext = &model.TaskBillingContext{
  525. ModelPrice: relayInfo.PriceData.ModelPrice,
  526. GroupRatio: relayInfo.PriceData.GroupRatioInfo.GroupRatio,
  527. ModelRatio: relayInfo.PriceData.ModelRatio,
  528. OtherRatios: relayInfo.PriceData.OtherRatios,
  529. OriginModelName: relayInfo.OriginModelName,
  530. PerCallBilling: common.StringsContains(constant.TaskPricePatches, relayInfo.OriginModelName) || relayInfo.PriceData.UsePrice,
  531. }
  532. task.Quota = result.Quota
  533. task.Data = result.TaskData
  534. task.Action = relayInfo.Action
  535. if insertErr := task.Insert(); insertErr != nil {
  536. common.SysError("insert task error: " + insertErr.Error())
  537. }
  538. }
  539. if taskErr != nil {
  540. respondTaskError(c, taskErr)
  541. }
  542. }
  543. // respondTaskError 统一输出 Task 错误响应(含 429 限流提示改写)
  544. func respondTaskError(c *gin.Context, taskErr *dto.TaskError) {
  545. if taskErr.StatusCode == http.StatusTooManyRequests {
  546. taskErr.Message = "当前分组上游负载已饱和,请稍后再试"
  547. }
  548. c.JSON(taskErr.StatusCode, taskErr)
  549. }
  550. func shouldRetryTaskRelay(c *gin.Context, channelId int, taskErr *dto.TaskError, retryTimes int) bool {
  551. if taskErr == nil {
  552. return false
  553. }
  554. if service.ShouldSkipRetryAfterChannelAffinityFailure(c) {
  555. return false
  556. }
  557. if retryTimes <= 0 {
  558. return false
  559. }
  560. if _, ok := c.Get("specific_channel_id"); ok {
  561. return false
  562. }
  563. if taskErr.StatusCode == http.StatusTooManyRequests {
  564. return true
  565. }
  566. if taskErr.StatusCode == 307 {
  567. return true
  568. }
  569. if taskErr.StatusCode/100 == 5 {
  570. // 超时不重试
  571. if operation_setting.IsAlwaysSkipRetryStatusCode(taskErr.StatusCode) {
  572. return false
  573. }
  574. return true
  575. }
  576. if taskErr.StatusCode == http.StatusBadRequest {
  577. return false
  578. }
  579. if taskErr.StatusCode == 408 {
  580. // azure处理超时不重试
  581. return false
  582. }
  583. if taskErr.LocalError {
  584. return false
  585. }
  586. if taskErr.StatusCode/100 == 2 {
  587. return false
  588. }
  589. return true
  590. }