relay.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473
  1. package controller
  2. import (
  3. "bytes"
  4. "fmt"
  5. "io"
  6. "log"
  7. "net/http"
  8. "one-api/common"
  9. "one-api/constant"
  10. "one-api/dto"
  11. "one-api/logger"
  12. "one-api/middleware"
  13. "one-api/model"
  14. "one-api/relay"
  15. relaycommon "one-api/relay/common"
  16. relayconstant "one-api/relay/constant"
  17. "one-api/relay/helper"
  18. "one-api/service"
  19. "one-api/setting"
  20. "one-api/types"
  21. "strings"
  22. "github.com/gin-gonic/gin"
  23. "github.com/gorilla/websocket"
  24. )
  25. func relayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  26. var err *types.NewAPIError
  27. switch info.RelayMode {
  28. case relayconstant.RelayModeImagesGenerations, relayconstant.RelayModeImagesEdits:
  29. err = relay.ImageHelper(c, info)
  30. case relayconstant.RelayModeAudioSpeech:
  31. fallthrough
  32. case relayconstant.RelayModeAudioTranslation:
  33. fallthrough
  34. case relayconstant.RelayModeAudioTranscription:
  35. err = relay.AudioHelper(c, info)
  36. case relayconstant.RelayModeRerank:
  37. err = relay.RerankHelper(c, info)
  38. case relayconstant.RelayModeEmbeddings:
  39. err = relay.EmbeddingHelper(c, info)
  40. case relayconstant.RelayModeResponses:
  41. err = relay.ResponsesHelper(c, info)
  42. default:
  43. err = relay.TextHelper(c, info)
  44. }
  45. return err
  46. }
  47. func geminiRelayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  48. var err *types.NewAPIError
  49. if strings.Contains(c.Request.URL.Path, "embed") {
  50. err = relay.GeminiEmbeddingHandler(c, info)
  51. } else {
  52. err = relay.GeminiHelper(c, info)
  53. }
  54. return err
  55. }
  56. func Relay(c *gin.Context, relayFormat types.RelayFormat) {
  57. requestId := c.GetString(common.RequestIdKey)
  58. group := c.GetString("group")
  59. originalModel := c.GetString("original_model")
  60. var (
  61. newAPIError *types.NewAPIError
  62. ws *websocket.Conn
  63. )
  64. if relayFormat == types.RelayFormatOpenAIRealtime {
  65. var err error
  66. ws, err = upgrader.Upgrade(c.Writer, c.Request, nil)
  67. if err != nil {
  68. helper.WssError(c, ws, types.NewError(err, types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry()).ToOpenAIError())
  69. return
  70. }
  71. defer ws.Close()
  72. }
  73. defer func() {
  74. if newAPIError != nil {
  75. newAPIError.SetMessage(common.MessageWithRequestId(newAPIError.Error(), requestId))
  76. switch relayFormat {
  77. case types.RelayFormatOpenAIRealtime:
  78. helper.WssError(c, ws, newAPIError.ToOpenAIError())
  79. case types.RelayFormatClaude:
  80. c.JSON(newAPIError.StatusCode, gin.H{
  81. "type": "error",
  82. "error": newAPIError.ToClaudeError(),
  83. })
  84. default:
  85. c.JSON(newAPIError.StatusCode, gin.H{
  86. "error": newAPIError.ToOpenAIError(),
  87. })
  88. }
  89. }
  90. }()
  91. request, err := helper.GetAndValidateRequest(c, relayFormat)
  92. if err != nil {
  93. newAPIError = types.NewError(err, types.ErrorCodeInvalidRequest)
  94. return
  95. }
  96. //includeUsage := true
  97. //// 判断用户是否需要返回使用情况
  98. //if textRequest.StreamOptions != nil {
  99. // includeUsage = textRequest.StreamOptions.IncludeUsage
  100. //}
  101. //
  102. //// 如果不支持StreamOptions,将StreamOptions设置为nil
  103. //if !relayInfo.SupportStreamOptions || !textRequest.Stream {
  104. // textRequest.StreamOptions = nil
  105. //} else {
  106. // // 如果支持StreamOptions,且请求中没有设置StreamOptions,根据配置文件设置StreamOptions
  107. // if constant.ForceStreamOption {
  108. // textRequest.StreamOptions = &dto.StreamOptions{
  109. // IncludeUsage: true,
  110. // }
  111. // }
  112. //}
  113. //
  114. //relayInfo.ShouldIncludeUsage = includeUsage
  115. relayInfo, err := relaycommon.GenRelayInfo(c, relayFormat, request, ws)
  116. if err != nil {
  117. newAPIError = types.NewError(err, types.ErrorCodeGenRelayInfoFailed)
  118. return
  119. }
  120. meta := request.GetTokenCountMeta()
  121. if setting.ShouldCheckPromptSensitive() {
  122. words, err := service.CheckSensitiveText(meta.CombineText)
  123. if err != nil {
  124. logger.LogWarn(c, fmt.Sprintf("user sensitive words detected: %s", strings.Join(words, ", ")))
  125. newAPIError = types.NewError(err, types.ErrorCodeSensitiveWordsDetected)
  126. return
  127. }
  128. }
  129. tokens, err := service.CountRequestToken(c, meta, relayInfo)
  130. if err != nil {
  131. newAPIError = types.NewError(err, types.ErrorCodeCountTokenFailed)
  132. return
  133. }
  134. priceData, err := helper.ModelPriceHelper(c, relayInfo, tokens, meta)
  135. if err != nil {
  136. newAPIError = types.NewError(err, types.ErrorCodeModelPriceError)
  137. return
  138. }
  139. preConsumedQuota, newApiErr := service.PreConsumeQuota(c, priceData.ShouldPreConsumedQuota, relayInfo)
  140. if newApiErr != nil {
  141. return
  142. }
  143. defer func() {
  144. if newApiErr != nil {
  145. service.ReturnPreConsumedQuota(c, relayInfo, preConsumedQuota)
  146. }
  147. }()
  148. for i := 0; i <= common.RetryTimes; i++ {
  149. channel, err := getChannel(c, group, originalModel, i)
  150. if err != nil {
  151. logger.LogError(c, err.Error())
  152. newAPIError = err
  153. break
  154. }
  155. addUsedChannel(c, channel.Id)
  156. requestBody, _ := common.GetRequestBody(c)
  157. c.Request.Body = io.NopCloser(bytes.NewBuffer(requestBody))
  158. switch relayFormat {
  159. case types.RelayFormatOpenAIRealtime:
  160. newAPIError = relay.WssHelper(c, ws)
  161. case types.RelayFormatClaude:
  162. newAPIError = relay.ClaudeHelper(c, relayInfo)
  163. case types.RelayFormatGemini:
  164. newAPIError = geminiRelayHandler(c, relayInfo)
  165. default:
  166. newAPIError = relayHandler(c, relayInfo)
  167. }
  168. if newAPIError == nil {
  169. return
  170. } else {
  171. if constant.ErrorLogEnabled && types.IsRecordErrorLog(newAPIError) {
  172. // 保存错误日志到mysql中
  173. userId := c.GetInt("id")
  174. tokenName := c.GetString("token_name")
  175. modelName := c.GetString("original_model")
  176. tokenId := c.GetInt("token_id")
  177. userGroup := c.GetString("group")
  178. channelId := c.GetInt("channel_id")
  179. other := make(map[string]interface{})
  180. other["error_type"] = newAPIError.GetErrorType()
  181. other["error_code"] = newAPIError.GetErrorCode()
  182. other["status_code"] = newAPIError.StatusCode
  183. other["channel_id"] = channelId
  184. other["channel_name"] = c.GetString("channel_name")
  185. other["channel_type"] = c.GetInt("channel_type")
  186. adminInfo := make(map[string]interface{})
  187. adminInfo["use_channel"] = c.GetStringSlice("use_channel")
  188. isMultiKey := common.GetContextKeyBool(c, constant.ContextKeyChannelIsMultiKey)
  189. if isMultiKey {
  190. adminInfo["is_multi_key"] = true
  191. adminInfo["multi_key_index"] = common.GetContextKeyInt(c, constant.ContextKeyChannelMultiKeyIndex)
  192. }
  193. other["admin_info"] = adminInfo
  194. model.RecordErrorLog(c, userId, channelId, modelName, tokenName, newAPIError.MaskSensitiveError(), tokenId, 0, false, userGroup, other)
  195. }
  196. }
  197. go processChannelError(c, *types.NewChannelError(channel.Id, channel.Type, channel.Name, channel.ChannelInfo.IsMultiKey, common.GetContextKeyString(c, constant.ContextKeyChannelKey), channel.GetAutoBan()), newAPIError)
  198. if !shouldRetry(c, newAPIError, common.RetryTimes-i) {
  199. break
  200. }
  201. }
  202. useChannel := c.GetStringSlice("use_channel")
  203. if len(useChannel) > 1 {
  204. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  205. logger.LogInfo(c, retryLogStr)
  206. }
  207. }
  208. var upgrader = websocket.Upgrader{
  209. Subprotocols: []string{"realtime"}, // WS 握手支持的协议,如果有使用 Sec-WebSocket-Protocol,则必须在此声明对应的 Protocol TODO add other protocol
  210. CheckOrigin: func(r *http.Request) bool {
  211. return true // 允许跨域
  212. },
  213. }
  214. func addUsedChannel(c *gin.Context, channelId int) {
  215. useChannel := c.GetStringSlice("use_channel")
  216. useChannel = append(useChannel, fmt.Sprintf("%d", channelId))
  217. c.Set("use_channel", useChannel)
  218. }
  219. func getChannel(c *gin.Context, group, originalModel string, retryCount int) (*model.Channel, *types.NewAPIError) {
  220. if retryCount == 0 {
  221. autoBan := c.GetBool("auto_ban")
  222. autoBanInt := 1
  223. if !autoBan {
  224. autoBanInt = 0
  225. }
  226. return &model.Channel{
  227. Id: c.GetInt("channel_id"),
  228. Type: c.GetInt("channel_type"),
  229. Name: c.GetString("channel_name"),
  230. AutoBan: &autoBanInt,
  231. }, nil
  232. }
  233. channel, selectGroup, err := model.CacheGetRandomSatisfiedChannel(c, group, originalModel, retryCount)
  234. if err != nil {
  235. return nil, types.NewError(fmt.Errorf("获取分组 %s 下模型 %s 的可用渠道失败(retry): %s", selectGroup, originalModel, err.Error()), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  236. }
  237. if channel == nil {
  238. return nil, types.NewError(fmt.Errorf("分组 %s 下模型 %s 的可用渠道不存在(数据库一致性已被破坏,retry)", selectGroup, originalModel), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  239. }
  240. newAPIError := middleware.SetupContextForSelectedChannel(c, channel, originalModel)
  241. if newAPIError != nil {
  242. return nil, newAPIError
  243. }
  244. return channel, nil
  245. }
  246. func shouldRetry(c *gin.Context, openaiErr *types.NewAPIError, retryTimes int) bool {
  247. if openaiErr == nil {
  248. return false
  249. }
  250. if types.IsChannelError(openaiErr) {
  251. return true
  252. }
  253. if types.IsSkipRetryError(openaiErr) {
  254. return false
  255. }
  256. if retryTimes <= 0 {
  257. return false
  258. }
  259. if _, ok := c.Get("specific_channel_id"); ok {
  260. return false
  261. }
  262. if openaiErr.StatusCode == http.StatusTooManyRequests {
  263. return true
  264. }
  265. if openaiErr.StatusCode == 307 {
  266. return true
  267. }
  268. if openaiErr.StatusCode/100 == 5 {
  269. // 超时不重试
  270. if openaiErr.StatusCode == 504 || openaiErr.StatusCode == 524 {
  271. return false
  272. }
  273. return true
  274. }
  275. if openaiErr.StatusCode == http.StatusBadRequest {
  276. return false
  277. }
  278. if openaiErr.StatusCode == 408 {
  279. // azure处理超时不重试
  280. return false
  281. }
  282. if openaiErr.StatusCode/100 == 2 {
  283. return false
  284. }
  285. return true
  286. }
  287. func processChannelError(c *gin.Context, channelError types.ChannelError, err *types.NewAPIError) {
  288. // 不要使用context获取渠道信息,异步处理时可能会出现渠道信息不一致的情况
  289. // do not use context to get channel info, there may be inconsistent channel info when processing asynchronously
  290. logger.LogError(c, fmt.Sprintf("relay error (channel #%d, status code: %d): %s", channelError.ChannelId, err.StatusCode, err.Error()))
  291. if service.ShouldDisableChannel(channelError.ChannelId, err) && channelError.AutoBan {
  292. service.DisableChannel(channelError, err.Error())
  293. }
  294. }
  295. func RelayMidjourney(c *gin.Context) {
  296. relayMode := c.GetInt("relay_mode")
  297. var err *dto.MidjourneyResponse
  298. switch relayMode {
  299. case relayconstant.RelayModeMidjourneyNotify:
  300. err = relay.RelayMidjourneyNotify(c)
  301. case relayconstant.RelayModeMidjourneyTaskFetch, relayconstant.RelayModeMidjourneyTaskFetchByCondition:
  302. err = relay.RelayMidjourneyTask(c, relayMode)
  303. case relayconstant.RelayModeMidjourneyTaskImageSeed:
  304. err = relay.RelayMidjourneyTaskImageSeed(c)
  305. case relayconstant.RelayModeSwapFace:
  306. err = relay.RelaySwapFace(c)
  307. default:
  308. err = relay.RelayMidjourneySubmit(c, relayMode)
  309. }
  310. //err = relayMidjourneySubmit(c, relayMode)
  311. log.Println(err)
  312. if err != nil {
  313. statusCode := http.StatusBadRequest
  314. if err.Code == 30 {
  315. err.Result = "当前分组负载已饱和,请稍后再试,或升级账户以提升服务质量。"
  316. statusCode = http.StatusTooManyRequests
  317. }
  318. c.JSON(statusCode, gin.H{
  319. "description": fmt.Sprintf("%s %s", err.Description, err.Result),
  320. "type": "upstream_error",
  321. "code": err.Code,
  322. })
  323. channelId := c.GetInt("channel_id")
  324. logger.LogError(c, fmt.Sprintf("relay error (channel #%d, status code %d): %s", channelId, statusCode, fmt.Sprintf("%s %s", err.Description, err.Result)))
  325. }
  326. }
  327. func RelayNotImplemented(c *gin.Context) {
  328. err := dto.OpenAIError{
  329. Message: "API not implemented",
  330. Type: "new_api_error",
  331. Param: "",
  332. Code: "api_not_implemented",
  333. }
  334. c.JSON(http.StatusNotImplemented, gin.H{
  335. "error": err,
  336. })
  337. }
  338. func RelayNotFound(c *gin.Context) {
  339. err := dto.OpenAIError{
  340. Message: fmt.Sprintf("Invalid URL (%s %s)", c.Request.Method, c.Request.URL.Path),
  341. Type: "invalid_request_error",
  342. Param: "",
  343. Code: "",
  344. }
  345. c.JSON(http.StatusNotFound, gin.H{
  346. "error": err,
  347. })
  348. }
  349. func RelayTask(c *gin.Context) {
  350. retryTimes := common.RetryTimes
  351. channelId := c.GetInt("channel_id")
  352. relayMode := c.GetInt("relay_mode")
  353. group := c.GetString("group")
  354. originalModel := c.GetString("original_model")
  355. c.Set("use_channel", []string{fmt.Sprintf("%d", channelId)})
  356. taskErr := taskRelayHandler(c, relayMode)
  357. if taskErr == nil {
  358. retryTimes = 0
  359. }
  360. for i := 0; shouldRetryTaskRelay(c, channelId, taskErr, retryTimes) && i < retryTimes; i++ {
  361. channel, newAPIError := getChannel(c, group, originalModel, i)
  362. if newAPIError != nil {
  363. logger.LogError(c, fmt.Sprintf("CacheGetRandomSatisfiedChannel failed: %s", newAPIError.Error()))
  364. taskErr = service.TaskErrorWrapperLocal(newAPIError.Err, "get_channel_failed", http.StatusInternalServerError)
  365. break
  366. }
  367. channelId = channel.Id
  368. useChannel := c.GetStringSlice("use_channel")
  369. useChannel = append(useChannel, fmt.Sprintf("%d", channelId))
  370. c.Set("use_channel", useChannel)
  371. logger.LogInfo(c, fmt.Sprintf("using channel #%d to retry (remain times %d)", channel.Id, i))
  372. //middleware.SetupContextForSelectedChannel(c, channel, originalModel)
  373. requestBody, _ := common.GetRequestBody(c)
  374. c.Request.Body = io.NopCloser(bytes.NewBuffer(requestBody))
  375. taskErr = taskRelayHandler(c, relayMode)
  376. }
  377. useChannel := c.GetStringSlice("use_channel")
  378. if len(useChannel) > 1 {
  379. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  380. logger.LogInfo(c, retryLogStr)
  381. }
  382. if taskErr != nil {
  383. if taskErr.StatusCode == http.StatusTooManyRequests {
  384. taskErr.Message = "当前分组上游负载已饱和,请稍后再试"
  385. }
  386. c.JSON(taskErr.StatusCode, taskErr)
  387. }
  388. }
  389. func taskRelayHandler(c *gin.Context, relayMode int) *dto.TaskError {
  390. var err *dto.TaskError
  391. switch relayMode {
  392. case relayconstant.RelayModeSunoFetch, relayconstant.RelayModeSunoFetchByID, relayconstant.RelayModeVideoFetchByID:
  393. err = relay.RelayTaskFetch(c, relayMode)
  394. default:
  395. err = relay.RelayTaskSubmit(c, relayMode)
  396. }
  397. return err
  398. }
  399. func shouldRetryTaskRelay(c *gin.Context, channelId int, taskErr *dto.TaskError, retryTimes int) bool {
  400. if taskErr == nil {
  401. return false
  402. }
  403. if retryTimes <= 0 {
  404. return false
  405. }
  406. if _, ok := c.Get("specific_channel_id"); ok {
  407. return false
  408. }
  409. if taskErr.StatusCode == http.StatusTooManyRequests {
  410. return true
  411. }
  412. if taskErr.StatusCode == 307 {
  413. return true
  414. }
  415. if taskErr.StatusCode/100 == 5 {
  416. // 超时不重试
  417. if taskErr.StatusCode == 504 || taskErr.StatusCode == 524 {
  418. return false
  419. }
  420. return true
  421. }
  422. if taskErr.StatusCode == http.StatusBadRequest {
  423. return false
  424. }
  425. if taskErr.StatusCode == 408 {
  426. // azure处理超时不重试
  427. return false
  428. }
  429. if taskErr.LocalError {
  430. return false
  431. }
  432. if taskErr.StatusCode/100 == 2 {
  433. return false
  434. }
  435. return true
  436. }