claude_handler.go 5.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. package relay
  2. import (
  3. "bytes"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "net/http"
  8. "one-api/common"
  9. "one-api/dto"
  10. relaycommon "one-api/relay/common"
  11. "one-api/relay/helper"
  12. "one-api/service"
  13. "one-api/setting/model_setting"
  14. "one-api/types"
  15. "strings"
  16. "github.com/gin-gonic/gin"
  17. )
  18. func getAndValidateClaudeRequest(c *gin.Context) (textRequest *dto.ClaudeRequest, err error) {
  19. textRequest = &dto.ClaudeRequest{}
  20. err = c.ShouldBindJSON(textRequest)
  21. if err != nil {
  22. return nil, err
  23. }
  24. if textRequest.Messages == nil || len(textRequest.Messages) == 0 {
  25. return nil, errors.New("field messages is required")
  26. }
  27. if textRequest.Model == "" {
  28. return nil, errors.New("field model is required")
  29. }
  30. return textRequest, nil
  31. }
  32. func ClaudeHelper(c *gin.Context) (newAPIError *types.NewAPIError) {
  33. relayInfo := relaycommon.GenRelayInfoClaude(c)
  34. // get & validate textRequest 获取并验证文本请求
  35. textRequest, err := getAndValidateClaudeRequest(c)
  36. if err != nil {
  37. return types.NewError(err, types.ErrorCodeInvalidRequest, types.ErrOptionWithSkipRetry())
  38. }
  39. if textRequest.Stream {
  40. relayInfo.IsStream = true
  41. }
  42. err = helper.ModelMappedHelper(c, relayInfo, textRequest)
  43. if err != nil {
  44. return types.NewError(err, types.ErrorCodeChannelModelMappedError, types.ErrOptionWithSkipRetry())
  45. }
  46. promptTokens, err := getClaudePromptTokens(textRequest, relayInfo)
  47. // count messages token error 计算promptTokens错误
  48. if err != nil {
  49. return types.NewError(err, types.ErrorCodeCountTokenFailed, types.ErrOptionWithSkipRetry())
  50. }
  51. priceData, err := helper.ModelPriceHelper(c, relayInfo, promptTokens, int(textRequest.MaxTokens))
  52. if err != nil {
  53. return types.NewError(err, types.ErrorCodeModelPriceError, types.ErrOptionWithSkipRetry())
  54. }
  55. // pre-consume quota 预消耗配额
  56. preConsumedQuota, userQuota, newAPIError := preConsumeQuota(c, priceData.ShouldPreConsumedQuota, relayInfo)
  57. if newAPIError != nil {
  58. return newAPIError
  59. }
  60. defer func() {
  61. if newAPIError != nil {
  62. returnPreConsumedQuota(c, relayInfo, userQuota, preConsumedQuota)
  63. }
  64. }()
  65. adaptor := GetAdaptor(relayInfo.ApiType)
  66. if adaptor == nil {
  67. return types.NewError(fmt.Errorf("invalid api type: %d", relayInfo.ApiType), types.ErrorCodeInvalidApiType, types.ErrOptionWithSkipRetry())
  68. }
  69. adaptor.Init(relayInfo)
  70. if textRequest.MaxTokens == 0 {
  71. textRequest.MaxTokens = uint(model_setting.GetClaudeSettings().GetDefaultMaxTokens(textRequest.Model))
  72. }
  73. if model_setting.GetClaudeSettings().ThinkingAdapterEnabled &&
  74. strings.HasSuffix(textRequest.Model, "-thinking") {
  75. if textRequest.Thinking == nil {
  76. // 因为BudgetTokens 必须大于1024
  77. if textRequest.MaxTokens < 1280 {
  78. textRequest.MaxTokens = 1280
  79. }
  80. // BudgetTokens 为 max_tokens 的 80%
  81. textRequest.Thinking = &dto.Thinking{
  82. Type: "enabled",
  83. BudgetTokens: common.GetPointer[int](int(float64(textRequest.MaxTokens) * model_setting.GetClaudeSettings().ThinkingAdapterBudgetTokensPercentage)),
  84. }
  85. // TODO: 临时处理
  86. // https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking
  87. textRequest.TopP = 0
  88. textRequest.Temperature = common.GetPointer[float64](1.0)
  89. }
  90. textRequest.Model = strings.TrimSuffix(textRequest.Model, "-thinking")
  91. relayInfo.UpstreamModelName = textRequest.Model
  92. }
  93. var requestBody io.Reader
  94. if model_setting.GetGlobalSettings().PassThroughRequestEnabled || relayInfo.ChannelSetting.PassThroughBodyEnabled {
  95. body, err := common.GetRequestBody(c)
  96. if err != nil {
  97. return types.NewErrorWithStatusCode(err, types.ErrorCodeReadRequestBodyFailed, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  98. }
  99. requestBody = bytes.NewBuffer(body)
  100. } else {
  101. convertedRequest, err := adaptor.ConvertClaudeRequest(c, relayInfo, textRequest)
  102. if err != nil {
  103. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  104. }
  105. jsonData, err := common.Marshal(convertedRequest)
  106. if err != nil {
  107. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  108. }
  109. // apply param override
  110. if len(relayInfo.ParamOverride) > 0 {
  111. reqMap := make(map[string]interface{})
  112. _ = common.Unmarshal(jsonData, &reqMap)
  113. for key, value := range relayInfo.ParamOverride {
  114. reqMap[key] = value
  115. }
  116. jsonData, err = common.Marshal(reqMap)
  117. if err != nil {
  118. return types.NewError(err, types.ErrorCodeChannelParamOverrideInvalid, types.ErrOptionWithSkipRetry())
  119. }
  120. }
  121. if common.DebugEnabled {
  122. println("requestBody: ", string(jsonData))
  123. }
  124. requestBody = bytes.NewBuffer(jsonData)
  125. }
  126. statusCodeMappingStr := c.GetString("status_code_mapping")
  127. var httpResp *http.Response
  128. resp, err := adaptor.DoRequest(c, relayInfo, requestBody)
  129. if err != nil {
  130. return types.NewOpenAIError(err, types.ErrorCodeDoRequestFailed, http.StatusInternalServerError)
  131. }
  132. if resp != nil {
  133. httpResp = resp.(*http.Response)
  134. relayInfo.IsStream = relayInfo.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
  135. if httpResp.StatusCode != http.StatusOK {
  136. newAPIError = service.RelayErrorHandler(httpResp, false)
  137. // reset status code 重置状态码
  138. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  139. return newAPIError
  140. }
  141. }
  142. usage, newAPIError := adaptor.DoResponse(c, httpResp, relayInfo)
  143. //log.Printf("usage: %v", usage)
  144. if newAPIError != nil {
  145. // reset status code 重置状态码
  146. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  147. return newAPIError
  148. }
  149. service.PostClaudeConsumeQuota(c, relayInfo, usage.(*dto.Usage), preConsumedQuota, userQuota, priceData, "")
  150. return nil
  151. }
  152. func getClaudePromptTokens(textRequest *dto.ClaudeRequest, info *relaycommon.RelayInfo) (int, error) {
  153. var promptTokens int
  154. var err error
  155. switch info.RelayMode {
  156. default:
  157. promptTokens, err = service.CountTokenClaudeRequest(*textRequest, info.UpstreamModelName)
  158. }
  159. info.PromptTokens = promptTokens
  160. return promptTokens, err
  161. }