claude_handler.go 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. package relay
  2. import (
  3. "bytes"
  4. "fmt"
  5. "io"
  6. "net/http"
  7. "strings"
  8. "github.com/QuantumNous/new-api/common"
  9. "github.com/QuantumNous/new-api/constant"
  10. "github.com/QuantumNous/new-api/dto"
  11. relaycommon "github.com/QuantumNous/new-api/relay/common"
  12. "github.com/QuantumNous/new-api/relay/helper"
  13. "github.com/QuantumNous/new-api/service"
  14. "github.com/QuantumNous/new-api/setting/model_setting"
  15. "github.com/QuantumNous/new-api/types"
  16. "github.com/gin-gonic/gin"
  17. )
  18. func ClaudeHelper(c *gin.Context, info *relaycommon.RelayInfo) (newAPIError *types.NewAPIError) {
  19. info.InitChannelMeta(c)
  20. claudeReq, ok := info.Request.(*dto.ClaudeRequest)
  21. if !ok {
  22. return types.NewErrorWithStatusCode(fmt.Errorf("invalid request type, expected *dto.ClaudeRequest, got %T", info.Request), types.ErrorCodeInvalidRequest, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  23. }
  24. request, err := common.DeepCopy(claudeReq)
  25. if err != nil {
  26. return types.NewError(fmt.Errorf("failed to copy request to ClaudeRequest: %w", err), types.ErrorCodeInvalidRequest, types.ErrOptionWithSkipRetry())
  27. }
  28. err = helper.ModelMappedHelper(c, info, request)
  29. if err != nil {
  30. return types.NewError(err, types.ErrorCodeChannelModelMappedError, types.ErrOptionWithSkipRetry())
  31. }
  32. adaptor := GetAdaptor(info.ApiType)
  33. if adaptor == nil {
  34. return types.NewError(fmt.Errorf("invalid api type: %d", info.ApiType), types.ErrorCodeInvalidApiType, types.ErrOptionWithSkipRetry())
  35. }
  36. adaptor.Init(info)
  37. if request.MaxTokens == 0 {
  38. request.MaxTokens = uint(model_setting.GetClaudeSettings().GetDefaultMaxTokens(request.Model))
  39. }
  40. if model_setting.GetClaudeSettings().ThinkingAdapterEnabled &&
  41. strings.HasSuffix(request.Model, "-thinking") {
  42. if request.Thinking == nil {
  43. // 因为BudgetTokens 必须大于1024
  44. if request.MaxTokens < 1280 {
  45. request.MaxTokens = 1280
  46. }
  47. // BudgetTokens 为 max_tokens 的 80%
  48. request.Thinking = &dto.Thinking{
  49. Type: "enabled",
  50. BudgetTokens: common.GetPointer[int](int(float64(request.MaxTokens) * model_setting.GetClaudeSettings().ThinkingAdapterBudgetTokensPercentage)),
  51. }
  52. // TODO: 临时处理
  53. // https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking
  54. request.TopP = 0
  55. request.Temperature = common.GetPointer[float64](1.0)
  56. }
  57. if !model_setting.ShouldPreserveThinkingSuffix(info.OriginModelName) {
  58. request.Model = strings.TrimSuffix(request.Model, "-thinking")
  59. }
  60. info.UpstreamModelName = request.Model
  61. }
  62. if info.ChannelSetting.SystemPrompt != "" {
  63. if request.System == nil {
  64. request.SetStringSystem(info.ChannelSetting.SystemPrompt)
  65. } else if info.ChannelSetting.SystemPromptOverride {
  66. common.SetContextKey(c, constant.ContextKeySystemPromptOverride, true)
  67. if request.IsStringSystem() {
  68. existing := strings.TrimSpace(request.GetStringSystem())
  69. if existing == "" {
  70. request.SetStringSystem(info.ChannelSetting.SystemPrompt)
  71. } else {
  72. request.SetStringSystem(info.ChannelSetting.SystemPrompt + "\n" + existing)
  73. }
  74. } else {
  75. systemContents := request.ParseSystem()
  76. newSystem := dto.ClaudeMediaMessage{Type: dto.ContentTypeText}
  77. newSystem.SetText(info.ChannelSetting.SystemPrompt)
  78. if len(systemContents) == 0 {
  79. request.System = []dto.ClaudeMediaMessage{newSystem}
  80. } else {
  81. request.System = append([]dto.ClaudeMediaMessage{newSystem}, systemContents...)
  82. }
  83. }
  84. }
  85. }
  86. if !model_setting.GetGlobalSettings().PassThroughRequestEnabled &&
  87. !info.ChannelSetting.PassThroughBodyEnabled &&
  88. service.ShouldChatCompletionsUseResponsesGlobal(info.ChannelId, info.ChannelType, info.OriginModelName) {
  89. openAIRequest, convErr := service.ClaudeToOpenAIRequest(*request, info)
  90. if convErr != nil {
  91. return types.NewError(convErr, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  92. }
  93. usage, newApiErr := chatCompletionsViaResponses(c, info, adaptor, openAIRequest)
  94. if newApiErr != nil {
  95. return newApiErr
  96. }
  97. service.PostClaudeConsumeQuota(c, info, usage)
  98. return nil
  99. }
  100. var requestBody io.Reader
  101. if model_setting.GetGlobalSettings().PassThroughRequestEnabled || info.ChannelSetting.PassThroughBodyEnabled {
  102. body, err := common.GetRequestBody(c)
  103. if err != nil {
  104. return types.NewErrorWithStatusCode(err, types.ErrorCodeReadRequestBodyFailed, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  105. }
  106. requestBody = bytes.NewBuffer(body)
  107. } else {
  108. convertedRequest, err := adaptor.ConvertClaudeRequest(c, info, request)
  109. if err != nil {
  110. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  111. }
  112. relaycommon.AppendRequestConversionFromRequest(info, convertedRequest)
  113. jsonData, err := common.Marshal(convertedRequest)
  114. if err != nil {
  115. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  116. }
  117. // remove disabled fields for Claude API
  118. jsonData, err = relaycommon.RemoveDisabledFields(jsonData, info.ChannelOtherSettings)
  119. if err != nil {
  120. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  121. }
  122. // apply param override
  123. if len(info.ParamOverride) > 0 {
  124. jsonData, err = relaycommon.ApplyParamOverride(jsonData, info.ParamOverride, relaycommon.BuildParamOverrideContext(info))
  125. if err != nil {
  126. return types.NewError(err, types.ErrorCodeChannelParamOverrideInvalid, types.ErrOptionWithSkipRetry())
  127. }
  128. }
  129. if common.DebugEnabled {
  130. println("requestBody: ", string(jsonData))
  131. }
  132. requestBody = bytes.NewBuffer(jsonData)
  133. }
  134. statusCodeMappingStr := c.GetString("status_code_mapping")
  135. var httpResp *http.Response
  136. resp, err := adaptor.DoRequest(c, info, requestBody)
  137. if err != nil {
  138. return types.NewOpenAIError(err, types.ErrorCodeDoRequestFailed, http.StatusInternalServerError)
  139. }
  140. if resp != nil {
  141. httpResp = resp.(*http.Response)
  142. info.IsStream = info.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
  143. if httpResp.StatusCode != http.StatusOK {
  144. newAPIError = service.RelayErrorHandler(c.Request.Context(), httpResp, false)
  145. // reset status code 重置状态码
  146. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  147. return newAPIError
  148. }
  149. }
  150. usage, newAPIError := adaptor.DoResponse(c, httpResp, info)
  151. //log.Printf("usage: %v", usage)
  152. if newAPIError != nil {
  153. // reset status code 重置状态码
  154. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  155. return newAPIError
  156. }
  157. service.PostClaudeConsumeQuota(c, info, usage.(*dto.Usage))
  158. return nil
  159. }