relay-aws.go 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295
  1. package aws
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "net/http"
  6. "one-api/common"
  7. "one-api/dto"
  8. "one-api/relay/channel/claude"
  9. relaycommon "one-api/relay/common"
  10. "one-api/relay/helper"
  11. "one-api/types"
  12. "strings"
  13. "github.com/gin-gonic/gin"
  14. "github.com/pkg/errors"
  15. "github.com/aws/aws-sdk-go-v2/aws"
  16. "github.com/aws/aws-sdk-go-v2/credentials"
  17. "github.com/aws/aws-sdk-go-v2/service/bedrockruntime"
  18. bedrockruntimeTypes "github.com/aws/aws-sdk-go-v2/service/bedrockruntime/types"
  19. "github.com/aws/smithy-go/auth/bearer"
  20. )
  21. func newAwsClient(c *gin.Context, info *relaycommon.RelayInfo) (*bedrockruntime.Client, error) {
  22. awsSecret := strings.Split(info.ApiKey, "|")
  23. var client *bedrockruntime.Client
  24. switch len(awsSecret) {
  25. case 2:
  26. apiKey := awsSecret[0]
  27. region := awsSecret[1]
  28. client = bedrockruntime.New(bedrockruntime.Options{
  29. Region: region,
  30. BearerAuthTokenProvider: bearer.StaticTokenProvider{Token: bearer.Token{Value: apiKey}},
  31. })
  32. case 3:
  33. ak := awsSecret[0]
  34. sk := awsSecret[1]
  35. region := awsSecret[2]
  36. client = bedrockruntime.New(bedrockruntime.Options{
  37. Region: region,
  38. Credentials: aws.NewCredentialsCache(credentials.NewStaticCredentialsProvider(ak, sk, "")),
  39. })
  40. default:
  41. return nil, errors.New("invalid aws secret key")
  42. }
  43. return client, nil
  44. }
  45. func wrapErr(err error) *dto.OpenAIErrorWithStatusCode {
  46. return &dto.OpenAIErrorWithStatusCode{
  47. StatusCode: http.StatusInternalServerError,
  48. Error: dto.OpenAIError{
  49. Message: fmt.Sprintf("%s", err.Error()),
  50. },
  51. }
  52. }
  53. func awsRegionPrefix(awsRegionId string) string {
  54. parts := strings.Split(awsRegionId, "-")
  55. regionPrefix := ""
  56. if len(parts) > 0 {
  57. regionPrefix = parts[0]
  58. }
  59. return regionPrefix
  60. }
  61. func awsModelCanCrossRegion(awsModelId, awsRegionPrefix string) bool {
  62. regionSet, exists := awsModelCanCrossRegionMap[awsModelId]
  63. return exists && regionSet[awsRegionPrefix]
  64. }
  65. func awsModelCrossRegion(awsModelId, awsRegionPrefix string) string {
  66. modelPrefix, find := awsRegionCrossModelPrefixMap[awsRegionPrefix]
  67. if !find {
  68. return awsModelId
  69. }
  70. return modelPrefix + "." + awsModelId
  71. }
  72. func awsModelID(requestModel string) string {
  73. if awsModelID, ok := awsModelIDMap[requestModel]; ok {
  74. return awsModelID
  75. }
  76. return requestModel
  77. }
  78. func awsHandler(c *gin.Context, info *relaycommon.RelayInfo, requestMode int) (*types.NewAPIError, *dto.Usage) {
  79. awsCli, err := newAwsClient(c, info)
  80. if err != nil {
  81. return types.NewError(err, types.ErrorCodeChannelAwsClientError), nil
  82. }
  83. awsModelId := awsModelID(c.GetString("request_model"))
  84. // 检查是否为Nova模型
  85. isNova, _ := c.Get("is_nova_model")
  86. if isNova == true {
  87. // Nova模型也支持跨区域
  88. awsRegionPrefix := awsRegionPrefix(awsCli.Options().Region)
  89. canCrossRegion := awsModelCanCrossRegion(awsModelId, awsRegionPrefix)
  90. if canCrossRegion {
  91. awsModelId = awsModelCrossRegion(awsModelId, awsRegionPrefix)
  92. }
  93. return handleNovaRequest(c, awsCli, info, awsModelId)
  94. }
  95. // 原有的Claude处理逻辑
  96. awsRegionPrefix := awsRegionPrefix(awsCli.Options().Region)
  97. canCrossRegion := awsModelCanCrossRegion(awsModelId, awsRegionPrefix)
  98. if canCrossRegion {
  99. awsModelId = awsModelCrossRegion(awsModelId, awsRegionPrefix)
  100. }
  101. awsReq := &bedrockruntime.InvokeModelInput{
  102. ModelId: aws.String(awsModelId),
  103. Accept: aws.String("application/json"),
  104. ContentType: aws.String("application/json"),
  105. }
  106. claudeReq_, ok := c.Get("converted_request")
  107. if !ok {
  108. return types.NewError(errors.New("aws claude request not found"), types.ErrorCodeInvalidRequest), nil
  109. }
  110. claudeReq := claudeReq_.(*dto.ClaudeRequest)
  111. awsClaudeReq := copyRequest(claudeReq)
  112. awsReq.Body, err = common.Marshal(awsClaudeReq)
  113. if err != nil {
  114. return types.NewError(errors.Wrap(err, "marshal request"), types.ErrorCodeBadResponseBody), nil
  115. }
  116. awsResp, err := awsCli.InvokeModel(c.Request.Context(), awsReq)
  117. if err != nil {
  118. return types.NewOpenAIError(errors.Wrap(err, "InvokeModel"), types.ErrorCodeAwsInvokeError, http.StatusInternalServerError), nil
  119. }
  120. claudeInfo := &claude.ClaudeResponseInfo{
  121. ResponseId: helper.GetResponseID(c),
  122. Created: common.GetTimestamp(),
  123. Model: info.UpstreamModelName,
  124. ResponseText: strings.Builder{},
  125. Usage: &dto.Usage{},
  126. }
  127. // 复制上游 Content-Type 到客户端响应头
  128. if awsResp.ContentType != nil && *awsResp.ContentType != "" {
  129. c.Writer.Header().Set("Content-Type", *awsResp.ContentType)
  130. }
  131. handlerErr := claude.HandleClaudeResponseData(c, info, claudeInfo, nil, awsResp.Body, RequestModeMessage)
  132. if handlerErr != nil {
  133. return handlerErr, nil
  134. }
  135. return nil, claudeInfo.Usage
  136. }
  137. func awsStreamHandler(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo, requestMode int) (*types.NewAPIError, *dto.Usage) {
  138. awsCli, err := newAwsClient(c, info)
  139. if err != nil {
  140. return types.NewError(err, types.ErrorCodeChannelAwsClientError), nil
  141. }
  142. awsModelId := awsModelID(c.GetString("request_model"))
  143. awsRegionPrefix := awsRegionPrefix(awsCli.Options().Region)
  144. canCrossRegion := awsModelCanCrossRegion(awsModelId, awsRegionPrefix)
  145. if canCrossRegion {
  146. awsModelId = awsModelCrossRegion(awsModelId, awsRegionPrefix)
  147. }
  148. awsReq := &bedrockruntime.InvokeModelWithResponseStreamInput{
  149. ModelId: aws.String(awsModelId),
  150. Accept: aws.String("application/json"),
  151. ContentType: aws.String("application/json"),
  152. }
  153. claudeReq_, ok := c.Get("converted_request")
  154. if !ok {
  155. return types.NewError(errors.New("aws claude request not found"), types.ErrorCodeInvalidRequest), nil
  156. }
  157. claudeReq := claudeReq_.(*dto.ClaudeRequest)
  158. awsClaudeReq := copyRequest(claudeReq)
  159. awsReq.Body, err = common.Marshal(awsClaudeReq)
  160. if err != nil {
  161. return types.NewError(errors.Wrap(err, "marshal request"), types.ErrorCodeBadResponseBody), nil
  162. }
  163. awsResp, err := awsCli.InvokeModelWithResponseStream(c.Request.Context(), awsReq)
  164. if err != nil {
  165. return types.NewOpenAIError(errors.Wrap(err, "InvokeModelWithResponseStream"), types.ErrorCodeAwsInvokeError, http.StatusInternalServerError), nil
  166. }
  167. stream := awsResp.GetStream()
  168. defer stream.Close()
  169. claudeInfo := &claude.ClaudeResponseInfo{
  170. ResponseId: helper.GetResponseID(c),
  171. Created: common.GetTimestamp(),
  172. Model: info.UpstreamModelName,
  173. ResponseText: strings.Builder{},
  174. Usage: &dto.Usage{},
  175. }
  176. for event := range stream.Events() {
  177. switch v := event.(type) {
  178. case *bedrockruntimeTypes.ResponseStreamMemberChunk:
  179. info.SetFirstResponseTime()
  180. respErr := claude.HandleStreamResponseData(c, info, claudeInfo, string(v.Value.Bytes), RequestModeMessage)
  181. if respErr != nil {
  182. return respErr, nil
  183. }
  184. case *bedrockruntimeTypes.UnknownUnionMember:
  185. fmt.Println("unknown tag:", v.Tag)
  186. return types.NewError(errors.New("unknown response type"), types.ErrorCodeInvalidRequest), nil
  187. default:
  188. fmt.Println("union is nil or unknown type")
  189. return types.NewError(errors.New("nil or unknown response type"), types.ErrorCodeInvalidRequest), nil
  190. }
  191. }
  192. claude.HandleStreamFinalResponse(c, info, claudeInfo, RequestModeMessage)
  193. return nil, claudeInfo.Usage
  194. }
  195. // Nova模型处理函数
  196. func handleNovaRequest(c *gin.Context, awsCli *bedrockruntime.Client, info *relaycommon.RelayInfo, awsModelId string) (*types.NewAPIError, *dto.Usage) {
  197. novaReq_, ok := c.Get("converted_request")
  198. if !ok {
  199. return types.NewError(errors.New("nova request not found"), types.ErrorCodeInvalidRequest), nil
  200. }
  201. novaReq := novaReq_.(*NovaRequest)
  202. // 使用InvokeModel API,但使用Nova格式的请求体
  203. awsReq := &bedrockruntime.InvokeModelInput{
  204. ModelId: aws.String(awsModelId),
  205. Accept: aws.String("application/json"),
  206. ContentType: aws.String("application/json"),
  207. }
  208. reqBody, err := json.Marshal(novaReq)
  209. if err != nil {
  210. return types.NewError(errors.Wrap(err, "marshal nova request"), types.ErrorCodeBadResponseBody), nil
  211. }
  212. awsReq.Body = reqBody
  213. awsResp, err := awsCli.InvokeModel(c.Request.Context(), awsReq)
  214. if err != nil {
  215. return types.NewError(errors.Wrap(err, "InvokeModel"), types.ErrorCodeChannelAwsClientError), nil
  216. }
  217. // 解析Nova响应
  218. var novaResp struct {
  219. Output struct {
  220. Message struct {
  221. Content []struct {
  222. Text string `json:"text"`
  223. } `json:"content"`
  224. } `json:"message"`
  225. } `json:"output"`
  226. Usage struct {
  227. InputTokens int `json:"inputTokens"`
  228. OutputTokens int `json:"outputTokens"`
  229. TotalTokens int `json:"totalTokens"`
  230. } `json:"usage"`
  231. }
  232. if err := json.Unmarshal(awsResp.Body, &novaResp); err != nil {
  233. return types.NewError(errors.Wrap(err, "unmarshal nova response"), types.ErrorCodeBadResponseBody), nil
  234. }
  235. // 构造OpenAI格式响应
  236. response := dto.OpenAITextResponse{
  237. Id: helper.GetResponseID(c),
  238. Object: "chat.completion",
  239. Created: common.GetTimestamp(),
  240. Model: info.UpstreamModelName,
  241. Choices: []dto.OpenAITextResponseChoice{{
  242. Index: 0,
  243. Message: dto.Message{
  244. Role: "assistant",
  245. Content: novaResp.Output.Message.Content[0].Text,
  246. },
  247. FinishReason: "stop",
  248. }},
  249. Usage: dto.Usage{
  250. PromptTokens: novaResp.Usage.InputTokens,
  251. CompletionTokens: novaResp.Usage.OutputTokens,
  252. TotalTokens: novaResp.Usage.TotalTokens,
  253. },
  254. }
  255. c.JSON(http.StatusOK, response)
  256. return nil, &response.Usage
  257. }