adaptor.go 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. package vertex
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "net/http"
  8. "one-api/dto"
  9. "one-api/relay/channel"
  10. "one-api/relay/channel/claude"
  11. "one-api/relay/channel/gemini"
  12. "one-api/relay/channel/openai"
  13. relaycommon "one-api/relay/common"
  14. "one-api/setting/model_setting"
  15. "strings"
  16. "github.com/gin-gonic/gin"
  17. )
  18. const (
  19. RequestModeClaude = 1
  20. RequestModeGemini = 2
  21. RequestModeLlama = 3
  22. )
  23. var claudeModelMap = map[string]string{
  24. "claude-3-sonnet-20240229": "claude-3-sonnet@20240229",
  25. "claude-3-opus-20240229": "claude-3-opus@20240229",
  26. "claude-3-haiku-20240307": "claude-3-haiku@20240307",
  27. "claude-3-5-sonnet-20240620": "claude-3-5-sonnet@20240620",
  28. "claude-3-5-sonnet-20241022": "claude-3-5-sonnet-v2@20241022",
  29. "claude-3-7-sonnet-20250219": "claude-3-7-sonnet@20250219",
  30. "claude-sonnet-4-20250514": "claude-sonnet-4@20250514",
  31. "claude-opus-4-20250514": "claude-opus-4@20250514",
  32. }
  33. const anthropicVersion = "vertex-2023-10-16"
  34. type Adaptor struct {
  35. RequestMode int
  36. AccountCredentials Credentials
  37. }
  38. func (a *Adaptor) ConvertClaudeRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.ClaudeRequest) (any, error) {
  39. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  40. c.Set("request_model", v)
  41. } else {
  42. c.Set("request_model", request.Model)
  43. }
  44. vertexClaudeReq := copyRequest(request, anthropicVersion)
  45. return vertexClaudeReq, nil
  46. }
  47. func (a *Adaptor) ConvertAudioRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.AudioRequest) (io.Reader, error) {
  48. //TODO implement me
  49. return nil, errors.New("not implemented")
  50. }
  51. func (a *Adaptor) ConvertImageRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.ImageRequest) (any, error) {
  52. //TODO implement me
  53. return nil, errors.New("not implemented")
  54. }
  55. func (a *Adaptor) Init(info *relaycommon.RelayInfo) {
  56. if strings.HasPrefix(info.UpstreamModelName, "claude") {
  57. a.RequestMode = RequestModeClaude
  58. } else if strings.HasPrefix(info.UpstreamModelName, "gemini") {
  59. a.RequestMode = RequestModeGemini
  60. } else if strings.Contains(info.UpstreamModelName, "llama") {
  61. a.RequestMode = RequestModeLlama
  62. }
  63. }
  64. func (a *Adaptor) GetRequestURL(info *relaycommon.RelayInfo) (string, error) {
  65. adc := &Credentials{}
  66. if err := json.Unmarshal([]byte(info.ApiKey), adc); err != nil {
  67. return "", fmt.Errorf("failed to decode credentials file: %w", err)
  68. }
  69. region := GetModelRegion(info.ApiVersion, info.OriginModelName)
  70. a.AccountCredentials = *adc
  71. suffix := ""
  72. if a.RequestMode == RequestModeGemini {
  73. if model_setting.GetGeminiSettings().ThinkingAdapterEnabled {
  74. // suffix -thinking and -nothinking
  75. if strings.HasSuffix(info.OriginModelName, "-thinking") {
  76. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-thinking")
  77. } else if strings.HasSuffix(info.OriginModelName, "-nothinking") {
  78. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-nothinking")
  79. }
  80. }
  81. if info.IsStream {
  82. suffix = "streamGenerateContent?alt=sse"
  83. } else {
  84. suffix = "generateContent"
  85. }
  86. if region == "global" {
  87. return fmt.Sprintf(
  88. "https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/google/models/%s:%s",
  89. adc.ProjectID,
  90. info.UpstreamModelName,
  91. suffix,
  92. ), nil
  93. } else {
  94. return fmt.Sprintf(
  95. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/google/models/%s:%s",
  96. region,
  97. adc.ProjectID,
  98. region,
  99. info.UpstreamModelName,
  100. suffix,
  101. ), nil
  102. }
  103. } else if a.RequestMode == RequestModeClaude {
  104. if info.IsStream {
  105. suffix = "streamRawPredict?alt=sse"
  106. } else {
  107. suffix = "rawPredict"
  108. }
  109. model := info.UpstreamModelName
  110. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  111. model = v
  112. }
  113. return fmt.Sprintf(
  114. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/anthropic/models/%s:%s",
  115. region,
  116. adc.ProjectID,
  117. region,
  118. model,
  119. suffix,
  120. ), nil
  121. } else if a.RequestMode == RequestModeLlama {
  122. return fmt.Sprintf(
  123. "https://%s-aiplatform.googleapis.com/v1beta1/projects/%s/locations/%s/endpoints/openapi/chat/completions",
  124. region,
  125. adc.ProjectID,
  126. region,
  127. ), nil
  128. }
  129. return "", errors.New("unsupported request mode")
  130. }
  131. func (a *Adaptor) SetupRequestHeader(c *gin.Context, req *http.Header, info *relaycommon.RelayInfo) error {
  132. channel.SetupApiRequestHeader(info, c, req)
  133. accessToken, err := getAccessToken(a, info)
  134. if err != nil {
  135. return err
  136. }
  137. req.Set("Authorization", "Bearer "+accessToken)
  138. return nil
  139. }
  140. func (a *Adaptor) ConvertOpenAIRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeneralOpenAIRequest) (any, error) {
  141. if request == nil {
  142. return nil, errors.New("request is nil")
  143. }
  144. if a.RequestMode == RequestModeClaude {
  145. claudeReq, err := claude.RequestOpenAI2ClaudeMessage(*request)
  146. if err != nil {
  147. return nil, err
  148. }
  149. vertexClaudeReq := copyRequest(claudeReq, anthropicVersion)
  150. c.Set("request_model", claudeReq.Model)
  151. info.UpstreamModelName = claudeReq.Model
  152. return vertexClaudeReq, nil
  153. } else if a.RequestMode == RequestModeGemini {
  154. geminiRequest, err := gemini.CovertGemini2OpenAI(*request, info)
  155. if err != nil {
  156. return nil, err
  157. }
  158. c.Set("request_model", request.Model)
  159. return geminiRequest, nil
  160. } else if a.RequestMode == RequestModeLlama {
  161. return request, nil
  162. }
  163. return nil, errors.New("unsupported request mode")
  164. }
  165. func (a *Adaptor) ConvertRerankRequest(c *gin.Context, relayMode int, request dto.RerankRequest) (any, error) {
  166. return nil, nil
  167. }
  168. func (a *Adaptor) ConvertEmbeddingRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.EmbeddingRequest) (any, error) {
  169. //TODO implement me
  170. return nil, errors.New("not implemented")
  171. }
  172. func (a *Adaptor) ConvertOpenAIResponsesRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.OpenAIResponsesRequest) (any, error) {
  173. // TODO implement me
  174. return nil, errors.New("not implemented")
  175. }
  176. func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, requestBody io.Reader) (any, error) {
  177. return channel.DoApiRequest(a, c, info, requestBody)
  178. }
  179. func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *dto.OpenAIErrorWithStatusCode) {
  180. if info.IsStream {
  181. switch a.RequestMode {
  182. case RequestModeClaude:
  183. err, usage = claude.ClaudeStreamHandler(c, resp, info, claude.RequestModeMessage)
  184. case RequestModeGemini:
  185. err, usage = gemini.GeminiChatStreamHandler(c, resp, info)
  186. case RequestModeLlama:
  187. err, usage = openai.OaiStreamHandler(c, resp, info)
  188. }
  189. } else {
  190. switch a.RequestMode {
  191. case RequestModeClaude:
  192. err, usage = claude.ClaudeHandler(c, resp, claude.RequestModeMessage, info)
  193. case RequestModeGemini:
  194. err, usage = gemini.GeminiChatHandler(c, resp, info)
  195. case RequestModeLlama:
  196. err, usage = openai.OpenaiHandler(c, resp, info)
  197. }
  198. }
  199. return
  200. }
  201. func (a *Adaptor) GetModelList() []string {
  202. var modelList []string
  203. for i, s := range ModelList {
  204. modelList = append(modelList, s)
  205. ModelList[i] = s
  206. }
  207. for i, s := range claude.ModelList {
  208. modelList = append(modelList, s)
  209. claude.ModelList[i] = s
  210. }
  211. for i, s := range gemini.ModelList {
  212. modelList = append(modelList, s)
  213. gemini.ModelList[i] = s
  214. }
  215. return modelList
  216. }
  217. func (a *Adaptor) GetChannelName() string {
  218. return ChannelName
  219. }