adaptor.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422
  1. package vertex
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "net/http"
  8. "strings"
  9. "github.com/QuantumNous/new-api/common"
  10. "github.com/QuantumNous/new-api/dto"
  11. "github.com/QuantumNous/new-api/relay/channel"
  12. "github.com/QuantumNous/new-api/relay/channel/claude"
  13. "github.com/QuantumNous/new-api/relay/channel/gemini"
  14. "github.com/QuantumNous/new-api/relay/channel/openai"
  15. relaycommon "github.com/QuantumNous/new-api/relay/common"
  16. "github.com/QuantumNous/new-api/relay/constant"
  17. "github.com/QuantumNous/new-api/setting/model_setting"
  18. "github.com/QuantumNous/new-api/setting/reasoning"
  19. "github.com/QuantumNous/new-api/types"
  20. "github.com/gin-gonic/gin"
  21. "github.com/samber/lo"
  22. )
  23. const (
  24. RequestModeClaude = 1
  25. RequestModeGemini = 2
  26. RequestModeOpenSource = 3
  27. )
  28. var claudeModelMap = map[string]string{
  29. "claude-3-sonnet-20240229": "claude-3-sonnet@20240229",
  30. "claude-3-opus-20240229": "claude-3-opus@20240229",
  31. "claude-3-haiku-20240307": "claude-3-haiku@20240307",
  32. "claude-3-5-sonnet-20240620": "claude-3-5-sonnet@20240620",
  33. "claude-3-5-sonnet-20241022": "claude-3-5-sonnet-v2@20241022",
  34. "claude-3-7-sonnet-20250219": "claude-3-7-sonnet@20250219",
  35. "claude-sonnet-4-20250514": "claude-sonnet-4@20250514",
  36. "claude-opus-4-20250514": "claude-opus-4@20250514",
  37. "claude-opus-4-1-20250805": "claude-opus-4-1@20250805",
  38. "claude-sonnet-4-5-20250929": "claude-sonnet-4-5@20250929",
  39. "claude-haiku-4-5-20251001": "claude-haiku-4-5@20251001",
  40. "claude-opus-4-5-20251101": "claude-opus-4-5@20251101",
  41. "claude-opus-4-6": "claude-opus-4-6",
  42. }
  43. const anthropicVersion = "vertex-2023-10-16"
  44. type Adaptor struct {
  45. RequestMode int
  46. AccountCredentials Credentials
  47. }
  48. func (a *Adaptor) ConvertGeminiRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeminiChatRequest) (any, error) {
  49. // Vertex AI does not support functionResponse.id; keep it stripped here for consistency.
  50. if model_setting.GetGeminiSettings().RemoveFunctionResponseIdEnabled {
  51. removeFunctionResponseID(request)
  52. }
  53. geminiAdaptor := gemini.Adaptor{}
  54. return geminiAdaptor.ConvertGeminiRequest(c, info, request)
  55. }
  56. func removeFunctionResponseID(request *dto.GeminiChatRequest) {
  57. if request == nil {
  58. return
  59. }
  60. if len(request.Contents) > 0 {
  61. for i := range request.Contents {
  62. if len(request.Contents[i].Parts) == 0 {
  63. continue
  64. }
  65. for j := range request.Contents[i].Parts {
  66. part := &request.Contents[i].Parts[j]
  67. if part.FunctionResponse == nil {
  68. continue
  69. }
  70. if len(part.FunctionResponse.ID) > 0 {
  71. part.FunctionResponse.ID = nil
  72. }
  73. }
  74. }
  75. }
  76. if len(request.Requests) > 0 {
  77. for i := range request.Requests {
  78. removeFunctionResponseID(&request.Requests[i])
  79. }
  80. }
  81. }
  82. func (a *Adaptor) ConvertClaudeRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.ClaudeRequest) (any, error) {
  83. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  84. c.Set("request_model", v)
  85. } else {
  86. c.Set("request_model", request.Model)
  87. }
  88. vertexClaudeReq := copyRequest(request, anthropicVersion)
  89. return vertexClaudeReq, nil
  90. }
  91. func (a *Adaptor) ConvertAudioRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.AudioRequest) (io.Reader, error) {
  92. //TODO implement me
  93. return nil, errors.New("not implemented")
  94. }
  95. func (a *Adaptor) ConvertImageRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.ImageRequest) (any, error) {
  96. geminiAdaptor := gemini.Adaptor{}
  97. return geminiAdaptor.ConvertImageRequest(c, info, request)
  98. }
  99. func (a *Adaptor) Init(info *relaycommon.RelayInfo) {
  100. if strings.HasPrefix(info.UpstreamModelName, "claude") {
  101. a.RequestMode = RequestModeClaude
  102. } else if strings.Contains(info.UpstreamModelName, "llama") ||
  103. // open source models
  104. strings.Contains(info.UpstreamModelName, "-maas") {
  105. a.RequestMode = RequestModeOpenSource
  106. } else {
  107. a.RequestMode = RequestModeGemini
  108. }
  109. }
  110. func (a *Adaptor) getRequestUrl(info *relaycommon.RelayInfo, modelName, suffix string) (string, error) {
  111. region := GetModelRegion(info.ApiVersion, info.OriginModelName)
  112. if info.ChannelOtherSettings.VertexKeyType != dto.VertexKeyTypeAPIKey {
  113. adc := &Credentials{}
  114. if err := common.Unmarshal([]byte(info.ApiKey), adc); err != nil {
  115. return "", fmt.Errorf("failed to decode credentials file: %w", err)
  116. }
  117. a.AccountCredentials = *adc
  118. if a.RequestMode == RequestModeGemini {
  119. if region == "global" {
  120. return fmt.Sprintf(
  121. "https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/google/models/%s:%s",
  122. adc.ProjectID,
  123. modelName,
  124. suffix,
  125. ), nil
  126. } else {
  127. return fmt.Sprintf(
  128. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/google/models/%s:%s",
  129. region,
  130. adc.ProjectID,
  131. region,
  132. modelName,
  133. suffix,
  134. ), nil
  135. }
  136. } else if a.RequestMode == RequestModeClaude {
  137. if region == "global" {
  138. return fmt.Sprintf(
  139. "https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/anthropic/models/%s:%s",
  140. adc.ProjectID,
  141. modelName,
  142. suffix,
  143. ), nil
  144. } else {
  145. return fmt.Sprintf(
  146. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/anthropic/models/%s:%s",
  147. region,
  148. adc.ProjectID,
  149. region,
  150. modelName,
  151. suffix,
  152. ), nil
  153. }
  154. } else if a.RequestMode == RequestModeOpenSource {
  155. return fmt.Sprintf(
  156. "https://aiplatform.googleapis.com/v1beta1/projects/%s/locations/%s/endpoints/openapi/chat/completions",
  157. adc.ProjectID,
  158. region,
  159. ), nil
  160. }
  161. } else {
  162. var keyPrefix string
  163. if strings.HasSuffix(suffix, "?alt=sse") {
  164. keyPrefix = "&"
  165. } else {
  166. keyPrefix = "?"
  167. }
  168. if region == "global" {
  169. return fmt.Sprintf(
  170. "https://aiplatform.googleapis.com/v1/publishers/google/models/%s:%s%skey=%s",
  171. modelName,
  172. suffix,
  173. keyPrefix,
  174. info.ApiKey,
  175. ), nil
  176. } else {
  177. return fmt.Sprintf(
  178. "https://%s-aiplatform.googleapis.com/v1/publishers/google/models/%s:%s%skey=%s",
  179. region,
  180. modelName,
  181. suffix,
  182. keyPrefix,
  183. info.ApiKey,
  184. ), nil
  185. }
  186. }
  187. return "", errors.New("unsupported request mode")
  188. }
  189. func (a *Adaptor) GetRequestURL(info *relaycommon.RelayInfo) (string, error) {
  190. suffix := ""
  191. if a.RequestMode == RequestModeGemini {
  192. if model_setting.GetGeminiSettings().ThinkingAdapterEnabled &&
  193. !model_setting.ShouldPreserveThinkingSuffix(info.OriginModelName) {
  194. // 新增逻辑:处理 -thinking-<budget> 格式
  195. if strings.Contains(info.UpstreamModelName, "-thinking-") {
  196. parts := strings.Split(info.UpstreamModelName, "-thinking-")
  197. info.UpstreamModelName = parts[0]
  198. } else if strings.HasSuffix(info.UpstreamModelName, "-thinking") { // 旧的适配
  199. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-thinking")
  200. } else if strings.HasSuffix(info.UpstreamModelName, "-nothinking") {
  201. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-nothinking")
  202. } else if baseModel, level, ok := reasoning.TrimEffortSuffix(info.UpstreamModelName); ok && level != "" {
  203. info.UpstreamModelName = baseModel
  204. }
  205. }
  206. if info.IsStream {
  207. suffix = "streamGenerateContent?alt=sse"
  208. } else {
  209. suffix = "generateContent"
  210. }
  211. if strings.HasPrefix(info.UpstreamModelName, "imagen") {
  212. suffix = "predict"
  213. }
  214. return a.getRequestUrl(info, info.UpstreamModelName, suffix)
  215. } else if a.RequestMode == RequestModeClaude {
  216. if info.IsStream {
  217. suffix = "streamRawPredict?alt=sse"
  218. } else {
  219. suffix = "rawPredict"
  220. }
  221. model := info.UpstreamModelName
  222. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  223. model = v
  224. }
  225. return a.getRequestUrl(info, model, suffix)
  226. } else if a.RequestMode == RequestModeOpenSource {
  227. return a.getRequestUrl(info, "", "")
  228. }
  229. return "", errors.New("unsupported request mode")
  230. }
  231. func (a *Adaptor) SetupRequestHeader(c *gin.Context, req *http.Header, info *relaycommon.RelayInfo) error {
  232. channel.SetupApiRequestHeader(info, c, req)
  233. if info.ChannelOtherSettings.VertexKeyType != dto.VertexKeyTypeAPIKey {
  234. accessToken, err := getAccessToken(a, info)
  235. if err != nil {
  236. return err
  237. }
  238. req.Set("Authorization", "Bearer "+accessToken)
  239. }
  240. if a.AccountCredentials.ProjectID != "" {
  241. req.Set("x-goog-user-project", a.AccountCredentials.ProjectID)
  242. }
  243. if strings.Contains(info.UpstreamModelName, "claude") {
  244. claude.CommonClaudeHeadersOperation(c, req, info)
  245. }
  246. return nil
  247. }
  248. func (a *Adaptor) ConvertOpenAIRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeneralOpenAIRequest) (any, error) {
  249. if request == nil {
  250. return nil, errors.New("request is nil")
  251. }
  252. if a.RequestMode == RequestModeGemini && strings.HasPrefix(info.UpstreamModelName, "imagen") {
  253. prompt := ""
  254. for _, m := range request.Messages {
  255. if m.Role == "user" {
  256. prompt = m.StringContent()
  257. if prompt != "" {
  258. break
  259. }
  260. }
  261. }
  262. if prompt == "" {
  263. if p, ok := request.Prompt.(string); ok {
  264. prompt = p
  265. }
  266. }
  267. if prompt == "" {
  268. return nil, errors.New("prompt is required for image generation")
  269. }
  270. imgReq := dto.ImageRequest{
  271. Model: request.Model,
  272. Prompt: prompt,
  273. N: lo.ToPtr(uint(1)),
  274. Size: "1024x1024",
  275. }
  276. if request.N != nil && *request.N > 0 {
  277. imgReq.N = lo.ToPtr(uint(*request.N))
  278. }
  279. if request.Size != "" {
  280. imgReq.Size = request.Size
  281. }
  282. if len(request.ExtraBody) > 0 {
  283. var extra map[string]any
  284. if err := json.Unmarshal(request.ExtraBody, &extra); err == nil {
  285. if n, ok := extra["n"].(float64); ok && n > 0 {
  286. imgReq.N = lo.ToPtr(uint(n))
  287. }
  288. if size, ok := extra["size"].(string); ok {
  289. imgReq.Size = size
  290. }
  291. // accept aspectRatio in extra body (top-level or under parameters)
  292. if ar, ok := extra["aspectRatio"].(string); ok && ar != "" {
  293. imgReq.Size = ar
  294. }
  295. if params, ok := extra["parameters"].(map[string]any); ok {
  296. if ar, ok := params["aspectRatio"].(string); ok && ar != "" {
  297. imgReq.Size = ar
  298. }
  299. }
  300. }
  301. }
  302. c.Set("request_model", request.Model)
  303. return a.ConvertImageRequest(c, info, imgReq)
  304. }
  305. if a.RequestMode == RequestModeClaude {
  306. claudeReq, err := claude.RequestOpenAI2ClaudeMessage(c, *request)
  307. if err != nil {
  308. return nil, err
  309. }
  310. vertexClaudeReq := copyRequest(claudeReq, anthropicVersion)
  311. c.Set("request_model", claudeReq.Model)
  312. info.UpstreamModelName = claudeReq.Model
  313. return vertexClaudeReq, nil
  314. } else if a.RequestMode == RequestModeGemini {
  315. geminiRequest, err := gemini.CovertOpenAI2Gemini(c, *request, info)
  316. if err != nil {
  317. return nil, err
  318. }
  319. c.Set("request_model", request.Model)
  320. return geminiRequest, nil
  321. } else if a.RequestMode == RequestModeOpenSource {
  322. return request, nil
  323. }
  324. return nil, errors.New("unsupported request mode")
  325. }
  326. func (a *Adaptor) ConvertRerankRequest(c *gin.Context, relayMode int, request dto.RerankRequest) (any, error) {
  327. return nil, nil
  328. }
  329. func (a *Adaptor) ConvertEmbeddingRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.EmbeddingRequest) (any, error) {
  330. //TODO implement me
  331. return nil, errors.New("not implemented")
  332. }
  333. func (a *Adaptor) ConvertOpenAIResponsesRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.OpenAIResponsesRequest) (any, error) {
  334. // TODO implement me
  335. return nil, errors.New("not implemented")
  336. }
  337. func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, requestBody io.Reader) (any, error) {
  338. return channel.DoApiRequest(a, c, info, requestBody)
  339. }
  340. func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) {
  341. claudeAdaptor := claude.Adaptor{}
  342. if info.IsStream {
  343. switch a.RequestMode {
  344. case RequestModeClaude:
  345. return claudeAdaptor.DoResponse(c, resp, info)
  346. case RequestModeGemini:
  347. if info.RelayMode == constant.RelayModeGemini {
  348. return gemini.GeminiTextGenerationStreamHandler(c, info, resp)
  349. } else {
  350. return gemini.GeminiChatStreamHandler(c, info, resp)
  351. }
  352. case RequestModeOpenSource:
  353. return openai.OaiStreamHandler(c, info, resp)
  354. }
  355. } else {
  356. switch a.RequestMode {
  357. case RequestModeClaude:
  358. return claudeAdaptor.DoResponse(c, resp, info)
  359. case RequestModeGemini:
  360. if info.RelayMode == constant.RelayModeGemini {
  361. return gemini.GeminiTextGenerationHandler(c, info, resp)
  362. } else {
  363. if strings.HasPrefix(info.UpstreamModelName, "imagen") {
  364. return gemini.GeminiImageHandler(c, info, resp)
  365. }
  366. return gemini.GeminiChatHandler(c, info, resp)
  367. }
  368. case RequestModeOpenSource:
  369. return openai.OpenaiHandler(c, info, resp)
  370. }
  371. }
  372. return
  373. }
  374. func (a *Adaptor) GetModelList() []string {
  375. var modelList []string
  376. for i, s := range ModelList {
  377. modelList = append(modelList, s)
  378. ModelList[i] = s
  379. }
  380. for i, s := range claude.ModelList {
  381. modelList = append(modelList, s)
  382. claude.ModelList[i] = s
  383. }
  384. for i, s := range gemini.ModelList {
  385. modelList = append(modelList, s)
  386. gemini.ModelList[i] = s
  387. }
  388. return modelList
  389. }
  390. func (a *Adaptor) GetChannelName() string {
  391. return ChannelName
  392. }