adaptor.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. package doubao
  2. import (
  3. "bytes"
  4. "fmt"
  5. "io"
  6. "net/http"
  7. "strconv"
  8. "time"
  9. "github.com/QuantumNous/new-api/common"
  10. "github.com/QuantumNous/new-api/constant"
  11. "github.com/QuantumNous/new-api/dto"
  12. "github.com/QuantumNous/new-api/model"
  13. "github.com/QuantumNous/new-api/relay/channel"
  14. "github.com/QuantumNous/new-api/relay/channel/task/taskcommon"
  15. relaycommon "github.com/QuantumNous/new-api/relay/common"
  16. "github.com/QuantumNous/new-api/service"
  17. "github.com/gin-gonic/gin"
  18. "github.com/pkg/errors"
  19. "github.com/samber/lo"
  20. )
  21. // ============================
  22. // Request / Response structures
  23. // ============================
  24. type ContentItem struct {
  25. Type string `json:"type,omitempty"`
  26. Text string `json:"text,omitempty"`
  27. ImageURL *MediaURL `json:"image_url,omitempty"`
  28. VideoURL *MediaURL `json:"video_url,omitempty"`
  29. AudioURL *MediaURL `json:"audio_url,omitempty"`
  30. Role string `json:"role,omitempty"`
  31. }
  32. type MediaURL struct {
  33. URL string `json:"url,omitempty"`
  34. }
  35. type requestPayload struct {
  36. Model string `json:"model"`
  37. Content []ContentItem `json:"content,omitempty"`
  38. CallbackURL string `json:"callback_url,omitempty"`
  39. ReturnLastFrame *dto.BoolValue `json:"return_last_frame,omitempty"`
  40. ServiceTier string `json:"service_tier,omitempty"`
  41. ExecutionExpiresAfter *dto.IntValue `json:"execution_expires_after,omitempty"`
  42. GenerateAudio *dto.BoolValue `json:"generate_audio,omitempty"`
  43. Draft *dto.BoolValue `json:"draft,omitempty"`
  44. Tools []struct {
  45. Type string `json:"type,omitempty"`
  46. } `json:"tools,omitempty"`
  47. Resolution string `json:"resolution,omitempty"`
  48. Ratio string `json:"ratio,omitempty"`
  49. Duration *dto.IntValue `json:"duration,omitempty"`
  50. Frames *dto.IntValue `json:"frames,omitempty"`
  51. Seed *dto.IntValue `json:"seed,omitempty"`
  52. CameraFixed *dto.BoolValue `json:"camera_fixed,omitempty"`
  53. Watermark *dto.BoolValue `json:"watermark,omitempty"`
  54. }
  55. type responsePayload struct {
  56. ID string `json:"id"` // task_id
  57. }
  58. type responseTask struct {
  59. ID string `json:"id"`
  60. Model string `json:"model"`
  61. Status string `json:"status"`
  62. Content struct {
  63. VideoURL string `json:"video_url"`
  64. } `json:"content"`
  65. Seed int `json:"seed"`
  66. Resolution string `json:"resolution"`
  67. Duration int `json:"duration"`
  68. Ratio string `json:"ratio"`
  69. FramesPerSecond int `json:"framespersecond"`
  70. ServiceTier string `json:"service_tier"`
  71. Tools []struct {
  72. Type string `json:"type"`
  73. } `json:"tools"`
  74. Usage struct {
  75. CompletionTokens int `json:"completion_tokens"`
  76. TotalTokens int `json:"total_tokens"`
  77. ToolUsage struct {
  78. WebSearch int `json:"web_search"`
  79. } `json:"tool_usage"`
  80. } `json:"usage"`
  81. Error struct {
  82. Code string `json:"code"`
  83. Message string `json:"message"`
  84. } `json:"error"`
  85. CreatedAt int64 `json:"created_at"`
  86. UpdatedAt int64 `json:"updated_at"`
  87. }
  88. // ============================
  89. // Adaptor implementation
  90. // ============================
  91. type TaskAdaptor struct {
  92. taskcommon.BaseBilling
  93. ChannelType int
  94. apiKey string
  95. baseURL string
  96. }
  97. func (a *TaskAdaptor) Init(info *relaycommon.RelayInfo) {
  98. a.ChannelType = info.ChannelType
  99. a.baseURL = info.ChannelBaseUrl
  100. a.apiKey = info.ApiKey
  101. }
  102. // ValidateRequestAndSetAction parses body, validates fields and sets default action.
  103. func (a *TaskAdaptor) ValidateRequestAndSetAction(c *gin.Context, info *relaycommon.RelayInfo) (taskErr *dto.TaskError) {
  104. // Accept only POST /v1/video/generations as "generate" action.
  105. return relaycommon.ValidateBasicTaskRequest(c, info, constant.TaskActionGenerate)
  106. }
  107. // BuildRequestURL constructs the upstream URL.
  108. func (a *TaskAdaptor) BuildRequestURL(_ *relaycommon.RelayInfo) (string, error) {
  109. return fmt.Sprintf("%s/api/v3/contents/generations/tasks", a.baseURL), nil
  110. }
  111. // BuildRequestHeader sets required headers.
  112. func (a *TaskAdaptor) BuildRequestHeader(_ *gin.Context, req *http.Request, _ *relaycommon.RelayInfo) error {
  113. req.Header.Set("Content-Type", "application/json")
  114. req.Header.Set("Accept", "application/json")
  115. req.Header.Set("Authorization", "Bearer "+a.apiKey)
  116. return nil
  117. }
  118. // EstimateBilling 检测请求 metadata 中是否包含视频输入,返回视频折扣 OtherRatio。
  119. func (a *TaskAdaptor) EstimateBilling(c *gin.Context, info *relaycommon.RelayInfo) map[string]float64 {
  120. req, err := relaycommon.GetTaskRequest(c)
  121. if err != nil {
  122. return nil
  123. }
  124. if hasVideoInMetadata(req.Metadata) {
  125. if ratio, ok := GetVideoInputRatio(info.OriginModelName); ok {
  126. return map[string]float64{"video_input": ratio}
  127. }
  128. }
  129. return nil
  130. }
  131. // hasVideoInMetadata 直接检查 metadata 的 content 数组是否包含 video_url 条目,
  132. // 避免构建完整的上游 requestPayload。
  133. func hasVideoInMetadata(metadata map[string]interface{}) bool {
  134. if metadata == nil {
  135. return false
  136. }
  137. contentRaw, ok := metadata["content"]
  138. if !ok {
  139. return false
  140. }
  141. contentSlice, ok := contentRaw.([]interface{})
  142. if !ok {
  143. return false
  144. }
  145. for _, item := range contentSlice {
  146. itemMap, ok := item.(map[string]interface{})
  147. if !ok {
  148. continue
  149. }
  150. if itemMap["type"] == "video_url" {
  151. return true
  152. }
  153. if _, has := itemMap["video_url"]; has {
  154. return true
  155. }
  156. }
  157. return false
  158. }
  159. // BuildRequestBody converts request into Doubao specific format.
  160. func (a *TaskAdaptor) BuildRequestBody(c *gin.Context, info *relaycommon.RelayInfo) (io.Reader, error) {
  161. req, err := relaycommon.GetTaskRequest(c)
  162. if err != nil {
  163. return nil, err
  164. }
  165. body, err := a.convertToRequestPayload(&req)
  166. if err != nil {
  167. return nil, errors.Wrap(err, "convert request payload failed")
  168. }
  169. if info.IsModelMapped {
  170. body.Model = info.UpstreamModelName
  171. } else {
  172. info.UpstreamModelName = body.Model
  173. }
  174. data, err := common.Marshal(body)
  175. if err != nil {
  176. return nil, err
  177. }
  178. return bytes.NewReader(data), nil
  179. }
  180. // DoRequest delegates to common helper.
  181. func (a *TaskAdaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, requestBody io.Reader) (*http.Response, error) {
  182. return channel.DoTaskApiRequest(a, c, info, requestBody)
  183. }
  184. // DoResponse handles upstream response, returns taskID etc.
  185. func (a *TaskAdaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (taskID string, taskData []byte, taskErr *dto.TaskError) {
  186. responseBody, err := io.ReadAll(resp.Body)
  187. if err != nil {
  188. taskErr = service.TaskErrorWrapper(err, "read_response_body_failed", http.StatusInternalServerError)
  189. return
  190. }
  191. _ = resp.Body.Close()
  192. // Parse Doubao response
  193. var dResp responsePayload
  194. if err := common.Unmarshal(responseBody, &dResp); err != nil {
  195. taskErr = service.TaskErrorWrapper(errors.Wrapf(err, "body: %s", responseBody), "unmarshal_response_body_failed", http.StatusInternalServerError)
  196. return
  197. }
  198. if dResp.ID == "" {
  199. taskErr = service.TaskErrorWrapper(fmt.Errorf("task_id is empty"), "invalid_response", http.StatusInternalServerError)
  200. return
  201. }
  202. ov := dto.NewOpenAIVideo()
  203. ov.ID = info.PublicTaskID
  204. ov.TaskID = info.PublicTaskID
  205. ov.CreatedAt = time.Now().Unix()
  206. ov.Model = info.OriginModelName
  207. c.JSON(http.StatusOK, ov)
  208. return dResp.ID, responseBody, nil
  209. }
  210. // FetchTask fetch task status
  211. func (a *TaskAdaptor) FetchTask(baseUrl, key string, body map[string]any, proxy string) (*http.Response, error) {
  212. taskID, ok := body["task_id"].(string)
  213. if !ok {
  214. return nil, fmt.Errorf("invalid task_id")
  215. }
  216. uri := fmt.Sprintf("%s/api/v3/contents/generations/tasks/%s", baseUrl, taskID)
  217. req, err := http.NewRequest(http.MethodGet, uri, nil)
  218. if err != nil {
  219. return nil, err
  220. }
  221. req.Header.Set("Accept", "application/json")
  222. req.Header.Set("Content-Type", "application/json")
  223. req.Header.Set("Authorization", "Bearer "+key)
  224. client, err := service.GetHttpClientWithProxy(proxy)
  225. if err != nil {
  226. return nil, fmt.Errorf("new proxy http client failed: %w", err)
  227. }
  228. return client.Do(req)
  229. }
  230. func (a *TaskAdaptor) GetModelList() []string {
  231. return ModelList
  232. }
  233. func (a *TaskAdaptor) GetChannelName() string {
  234. return ChannelName
  235. }
  236. func (a *TaskAdaptor) convertToRequestPayload(req *relaycommon.TaskSubmitReq) (*requestPayload, error) {
  237. r := requestPayload{
  238. Model: req.Model,
  239. Content: []ContentItem{},
  240. }
  241. // Add images if present
  242. if req.HasImage() {
  243. for _, imgURL := range req.Images {
  244. r.Content = append(r.Content, ContentItem{
  245. Type: "image_url",
  246. ImageURL: &MediaURL{
  247. URL: imgURL,
  248. },
  249. })
  250. }
  251. }
  252. metadata := req.Metadata
  253. if err := taskcommon.UnmarshalMetadata(metadata, &r); err != nil {
  254. return nil, errors.Wrap(err, "unmarshal metadata failed")
  255. }
  256. if sec, _ := strconv.Atoi(req.Seconds); sec > 0 {
  257. r.Duration = lo.ToPtr(dto.IntValue(sec))
  258. }
  259. r.Content = lo.Reject(r.Content, func(c ContentItem, _ int) bool { return c.Type == "text" })
  260. r.Content = append(r.Content, ContentItem{
  261. Type: "text",
  262. Text: req.Prompt,
  263. })
  264. return &r, nil
  265. }
  266. func (a *TaskAdaptor) ParseTaskResult(respBody []byte) (*relaycommon.TaskInfo, error) {
  267. resTask := responseTask{}
  268. if err := common.Unmarshal(respBody, &resTask); err != nil {
  269. return nil, errors.Wrap(err, "unmarshal task result failed")
  270. }
  271. taskResult := relaycommon.TaskInfo{
  272. Code: 0,
  273. }
  274. // Map Doubao status to internal status
  275. switch resTask.Status {
  276. case "pending", "queued":
  277. taskResult.Status = model.TaskStatusQueued
  278. taskResult.Progress = "10%"
  279. case "processing", "running":
  280. taskResult.Status = model.TaskStatusInProgress
  281. taskResult.Progress = "50%"
  282. case "succeeded":
  283. taskResult.Status = model.TaskStatusSuccess
  284. taskResult.Progress = "100%"
  285. taskResult.Url = resTask.Content.VideoURL
  286. // 解析 usage 信息用于按倍率计费
  287. taskResult.CompletionTokens = resTask.Usage.CompletionTokens
  288. taskResult.TotalTokens = resTask.Usage.TotalTokens
  289. case "failed":
  290. taskResult.Status = model.TaskStatusFailure
  291. taskResult.Progress = "100%"
  292. taskResult.Reason = resTask.Error.Message
  293. default:
  294. // Unknown status, treat as processing
  295. taskResult.Status = model.TaskStatusInProgress
  296. taskResult.Progress = "30%"
  297. }
  298. return &taskResult, nil
  299. }
  300. func (a *TaskAdaptor) ConvertToOpenAIVideo(originTask *model.Task) ([]byte, error) {
  301. var dResp responseTask
  302. if err := common.Unmarshal(originTask.Data, &dResp); err != nil {
  303. return nil, errors.Wrap(err, "unmarshal doubao task data failed")
  304. }
  305. openAIVideo := dto.NewOpenAIVideo()
  306. openAIVideo.ID = originTask.TaskID
  307. openAIVideo.TaskID = originTask.TaskID
  308. openAIVideo.Status = originTask.Status.ToVideoStatus()
  309. openAIVideo.SetProgressStr(originTask.Progress)
  310. openAIVideo.SetMetadata("url", dResp.Content.VideoURL)
  311. openAIVideo.CreatedAt = originTask.CreatedAt
  312. openAIVideo.CompletedAt = originTask.UpdatedAt
  313. openAIVideo.Model = originTask.Properties.OriginModelName
  314. if dResp.Status == "failed" {
  315. openAIVideo.Error = &dto.OpenAIVideoError{
  316. Message: dResp.Error.Message,
  317. Code: dResp.Error.Code,
  318. }
  319. }
  320. return common.Marshal(openAIVideo)
  321. }