video_proxy_gemini.go 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263
  1. package controller
  2. import (
  3. "fmt"
  4. "io"
  5. "strconv"
  6. "strings"
  7. "github.com/QuantumNous/new-api/common"
  8. "github.com/QuantumNous/new-api/constant"
  9. "github.com/QuantumNous/new-api/model"
  10. "github.com/QuantumNous/new-api/relay"
  11. )
  12. func getGeminiVideoURL(channel *model.Channel, task *model.Task, apiKey string) (string, error) {
  13. if channel == nil || task == nil {
  14. return "", fmt.Errorf("invalid channel or task")
  15. }
  16. if url := extractGeminiVideoURLFromTaskData(task); url != "" {
  17. return ensureAPIKey(url, apiKey), nil
  18. }
  19. baseURL := constant.ChannelBaseURLs[channel.Type]
  20. if channel.GetBaseURL() != "" {
  21. baseURL = channel.GetBaseURL()
  22. }
  23. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  24. if adaptor == nil {
  25. return "", fmt.Errorf("gemini task adaptor not found")
  26. }
  27. if apiKey == "" {
  28. return "", fmt.Errorf("api key not available for task")
  29. }
  30. proxy := channel.GetSetting().Proxy
  31. resp, err := adaptor.FetchTask(baseURL, apiKey, map[string]any{
  32. "task_id": task.GetUpstreamTaskID(),
  33. "action": task.Action,
  34. }, proxy)
  35. if err != nil {
  36. return "", fmt.Errorf("fetch task failed: %w", err)
  37. }
  38. defer resp.Body.Close()
  39. body, err := io.ReadAll(resp.Body)
  40. if err != nil {
  41. return "", fmt.Errorf("read task response failed: %w", err)
  42. }
  43. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  44. if parseErr == nil && taskInfo != nil && taskInfo.RemoteUrl != "" {
  45. return ensureAPIKey(taskInfo.RemoteUrl, apiKey), nil
  46. }
  47. if url := extractGeminiVideoURLFromPayload(body); url != "" {
  48. return ensureAPIKey(url, apiKey), nil
  49. }
  50. if parseErr != nil {
  51. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  52. }
  53. return "", fmt.Errorf("gemini video url not found")
  54. }
  55. func extractGeminiVideoURLFromTaskData(task *model.Task) string {
  56. if task == nil || len(task.Data) == 0 {
  57. return ""
  58. }
  59. var payload map[string]any
  60. if err := common.Unmarshal(task.Data, &payload); err != nil {
  61. return ""
  62. }
  63. return extractGeminiVideoURLFromMap(payload)
  64. }
  65. func extractGeminiVideoURLFromPayload(body []byte) string {
  66. var payload map[string]any
  67. if err := common.Unmarshal(body, &payload); err != nil {
  68. return ""
  69. }
  70. return extractGeminiVideoURLFromMap(payload)
  71. }
  72. func extractGeminiVideoURLFromMap(payload map[string]any) string {
  73. if payload == nil {
  74. return ""
  75. }
  76. if uri, ok := payload["uri"].(string); ok && uri != "" {
  77. return uri
  78. }
  79. if resp, ok := payload["response"].(map[string]any); ok {
  80. if uri := extractGeminiVideoURLFromResponse(resp); uri != "" {
  81. return uri
  82. }
  83. }
  84. return ""
  85. }
  86. func extractGeminiVideoURLFromResponse(resp map[string]any) string {
  87. if resp == nil {
  88. return ""
  89. }
  90. if gvr, ok := resp["generateVideoResponse"].(map[string]any); ok {
  91. if uri := extractGeminiVideoURLFromGeneratedSamples(gvr); uri != "" {
  92. return uri
  93. }
  94. }
  95. if videos, ok := resp["videos"].([]any); ok {
  96. for _, video := range videos {
  97. if vm, ok := video.(map[string]any); ok {
  98. if uri, ok := vm["uri"].(string); ok && uri != "" {
  99. return uri
  100. }
  101. }
  102. }
  103. }
  104. if uri, ok := resp["video"].(string); ok && uri != "" {
  105. return uri
  106. }
  107. if uri, ok := resp["uri"].(string); ok && uri != "" {
  108. return uri
  109. }
  110. return ""
  111. }
  112. func extractGeminiVideoURLFromGeneratedSamples(gvr map[string]any) string {
  113. if gvr == nil {
  114. return ""
  115. }
  116. if samples, ok := gvr["generatedSamples"].([]any); ok {
  117. for _, sample := range samples {
  118. if sm, ok := sample.(map[string]any); ok {
  119. if video, ok := sm["video"].(map[string]any); ok {
  120. if uri, ok := video["uri"].(string); ok && uri != "" {
  121. return uri
  122. }
  123. }
  124. }
  125. }
  126. }
  127. return ""
  128. }
  129. func getVertexVideoURL(channel *model.Channel, task *model.Task) (string, error) {
  130. if channel == nil || task == nil {
  131. return "", fmt.Errorf("invalid channel or task")
  132. }
  133. if url := strings.TrimSpace(task.GetResultURL()); url != "" {
  134. return url, nil
  135. }
  136. if url := extractVertexVideoURLFromTaskData(task); url != "" {
  137. return url, nil
  138. }
  139. baseURL := constant.ChannelBaseURLs[channel.Type]
  140. if channel.GetBaseURL() != "" {
  141. baseURL = channel.GetBaseURL()
  142. }
  143. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  144. if adaptor == nil {
  145. return "", fmt.Errorf("vertex task adaptor not found")
  146. }
  147. resp, err := adaptor.FetchTask(baseURL, channel.Key, map[string]any{
  148. "task_id": task.GetUpstreamTaskID(),
  149. "action": task.Action,
  150. }, channel.GetSetting().Proxy)
  151. if err != nil {
  152. return "", fmt.Errorf("fetch task failed: %w", err)
  153. }
  154. defer resp.Body.Close()
  155. body, err := io.ReadAll(resp.Body)
  156. if err != nil {
  157. return "", fmt.Errorf("read task response failed: %w", err)
  158. }
  159. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  160. if parseErr == nil && taskInfo != nil && strings.TrimSpace(taskInfo.Url) != "" {
  161. return taskInfo.Url, nil
  162. }
  163. if url := extractVertexVideoURLFromPayload(body); url != "" {
  164. return url, nil
  165. }
  166. if parseErr != nil {
  167. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  168. }
  169. return "", fmt.Errorf("vertex video url not found")
  170. }
  171. func extractVertexVideoURLFromTaskData(task *model.Task) string {
  172. if task == nil || len(task.Data) == 0 {
  173. return ""
  174. }
  175. return extractVertexVideoURLFromPayload(task.Data)
  176. }
  177. func extractVertexVideoURLFromPayload(body []byte) string {
  178. var payload map[string]any
  179. if err := common.Unmarshal(body, &payload); err != nil {
  180. return ""
  181. }
  182. resp, ok := payload["response"].(map[string]any)
  183. if !ok || resp == nil {
  184. return ""
  185. }
  186. if videos, ok := resp["videos"].([]any); ok && len(videos) > 0 {
  187. if video, ok := videos[0].(map[string]any); ok && video != nil {
  188. if b64, _ := video["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  189. mime, _ := video["mimeType"].(string)
  190. enc, _ := video["encoding"].(string)
  191. return buildVideoDataURL(mime, enc, b64)
  192. }
  193. }
  194. }
  195. if b64, _ := resp["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  196. enc, _ := resp["encoding"].(string)
  197. return buildVideoDataURL("", enc, b64)
  198. }
  199. if video, _ := resp["video"].(string); strings.TrimSpace(video) != "" {
  200. if strings.HasPrefix(video, "data:") || strings.HasPrefix(video, "http://") || strings.HasPrefix(video, "https://") {
  201. return video
  202. }
  203. enc, _ := resp["encoding"].(string)
  204. return buildVideoDataURL("", enc, video)
  205. }
  206. return ""
  207. }
  208. func buildVideoDataURL(mimeType string, encoding string, base64Data string) string {
  209. mime := strings.TrimSpace(mimeType)
  210. if mime == "" {
  211. enc := strings.TrimSpace(encoding)
  212. if enc == "" {
  213. enc = "mp4"
  214. }
  215. if strings.Contains(enc, "/") {
  216. mime = enc
  217. } else {
  218. mime = "video/" + enc
  219. }
  220. }
  221. return "data:" + mime + ";base64," + base64Data
  222. }
  223. func ensureAPIKey(uri, key string) string {
  224. if key == "" || uri == "" {
  225. return uri
  226. }
  227. if strings.Contains(uri, "key=") {
  228. return uri
  229. }
  230. if strings.Contains(uri, "?") {
  231. return fmt.Sprintf("%s&key=%s", uri, key)
  232. }
  233. return fmt.Sprintf("%s?key=%s", uri, key)
  234. }