video_proxy_gemini.go 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294
  1. package controller
  2. import (
  3. "fmt"
  4. "io"
  5. "strconv"
  6. "strings"
  7. "github.com/QuantumNous/new-api/common"
  8. "github.com/QuantumNous/new-api/constant"
  9. "github.com/QuantumNous/new-api/model"
  10. "github.com/QuantumNous/new-api/relay"
  11. )
  12. func getGeminiVideoURL(channel *model.Channel, task *model.Task, apiKey string) (string, error) {
  13. if channel == nil || task == nil {
  14. return "", fmt.Errorf("invalid channel or task")
  15. }
  16. if url := extractGeminiVideoURLFromTaskData(task); url != "" {
  17. return ensureAPIKey(url, apiKey), nil
  18. }
  19. baseURL := constant.ChannelBaseURLs[channel.Type]
  20. if channel.GetBaseURL() != "" {
  21. baseURL = channel.GetBaseURL()
  22. }
  23. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  24. if adaptor == nil {
  25. return "", fmt.Errorf("gemini task adaptor not found")
  26. }
  27. if apiKey == "" {
  28. return "", fmt.Errorf("api key not available for task")
  29. }
  30. proxy := channel.GetSetting().Proxy
  31. resp, err := adaptor.FetchTask(baseURL, apiKey, map[string]any{
  32. "task_id": task.GetUpstreamTaskID(),
  33. "action": task.Action,
  34. }, proxy)
  35. if err != nil {
  36. return "", fmt.Errorf("fetch task failed: %w", err)
  37. }
  38. defer resp.Body.Close()
  39. body, err := io.ReadAll(resp.Body)
  40. if err != nil {
  41. return "", fmt.Errorf("read task response failed: %w", err)
  42. }
  43. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  44. if parseErr == nil && taskInfo != nil && taskInfo.RemoteUrl != "" {
  45. return ensureAPIKey(taskInfo.RemoteUrl, apiKey), nil
  46. }
  47. if url := extractGeminiVideoURLFromPayload(body); url != "" {
  48. return ensureAPIKey(url, apiKey), nil
  49. }
  50. if parseErr != nil {
  51. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  52. }
  53. return "", fmt.Errorf("gemini video url not found")
  54. }
  55. func extractGeminiVideoURLFromTaskData(task *model.Task) string {
  56. if task == nil || len(task.Data) == 0 {
  57. return ""
  58. }
  59. var payload map[string]any
  60. if err := common.Unmarshal(task.Data, &payload); err != nil {
  61. return ""
  62. }
  63. return extractGeminiVideoURLFromMap(payload)
  64. }
  65. func extractGeminiVideoURLFromPayload(body []byte) string {
  66. var payload map[string]any
  67. if err := common.Unmarshal(body, &payload); err != nil {
  68. return ""
  69. }
  70. return extractGeminiVideoURLFromMap(payload)
  71. }
  72. func extractGeminiVideoURLFromMap(payload map[string]any) string {
  73. if payload == nil {
  74. return ""
  75. }
  76. if uri, ok := payload["uri"].(string); ok && uri != "" {
  77. return uri
  78. }
  79. if resp, ok := payload["response"].(map[string]any); ok {
  80. if uri := extractGeminiVideoURLFromResponse(resp); uri != "" {
  81. return uri
  82. }
  83. }
  84. return ""
  85. }
  86. func extractGeminiVideoURLFromResponse(resp map[string]any) string {
  87. if resp == nil {
  88. return ""
  89. }
  90. if gvr, ok := resp["generateVideoResponse"].(map[string]any); ok {
  91. if uri := extractGeminiVideoURLFromGeneratedSamples(gvr); uri != "" {
  92. return uri
  93. }
  94. }
  95. if videos, ok := resp["videos"].([]any); ok {
  96. for _, video := range videos {
  97. if vm, ok := video.(map[string]any); ok {
  98. if uri, ok := vm["uri"].(string); ok && uri != "" {
  99. return uri
  100. }
  101. }
  102. }
  103. }
  104. if uri, ok := resp["video"].(string); ok && uri != "" {
  105. return uri
  106. }
  107. if uri, ok := resp["uri"].(string); ok && uri != "" {
  108. return uri
  109. }
  110. return ""
  111. }
  112. func extractGeminiVideoURLFromGeneratedSamples(gvr map[string]any) string {
  113. if gvr == nil {
  114. return ""
  115. }
  116. if samples, ok := gvr["generatedSamples"].([]any); ok {
  117. for _, sample := range samples {
  118. if sm, ok := sample.(map[string]any); ok {
  119. if video, ok := sm["video"].(map[string]any); ok {
  120. if uri, ok := video["uri"].(string); ok && uri != "" {
  121. return uri
  122. }
  123. }
  124. }
  125. }
  126. }
  127. return ""
  128. }
  129. func getVertexVideoURL(channel *model.Channel, task *model.Task) (string, error) {
  130. if channel == nil || task == nil {
  131. return "", fmt.Errorf("invalid channel or task")
  132. }
  133. if url := strings.TrimSpace(task.GetResultURL()); url != "" && !isTaskProxyContentURL(url, task.TaskID) {
  134. return url, nil
  135. }
  136. if url := extractVertexVideoURLFromTaskData(task); url != "" {
  137. return url, nil
  138. }
  139. baseURL := constant.ChannelBaseURLs[channel.Type]
  140. if channel.GetBaseURL() != "" {
  141. baseURL = channel.GetBaseURL()
  142. }
  143. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  144. if adaptor == nil {
  145. return "", fmt.Errorf("vertex task adaptor not found")
  146. }
  147. key := getVertexTaskKey(channel, task)
  148. if key == "" {
  149. return "", fmt.Errorf("vertex key not available for task")
  150. }
  151. resp, err := adaptor.FetchTask(baseURL, key, map[string]any{
  152. "task_id": task.GetUpstreamTaskID(),
  153. "action": task.Action,
  154. }, channel.GetSetting().Proxy)
  155. if err != nil {
  156. return "", fmt.Errorf("fetch task failed: %w", err)
  157. }
  158. defer resp.Body.Close()
  159. body, err := io.ReadAll(resp.Body)
  160. if err != nil {
  161. return "", fmt.Errorf("read task response failed: %w", err)
  162. }
  163. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  164. if parseErr == nil && taskInfo != nil && strings.TrimSpace(taskInfo.Url) != "" {
  165. return taskInfo.Url, nil
  166. }
  167. if url := extractVertexVideoURLFromPayload(body); url != "" {
  168. return url, nil
  169. }
  170. if parseErr != nil {
  171. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  172. }
  173. return "", fmt.Errorf("vertex video url not found")
  174. }
  175. func isTaskProxyContentURL(url string, taskID string) bool {
  176. if strings.TrimSpace(url) == "" || strings.TrimSpace(taskID) == "" {
  177. return false
  178. }
  179. return strings.Contains(url, "/v1/videos/"+taskID+"/content")
  180. }
  181. func getVertexTaskKey(channel *model.Channel, task *model.Task) string {
  182. if task != nil {
  183. if key := strings.TrimSpace(task.PrivateData.Key); key != "" {
  184. return key
  185. }
  186. }
  187. if channel == nil {
  188. return ""
  189. }
  190. keys := channel.GetKeys()
  191. for _, key := range keys {
  192. key = strings.TrimSpace(key)
  193. if key != "" {
  194. return key
  195. }
  196. }
  197. return strings.TrimSpace(channel.Key)
  198. }
  199. func extractVertexVideoURLFromTaskData(task *model.Task) string {
  200. if task == nil || len(task.Data) == 0 {
  201. return ""
  202. }
  203. return extractVertexVideoURLFromPayload(task.Data)
  204. }
  205. func extractVertexVideoURLFromPayload(body []byte) string {
  206. var payload map[string]any
  207. if err := common.Unmarshal(body, &payload); err != nil {
  208. return ""
  209. }
  210. resp, ok := payload["response"].(map[string]any)
  211. if !ok || resp == nil {
  212. return ""
  213. }
  214. if videos, ok := resp["videos"].([]any); ok && len(videos) > 0 {
  215. if video, ok := videos[0].(map[string]any); ok && video != nil {
  216. if b64, _ := video["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  217. mime, _ := video["mimeType"].(string)
  218. enc, _ := video["encoding"].(string)
  219. return buildVideoDataURL(mime, enc, b64)
  220. }
  221. }
  222. }
  223. if b64, _ := resp["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  224. enc, _ := resp["encoding"].(string)
  225. return buildVideoDataURL("", enc, b64)
  226. }
  227. if video, _ := resp["video"].(string); strings.TrimSpace(video) != "" {
  228. if strings.HasPrefix(video, "data:") || strings.HasPrefix(video, "http://") || strings.HasPrefix(video, "https://") {
  229. return video
  230. }
  231. enc, _ := resp["encoding"].(string)
  232. return buildVideoDataURL("", enc, video)
  233. }
  234. return ""
  235. }
  236. func buildVideoDataURL(mimeType string, encoding string, base64Data string) string {
  237. mime := strings.TrimSpace(mimeType)
  238. if mime == "" {
  239. enc := strings.TrimSpace(encoding)
  240. if enc == "" {
  241. enc = "mp4"
  242. }
  243. if strings.Contains(enc, "/") {
  244. mime = enc
  245. } else {
  246. mime = "video/" + enc
  247. }
  248. }
  249. return "data:" + mime + ";base64," + base64Data
  250. }
  251. func ensureAPIKey(uri, key string) string {
  252. if key == "" || uri == "" {
  253. return uri
  254. }
  255. if strings.Contains(uri, "key=") {
  256. return uri
  257. }
  258. if strings.Contains(uri, "?") {
  259. return fmt.Sprintf("%s&key=%s", uri, key)
  260. }
  261. return fmt.Sprintf("%s?key=%s", uri, key)
  262. }