video_proxy_gemini.go 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287
  1. package controller
  2. import (
  3. "fmt"
  4. "io"
  5. "strconv"
  6. "strings"
  7. "github.com/QuantumNous/new-api/common"
  8. "github.com/QuantumNous/new-api/constant"
  9. "github.com/QuantumNous/new-api/model"
  10. "github.com/QuantumNous/new-api/relay"
  11. )
  12. func getGeminiVideoURL(channel *model.Channel, task *model.Task, apiKey string) (string, error) {
  13. if channel == nil || task == nil {
  14. return "", fmt.Errorf("invalid channel or task")
  15. }
  16. if url := extractGeminiVideoURLFromTaskData(task); url != "" {
  17. return ensureAPIKey(url, apiKey), nil
  18. }
  19. baseURL := constant.ChannelBaseURLs[channel.Type]
  20. if channel.GetBaseURL() != "" {
  21. baseURL = channel.GetBaseURL()
  22. }
  23. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  24. if adaptor == nil {
  25. return "", fmt.Errorf("gemini task adaptor not found")
  26. }
  27. if apiKey == "" {
  28. return "", fmt.Errorf("api key not available for task")
  29. }
  30. proxy := channel.GetSetting().Proxy
  31. resp, err := adaptor.FetchTask(baseURL, apiKey, map[string]any{
  32. "task_id": task.GetUpstreamTaskID(),
  33. "action": task.Action,
  34. }, proxy)
  35. if err != nil {
  36. return "", fmt.Errorf("fetch task failed: %w", err)
  37. }
  38. defer resp.Body.Close()
  39. body, err := io.ReadAll(resp.Body)
  40. if err != nil {
  41. return "", fmt.Errorf("read task response failed: %w", err)
  42. }
  43. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  44. if parseErr == nil && taskInfo != nil && taskInfo.RemoteUrl != "" {
  45. return ensureAPIKey(taskInfo.RemoteUrl, apiKey), nil
  46. }
  47. if url := extractGeminiVideoURLFromPayload(body); url != "" {
  48. return ensureAPIKey(url, apiKey), nil
  49. }
  50. if parseErr != nil {
  51. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  52. }
  53. return "", fmt.Errorf("gemini video url not found")
  54. }
  55. func extractGeminiVideoURLFromTaskData(task *model.Task) string {
  56. if task == nil || len(task.Data) == 0 {
  57. return ""
  58. }
  59. var payload map[string]any
  60. if err := common.Unmarshal(task.Data, &payload); err != nil {
  61. return ""
  62. }
  63. return extractGeminiVideoURLFromMap(payload)
  64. }
  65. func extractGeminiVideoURLFromPayload(body []byte) string {
  66. var payload map[string]any
  67. if err := common.Unmarshal(body, &payload); err != nil {
  68. return ""
  69. }
  70. return extractGeminiVideoURLFromMap(payload)
  71. }
  72. func extractGeminiVideoURLFromMap(payload map[string]any) string {
  73. if payload == nil {
  74. return ""
  75. }
  76. if uri, ok := payload["uri"].(string); ok && uri != "" {
  77. return uri
  78. }
  79. if resp, ok := payload["response"].(map[string]any); ok {
  80. if uri := extractGeminiVideoURLFromResponse(resp); uri != "" {
  81. return uri
  82. }
  83. }
  84. return ""
  85. }
  86. func extractGeminiVideoURLFromResponse(resp map[string]any) string {
  87. if resp == nil {
  88. return ""
  89. }
  90. if gvr, ok := resp["generateVideoResponse"].(map[string]any); ok {
  91. if uri := extractGeminiVideoURLFromGeneratedSamples(gvr); uri != "" {
  92. return uri
  93. }
  94. }
  95. if videos, ok := resp["videos"].([]any); ok {
  96. for _, video := range videos {
  97. if vm, ok := video.(map[string]any); ok {
  98. if uri, ok := vm["uri"].(string); ok && uri != "" {
  99. return uri
  100. }
  101. }
  102. }
  103. }
  104. if uri, ok := resp["video"].(string); ok && uri != "" {
  105. return uri
  106. }
  107. if uri, ok := resp["uri"].(string); ok && uri != "" {
  108. return uri
  109. }
  110. return ""
  111. }
  112. func extractGeminiVideoURLFromGeneratedSamples(gvr map[string]any) string {
  113. if gvr == nil {
  114. return ""
  115. }
  116. if samples, ok := gvr["generatedSamples"].([]any); ok {
  117. for _, sample := range samples {
  118. if sm, ok := sample.(map[string]any); ok {
  119. if video, ok := sm["video"].(map[string]any); ok {
  120. if uri, ok := video["uri"].(string); ok && uri != "" {
  121. return uri
  122. }
  123. }
  124. }
  125. }
  126. }
  127. return ""
  128. }
  129. func getVertexVideoURL(channel *model.Channel, task *model.Task) (string, error) {
  130. if channel == nil || task == nil {
  131. return "", fmt.Errorf("invalid channel or task")
  132. }
  133. if url := strings.TrimSpace(task.GetResultURL()); url != "" {
  134. return url, nil
  135. }
  136. if url := extractVertexVideoURLFromTaskData(task); url != "" {
  137. return url, nil
  138. }
  139. baseURL := constant.ChannelBaseURLs[channel.Type]
  140. if channel.GetBaseURL() != "" {
  141. baseURL = channel.GetBaseURL()
  142. }
  143. adaptor := relay.GetTaskAdaptor(constant.TaskPlatform(strconv.Itoa(channel.Type)))
  144. if adaptor == nil {
  145. return "", fmt.Errorf("vertex task adaptor not found")
  146. }
  147. key := getVertexTaskKey(channel, task)
  148. if key == "" {
  149. return "", fmt.Errorf("vertex key not available for task")
  150. }
  151. resp, err := adaptor.FetchTask(baseURL, key, map[string]any{
  152. "task_id": task.GetUpstreamTaskID(),
  153. "action": task.Action,
  154. }, channel.GetSetting().Proxy)
  155. if err != nil {
  156. return "", fmt.Errorf("fetch task failed: %w", err)
  157. }
  158. defer resp.Body.Close()
  159. body, err := io.ReadAll(resp.Body)
  160. if err != nil {
  161. return "", fmt.Errorf("read task response failed: %w", err)
  162. }
  163. taskInfo, parseErr := adaptor.ParseTaskResult(body)
  164. if parseErr == nil && taskInfo != nil && strings.TrimSpace(taskInfo.Url) != "" {
  165. return taskInfo.Url, nil
  166. }
  167. if url := extractVertexVideoURLFromPayload(body); url != "" {
  168. return url, nil
  169. }
  170. if parseErr != nil {
  171. return "", fmt.Errorf("parse task result failed: %w", parseErr)
  172. }
  173. return "", fmt.Errorf("vertex video url not found")
  174. }
  175. func getVertexTaskKey(channel *model.Channel, task *model.Task) string {
  176. if task != nil {
  177. if key := strings.TrimSpace(task.PrivateData.Key); key != "" {
  178. return key
  179. }
  180. }
  181. if channel == nil {
  182. return ""
  183. }
  184. keys := channel.GetKeys()
  185. for _, key := range keys {
  186. key = strings.TrimSpace(key)
  187. if key != "" {
  188. return key
  189. }
  190. }
  191. return strings.TrimSpace(channel.Key)
  192. }
  193. func extractVertexVideoURLFromTaskData(task *model.Task) string {
  194. if task == nil || len(task.Data) == 0 {
  195. return ""
  196. }
  197. return extractVertexVideoURLFromPayload(task.Data)
  198. }
  199. func extractVertexVideoURLFromPayload(body []byte) string {
  200. var payload map[string]any
  201. if err := common.Unmarshal(body, &payload); err != nil {
  202. return ""
  203. }
  204. resp, ok := payload["response"].(map[string]any)
  205. if !ok || resp == nil {
  206. return ""
  207. }
  208. if videos, ok := resp["videos"].([]any); ok && len(videos) > 0 {
  209. if video, ok := videos[0].(map[string]any); ok && video != nil {
  210. if b64, _ := video["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  211. mime, _ := video["mimeType"].(string)
  212. enc, _ := video["encoding"].(string)
  213. return buildVideoDataURL(mime, enc, b64)
  214. }
  215. }
  216. }
  217. if b64, _ := resp["bytesBase64Encoded"].(string); strings.TrimSpace(b64) != "" {
  218. enc, _ := resp["encoding"].(string)
  219. return buildVideoDataURL("", enc, b64)
  220. }
  221. if video, _ := resp["video"].(string); strings.TrimSpace(video) != "" {
  222. if strings.HasPrefix(video, "data:") || strings.HasPrefix(video, "http://") || strings.HasPrefix(video, "https://") {
  223. return video
  224. }
  225. enc, _ := resp["encoding"].(string)
  226. return buildVideoDataURL("", enc, video)
  227. }
  228. return ""
  229. }
  230. func buildVideoDataURL(mimeType string, encoding string, base64Data string) string {
  231. mime := strings.TrimSpace(mimeType)
  232. if mime == "" {
  233. enc := strings.TrimSpace(encoding)
  234. if enc == "" {
  235. enc = "mp4"
  236. }
  237. if strings.Contains(enc, "/") {
  238. mime = enc
  239. } else {
  240. mime = "video/" + enc
  241. }
  242. }
  243. return "data:" + mime + ";base64," + base64Data
  244. }
  245. func ensureAPIKey(uri, key string) string {
  246. if key == "" || uri == "" {
  247. return uri
  248. }
  249. if strings.Contains(uri, "key=") {
  250. return uri
  251. }
  252. if strings.Contains(uri, "?") {
  253. return fmt.Sprintf("%s&key=%s", uri, key)
  254. }
  255. return fmt.Sprintf("%s?key=%s", uri, key)
  256. }