openai_request.go 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221
  1. package dto
  2. import "encoding/json"
  3. type ResponseFormat struct {
  4. Type string `json:"type,omitempty"`
  5. JsonSchema *FormatJsonSchema `json:"json_schema,omitempty"`
  6. }
  7. type FormatJsonSchema struct {
  8. Description string `json:"description,omitempty"`
  9. Name string `json:"name"`
  10. Schema any `json:"schema,omitempty"`
  11. Strict any `json:"strict,omitempty"`
  12. }
  13. type GeneralOpenAIRequest struct {
  14. Model string `json:"model,omitempty"`
  15. Messages []Message `json:"messages,omitempty"`
  16. Prompt any `json:"prompt,omitempty"`
  17. Suffix any `json:"suffix,omitempty"`
  18. Stream bool `json:"stream,omitempty"`
  19. StreamOptions *StreamOptions `json:"stream_options,omitempty"`
  20. MaxTokens uint `json:"max_tokens,omitempty"`
  21. MaxCompletionTokens uint `json:"max_completion_tokens,omitempty"`
  22. ReasoningEffort string `json:"reasoning_effort,omitempty"`
  23. Temperature *float64 `json:"temperature,omitempty"`
  24. TopP float64 `json:"top_p,omitempty"`
  25. TopK int `json:"top_k,omitempty"`
  26. Stop any `json:"stop,omitempty"`
  27. N int `json:"n,omitempty"`
  28. Input any `json:"input,omitempty"`
  29. Instruction string `json:"instruction,omitempty"`
  30. Size string `json:"size,omitempty"`
  31. Functions any `json:"functions,omitempty"`
  32. FrequencyPenalty float64 `json:"frequency_penalty,omitempty"`
  33. PresencePenalty float64 `json:"presence_penalty,omitempty"`
  34. ResponseFormat *ResponseFormat `json:"response_format,omitempty"`
  35. EncodingFormat any `json:"encoding_format,omitempty"`
  36. Seed float64 `json:"seed,omitempty"`
  37. Tools []ToolCall `json:"tools,omitempty"`
  38. ToolChoice any `json:"tool_choice,omitempty"`
  39. User string `json:"user,omitempty"`
  40. LogProbs bool `json:"logprobs,omitempty"`
  41. TopLogProbs int `json:"top_logprobs,omitempty"`
  42. Dimensions int `json:"dimensions,omitempty"`
  43. Modalities any `json:"modalities,omitempty"`
  44. Audio any `json:"audio,omitempty"`
  45. }
  46. type OpenAITools struct {
  47. Type string `json:"type"`
  48. Function OpenAIFunction `json:"function"`
  49. }
  50. type OpenAIFunction struct {
  51. Description string `json:"description,omitempty"`
  52. Name string `json:"name"`
  53. Parameters any `json:"parameters,omitempty"`
  54. }
  55. type StreamOptions struct {
  56. IncludeUsage bool `json:"include_usage,omitempty"`
  57. }
  58. func (r GeneralOpenAIRequest) GetMaxTokens() int {
  59. return int(r.MaxTokens)
  60. }
  61. func (r GeneralOpenAIRequest) ParseInput() []string {
  62. if r.Input == nil {
  63. return nil
  64. }
  65. var input []string
  66. switch r.Input.(type) {
  67. case string:
  68. input = []string{r.Input.(string)}
  69. case []any:
  70. input = make([]string, 0, len(r.Input.([]any)))
  71. for _, item := range r.Input.([]any) {
  72. if str, ok := item.(string); ok {
  73. input = append(input, str)
  74. }
  75. }
  76. }
  77. return input
  78. }
  79. type Message struct {
  80. Role string `json:"role"`
  81. Content json.RawMessage `json:"content"`
  82. Name *string `json:"name,omitempty"`
  83. ToolCalls json.RawMessage `json:"tool_calls,omitempty"`
  84. ToolCallId string `json:"tool_call_id,omitempty"`
  85. }
  86. type MediaContent struct {
  87. Type string `json:"type"`
  88. Text string `json:"text"`
  89. ImageUrl any `json:"image_url,omitempty"`
  90. InputAudio any `json:"input_audio,omitempty"`
  91. }
  92. type MessageImageUrl struct {
  93. Url string `json:"url"`
  94. Detail string `json:"detail"`
  95. }
  96. type MessageInputAudio struct {
  97. Data string `json:"data"` //base64
  98. Format string `json:"format"`
  99. }
  100. const (
  101. ContentTypeText = "text"
  102. ContentTypeImageURL = "image_url"
  103. ContentTypeInputAudio = "input_audio"
  104. )
  105. func (m *Message) ParseToolCalls() []ToolCall {
  106. if m.ToolCalls == nil {
  107. return nil
  108. }
  109. var toolCalls []ToolCall
  110. if err := json.Unmarshal(m.ToolCalls, &toolCalls); err == nil {
  111. return toolCalls
  112. }
  113. return toolCalls
  114. }
  115. func (m *Message) SetToolCalls(toolCalls any) {
  116. toolCallsJson, _ := json.Marshal(toolCalls)
  117. m.ToolCalls = toolCallsJson
  118. }
  119. func (m *Message) StringContent() string {
  120. var stringContent string
  121. if err := json.Unmarshal(m.Content, &stringContent); err == nil {
  122. return stringContent
  123. }
  124. return string(m.Content)
  125. }
  126. func (m *Message) SetStringContent(content string) {
  127. jsonContent, _ := json.Marshal(content)
  128. m.Content = jsonContent
  129. }
  130. func (m *Message) IsStringContent() bool {
  131. var stringContent string
  132. if err := json.Unmarshal(m.Content, &stringContent); err == nil {
  133. return true
  134. }
  135. return false
  136. }
  137. func (m *Message) ParseContent() []MediaContent {
  138. var contentList []MediaContent
  139. var stringContent string
  140. if err := json.Unmarshal(m.Content, &stringContent); err == nil {
  141. contentList = append(contentList, MediaContent{
  142. Type: ContentTypeText,
  143. Text: stringContent,
  144. })
  145. return contentList
  146. }
  147. var arrayContent []json.RawMessage
  148. if err := json.Unmarshal(m.Content, &arrayContent); err == nil {
  149. for _, contentItem := range arrayContent {
  150. var contentMap map[string]any
  151. if err := json.Unmarshal(contentItem, &contentMap); err != nil {
  152. continue
  153. }
  154. switch contentMap["type"] {
  155. case ContentTypeText:
  156. if subStr, ok := contentMap["text"].(string); ok {
  157. contentList = append(contentList, MediaContent{
  158. Type: ContentTypeText,
  159. Text: subStr,
  160. })
  161. }
  162. case ContentTypeImageURL:
  163. if subObj, ok := contentMap["image_url"].(map[string]any); ok {
  164. detail, ok := subObj["detail"]
  165. if ok {
  166. subObj["detail"] = detail.(string)
  167. } else {
  168. subObj["detail"] = "high"
  169. }
  170. contentList = append(contentList, MediaContent{
  171. Type: ContentTypeImageURL,
  172. ImageUrl: MessageImageUrl{
  173. Url: subObj["url"].(string),
  174. Detail: subObj["detail"].(string),
  175. },
  176. })
  177. } else if url, ok := contentMap["image_url"].(string); ok {
  178. contentList = append(contentList, MediaContent{
  179. Type: ContentTypeImageURL,
  180. ImageUrl: MessageImageUrl{
  181. Url: url,
  182. Detail: "high",
  183. },
  184. })
  185. }
  186. case ContentTypeInputAudio:
  187. if subObj, ok := contentMap["input_audio"].(map[string]any); ok {
  188. contentList = append(contentList, MediaContent{
  189. Type: ContentTypeInputAudio,
  190. InputAudio: MessageInputAudio{
  191. Data: subObj["data"].(string),
  192. Format: subObj["format"].(string),
  193. },
  194. })
  195. }
  196. }
  197. }
  198. return contentList
  199. }
  200. return nil
  201. }