| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309 |
- package gemini
- import (
- "bufio"
- "encoding/json"
- "fmt"
- "io"
- "log"
- "net/http"
- "one-api/common"
- "one-api/constant"
- "one-api/dto"
- relaycommon "one-api/relay/common"
- "one-api/service"
- "strings"
- "time"
- "github.com/gin-gonic/gin"
- )
- // Setting safety to the lowest possible values since Gemini is already powerless enough
- func CovertGemini2OpenAI(textRequest dto.GeneralOpenAIRequest) *GeminiChatRequest {
- geminiRequest := GeminiChatRequest{
- Contents: make([]GeminiChatContent, 0, len(textRequest.Messages)),
- SafetySettings: []GeminiChatSafetySettings{
- {
- Category: "HARM_CATEGORY_HARASSMENT",
- Threshold: common.GeminiSafetySetting,
- },
- {
- Category: "HARM_CATEGORY_HATE_SPEECH",
- Threshold: common.GeminiSafetySetting,
- },
- {
- Category: "HARM_CATEGORY_SEXUALLY_EXPLICIT",
- Threshold: common.GeminiSafetySetting,
- },
- {
- Category: "HARM_CATEGORY_DANGEROUS_CONTENT",
- Threshold: common.GeminiSafetySetting,
- },
- },
- GenerationConfig: GeminiChatGenerationConfig{
- Temperature: textRequest.Temperature,
- TopP: textRequest.TopP,
- MaxOutputTokens: textRequest.MaxTokens,
- },
- }
- if textRequest.Functions != nil {
- geminiRequest.Tools = []GeminiChatTools{
- {
- FunctionDeclarations: textRequest.Functions,
- },
- }
- }
- shouldAddDummyModelMessage := false
- for _, message := range textRequest.Messages {
- content := GeminiChatContent{
- Role: message.Role,
- Parts: []GeminiPart{
- {
- Text: message.StringContent(),
- },
- },
- }
- openaiContent := message.ParseContent()
- var parts []GeminiPart
- imageNum := 0
- for _, part := range openaiContent {
- if part.Type == dto.ContentTypeText {
- parts = append(parts, GeminiPart{
- Text: part.Text,
- })
- } else if part.Type == dto.ContentTypeImageURL {
- imageNum += 1
- if imageNum > GeminiVisionMaxImageNum {
- continue
- }
- mimeType, data, _ := service.GetImageFromUrl(part.ImageUrl.(dto.MessageImageUrl).Url)
- parts = append(parts, GeminiPart{
- InlineData: &GeminiInlineData{
- MimeType: mimeType,
- Data: data,
- },
- })
- }
- }
- content.Parts = parts
- // there's no assistant role in gemini and API shall vomit if Role is not user or model
- if content.Role == "assistant" {
- content.Role = "model"
- }
- // Converting system prompt to prompt from user for the same reason
- if content.Role == "system" {
- content.Role = "user"
- shouldAddDummyModelMessage = true
- }
- geminiRequest.Contents = append(geminiRequest.Contents, content)
- // If a system message is the last message, we need to add a dummy model message to make gemini happy
- if shouldAddDummyModelMessage {
- geminiRequest.Contents = append(geminiRequest.Contents, GeminiChatContent{
- Role: "model",
- Parts: []GeminiPart{
- {
- Text: "Okay",
- },
- },
- })
- shouldAddDummyModelMessage = false
- }
- }
- return &geminiRequest
- }
- func (g *GeminiChatResponse) GetResponseText() string {
- if g == nil {
- return ""
- }
- if len(g.Candidates) > 0 && len(g.Candidates[0].Content.Parts) > 0 {
- return g.Candidates[0].Content.Parts[0].Text
- }
- return ""
- }
- func responseGeminiChat2OpenAI(response *GeminiChatResponse) *dto.OpenAITextResponse {
- fullTextResponse := dto.OpenAITextResponse{
- Id: fmt.Sprintf("chatcmpl-%s", common.GetUUID()),
- Object: "chat.completion",
- Created: common.GetTimestamp(),
- Choices: make([]dto.OpenAITextResponseChoice, 0, len(response.Candidates)),
- }
- content, _ := json.Marshal("")
- for i, candidate := range response.Candidates {
- choice := dto.OpenAITextResponseChoice{
- Index: i,
- Message: dto.Message{
- Role: "assistant",
- Content: content,
- },
- FinishReason: relaycommon.StopFinishReason,
- }
- if len(candidate.Content.Parts) > 0 {
- content, _ = json.Marshal(candidate.Content.Parts[0].Text)
- choice.Message.Content = content
- }
- fullTextResponse.Choices = append(fullTextResponse.Choices, choice)
- }
- return &fullTextResponse
- }
- func streamResponseGeminiChat2OpenAI(geminiResponse *GeminiChatResponse) *dto.ChatCompletionsStreamResponse {
- var choice dto.ChatCompletionsStreamResponseChoice
- choice.Delta.SetContentString(geminiResponse.GetResponseText())
- choice.FinishReason = &relaycommon.StopFinishReason
- var response dto.ChatCompletionsStreamResponse
- response.Object = "chat.completion.chunk"
- response.Model = "gemini"
- response.Choices = []dto.ChatCompletionsStreamResponseChoice{choice}
- return &response
- }
- func geminiChatStreamHandler(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (*dto.OpenAIErrorWithStatusCode, *dto.Usage) {
- responseText := ""
- responseJson := ""
- id := fmt.Sprintf("chatcmpl-%s", common.GetUUID())
- createAt := common.GetTimestamp()
- var usage = &dto.Usage{}
- dataChan := make(chan string, 5)
- stopChan := make(chan bool, 2)
- scanner := bufio.NewScanner(resp.Body)
- scanner.Split(func(data []byte, atEOF bool) (advance int, token []byte, err error) {
- if atEOF && len(data) == 0 {
- return 0, nil, nil
- }
- if i := strings.Index(string(data), "\n"); i >= 0 {
- return i + 1, data[0:i], nil
- }
- if atEOF {
- return len(data), data, nil
- }
- return 0, nil, nil
- })
- go func() {
- for scanner.Scan() {
- data := scanner.Text()
- responseJson += data
- data = strings.TrimSpace(data)
- if !strings.HasPrefix(data, "\"text\": \"") {
- continue
- }
- data = strings.TrimPrefix(data, "\"text\": \"")
- data = strings.TrimSuffix(data, "\"")
- if !common.SafeSendStringTimeout(dataChan, data, constant.StreamingTimeout) {
- // send data timeout, stop the stream
- common.LogError(c, "send data timeout, stop the stream")
- break
- }
- }
- stopChan <- true
- }()
- isFirst := true
- service.SetEventStreamHeaders(c)
- c.Stream(func(w io.Writer) bool {
- select {
- case data := <-dataChan:
- if isFirst {
- isFirst = false
- info.FirstResponseTime = time.Now()
- }
- // this is used to prevent annoying \ related format bug
- data = fmt.Sprintf("{\"content\": \"%s\"}", data)
- type dummyStruct struct {
- Content string `json:"content"`
- }
- var dummy dummyStruct
- err := json.Unmarshal([]byte(data), &dummy)
- responseText += dummy.Content
- var choice dto.ChatCompletionsStreamResponseChoice
- choice.Delta.SetContentString(dummy.Content)
- response := dto.ChatCompletionsStreamResponse{
- Id: id,
- Object: "chat.completion.chunk",
- Created: createAt,
- Model: info.UpstreamModelName,
- Choices: []dto.ChatCompletionsStreamResponseChoice{choice},
- }
- jsonResponse, err := json.Marshal(response)
- if err != nil {
- common.SysError("error marshalling stream response: " + err.Error())
- return true
- }
- c.Render(-1, common.CustomEvent{Data: "data: " + string(jsonResponse)})
- return true
- case <-stopChan:
- return false
- }
- })
- var geminiChatResponses []GeminiChatResponse
- err := json.Unmarshal([]byte(responseJson), &geminiChatResponses)
- if err != nil {
- log.Printf("cannot get gemini usage: %s", err.Error())
- usage, _ = service.ResponseText2Usage(responseText, info.UpstreamModelName, info.PromptTokens)
- } else {
- for _, response := range geminiChatResponses {
- usage.PromptTokens = response.UsageMetadata.PromptTokenCount
- usage.CompletionTokens = response.UsageMetadata.CandidatesTokenCount
- }
- usage.TotalTokens = usage.PromptTokens + usage.CompletionTokens
- }
- if info.ShouldIncludeUsage {
- response := service.GenerateFinalUsageResponse(id, createAt, info.UpstreamModelName, *usage)
- err := service.ObjectData(c, response)
- if err != nil {
- common.SysError("send final response failed: " + err.Error())
- }
- }
- service.Done(c)
- err = resp.Body.Close()
- if err != nil {
- return service.OpenAIErrorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), usage
- }
- return nil, usage
- }
- func geminiChatHandler(c *gin.Context, resp *http.Response, promptTokens int, model string) (*dto.OpenAIErrorWithStatusCode, *dto.Usage) {
- responseBody, err := io.ReadAll(resp.Body)
- if err != nil {
- return service.OpenAIErrorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil
- }
- err = resp.Body.Close()
- if err != nil {
- return service.OpenAIErrorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
- }
- var geminiResponse GeminiChatResponse
- err = json.Unmarshal(responseBody, &geminiResponse)
- if err != nil {
- return service.OpenAIErrorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil
- }
- if len(geminiResponse.Candidates) == 0 {
- return &dto.OpenAIErrorWithStatusCode{
- Error: dto.OpenAIError{
- Message: "No candidates returned",
- Type: "server_error",
- Param: "",
- Code: 500,
- },
- StatusCode: resp.StatusCode,
- }, nil
- }
- fullTextResponse := responseGeminiChat2OpenAI(&geminiResponse)
- usage := dto.Usage{
- PromptTokens: geminiResponse.UsageMetadata.PromptTokenCount,
- CompletionTokens: geminiResponse.UsageMetadata.CandidatesTokenCount,
- TotalTokens: geminiResponse.UsageMetadata.TotalTokenCount,
- }
- fullTextResponse.Usage = usage
- jsonResponse, err := json.Marshal(fullTextResponse)
- if err != nil {
- return service.OpenAIErrorWrapper(err, "marshal_response_body_failed", http.StatusInternalServerError), nil
- }
- c.Writer.Header().Set("Content-Type", "application/json")
- c.Writer.WriteHeader(resp.StatusCode)
- _, err = c.Writer.Write(jsonResponse)
- return nil, &usage
- }
|