relay-openai.go 4.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148
  1. package controller
  2. import (
  3. "bufio"
  4. "bytes"
  5. "encoding/json"
  6. "github.com/gin-gonic/gin"
  7. "io"
  8. "net/http"
  9. "one-api/common"
  10. "strings"
  11. )
  12. func openaiStreamHandler(c *gin.Context, resp *http.Response, relayMode int) (*OpenAIErrorWithStatusCode, string) {
  13. responseText := ""
  14. scanner := bufio.NewScanner(resp.Body)
  15. scanner.Split(func(data []byte, atEOF bool) (advance int, token []byte, err error) {
  16. if atEOF && len(data) == 0 {
  17. return 0, nil, nil
  18. }
  19. if i := strings.Index(string(data), "\n"); i >= 0 {
  20. return i + 1, data[0:i], nil
  21. }
  22. if atEOF {
  23. return len(data), data, nil
  24. }
  25. return 0, nil, nil
  26. })
  27. dataChan := make(chan string)
  28. stopChan := make(chan bool)
  29. go func() {
  30. for scanner.Scan() {
  31. data := scanner.Text()
  32. if len(data) < 6 { // ignore blank line or wrong format
  33. continue
  34. }
  35. if data[:6] != "data: " && data[:6] != "[DONE]" {
  36. continue
  37. }
  38. dataChan <- data
  39. data = data[6:]
  40. if !strings.HasPrefix(data, "[DONE]") {
  41. switch relayMode {
  42. case RelayModeChatCompletions:
  43. var streamResponse ChatCompletionsStreamResponse
  44. err := json.Unmarshal([]byte(data), &streamResponse)
  45. if err != nil {
  46. common.SysError("error unmarshalling stream response: " + err.Error())
  47. continue // just ignore the error
  48. }
  49. for _, choice := range streamResponse.Choices {
  50. responseText += choice.Delta.Content
  51. }
  52. case RelayModeCompletions:
  53. var streamResponse CompletionsStreamResponse
  54. err := json.Unmarshal([]byte(data), &streamResponse)
  55. if err != nil {
  56. common.SysError("error unmarshalling stream response: " + err.Error())
  57. continue
  58. }
  59. for _, choice := range streamResponse.Choices {
  60. responseText += choice.Text
  61. }
  62. }
  63. }
  64. }
  65. stopChan <- true
  66. }()
  67. c.Writer.Header().Set("Content-Type", "text/event-stream")
  68. c.Writer.Header().Set("Cache-Control", "no-cache")
  69. c.Writer.Header().Set("Connection", "keep-alive")
  70. c.Writer.Header().Set("Transfer-Encoding", "chunked")
  71. c.Writer.Header().Set("X-Accel-Buffering", "no")
  72. c.Stream(func(w io.Writer) bool {
  73. select {
  74. case data := <-dataChan:
  75. if strings.HasPrefix(data, "data: [DONE]") {
  76. data = data[:12]
  77. }
  78. // some implementations may add \r at the end of data
  79. data = strings.TrimSuffix(data, "\r")
  80. c.Render(-1, common.CustomEvent{Data: data})
  81. return true
  82. case <-stopChan:
  83. return false
  84. }
  85. })
  86. err := resp.Body.Close()
  87. if err != nil {
  88. return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), ""
  89. }
  90. return nil, responseText
  91. }
  92. func openaiHandler(c *gin.Context, resp *http.Response, consumeQuota bool, promptTokens int, model string) (*OpenAIErrorWithStatusCode, *Usage) {
  93. var textResponse TextResponse
  94. if consumeQuota {
  95. responseBody, err := io.ReadAll(resp.Body)
  96. if err != nil {
  97. return errorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil
  98. }
  99. err = resp.Body.Close()
  100. if err != nil {
  101. return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
  102. }
  103. err = json.Unmarshal(responseBody, &textResponse)
  104. if err != nil {
  105. return errorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil
  106. }
  107. if textResponse.Error.Type != "" {
  108. return &OpenAIErrorWithStatusCode{
  109. OpenAIError: textResponse.Error,
  110. StatusCode: resp.StatusCode,
  111. }, nil
  112. }
  113. // Reset response body
  114. resp.Body = io.NopCloser(bytes.NewBuffer(responseBody))
  115. }
  116. // We shouldn't set the header before we parse the response body, because the parse part may fail.
  117. // And then we will have to send an error response, but in this case, the header has already been set.
  118. // So the httpClient will be confused by the response.
  119. // For example, Postman will report error, and we cannot check the response at all.
  120. for k, v := range resp.Header {
  121. c.Writer.Header().Set(k, v[0])
  122. }
  123. c.Writer.WriteHeader(resp.StatusCode)
  124. _, err := io.Copy(c.Writer, resp.Body)
  125. if err != nil {
  126. return errorWrapper(err, "copy_response_body_failed", http.StatusInternalServerError), nil
  127. }
  128. err = resp.Body.Close()
  129. if err != nil {
  130. return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
  131. }
  132. if textResponse.Usage.TotalTokens == 0 {
  133. completionTokens := 0
  134. for _, choice := range textResponse.Choices {
  135. completionTokens += countTokenText(choice.Message.Content, model)
  136. }
  137. textResponse.Usage = Usage{
  138. PromptTokens: promptTokens,
  139. CompletionTokens: completionTokens,
  140. TotalTokens: promptTokens + completionTokens,
  141. }
  142. }
  143. return nil, &textResponse.Usage
  144. }