relay-utils.go 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173
  1. package controller
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "github.com/gin-gonic/gin"
  6. "github.com/pkoukk/tiktoken-go"
  7. "io"
  8. "net/http"
  9. "one-api/common"
  10. "strconv"
  11. )
  12. var stopFinishReason = "stop"
  13. var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}
  14. func InitTokenEncoders() {
  15. common.SysLog("initializing token encoders")
  16. fallbackTokenEncoder, err := tiktoken.EncodingForModel("gpt-3.5-turbo")
  17. if err != nil {
  18. common.FatalLog(fmt.Sprintf("failed to get fallback token encoder: %s", err.Error()))
  19. }
  20. for model, _ := range common.ModelRatio {
  21. tokenEncoder, err := tiktoken.EncodingForModel(model)
  22. if err != nil {
  23. common.SysError(fmt.Sprintf("using fallback encoder for model %s", model))
  24. tokenEncoderMap[model] = fallbackTokenEncoder
  25. continue
  26. }
  27. tokenEncoderMap[model] = tokenEncoder
  28. }
  29. common.SysLog("token encoders initialized")
  30. }
  31. func getTokenEncoder(model string) *tiktoken.Tiktoken {
  32. if tokenEncoder, ok := tokenEncoderMap[model]; ok {
  33. return tokenEncoder
  34. }
  35. tokenEncoder, err := tiktoken.EncodingForModel(model)
  36. if err != nil {
  37. common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))
  38. tokenEncoder, err = tiktoken.EncodingForModel("gpt-3.5-turbo")
  39. if err != nil {
  40. common.FatalLog(fmt.Sprintf("failed to get token encoder for model gpt-3.5-turbo: %s", err.Error()))
  41. }
  42. }
  43. tokenEncoderMap[model] = tokenEncoder
  44. return tokenEncoder
  45. }
  46. func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {
  47. if common.ApproximateTokenEnabled {
  48. return int(float64(len(text)) * 0.38)
  49. }
  50. return len(tokenEncoder.Encode(text, nil, nil))
  51. }
  52. func countTokenMessages(messages []Message, model string) int {
  53. tokenEncoder := getTokenEncoder(model)
  54. // Reference:
  55. // https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
  56. // https://github.com/pkoukk/tiktoken-go/issues/6
  57. //
  58. // Every message follows <|start|>{role/name}\n{content}<|end|>\n
  59. var tokensPerMessage int
  60. var tokensPerName int
  61. if model == "gpt-3.5-turbo-0301" {
  62. tokensPerMessage = 4
  63. tokensPerName = -1 // If there's a name, the role is omitted
  64. } else {
  65. tokensPerMessage = 3
  66. tokensPerName = 1
  67. }
  68. tokenNum := 0
  69. for _, message := range messages {
  70. tokenNum += tokensPerMessage
  71. tokenNum += getTokenNum(tokenEncoder, message.Content)
  72. tokenNum += getTokenNum(tokenEncoder, message.Role)
  73. if message.Name != nil {
  74. tokenNum += tokensPerName
  75. tokenNum += getTokenNum(tokenEncoder, *message.Name)
  76. }
  77. }
  78. tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
  79. return tokenNum
  80. }
  81. func countTokenInput(input any, model string) int {
  82. switch input.(type) {
  83. case string:
  84. return countTokenText(input.(string), model)
  85. case []string:
  86. text := ""
  87. for _, s := range input.([]string) {
  88. text += s
  89. }
  90. return countTokenText(text, model)
  91. }
  92. return 0
  93. }
  94. func countTokenText(text string, model string) int {
  95. tokenEncoder := getTokenEncoder(model)
  96. return getTokenNum(tokenEncoder, text)
  97. }
  98. func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {
  99. if statusCode == http.StatusInternalServerError {
  100. //避免暴露内部错误
  101. err = fmt.Errorf("internal server error")
  102. }
  103. openAIError := OpenAIError{
  104. Message: err.Error(),
  105. Type: "one_api_error",
  106. Code: code,
  107. }
  108. return &OpenAIErrorWithStatusCode{
  109. OpenAIError: openAIError,
  110. StatusCode: statusCode,
  111. }
  112. }
  113. func shouldDisableChannel(err *OpenAIError, statusCode int) bool {
  114. if !common.AutomaticDisableChannelEnabled {
  115. return false
  116. }
  117. if err == nil {
  118. return false
  119. }
  120. if statusCode == http.StatusUnauthorized {
  121. return true
  122. }
  123. if err.Type == "insufficient_quota" || err.Code == "invalid_api_key" || err.Code == "account_deactivated" {
  124. return true
  125. }
  126. return false
  127. }
  128. func setEventStreamHeaders(c *gin.Context) {
  129. c.Writer.Header().Set("Content-Type", "text/event-stream")
  130. c.Writer.Header().Set("Cache-Control", "no-cache")
  131. c.Writer.Header().Set("Connection", "keep-alive")
  132. c.Writer.Header().Set("Transfer-Encoding", "chunked")
  133. c.Writer.Header().Set("X-Accel-Buffering", "no")
  134. }
  135. func relayErrorHandler(resp *http.Response) (openAIErrorWithStatusCode *OpenAIErrorWithStatusCode) {
  136. openAIErrorWithStatusCode = &OpenAIErrorWithStatusCode{
  137. StatusCode: resp.StatusCode,
  138. OpenAIError: OpenAIError{
  139. Message: fmt.Sprintf("bad response status code %d", resp.StatusCode),
  140. Type: "upstream_error",
  141. Code: "bad_response_status_code",
  142. Param: strconv.Itoa(resp.StatusCode),
  143. },
  144. }
  145. responseBody, err := io.ReadAll(resp.Body)
  146. if err != nil {
  147. return
  148. }
  149. err = resp.Body.Close()
  150. if err != nil {
  151. return
  152. }
  153. var textResponse TextResponse
  154. err = json.Unmarshal(responseBody, &textResponse)
  155. if err != nil {
  156. return
  157. }
  158. openAIErrorWithStatusCode.OpenAIError = textResponse.Error
  159. return
  160. }