relay-utils.go 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121
  1. package controller
  2. import (
  3. "fmt"
  4. "github.com/gin-gonic/gin"
  5. "github.com/pkoukk/tiktoken-go"
  6. "net/http"
  7. "one-api/common"
  8. )
  9. var stopFinishReason = "stop"
  10. var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}
  11. func getTokenEncoder(model string) *tiktoken.Tiktoken {
  12. if tokenEncoder, ok := tokenEncoderMap[model]; ok {
  13. return tokenEncoder
  14. }
  15. tokenEncoder, err := tiktoken.EncodingForModel(model)
  16. if err != nil {
  17. common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))
  18. tokenEncoder, err = tiktoken.EncodingForModel("gpt-3.5-turbo")
  19. if err != nil {
  20. common.FatalLog(fmt.Sprintf("failed to get token encoder for model gpt-3.5-turbo: %s", err.Error()))
  21. }
  22. }
  23. tokenEncoderMap[model] = tokenEncoder
  24. return tokenEncoder
  25. }
  26. func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {
  27. if common.ApproximateTokenEnabled {
  28. return int(float64(len(text)) * 0.38)
  29. }
  30. return len(tokenEncoder.Encode(text, nil, nil))
  31. }
  32. func countTokenMessages(messages []Message, model string) int {
  33. tokenEncoder := getTokenEncoder(model)
  34. // Reference:
  35. // https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
  36. // https://github.com/pkoukk/tiktoken-go/issues/6
  37. //
  38. // Every message follows <|start|>{role/name}\n{content}<|end|>\n
  39. var tokensPerMessage int
  40. var tokensPerName int
  41. if model == "gpt-3.5-turbo-0301" {
  42. tokensPerMessage = 4
  43. tokensPerName = -1 // If there's a name, the role is omitted
  44. } else {
  45. tokensPerMessage = 3
  46. tokensPerName = 1
  47. }
  48. tokenNum := 0
  49. for _, message := range messages {
  50. tokenNum += tokensPerMessage
  51. tokenNum += getTokenNum(tokenEncoder, message.Content)
  52. tokenNum += getTokenNum(tokenEncoder, message.Role)
  53. if message.Name != nil {
  54. tokenNum += tokensPerName
  55. tokenNum += getTokenNum(tokenEncoder, *message.Name)
  56. }
  57. }
  58. tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
  59. return tokenNum
  60. }
  61. func countTokenInput(input any, model string) int {
  62. switch input.(type) {
  63. case string:
  64. return countTokenText(input.(string), model)
  65. case []string:
  66. text := ""
  67. for _, s := range input.([]string) {
  68. text += s
  69. }
  70. return countTokenText(text, model)
  71. }
  72. return 0
  73. }
  74. func countTokenText(text string, model string) int {
  75. tokenEncoder := getTokenEncoder(model)
  76. return getTokenNum(tokenEncoder, text)
  77. }
  78. func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {
  79. openAIError := OpenAIError{
  80. Message: err.Error(),
  81. Type: "one_api_error",
  82. Code: code,
  83. }
  84. return &OpenAIErrorWithStatusCode{
  85. OpenAIError: openAIError,
  86. StatusCode: statusCode,
  87. }
  88. }
  89. func shouldDisableChannel(err *OpenAIError, statusCode int) bool {
  90. if !common.AutomaticDisableChannelEnabled {
  91. return false
  92. }
  93. if err == nil {
  94. return false
  95. }
  96. if statusCode == http.StatusUnauthorized {
  97. return true
  98. }
  99. if err.Type == "insufficient_quota" || err.Code == "invalid_api_key" || err.Code == "account_deactivated" {
  100. return true
  101. }
  102. return false
  103. }
  104. func setEventStreamHeaders(c *gin.Context) {
  105. c.Writer.Header().Set("Content-Type", "text/event-stream")
  106. c.Writer.Header().Set("Cache-Control", "no-cache")
  107. c.Writer.Header().Set("Connection", "keep-alive")
  108. c.Writer.Header().Set("Transfer-Encoding", "chunked")
  109. c.Writer.Header().Set("X-Accel-Buffering", "no")
  110. }