relay-utils.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178
  1. package controller
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "github.com/gin-gonic/gin"
  6. "github.com/pkoukk/tiktoken-go"
  7. "io"
  8. "net/http"
  9. "one-api/common"
  10. "strconv"
  11. "strings"
  12. )
  13. var stopFinishReason = "stop"
  14. // tokenEncoderMap won't grow after initialization
  15. var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}
  16. var defaultTokenEncoder *tiktoken.Tiktoken
  17. func InitTokenEncoders() {
  18. common.SysLog("initializing token encoders")
  19. gpt35TokenEncoder, err := tiktoken.EncodingForModel("gpt-3.5-turbo")
  20. if err != nil {
  21. common.FatalLog(fmt.Sprintf("failed to get gpt-3.5-turbo token encoder: %s", err.Error()))
  22. }
  23. defaultTokenEncoder = gpt35TokenEncoder
  24. gpt4TokenEncoder, err := tiktoken.EncodingForModel("gpt-4")
  25. if err != nil {
  26. common.FatalLog(fmt.Sprintf("failed to get gpt-4 token encoder: %s", err.Error()))
  27. }
  28. for model, _ := range common.ModelRatio {
  29. if strings.HasPrefix(model, "gpt-3.5") {
  30. tokenEncoderMap[model] = gpt35TokenEncoder
  31. } else if strings.HasPrefix(model, "gpt-4") {
  32. tokenEncoderMap[model] = gpt4TokenEncoder
  33. } else {
  34. tokenEncoderMap[model] = nil
  35. }
  36. }
  37. common.SysLog("token encoders initialized")
  38. }
  39. func getTokenEncoder(model string) *tiktoken.Tiktoken {
  40. tokenEncoder, ok := tokenEncoderMap[model]
  41. if ok && tokenEncoder != nil {
  42. return tokenEncoder
  43. }
  44. if ok {
  45. tokenEncoder, err := tiktoken.EncodingForModel(model)
  46. if err != nil {
  47. common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))
  48. tokenEncoder = defaultTokenEncoder
  49. }
  50. tokenEncoderMap[model] = tokenEncoder
  51. return tokenEncoder
  52. }
  53. return defaultTokenEncoder
  54. }
  55. func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {
  56. if common.ApproximateTokenEnabled {
  57. return int(float64(len(text)) * 0.38)
  58. }
  59. return len(tokenEncoder.Encode(text, nil, nil))
  60. }
  61. func countTokenMessages(messages []Message, model string) int {
  62. tokenEncoder := getTokenEncoder(model)
  63. // Reference:
  64. // https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
  65. // https://github.com/pkoukk/tiktoken-go/issues/6
  66. //
  67. // Every message follows <|start|>{role/name}\n{content}<|end|>\n
  68. var tokensPerMessage int
  69. var tokensPerName int
  70. if model == "gpt-3.5-turbo-0301" {
  71. tokensPerMessage = 4
  72. tokensPerName = -1 // If there's a name, the role is omitted
  73. } else {
  74. tokensPerMessage = 3
  75. tokensPerName = 1
  76. }
  77. tokenNum := 0
  78. for _, message := range messages {
  79. tokenNum += tokensPerMessage
  80. tokenNum += getTokenNum(tokenEncoder, message.Content)
  81. tokenNum += getTokenNum(tokenEncoder, message.Role)
  82. if message.Name != nil {
  83. tokenNum += tokensPerName
  84. tokenNum += getTokenNum(tokenEncoder, *message.Name)
  85. }
  86. }
  87. tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
  88. return tokenNum
  89. }
  90. func countTokenInput(input any, model string) int {
  91. switch input.(type) {
  92. case string:
  93. return countTokenText(input.(string), model)
  94. case []string:
  95. text := ""
  96. for _, s := range input.([]string) {
  97. text += s
  98. }
  99. return countTokenText(text, model)
  100. }
  101. return 0
  102. }
  103. func countTokenText(text string, model string) int {
  104. tokenEncoder := getTokenEncoder(model)
  105. return getTokenNum(tokenEncoder, text)
  106. }
  107. func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {
  108. openAIError := OpenAIError{
  109. Message: err.Error(),
  110. Type: "one_api_error",
  111. Code: code,
  112. }
  113. return &OpenAIErrorWithStatusCode{
  114. OpenAIError: openAIError,
  115. StatusCode: statusCode,
  116. }
  117. }
  118. func shouldDisableChannel(err *OpenAIError, statusCode int) bool {
  119. if !common.AutomaticDisableChannelEnabled {
  120. return false
  121. }
  122. if err == nil {
  123. return false
  124. }
  125. if statusCode == http.StatusUnauthorized {
  126. return true
  127. }
  128. if err.Type == "insufficient_quota" || err.Code == "invalid_api_key" || err.Code == "account_deactivated" {
  129. return true
  130. }
  131. return false
  132. }
  133. func setEventStreamHeaders(c *gin.Context) {
  134. c.Writer.Header().Set("Content-Type", "text/event-stream")
  135. c.Writer.Header().Set("Cache-Control", "no-cache")
  136. c.Writer.Header().Set("Connection", "keep-alive")
  137. c.Writer.Header().Set("Transfer-Encoding", "chunked")
  138. c.Writer.Header().Set("X-Accel-Buffering", "no")
  139. }
  140. func relayErrorHandler(resp *http.Response) (openAIErrorWithStatusCode *OpenAIErrorWithStatusCode) {
  141. openAIErrorWithStatusCode = &OpenAIErrorWithStatusCode{
  142. StatusCode: resp.StatusCode,
  143. OpenAIError: OpenAIError{
  144. Message: fmt.Sprintf("bad response status code %d", resp.StatusCode),
  145. Type: "upstream_error",
  146. Code: "bad_response_status_code",
  147. Param: strconv.Itoa(resp.StatusCode),
  148. },
  149. }
  150. responseBody, err := io.ReadAll(resp.Body)
  151. if err != nil {
  152. return
  153. }
  154. err = resp.Body.Close()
  155. if err != nil {
  156. return
  157. }
  158. var textResponse TextResponse
  159. err = json.Unmarshal(responseBody, &textResponse)
  160. if err != nil {
  161. return
  162. }
  163. openAIErrorWithStatusCode.OpenAIError = textResponse.Error
  164. return
  165. }