relay-utils.go 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169
  1. package controller
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "github.com/gin-gonic/gin"
  6. "github.com/pkoukk/tiktoken-go"
  7. "io"
  8. "net/http"
  9. "one-api/common"
  10. "strconv"
  11. )
  12. var stopFinishReason = "stop"
  13. var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}
  14. func InitTokenEncoders() {
  15. common.SysLog("initializing token encoders")
  16. fallbackTokenEncoder, err := tiktoken.EncodingForModel("gpt-3.5-turbo")
  17. if err != nil {
  18. common.FatalLog(fmt.Sprintf("failed to get fallback token encoder: %s", err.Error()))
  19. }
  20. for model, _ := range common.ModelRatio {
  21. tokenEncoder, err := tiktoken.EncodingForModel(model)
  22. if err != nil {
  23. common.SysError(fmt.Sprintf("using fallback encoder for model %s", model))
  24. tokenEncoderMap[model] = fallbackTokenEncoder
  25. continue
  26. }
  27. tokenEncoderMap[model] = tokenEncoder
  28. }
  29. common.SysLog("token encoders initialized")
  30. }
  31. func getTokenEncoder(model string) *tiktoken.Tiktoken {
  32. if tokenEncoder, ok := tokenEncoderMap[model]; ok {
  33. return tokenEncoder
  34. }
  35. tokenEncoder, err := tiktoken.EncodingForModel(model)
  36. if err != nil {
  37. common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))
  38. tokenEncoder, err = tiktoken.EncodingForModel("gpt-3.5-turbo")
  39. if err != nil {
  40. common.FatalLog(fmt.Sprintf("failed to get token encoder for model gpt-3.5-turbo: %s", err.Error()))
  41. }
  42. }
  43. tokenEncoderMap[model] = tokenEncoder
  44. return tokenEncoder
  45. }
  46. func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {
  47. if common.ApproximateTokenEnabled {
  48. return int(float64(len(text)) * 0.38)
  49. }
  50. return len(tokenEncoder.Encode(text, nil, nil))
  51. }
  52. func countTokenMessages(messages []Message, model string) int {
  53. tokenEncoder := getTokenEncoder(model)
  54. // Reference:
  55. // https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
  56. // https://github.com/pkoukk/tiktoken-go/issues/6
  57. //
  58. // Every message follows <|start|>{role/name}\n{content}<|end|>\n
  59. var tokensPerMessage int
  60. var tokensPerName int
  61. if model == "gpt-3.5-turbo-0301" {
  62. tokensPerMessage = 4
  63. tokensPerName = -1 // If there's a name, the role is omitted
  64. } else {
  65. tokensPerMessage = 3
  66. tokensPerName = 1
  67. }
  68. tokenNum := 0
  69. for _, message := range messages {
  70. tokenNum += tokensPerMessage
  71. tokenNum += getTokenNum(tokenEncoder, message.Content)
  72. tokenNum += getTokenNum(tokenEncoder, message.Role)
  73. if message.Name != nil {
  74. tokenNum += tokensPerName
  75. tokenNum += getTokenNum(tokenEncoder, *message.Name)
  76. }
  77. }
  78. tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
  79. return tokenNum
  80. }
  81. func countTokenInput(input any, model string) int {
  82. switch input.(type) {
  83. case string:
  84. return countTokenText(input.(string), model)
  85. case []string:
  86. text := ""
  87. for _, s := range input.([]string) {
  88. text += s
  89. }
  90. return countTokenText(text, model)
  91. }
  92. return 0
  93. }
  94. func countTokenText(text string, model string) int {
  95. tokenEncoder := getTokenEncoder(model)
  96. return getTokenNum(tokenEncoder, text)
  97. }
  98. func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {
  99. openAIError := OpenAIError{
  100. Message: err.Error(),
  101. Type: "one_api_error",
  102. Code: code,
  103. }
  104. return &OpenAIErrorWithStatusCode{
  105. OpenAIError: openAIError,
  106. StatusCode: statusCode,
  107. }
  108. }
  109. func shouldDisableChannel(err *OpenAIError, statusCode int) bool {
  110. if !common.AutomaticDisableChannelEnabled {
  111. return false
  112. }
  113. if err == nil {
  114. return false
  115. }
  116. if statusCode == http.StatusUnauthorized {
  117. return true
  118. }
  119. if err.Type == "insufficient_quota" || err.Code == "invalid_api_key" || err.Code == "account_deactivated" {
  120. return true
  121. }
  122. return false
  123. }
  124. func setEventStreamHeaders(c *gin.Context) {
  125. c.Writer.Header().Set("Content-Type", "text/event-stream")
  126. c.Writer.Header().Set("Cache-Control", "no-cache")
  127. c.Writer.Header().Set("Connection", "keep-alive")
  128. c.Writer.Header().Set("Transfer-Encoding", "chunked")
  129. c.Writer.Header().Set("X-Accel-Buffering", "no")
  130. }
  131. func relayErrorHandler(resp *http.Response) (openAIErrorWithStatusCode *OpenAIErrorWithStatusCode) {
  132. openAIErrorWithStatusCode = &OpenAIErrorWithStatusCode{
  133. StatusCode: resp.StatusCode,
  134. OpenAIError: OpenAIError{
  135. Message: fmt.Sprintf("bad response status code %d", resp.StatusCode),
  136. Type: "one_api_error",
  137. Code: "bad_response_status_code",
  138. Param: strconv.Itoa(resp.StatusCode),
  139. },
  140. }
  141. responseBody, err := io.ReadAll(resp.Body)
  142. if err != nil {
  143. return
  144. }
  145. err = resp.Body.Close()
  146. if err != nil {
  147. return
  148. }
  149. var textResponse TextResponse
  150. err = json.Unmarshal(responseBody, &textResponse)
  151. if err != nil {
  152. return
  153. }
  154. openAIErrorWithStatusCode.OpenAIError = textResponse.Error
  155. return
  156. }