claude_handler.go 7.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195
  1. package relay
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "fmt"
  6. "io"
  7. "net/http"
  8. "strings"
  9. "github.com/QuantumNous/new-api/common"
  10. "github.com/QuantumNous/new-api/constant"
  11. "github.com/QuantumNous/new-api/dto"
  12. relaycommon "github.com/QuantumNous/new-api/relay/common"
  13. "github.com/QuantumNous/new-api/relay/helper"
  14. "github.com/QuantumNous/new-api/service"
  15. "github.com/QuantumNous/new-api/setting/model_setting"
  16. "github.com/QuantumNous/new-api/setting/reasoning"
  17. "github.com/QuantumNous/new-api/types"
  18. "github.com/gin-gonic/gin"
  19. )
  20. func ClaudeHelper(c *gin.Context, info *relaycommon.RelayInfo) (newAPIError *types.NewAPIError) {
  21. info.InitChannelMeta(c)
  22. claudeReq, ok := info.Request.(*dto.ClaudeRequest)
  23. if !ok {
  24. return types.NewErrorWithStatusCode(fmt.Errorf("invalid request type, expected *dto.ClaudeRequest, got %T", info.Request), types.ErrorCodeInvalidRequest, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  25. }
  26. request, err := common.DeepCopy(claudeReq)
  27. if err != nil {
  28. return types.NewError(fmt.Errorf("failed to copy request to ClaudeRequest: %w", err), types.ErrorCodeInvalidRequest, types.ErrOptionWithSkipRetry())
  29. }
  30. err = helper.ModelMappedHelper(c, info, request)
  31. if err != nil {
  32. return types.NewError(err, types.ErrorCodeChannelModelMappedError, types.ErrOptionWithSkipRetry())
  33. }
  34. adaptor := GetAdaptor(info.ApiType)
  35. if adaptor == nil {
  36. return types.NewError(fmt.Errorf("invalid api type: %d", info.ApiType), types.ErrorCodeInvalidApiType, types.ErrOptionWithSkipRetry())
  37. }
  38. adaptor.Init(info)
  39. if request.MaxTokens == nil || *request.MaxTokens == 0 {
  40. defaultMaxTokens := uint(model_setting.GetClaudeSettings().GetDefaultMaxTokens(request.Model))
  41. request.MaxTokens = &defaultMaxTokens
  42. }
  43. if baseModel, effortLevel, ok := reasoning.TrimEffortSuffix(request.Model); ok && effortLevel != "" &&
  44. strings.HasPrefix(request.Model, "claude-opus-4-6") {
  45. request.Model = baseModel
  46. request.Thinking = &dto.Thinking{
  47. Type: "adaptive",
  48. }
  49. request.OutputConfig = json.RawMessage(fmt.Sprintf(`{"effort":"%s"}`, effortLevel))
  50. request.Temperature = common.GetPointer[float64](1.0)
  51. info.UpstreamModelName = request.Model
  52. } else if model_setting.GetClaudeSettings().ThinkingAdapterEnabled &&
  53. strings.HasSuffix(request.Model, "-thinking") {
  54. if request.Thinking == nil {
  55. // 因为BudgetTokens 必须大于1024
  56. if request.MaxTokens == nil || *request.MaxTokens < 1280 {
  57. request.MaxTokens = common.GetPointer[uint](1280)
  58. }
  59. // BudgetTokens 为 max_tokens 的 80%
  60. request.Thinking = &dto.Thinking{
  61. Type: "enabled",
  62. BudgetTokens: common.GetPointer[int](int(float64(*request.MaxTokens) * model_setting.GetClaudeSettings().ThinkingAdapterBudgetTokensPercentage)),
  63. }
  64. // TODO: 临时处理
  65. // https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking
  66. request.Temperature = common.GetPointer[float64](1.0)
  67. }
  68. if !model_setting.ShouldPreserveThinkingSuffix(info.OriginModelName) {
  69. request.Model = strings.TrimSuffix(request.Model, "-thinking")
  70. }
  71. info.UpstreamModelName = request.Model
  72. }
  73. if info.ChannelSetting.SystemPrompt != "" {
  74. if request.System == nil {
  75. request.SetStringSystem(info.ChannelSetting.SystemPrompt)
  76. } else if info.ChannelSetting.SystemPromptOverride {
  77. common.SetContextKey(c, constant.ContextKeySystemPromptOverride, true)
  78. if request.IsStringSystem() {
  79. existing := strings.TrimSpace(request.GetStringSystem())
  80. if existing == "" {
  81. request.SetStringSystem(info.ChannelSetting.SystemPrompt)
  82. } else {
  83. request.SetStringSystem(info.ChannelSetting.SystemPrompt + "\n" + existing)
  84. }
  85. } else {
  86. systemContents := request.ParseSystem()
  87. newSystem := dto.ClaudeMediaMessage{Type: dto.ContentTypeText}
  88. newSystem.SetText(info.ChannelSetting.SystemPrompt)
  89. if len(systemContents) == 0 {
  90. request.System = []dto.ClaudeMediaMessage{newSystem}
  91. } else {
  92. request.System = append([]dto.ClaudeMediaMessage{newSystem}, systemContents...)
  93. }
  94. }
  95. }
  96. }
  97. if !model_setting.GetGlobalSettings().PassThroughRequestEnabled &&
  98. !info.ChannelSetting.PassThroughBodyEnabled &&
  99. service.ShouldChatCompletionsUseResponsesGlobal(info.ChannelId, info.ChannelType, info.OriginModelName) {
  100. openAIRequest, convErr := service.ClaudeToOpenAIRequest(*request, info)
  101. if convErr != nil {
  102. return types.NewError(convErr, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  103. }
  104. usage, newApiErr := chatCompletionsViaResponses(c, info, adaptor, openAIRequest)
  105. if newApiErr != nil {
  106. return newApiErr
  107. }
  108. service.PostTextConsumeQuota(c, info, usage, nil)
  109. return nil
  110. }
  111. var requestBody io.Reader
  112. if model_setting.GetGlobalSettings().PassThroughRequestEnabled || info.ChannelSetting.PassThroughBodyEnabled {
  113. storage, err := common.GetBodyStorage(c)
  114. if err != nil {
  115. return types.NewErrorWithStatusCode(err, types.ErrorCodeReadRequestBodyFailed, http.StatusBadRequest, types.ErrOptionWithSkipRetry())
  116. }
  117. requestBody = common.ReaderOnly(storage)
  118. } else {
  119. convertedRequest, err := adaptor.ConvertClaudeRequest(c, info, request)
  120. if err != nil {
  121. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  122. }
  123. relaycommon.AppendRequestConversionFromRequest(info, convertedRequest)
  124. jsonData, err := common.Marshal(convertedRequest)
  125. if err != nil {
  126. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  127. }
  128. // remove disabled fields for Claude API
  129. jsonData, err = relaycommon.RemoveDisabledFields(jsonData, info.ChannelOtherSettings, info.ChannelSetting.PassThroughBodyEnabled)
  130. if err != nil {
  131. return types.NewError(err, types.ErrorCodeConvertRequestFailed, types.ErrOptionWithSkipRetry())
  132. }
  133. // apply param override
  134. if len(info.ParamOverride) > 0 {
  135. jsonData, err = relaycommon.ApplyParamOverrideWithRelayInfo(jsonData, info)
  136. if err != nil {
  137. return newAPIErrorFromParamOverride(err)
  138. }
  139. }
  140. if common.DebugEnabled {
  141. println("requestBody: ", string(jsonData))
  142. }
  143. requestBody = bytes.NewBuffer(jsonData)
  144. }
  145. statusCodeMappingStr := c.GetString("status_code_mapping")
  146. var httpResp *http.Response
  147. resp, err := adaptor.DoRequest(c, info, requestBody)
  148. if err != nil {
  149. return types.NewOpenAIError(err, types.ErrorCodeDoRequestFailed, http.StatusInternalServerError)
  150. }
  151. if resp != nil {
  152. httpResp = resp.(*http.Response)
  153. info.IsStream = info.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
  154. if httpResp.StatusCode != http.StatusOK {
  155. newAPIError = service.RelayErrorHandler(c.Request.Context(), httpResp, false)
  156. // reset status code 重置状态码
  157. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  158. return newAPIError
  159. }
  160. }
  161. usage, newAPIError := adaptor.DoResponse(c, httpResp, info)
  162. //log.Printf("usage: %v", usage)
  163. if newAPIError != nil {
  164. // reset status code 重置状态码
  165. service.ResetStatusCode(newAPIError, statusCodeMappingStr)
  166. return newAPIError
  167. }
  168. service.PostTextConsumeQuota(c, info, usage.(*dto.Usage), nil)
  169. return nil
  170. }