relay.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500
  1. package controller
  2. import (
  3. "bytes"
  4. "fmt"
  5. "io"
  6. "log"
  7. "net/http"
  8. "strings"
  9. "github.com/QuantumNous/new-api/common"
  10. "github.com/QuantumNous/new-api/constant"
  11. "github.com/QuantumNous/new-api/dto"
  12. "github.com/QuantumNous/new-api/logger"
  13. "github.com/QuantumNous/new-api/middleware"
  14. "github.com/QuantumNous/new-api/model"
  15. "github.com/QuantumNous/new-api/relay"
  16. relaycommon "github.com/QuantumNous/new-api/relay/common"
  17. relayconstant "github.com/QuantumNous/new-api/relay/constant"
  18. "github.com/QuantumNous/new-api/relay/helper"
  19. "github.com/QuantumNous/new-api/service"
  20. "github.com/QuantumNous/new-api/setting"
  21. "github.com/QuantumNous/new-api/types"
  22. "github.com/bytedance/gopkg/util/gopool"
  23. "github.com/gin-gonic/gin"
  24. "github.com/gorilla/websocket"
  25. )
  26. func relayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  27. var err *types.NewAPIError
  28. switch info.RelayMode {
  29. case relayconstant.RelayModeImagesGenerations, relayconstant.RelayModeImagesEdits:
  30. err = relay.ImageHelper(c, info)
  31. case relayconstant.RelayModeAudioSpeech:
  32. fallthrough
  33. case relayconstant.RelayModeAudioTranslation:
  34. fallthrough
  35. case relayconstant.RelayModeAudioTranscription:
  36. err = relay.AudioHelper(c, info)
  37. case relayconstant.RelayModeRerank:
  38. err = relay.RerankHelper(c, info)
  39. case relayconstant.RelayModeEmbeddings:
  40. err = relay.EmbeddingHelper(c, info)
  41. case relayconstant.RelayModeResponses:
  42. err = relay.ResponsesHelper(c, info)
  43. default:
  44. err = relay.TextHelper(c, info)
  45. }
  46. return err
  47. }
  48. func geminiRelayHandler(c *gin.Context, info *relaycommon.RelayInfo) *types.NewAPIError {
  49. var err *types.NewAPIError
  50. if strings.Contains(c.Request.URL.Path, "embed") {
  51. err = relay.GeminiEmbeddingHandler(c, info)
  52. } else {
  53. err = relay.GeminiHelper(c, info)
  54. }
  55. return err
  56. }
  57. func Relay(c *gin.Context, relayFormat types.RelayFormat) {
  58. requestId := c.GetString(common.RequestIdKey)
  59. //group := common.GetContextKeyString(c, constant.ContextKeyUsingGroup)
  60. //originalModel := common.GetContextKeyString(c, constant.ContextKeyOriginalModel)
  61. var (
  62. newAPIError *types.NewAPIError
  63. ws *websocket.Conn
  64. )
  65. if relayFormat == types.RelayFormatOpenAIRealtime {
  66. var err error
  67. ws, err = upgrader.Upgrade(c.Writer, c.Request, nil)
  68. if err != nil {
  69. helper.WssError(c, ws, types.NewError(err, types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry()).ToOpenAIError())
  70. return
  71. }
  72. defer ws.Close()
  73. }
  74. defer func() {
  75. if newAPIError != nil {
  76. logger.LogError(c, fmt.Sprintf("relay error: %s", newAPIError.Error()))
  77. newAPIError.SetMessage(common.MessageWithRequestId(newAPIError.Error(), requestId))
  78. switch relayFormat {
  79. case types.RelayFormatOpenAIRealtime:
  80. helper.WssError(c, ws, newAPIError.ToOpenAIError())
  81. case types.RelayFormatClaude:
  82. c.JSON(newAPIError.StatusCode, gin.H{
  83. "type": "error",
  84. "error": newAPIError.ToClaudeError(),
  85. })
  86. default:
  87. c.JSON(newAPIError.StatusCode, gin.H{
  88. "error": newAPIError.ToOpenAIError(),
  89. })
  90. }
  91. }
  92. }()
  93. request, err := helper.GetAndValidateRequest(c, relayFormat)
  94. if err != nil {
  95. newAPIError = types.NewError(err, types.ErrorCodeInvalidRequest)
  96. return
  97. }
  98. relayInfo, err := relaycommon.GenRelayInfo(c, relayFormat, request, ws)
  99. if err != nil {
  100. newAPIError = types.NewError(err, types.ErrorCodeGenRelayInfoFailed)
  101. return
  102. }
  103. meta := request.GetTokenCountMeta()
  104. if setting.ShouldCheckPromptSensitive() {
  105. contains, words := service.CheckSensitiveText(meta.CombineText)
  106. if contains {
  107. logger.LogWarn(c, fmt.Sprintf("user sensitive words detected: %s", strings.Join(words, ", ")))
  108. newAPIError = types.NewError(err, types.ErrorCodeSensitiveWordsDetected)
  109. return
  110. }
  111. }
  112. tokens, err := service.EstimateRequestToken(c, meta, relayInfo)
  113. if err != nil {
  114. newAPIError = types.NewError(err, types.ErrorCodeCountTokenFailed)
  115. return
  116. }
  117. relayInfo.SetEstimatePromptTokens(tokens)
  118. priceData, err := helper.ModelPriceHelper(c, relayInfo, tokens, meta)
  119. if err != nil {
  120. newAPIError = types.NewError(err, types.ErrorCodeModelPriceError)
  121. return
  122. }
  123. // common.SetContextKey(c, constant.ContextKeyTokenCountMeta, meta)
  124. if priceData.FreeModel {
  125. logger.LogInfo(c, fmt.Sprintf("模型 %s 免费,跳过预扣费", relayInfo.OriginModelName))
  126. } else {
  127. newAPIError = service.PreConsumeQuota(c, priceData.QuotaToPreConsume, relayInfo)
  128. if newAPIError != nil {
  129. return
  130. }
  131. }
  132. defer func() {
  133. // Only return quota if downstream failed and quota was actually pre-consumed
  134. if newAPIError != nil && relayInfo.FinalPreConsumedQuota != 0 {
  135. service.ReturnPreConsumedQuota(c, relayInfo)
  136. }
  137. }()
  138. retryParam := &service.RetryParam{
  139. Ctx: c,
  140. TokenGroup: relayInfo.TokenGroup,
  141. ModelName: relayInfo.OriginModelName,
  142. Retry: common.GetPointer(0),
  143. }
  144. for ; retryParam.GetRetry() <= common.RetryTimes; retryParam.IncreaseRetry() {
  145. channel, err := getChannel(c, relayInfo, retryParam)
  146. if err != nil {
  147. logger.LogError(c, err.Error())
  148. newAPIError = err
  149. break
  150. }
  151. addUsedChannel(c, channel.Id)
  152. requestBody, _ := common.GetRequestBody(c)
  153. c.Request.Body = io.NopCloser(bytes.NewBuffer(requestBody))
  154. switch relayFormat {
  155. case types.RelayFormatOpenAIRealtime:
  156. newAPIError = relay.WssHelper(c, relayInfo)
  157. case types.RelayFormatClaude:
  158. newAPIError = relay.ClaudeHelper(c, relayInfo)
  159. case types.RelayFormatGemini:
  160. newAPIError = geminiRelayHandler(c, relayInfo)
  161. default:
  162. newAPIError = relayHandler(c, relayInfo)
  163. }
  164. if newAPIError == nil {
  165. return
  166. }
  167. processChannelError(c, *types.NewChannelError(channel.Id, channel.Type, channel.Name, channel.ChannelInfo.IsMultiKey, common.GetContextKeyString(c, constant.ContextKeyChannelKey), channel.GetAutoBan()), newAPIError)
  168. if !shouldRetry(c, newAPIError, common.RetryTimes-retryParam.GetRetry()) {
  169. break
  170. }
  171. }
  172. useChannel := c.GetStringSlice("use_channel")
  173. if len(useChannel) > 1 {
  174. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  175. logger.LogInfo(c, retryLogStr)
  176. }
  177. }
  178. var upgrader = websocket.Upgrader{
  179. Subprotocols: []string{"realtime"}, // WS 握手支持的协议,如果有使用 Sec-WebSocket-Protocol,则必须在此声明对应的 Protocol TODO add other protocol
  180. CheckOrigin: func(r *http.Request) bool {
  181. return true // 允许跨域
  182. },
  183. }
  184. func addUsedChannel(c *gin.Context, channelId int) {
  185. useChannel := c.GetStringSlice("use_channel")
  186. useChannel = append(useChannel, fmt.Sprintf("%d", channelId))
  187. c.Set("use_channel", useChannel)
  188. }
  189. func getChannel(c *gin.Context, info *relaycommon.RelayInfo, retryParam *service.RetryParam) (*model.Channel, *types.NewAPIError) {
  190. if info.ChannelMeta == nil {
  191. autoBan := c.GetBool("auto_ban")
  192. autoBanInt := 1
  193. if !autoBan {
  194. autoBanInt = 0
  195. }
  196. return &model.Channel{
  197. Id: c.GetInt("channel_id"),
  198. Type: c.GetInt("channel_type"),
  199. Name: c.GetString("channel_name"),
  200. AutoBan: &autoBanInt,
  201. }, nil
  202. }
  203. channel, selectGroup, err := service.CacheGetRandomSatisfiedChannel(retryParam)
  204. info.PriceData.GroupRatioInfo = helper.HandleGroupRatio(c, info)
  205. if err != nil {
  206. return nil, types.NewError(fmt.Errorf("获取分组 %s 下模型 %s 的可用渠道失败(retry): %s", selectGroup, info.OriginModelName, err.Error()), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  207. }
  208. if channel == nil {
  209. return nil, types.NewError(fmt.Errorf("分组 %s 下模型 %s 的可用渠道不存在(retry)", selectGroup, info.OriginModelName), types.ErrorCodeGetChannelFailed, types.ErrOptionWithSkipRetry())
  210. }
  211. newAPIError := middleware.SetupContextForSelectedChannel(c, channel, info.OriginModelName)
  212. if newAPIError != nil {
  213. return nil, newAPIError
  214. }
  215. return channel, nil
  216. }
  217. func shouldRetry(c *gin.Context, openaiErr *types.NewAPIError, retryTimes int) bool {
  218. if openaiErr == nil {
  219. return false
  220. }
  221. if types.IsChannelError(openaiErr) {
  222. return true
  223. }
  224. if types.IsSkipRetryError(openaiErr) {
  225. return false
  226. }
  227. if retryTimes <= 0 {
  228. return false
  229. }
  230. if _, ok := c.Get("specific_channel_id"); ok {
  231. return false
  232. }
  233. if openaiErr.StatusCode == http.StatusTooManyRequests {
  234. return true
  235. }
  236. if openaiErr.StatusCode == 307 {
  237. return true
  238. }
  239. if openaiErr.StatusCode/100 == 5 {
  240. // 超时不重试
  241. if openaiErr.StatusCode == 504 || openaiErr.StatusCode == 524 {
  242. return false
  243. }
  244. return true
  245. }
  246. if openaiErr.StatusCode == http.StatusBadRequest {
  247. return false
  248. }
  249. if openaiErr.StatusCode == 408 {
  250. // azure处理超时不重试
  251. return false
  252. }
  253. if openaiErr.StatusCode/100 == 2 {
  254. return false
  255. }
  256. return true
  257. }
  258. func processChannelError(c *gin.Context, channelError types.ChannelError, err *types.NewAPIError) {
  259. logger.LogError(c, fmt.Sprintf("channel error (channel #%d, status code: %d): %s", channelError.ChannelId, err.StatusCode, err.Error()))
  260. // 不要使用context获取渠道信息,异步处理时可能会出现渠道信息不一致的情况
  261. // do not use context to get channel info, there may be inconsistent channel info when processing asynchronously
  262. if service.ShouldDisableChannel(channelError.ChannelType, err) && channelError.AutoBan {
  263. gopool.Go(func() {
  264. service.DisableChannel(channelError, err.Error())
  265. })
  266. }
  267. if constant.ErrorLogEnabled && types.IsRecordErrorLog(err) {
  268. // 保存错误日志到mysql中
  269. userId := c.GetInt("id")
  270. tokenName := c.GetString("token_name")
  271. modelName := c.GetString("original_model")
  272. tokenId := c.GetInt("token_id")
  273. userGroup := c.GetString("group")
  274. channelId := c.GetInt("channel_id")
  275. other := make(map[string]interface{})
  276. if c.Request != nil && c.Request.URL != nil {
  277. other["request_path"] = c.Request.URL.Path
  278. }
  279. other["error_type"] = err.GetErrorType()
  280. other["error_code"] = err.GetErrorCode()
  281. other["status_code"] = err.StatusCode
  282. other["channel_id"] = channelId
  283. other["channel_name"] = c.GetString("channel_name")
  284. other["channel_type"] = c.GetInt("channel_type")
  285. adminInfo := make(map[string]interface{})
  286. adminInfo["use_channel"] = c.GetStringSlice("use_channel")
  287. isMultiKey := common.GetContextKeyBool(c, constant.ContextKeyChannelIsMultiKey)
  288. if isMultiKey {
  289. adminInfo["is_multi_key"] = true
  290. adminInfo["multi_key_index"] = common.GetContextKeyInt(c, constant.ContextKeyChannelMultiKeyIndex)
  291. }
  292. other["admin_info"] = adminInfo
  293. model.RecordErrorLog(c, userId, channelId, modelName, tokenName, err.MaskSensitiveError(), tokenId, 0, false, userGroup, other)
  294. }
  295. }
  296. func RelayMidjourney(c *gin.Context) {
  297. relayInfo, err := relaycommon.GenRelayInfo(c, types.RelayFormatMjProxy, nil, nil)
  298. if err != nil {
  299. c.JSON(http.StatusInternalServerError, gin.H{
  300. "description": fmt.Sprintf("failed to generate relay info: %s", err.Error()),
  301. "type": "upstream_error",
  302. "code": 4,
  303. })
  304. return
  305. }
  306. var mjErr *dto.MidjourneyResponse
  307. switch relayInfo.RelayMode {
  308. case relayconstant.RelayModeMidjourneyNotify:
  309. mjErr = relay.RelayMidjourneyNotify(c)
  310. case relayconstant.RelayModeMidjourneyTaskFetch, relayconstant.RelayModeMidjourneyTaskFetchByCondition:
  311. mjErr = relay.RelayMidjourneyTask(c, relayInfo.RelayMode)
  312. case relayconstant.RelayModeMidjourneyTaskImageSeed:
  313. mjErr = relay.RelayMidjourneyTaskImageSeed(c)
  314. case relayconstant.RelayModeSwapFace:
  315. mjErr = relay.RelaySwapFace(c, relayInfo)
  316. default:
  317. mjErr = relay.RelayMidjourneySubmit(c, relayInfo)
  318. }
  319. //err = relayMidjourneySubmit(c, relayMode)
  320. log.Println(mjErr)
  321. if mjErr != nil {
  322. statusCode := http.StatusBadRequest
  323. if mjErr.Code == 30 {
  324. mjErr.Result = "当前分组负载已饱和,请稍后再试,或升级账户以提升服务质量。"
  325. statusCode = http.StatusTooManyRequests
  326. }
  327. c.JSON(statusCode, gin.H{
  328. "description": fmt.Sprintf("%s %s", mjErr.Description, mjErr.Result),
  329. "type": "upstream_error",
  330. "code": mjErr.Code,
  331. })
  332. channelId := c.GetInt("channel_id")
  333. logger.LogError(c, fmt.Sprintf("relay error (channel #%d, status code %d): %s", channelId, statusCode, fmt.Sprintf("%s %s", mjErr.Description, mjErr.Result)))
  334. }
  335. }
  336. func RelayNotImplemented(c *gin.Context) {
  337. err := types.OpenAIError{
  338. Message: "API not implemented",
  339. Type: "new_api_error",
  340. Param: "",
  341. Code: "api_not_implemented",
  342. }
  343. c.JSON(http.StatusNotImplemented, gin.H{
  344. "error": err,
  345. })
  346. }
  347. func RelayNotFound(c *gin.Context) {
  348. err := types.OpenAIError{
  349. Message: fmt.Sprintf("Invalid URL (%s %s)", c.Request.Method, c.Request.URL.Path),
  350. Type: "invalid_request_error",
  351. Param: "",
  352. Code: "",
  353. }
  354. c.JSON(http.StatusNotFound, gin.H{
  355. "error": err,
  356. })
  357. }
  358. func RelayTask(c *gin.Context) {
  359. retryTimes := common.RetryTimes
  360. channelId := c.GetInt("channel_id")
  361. c.Set("use_channel", []string{fmt.Sprintf("%d", channelId)})
  362. relayInfo, err := relaycommon.GenRelayInfo(c, types.RelayFormatTask, nil, nil)
  363. if err != nil {
  364. return
  365. }
  366. taskErr := taskRelayHandler(c, relayInfo)
  367. if taskErr == nil {
  368. retryTimes = 0
  369. }
  370. retryParam := &service.RetryParam{
  371. Ctx: c,
  372. TokenGroup: relayInfo.TokenGroup,
  373. ModelName: relayInfo.OriginModelName,
  374. Retry: common.GetPointer(0),
  375. }
  376. for ; shouldRetryTaskRelay(c, channelId, taskErr, retryTimes) && retryParam.GetRetry() < retryTimes; retryParam.IncreaseRetry() {
  377. channel, newAPIError := getChannel(c, relayInfo, retryParam)
  378. if newAPIError != nil {
  379. logger.LogError(c, fmt.Sprintf("CacheGetRandomSatisfiedChannel failed: %s", newAPIError.Error()))
  380. taskErr = service.TaskErrorWrapperLocal(newAPIError.Err, "get_channel_failed", http.StatusInternalServerError)
  381. break
  382. }
  383. channelId = channel.Id
  384. useChannel := c.GetStringSlice("use_channel")
  385. useChannel = append(useChannel, fmt.Sprintf("%d", channelId))
  386. c.Set("use_channel", useChannel)
  387. logger.LogInfo(c, fmt.Sprintf("using channel #%d to retry (remain times %d)", channel.Id, retryParam.GetRetry()))
  388. //middleware.SetupContextForSelectedChannel(c, channel, originalModel)
  389. requestBody, _ := common.GetRequestBody(c)
  390. c.Request.Body = io.NopCloser(bytes.NewBuffer(requestBody))
  391. taskErr = taskRelayHandler(c, relayInfo)
  392. }
  393. useChannel := c.GetStringSlice("use_channel")
  394. if len(useChannel) > 1 {
  395. retryLogStr := fmt.Sprintf("重试:%s", strings.Trim(strings.Join(strings.Fields(fmt.Sprint(useChannel)), "->"), "[]"))
  396. logger.LogInfo(c, retryLogStr)
  397. }
  398. if taskErr != nil {
  399. if taskErr.StatusCode == http.StatusTooManyRequests {
  400. taskErr.Message = "当前分组上游负载已饱和,请稍后再试"
  401. }
  402. c.JSON(taskErr.StatusCode, taskErr)
  403. }
  404. }
  405. func taskRelayHandler(c *gin.Context, relayInfo *relaycommon.RelayInfo) *dto.TaskError {
  406. var err *dto.TaskError
  407. switch relayInfo.RelayMode {
  408. case relayconstant.RelayModeSunoFetch, relayconstant.RelayModeSunoFetchByID, relayconstant.RelayModeVideoFetchByID:
  409. err = relay.RelayTaskFetch(c, relayInfo.RelayMode)
  410. default:
  411. err = relay.RelayTaskSubmit(c, relayInfo)
  412. }
  413. return err
  414. }
  415. func shouldRetryTaskRelay(c *gin.Context, channelId int, taskErr *dto.TaskError, retryTimes int) bool {
  416. if taskErr == nil {
  417. return false
  418. }
  419. if retryTimes <= 0 {
  420. return false
  421. }
  422. if _, ok := c.Get("specific_channel_id"); ok {
  423. return false
  424. }
  425. if taskErr.StatusCode == http.StatusTooManyRequests {
  426. return true
  427. }
  428. if taskErr.StatusCode == 307 {
  429. return true
  430. }
  431. if taskErr.StatusCode/100 == 5 {
  432. // 超时不重试
  433. if taskErr.StatusCode == 504 || taskErr.StatusCode == 524 {
  434. return false
  435. }
  436. return true
  437. }
  438. if taskErr.StatusCode == http.StatusBadRequest {
  439. return false
  440. }
  441. if taskErr.StatusCode == 408 {
  442. // azure处理超时不重试
  443. return false
  444. }
  445. if taskErr.LocalError {
  446. return false
  447. }
  448. if taskErr.StatusCode/100 == 2 {
  449. return false
  450. }
  451. return true
  452. }