rerank.go 2.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475
  1. package common_handler
  2. import (
  3. "io"
  4. "net/http"
  5. "github.com/QuantumNous/new-api/common"
  6. "github.com/QuantumNous/new-api/constant"
  7. "github.com/QuantumNous/new-api/dto"
  8. "github.com/QuantumNous/new-api/relay/channel/xinference"
  9. relaycommon "github.com/QuantumNous/new-api/relay/common"
  10. "github.com/QuantumNous/new-api/service"
  11. "github.com/QuantumNous/new-api/types"
  12. "github.com/gin-gonic/gin"
  13. )
  14. func RerankHandler(c *gin.Context, info *relaycommon.RelayInfo, resp *http.Response) (*dto.Usage, *types.NewAPIError) {
  15. responseBody, err := io.ReadAll(resp.Body)
  16. if err != nil {
  17. return nil, types.NewOpenAIError(err, types.ErrorCodeReadResponseBodyFailed, http.StatusInternalServerError)
  18. }
  19. service.CloseResponseBodyGracefully(resp)
  20. if common.DebugEnabled {
  21. println("reranker response body: ", string(responseBody))
  22. }
  23. var jinaResp dto.RerankResponse
  24. if info.ChannelType == constant.ChannelTypeXinference {
  25. var xinRerankResponse xinference.XinRerankResponse
  26. err = common.Unmarshal(responseBody, &xinRerankResponse)
  27. if err != nil {
  28. return nil, types.NewOpenAIError(err, types.ErrorCodeBadResponseBody, http.StatusInternalServerError)
  29. }
  30. jinaRespResults := make([]dto.RerankResponseResult, len(xinRerankResponse.Results))
  31. for i, result := range xinRerankResponse.Results {
  32. respResult := dto.RerankResponseResult{
  33. Index: result.Index,
  34. RelevanceScore: result.RelevanceScore,
  35. }
  36. if info.ReturnDocuments {
  37. var document any
  38. if result.Document != nil {
  39. if doc, ok := result.Document.(string); ok {
  40. if doc == "" {
  41. document = info.Documents[result.Index]
  42. } else {
  43. document = doc
  44. }
  45. } else {
  46. document = result.Document
  47. }
  48. }
  49. respResult.Document = document
  50. }
  51. jinaRespResults[i] = respResult
  52. }
  53. jinaResp = dto.RerankResponse{
  54. Results: jinaRespResults,
  55. Usage: dto.Usage{
  56. PromptTokens: info.PromptTokens,
  57. TotalTokens: info.PromptTokens,
  58. },
  59. }
  60. } else {
  61. err = common.Unmarshal(responseBody, &jinaResp)
  62. if err != nil {
  63. return nil, types.NewOpenAIError(err, types.ErrorCodeBadResponseBody, http.StatusInternalServerError)
  64. }
  65. jinaResp.Usage.PromptTokens = jinaResp.Usage.TotalTokens
  66. }
  67. c.Writer.Header().Set("Content-Type", "application/json")
  68. c.JSON(http.StatusOK, jinaResp)
  69. return &jinaResp.Usage, nil
  70. }