adaptor.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383
  1. package vertex
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "net/http"
  8. "strings"
  9. "github.com/QuantumNous/new-api/common"
  10. "github.com/QuantumNous/new-api/dto"
  11. "github.com/QuantumNous/new-api/relay/channel"
  12. "github.com/QuantumNous/new-api/relay/channel/claude"
  13. "github.com/QuantumNous/new-api/relay/channel/gemini"
  14. "github.com/QuantumNous/new-api/relay/channel/openai"
  15. relaycommon "github.com/QuantumNous/new-api/relay/common"
  16. "github.com/QuantumNous/new-api/relay/constant"
  17. "github.com/QuantumNous/new-api/setting/model_setting"
  18. "github.com/QuantumNous/new-api/types"
  19. "github.com/gin-gonic/gin"
  20. )
  21. const (
  22. RequestModeClaude = 1
  23. RequestModeGemini = 2
  24. RequestModeLlama = 3
  25. )
  26. var claudeModelMap = map[string]string{
  27. "claude-3-sonnet-20240229": "claude-3-sonnet@20240229",
  28. "claude-3-opus-20240229": "claude-3-opus@20240229",
  29. "claude-3-haiku-20240307": "claude-3-haiku@20240307",
  30. "claude-3-5-sonnet-20240620": "claude-3-5-sonnet@20240620",
  31. "claude-3-5-sonnet-20241022": "claude-3-5-sonnet-v2@20241022",
  32. "claude-3-7-sonnet-20250219": "claude-3-7-sonnet@20250219",
  33. "claude-sonnet-4-20250514": "claude-sonnet-4@20250514",
  34. "claude-opus-4-20250514": "claude-opus-4@20250514",
  35. "claude-opus-4-1-20250805": "claude-opus-4-1@20250805",
  36. "claude-sonnet-4-5-20250929": "claude-sonnet-4-5@20250929",
  37. "claude-opus-4-5-20251101": "claude-opus-4-5@20251101",
  38. }
  39. const anthropicVersion = "vertex-2023-10-16"
  40. type Adaptor struct {
  41. RequestMode int
  42. AccountCredentials Credentials
  43. }
  44. func (a *Adaptor) ConvertGeminiRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeminiChatRequest) (any, error) {
  45. geminiAdaptor := gemini.Adaptor{}
  46. return geminiAdaptor.ConvertGeminiRequest(c, info, request)
  47. }
  48. func (a *Adaptor) ConvertClaudeRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.ClaudeRequest) (any, error) {
  49. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  50. c.Set("request_model", v)
  51. } else {
  52. c.Set("request_model", request.Model)
  53. }
  54. vertexClaudeReq := copyRequest(request, anthropicVersion)
  55. return vertexClaudeReq, nil
  56. }
  57. func (a *Adaptor) ConvertAudioRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.AudioRequest) (io.Reader, error) {
  58. //TODO implement me
  59. return nil, errors.New("not implemented")
  60. }
  61. func (a *Adaptor) ConvertImageRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.ImageRequest) (any, error) {
  62. geminiAdaptor := gemini.Adaptor{}
  63. return geminiAdaptor.ConvertImageRequest(c, info, request)
  64. }
  65. func (a *Adaptor) Init(info *relaycommon.RelayInfo) {
  66. if strings.HasPrefix(info.UpstreamModelName, "claude") {
  67. a.RequestMode = RequestModeClaude
  68. } else if strings.Contains(info.UpstreamModelName, "llama") ||
  69. // open source models
  70. strings.Contains(info.UpstreamModelName, "-maas") {
  71. a.RequestMode = RequestModeLlama
  72. } else {
  73. a.RequestMode = RequestModeGemini
  74. }
  75. }
  76. func (a *Adaptor) getRequestUrl(info *relaycommon.RelayInfo, modelName, suffix string) (string, error) {
  77. region := GetModelRegion(info.ApiVersion, info.OriginModelName)
  78. if info.ChannelOtherSettings.VertexKeyType != dto.VertexKeyTypeAPIKey {
  79. adc := &Credentials{}
  80. if err := common.Unmarshal([]byte(info.ApiKey), adc); err != nil {
  81. return "", fmt.Errorf("failed to decode credentials file: %w", err)
  82. }
  83. a.AccountCredentials = *adc
  84. if a.RequestMode == RequestModeGemini {
  85. if region == "global" {
  86. return fmt.Sprintf(
  87. "https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/google/models/%s:%s",
  88. adc.ProjectID,
  89. modelName,
  90. suffix,
  91. ), nil
  92. } else {
  93. return fmt.Sprintf(
  94. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/google/models/%s:%s",
  95. region,
  96. adc.ProjectID,
  97. region,
  98. modelName,
  99. suffix,
  100. ), nil
  101. }
  102. } else if a.RequestMode == RequestModeClaude {
  103. if region == "global" {
  104. return fmt.Sprintf(
  105. "https://aiplatform.googleapis.com/v1/projects/%s/locations/global/publishers/anthropic/models/%s:%s",
  106. adc.ProjectID,
  107. modelName,
  108. suffix,
  109. ), nil
  110. } else {
  111. return fmt.Sprintf(
  112. "https://%s-aiplatform.googleapis.com/v1/projects/%s/locations/%s/publishers/anthropic/models/%s:%s",
  113. region,
  114. adc.ProjectID,
  115. region,
  116. modelName,
  117. suffix,
  118. ), nil
  119. }
  120. } else if a.RequestMode == RequestModeLlama {
  121. return fmt.Sprintf(
  122. "https://%s-aiplatform.googleapis.com/v1beta1/projects/%s/locations/%s/endpoints/openapi/chat/completions",
  123. region,
  124. adc.ProjectID,
  125. region,
  126. ), nil
  127. }
  128. } else {
  129. var keyPrefix string
  130. if strings.HasSuffix(suffix, "?alt=sse") {
  131. keyPrefix = "&"
  132. } else {
  133. keyPrefix = "?"
  134. }
  135. if region == "global" {
  136. return fmt.Sprintf(
  137. "https://aiplatform.googleapis.com/v1/publishers/google/models/%s:%s%skey=%s",
  138. modelName,
  139. suffix,
  140. keyPrefix,
  141. info.ApiKey,
  142. ), nil
  143. } else {
  144. return fmt.Sprintf(
  145. "https://%s-aiplatform.googleapis.com/v1/publishers/google/models/%s:%s%skey=%s",
  146. region,
  147. modelName,
  148. suffix,
  149. keyPrefix,
  150. info.ApiKey,
  151. ), nil
  152. }
  153. }
  154. return "", errors.New("unsupported request mode")
  155. }
  156. func (a *Adaptor) GetRequestURL(info *relaycommon.RelayInfo) (string, error) {
  157. suffix := ""
  158. if a.RequestMode == RequestModeGemini {
  159. if model_setting.GetGeminiSettings().ThinkingAdapterEnabled &&
  160. !model_setting.ShouldPreserveThinkingSuffix(info.OriginModelName) {
  161. // 新增逻辑:处理 -thinking-<budget> 格式
  162. if strings.Contains(info.UpstreamModelName, "-thinking-") {
  163. parts := strings.Split(info.UpstreamModelName, "-thinking-")
  164. info.UpstreamModelName = parts[0]
  165. } else if strings.HasSuffix(info.UpstreamModelName, "-thinking") { // 旧的适配
  166. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-thinking")
  167. } else if strings.HasSuffix(info.UpstreamModelName, "-nothinking") {
  168. info.UpstreamModelName = strings.TrimSuffix(info.UpstreamModelName, "-nothinking")
  169. }
  170. }
  171. if info.IsStream {
  172. suffix = "streamGenerateContent?alt=sse"
  173. } else {
  174. suffix = "generateContent"
  175. }
  176. if strings.HasPrefix(info.UpstreamModelName, "imagen") {
  177. suffix = "predict"
  178. }
  179. return a.getRequestUrl(info, info.UpstreamModelName, suffix)
  180. } else if a.RequestMode == RequestModeClaude {
  181. if info.IsStream {
  182. suffix = "streamRawPredict?alt=sse"
  183. } else {
  184. suffix = "rawPredict"
  185. }
  186. model := info.UpstreamModelName
  187. if v, ok := claudeModelMap[info.UpstreamModelName]; ok {
  188. model = v
  189. }
  190. return a.getRequestUrl(info, model, suffix)
  191. } else if a.RequestMode == RequestModeLlama {
  192. return a.getRequestUrl(info, "", "")
  193. }
  194. return "", errors.New("unsupported request mode")
  195. }
  196. func (a *Adaptor) SetupRequestHeader(c *gin.Context, req *http.Header, info *relaycommon.RelayInfo) error {
  197. channel.SetupApiRequestHeader(info, c, req)
  198. if info.ChannelOtherSettings.VertexKeyType != dto.VertexKeyTypeAPIKey {
  199. accessToken, err := getAccessToken(a, info)
  200. if err != nil {
  201. return err
  202. }
  203. req.Set("Authorization", "Bearer "+accessToken)
  204. }
  205. if a.AccountCredentials.ProjectID != "" {
  206. req.Set("x-goog-user-project", a.AccountCredentials.ProjectID)
  207. }
  208. if strings.Contains(info.UpstreamModelName, "claude") {
  209. claude.CommonClaudeHeadersOperation(c, req, info)
  210. }
  211. return nil
  212. }
  213. func (a *Adaptor) ConvertOpenAIRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeneralOpenAIRequest) (any, error) {
  214. if request == nil {
  215. return nil, errors.New("request is nil")
  216. }
  217. if a.RequestMode == RequestModeGemini && strings.HasPrefix(info.UpstreamModelName, "imagen") {
  218. prompt := ""
  219. for _, m := range request.Messages {
  220. if m.Role == "user" {
  221. prompt = m.StringContent()
  222. if prompt != "" {
  223. break
  224. }
  225. }
  226. }
  227. if prompt == "" {
  228. if p, ok := request.Prompt.(string); ok {
  229. prompt = p
  230. }
  231. }
  232. if prompt == "" {
  233. return nil, errors.New("prompt is required for image generation")
  234. }
  235. imgReq := dto.ImageRequest{
  236. Model: request.Model,
  237. Prompt: prompt,
  238. N: 1,
  239. Size: "1024x1024",
  240. }
  241. if request.N > 0 {
  242. imgReq.N = uint(request.N)
  243. }
  244. if request.Size != "" {
  245. imgReq.Size = request.Size
  246. }
  247. if len(request.ExtraBody) > 0 {
  248. var extra map[string]any
  249. if err := json.Unmarshal(request.ExtraBody, &extra); err == nil {
  250. if n, ok := extra["n"].(float64); ok && n > 0 {
  251. imgReq.N = uint(n)
  252. }
  253. if size, ok := extra["size"].(string); ok {
  254. imgReq.Size = size
  255. }
  256. // accept aspectRatio in extra body (top-level or under parameters)
  257. if ar, ok := extra["aspectRatio"].(string); ok && ar != "" {
  258. imgReq.Size = ar
  259. }
  260. if params, ok := extra["parameters"].(map[string]any); ok {
  261. if ar, ok := params["aspectRatio"].(string); ok && ar != "" {
  262. imgReq.Size = ar
  263. }
  264. }
  265. }
  266. }
  267. c.Set("request_model", request.Model)
  268. return a.ConvertImageRequest(c, info, imgReq)
  269. }
  270. if a.RequestMode == RequestModeClaude {
  271. claudeReq, err := claude.RequestOpenAI2ClaudeMessage(c, *request)
  272. if err != nil {
  273. return nil, err
  274. }
  275. vertexClaudeReq := copyRequest(claudeReq, anthropicVersion)
  276. c.Set("request_model", claudeReq.Model)
  277. info.UpstreamModelName = claudeReq.Model
  278. return vertexClaudeReq, nil
  279. } else if a.RequestMode == RequestModeGemini {
  280. geminiRequest, err := gemini.CovertOpenAI2Gemini(c, *request, info)
  281. if err != nil {
  282. return nil, err
  283. }
  284. c.Set("request_model", request.Model)
  285. return geminiRequest, nil
  286. } else if a.RequestMode == RequestModeLlama {
  287. return request, nil
  288. }
  289. return nil, errors.New("unsupported request mode")
  290. }
  291. func (a *Adaptor) ConvertRerankRequest(c *gin.Context, relayMode int, request dto.RerankRequest) (any, error) {
  292. return nil, nil
  293. }
  294. func (a *Adaptor) ConvertEmbeddingRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.EmbeddingRequest) (any, error) {
  295. //TODO implement me
  296. return nil, errors.New("not implemented")
  297. }
  298. func (a *Adaptor) ConvertOpenAIResponsesRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.OpenAIResponsesRequest) (any, error) {
  299. // TODO implement me
  300. return nil, errors.New("not implemented")
  301. }
  302. func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, requestBody io.Reader) (any, error) {
  303. return channel.DoApiRequest(a, c, info, requestBody)
  304. }
  305. func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) {
  306. if info.IsStream {
  307. switch a.RequestMode {
  308. case RequestModeClaude:
  309. return claude.ClaudeStreamHandler(c, resp, info, claude.RequestModeMessage)
  310. case RequestModeGemini:
  311. if info.RelayMode == constant.RelayModeGemini {
  312. return gemini.GeminiTextGenerationStreamHandler(c, info, resp)
  313. } else {
  314. return gemini.GeminiChatStreamHandler(c, info, resp)
  315. }
  316. case RequestModeLlama:
  317. return openai.OaiStreamHandler(c, info, resp)
  318. }
  319. } else {
  320. switch a.RequestMode {
  321. case RequestModeClaude:
  322. return claude.ClaudeHandler(c, resp, info, claude.RequestModeMessage)
  323. case RequestModeGemini:
  324. if info.RelayMode == constant.RelayModeGemini {
  325. return gemini.GeminiTextGenerationHandler(c, info, resp)
  326. } else {
  327. if strings.HasPrefix(info.UpstreamModelName, "imagen") {
  328. return gemini.GeminiImageHandler(c, info, resp)
  329. }
  330. return gemini.GeminiChatHandler(c, info, resp)
  331. }
  332. case RequestModeLlama:
  333. return openai.OpenaiHandler(c, info, resp)
  334. }
  335. }
  336. return
  337. }
  338. func (a *Adaptor) GetModelList() []string {
  339. var modelList []string
  340. for i, s := range ModelList {
  341. modelList = append(modelList, s)
  342. ModelList[i] = s
  343. }
  344. for i, s := range claude.ModelList {
  345. modelList = append(modelList, s)
  346. claude.ModelList[i] = s
  347. }
  348. for i, s := range gemini.ModelList {
  349. modelList = append(modelList, s)
  350. gemini.ModelList[i] = s
  351. }
  352. return modelList
  353. }
  354. func (a *Adaptor) GetChannelName() string {
  355. return ChannelName
  356. }