convert.go 28 KB


  1. package service
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "strings"
  6. "github.com/QuantumNous/new-api/common"
  7. "github.com/QuantumNous/new-api/constant"
  8. "github.com/QuantumNous/new-api/dto"
  9. "github.com/QuantumNous/new-api/relay/channel/openrouter"
  10. relaycommon "github.com/QuantumNous/new-api/relay/common"
  11. )
  12. func ClaudeToOpenAIRequest(claudeRequest dto.ClaudeRequest, info *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
  13. openAIRequest := dto.GeneralOpenAIRequest{
  14. Model: claudeRequest.Model,
  15. MaxTokens: claudeRequest.MaxTokens,
  16. Temperature: claudeRequest.Temperature,
  17. TopP: claudeRequest.TopP,
  18. Stream: claudeRequest.Stream,
  19. }
  20. isOpenRouter := info.ChannelType == constant.ChannelTypeOpenRouter
  21. if claudeRequest.Thinking != nil && claudeRequest.Thinking.Type == "enabled" {
  22. if isOpenRouter {
  23. reasoning := openrouter.RequestReasoning{
  24. MaxTokens: claudeRequest.Thinking.GetBudgetTokens(),
  25. }
  26. reasoningJSON, err := json.Marshal(reasoning)
  27. if err != nil {
  28. return nil, fmt.Errorf("failed to marshal reasoning: %w", err)
  29. }
  30. openAIRequest.Reasoning = reasoningJSON
  31. } else {
  32. thinkingSuffix := "-thinking"
  33. if strings.HasSuffix(info.OriginModelName, thinkingSuffix) &&
  34. !strings.HasSuffix(openAIRequest.Model, thinkingSuffix) {
  35. openAIRequest.Model = openAIRequest.Model + thinkingSuffix
  36. }
  37. }
  38. }
  39. // Convert stop sequences
  40. if len(claudeRequest.StopSequences) == 1 {
  41. openAIRequest.Stop = claudeRequest.StopSequences[0]
  42. } else if len(claudeRequest.StopSequences) > 1 {
  43. openAIRequest.Stop = claudeRequest.StopSequences
  44. }
  45. // Convert tools
  46. tools, _ := common.Any2Type[[]dto.Tool](claudeRequest.Tools)
  47. openAITools := make([]dto.ToolCallRequest, 0)
  48. for _, claudeTool := range tools {
  49. openAITool := dto.ToolCallRequest{
  50. Type: "function",
  51. Function: dto.FunctionRequest{
  52. Name: claudeTool.Name,
  53. Description: claudeTool.Description,
  54. Parameters: claudeTool.InputSchema,
  55. },
  56. }
  57. openAITools = append(openAITools, openAITool)
  58. }
  59. openAIRequest.Tools = openAITools
  60. // Convert messages
  61. openAIMessages := make([]dto.Message, 0)
  62. // Add system message if present
  63. if claudeRequest.System != nil {
  64. if claudeRequest.IsStringSystem() && claudeRequest.GetStringSystem() != "" {
  65. openAIMessage := dto.Message{
  66. Role: "system",
  67. }
  68. openAIMessage.SetStringContent(claudeRequest.GetStringSystem())
  69. openAIMessages = append(openAIMessages, openAIMessage)
  70. } else {
  71. systems := claudeRequest.ParseSystem()
  72. if len(systems) > 0 {
  73. openAIMessage := dto.Message{
  74. Role: "system",
  75. }
  76. isOpenRouterClaude := isOpenRouter && strings.HasPrefix(info.UpstreamModelName, "anthropic/claude")
  77. if isOpenRouterClaude {
  78. systemMediaMessages := make([]dto.MediaContent, 0, len(systems))
  79. for _, system := range systems {
  80. message := dto.MediaContent{
  81. Type: "text",
  82. Text: system.GetText(),
  83. CacheControl: system.CacheControl,
  84. }
  85. systemMediaMessages = append(systemMediaMessages, message)
  86. }
  87. openAIMessage.SetMediaContent(systemMediaMessages)
  88. } else {
  89. systemStr := ""
  90. for _, system := range systems {
  91. if system.Text != nil {
  92. systemStr += *system.Text
  93. }
  94. }
  95. openAIMessage.SetStringContent(systemStr)
  96. }
  97. openAIMessages = append(openAIMessages, openAIMessage)
  98. }
  99. }
  100. }
  101. for _, claudeMessage := range claudeRequest.Messages {
  102. openAIMessage := dto.Message{
  103. Role: claudeMessage.Role,
  104. }
  105. //log.Printf("claudeMessage.Content: %v", claudeMessage.Content)
  106. if claudeMessage.IsStringContent() {
  107. openAIMessage.SetStringContent(claudeMessage.GetStringContent())
  108. } else {
  109. content, err := claudeMessage.ParseContent()
  110. if err != nil {
  111. return nil, err
  112. }
  113. contents := content
  114. var toolCalls []dto.ToolCallRequest
  115. mediaMessages := make([]dto.MediaContent, 0, len(contents))
  116. for _, mediaMsg := range contents {
  117. switch mediaMsg.Type {
  118. case "text":
  119. message := dto.MediaContent{
  120. Type: "text",
  121. Text: mediaMsg.GetText(),
  122. CacheControl: mediaMsg.CacheControl,
  123. }
  124. mediaMessages = append(mediaMessages, message)
  125. case "image":
  126. // Handle image conversion (base64 to URL or keep as is)
  127. imageData := fmt.Sprintf("data:%s;base64,%s", mediaMsg.Source.MediaType, mediaMsg.Source.Data)
  128. //textContent += fmt.Sprintf("[Image: %s]", imageData)
  129. mediaMessage := dto.MediaContent{
  130. Type: "image_url",
  131. ImageUrl: &dto.MessageImageUrl{Url: imageData},
  132. }
  133. mediaMessages = append(mediaMessages, mediaMessage)
  134. case "tool_use":
  135. toolCall := dto.ToolCallRequest{
  136. ID: mediaMsg.Id,
  137. Type: "function",
  138. Function: dto.FunctionRequest{
  139. Name: mediaMsg.Name,
  140. Arguments: toJSONString(mediaMsg.Input),
  141. },
  142. }
  143. toolCalls = append(toolCalls, toolCall)
  144. case "tool_result":
  145. // Add tool result as a separate message
  146. toolName := mediaMsg.Name
  147. if toolName == "" {
  148. toolName = claudeRequest.SearchToolNameByToolCallId(mediaMsg.ToolUseId)
  149. }
  150. oaiToolMessage := dto.Message{
  151. Role: "tool",
  152. Name: &toolName,
  153. ToolCallId: mediaMsg.ToolUseId,
  154. }
  155. //oaiToolMessage.SetStringContent(*mediaMsg.GetMediaContent().Text)
  156. if mediaMsg.IsStringContent() {
  157. oaiToolMessage.SetStringContent(mediaMsg.GetStringContent())
  158. } else {
  159. mediaContents := mediaMsg.ParseMediaContent()
  160. encodeJson, _ := common.Marshal(mediaContents)
  161. oaiToolMessage.SetStringContent(string(encodeJson))
  162. }
  163. openAIMessages = append(openAIMessages, oaiToolMessage)
  164. }
  165. }
  166. if len(toolCalls) > 0 {
  167. openAIMessage.SetToolCalls(toolCalls)
  168. }
  169. if len(mediaMessages) > 0 && len(toolCalls) == 0 {
  170. openAIMessage.SetMediaContent(mediaMessages)
  171. }
  172. }
  173. if len(openAIMessage.ParseContent()) > 0 || len(openAIMessage.ToolCalls) > 0 {
  174. openAIMessages = append(openAIMessages, openAIMessage)
  175. }
  176. }
  177. openAIRequest.Messages = openAIMessages
  178. return &openAIRequest, nil
  179. }
  180. func generateStopBlock(index int) *dto.ClaudeResponse {
  181. return &dto.ClaudeResponse{
  182. Type: "content_block_stop",
  183. Index: common.GetPointer[int](index),
  184. }
  185. }
  186. func StreamResponseOpenAI2Claude(openAIResponse *dto.ChatCompletionsStreamResponse, info *relaycommon.RelayInfo) []*dto.ClaudeResponse {
  187. if info.ClaudeConvertInfo.Done {
  188. return nil
  189. }
  190. var claudeResponses []*dto.ClaudeResponse
  191. if info.SendResponseCount == 1 {
  192. msg := &dto.ClaudeMediaMessage{
  193. Id: openAIResponse.Id,
  194. Model: openAIResponse.Model,
  195. Type: "message",
  196. Role: "assistant",
  197. Usage: &dto.ClaudeUsage{
  198. InputTokens: info.GetEstimatePromptTokens(),
  199. OutputTokens: 0,
  200. },
  201. }
  202. msg.SetContent(make([]any, 0))
  203. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  204. Type: "message_start",
  205. Message: msg,
  206. })
  207. //claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  208. // Type: "ping",
  209. //})
  210. if openAIResponse.IsToolCall() {
  211. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeTools
  212. var toolCall dto.ToolCallResponse
  213. if len(openAIResponse.Choices) > 0 && len(openAIResponse.Choices[0].Delta.ToolCalls) > 0 {
  214. toolCall = openAIResponse.Choices[0].Delta.ToolCalls[0]
  215. } else {
  216. first := openAIResponse.GetFirstToolCall()
  217. if first != nil {
  218. toolCall = *first
  219. } else {
  220. toolCall = dto.ToolCallResponse{}
  221. }
  222. }
  223. resp := &dto.ClaudeResponse{
  224. Type: "content_block_start",
  225. ContentBlock: &dto.ClaudeMediaMessage{
  226. Id: toolCall.ID,
  227. Type: "tool_use",
  228. Name: toolCall.Function.Name,
  229. Input: map[string]interface{}{},
  230. },
  231. }
  232. resp.SetIndex(0)
  233. claudeResponses = append(claudeResponses, resp)
  234. // 首块包含工具 delta,则追加 input_json_delta
  235. if toolCall.Function.Arguments != "" {
  236. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  237. Index: &info.ClaudeConvertInfo.Index,
  238. Type: "content_block_delta",
  239. Delta: &dto.ClaudeMediaMessage{
  240. Type: "input_json_delta",
  241. PartialJson: &toolCall.Function.Arguments,
  242. },
  243. })
  244. }
  245. } else {
  246. }
  247. // 判断首个响应是否存在内容(非标准的 OpenAI 响应)
  248. if len(openAIResponse.Choices) > 0 {
  249. reasoning := openAIResponse.Choices[0].Delta.GetReasoningContent()
  250. content := openAIResponse.Choices[0].Delta.GetContentString()
  251. if reasoning != "" {
  252. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  253. Index: &info.ClaudeConvertInfo.Index,
  254. Type: "content_block_start",
  255. ContentBlock: &dto.ClaudeMediaMessage{
  256. Type: "thinking",
  257. Thinking: common.GetPointer[string](""),
  258. },
  259. })
  260. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  261. Index: &info.ClaudeConvertInfo.Index,
  262. Type: "content_block_delta",
  263. Delta: &dto.ClaudeMediaMessage{
  264. Type: "thinking_delta",
  265. Thinking: &reasoning,
  266. },
  267. })
  268. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeThinking
  269. } else if content != "" {
  270. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  271. Index: &info.ClaudeConvertInfo.Index,
  272. Type: "content_block_start",
  273. ContentBlock: &dto.ClaudeMediaMessage{
  274. Type: "text",
  275. Text: common.GetPointer[string](""),
  276. },
  277. })
  278. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  279. Index: &info.ClaudeConvertInfo.Index,
  280. Type: "content_block_delta",
  281. Delta: &dto.ClaudeMediaMessage{
  282. Type: "text_delta",
  283. Text: common.GetPointer[string](content),
  284. },
  285. })
  286. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeText
  287. }
  288. }
  289. // 如果首块就带 finish_reason,需要立即发送停止块
  290. if len(openAIResponse.Choices) > 0 && openAIResponse.Choices[0].FinishReason != nil && *openAIResponse.Choices[0].FinishReason != "" {
  291. info.FinishReason = *openAIResponse.Choices[0].FinishReason
  292. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  293. oaiUsage := openAIResponse.Usage
  294. if oaiUsage == nil {
  295. oaiUsage = info.ClaudeConvertInfo.Usage
  296. }
  297. if oaiUsage != nil {
  298. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  299. Type: "message_delta",
  300. Usage: &dto.ClaudeUsage{
  301. InputTokens: oaiUsage.PromptTokens,
  302. OutputTokens: oaiUsage.CompletionTokens,
  303. CacheCreationInputTokens: oaiUsage.PromptTokensDetails.CachedCreationTokens,
  304. CacheReadInputTokens: oaiUsage.PromptTokensDetails.CachedTokens,
  305. },
  306. Delta: &dto.ClaudeMediaMessage{
  307. StopReason: common.GetPointer[string](stopReasonOpenAI2Claude(info.FinishReason)),
  308. },
  309. })
  310. }
  311. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  312. Type: "message_stop",
  313. })
  314. info.ClaudeConvertInfo.Done = true
  315. }
  316. return claudeResponses
  317. }
  318. if len(openAIResponse.Choices) == 0 {
  319. // no choices
  320. // 可能为非标准的 OpenAI 响应,判断是否已经完成
  321. if info.ClaudeConvertInfo.Done {
  322. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  323. oaiUsage := info.ClaudeConvertInfo.Usage
  324. if oaiUsage != nil {
  325. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  326. Type: "message_delta",
  327. Usage: &dto.ClaudeUsage{
  328. InputTokens: oaiUsage.PromptTokens,
  329. OutputTokens: oaiUsage.CompletionTokens,
  330. CacheCreationInputTokens: oaiUsage.PromptTokensDetails.CachedCreationTokens,
  331. CacheReadInputTokens: oaiUsage.PromptTokensDetails.CachedTokens,
  332. },
  333. Delta: &dto.ClaudeMediaMessage{
  334. StopReason: common.GetPointer[string](stopReasonOpenAI2Claude(info.FinishReason)),
  335. },
  336. })
  337. }
  338. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  339. Type: "message_stop",
  340. })
  341. }
  342. return claudeResponses
  343. } else {
  344. chosenChoice := openAIResponse.Choices[0]
  345. doneChunk := chosenChoice.FinishReason != nil && *chosenChoice.FinishReason != ""
  346. if doneChunk {
  347. info.FinishReason = *chosenChoice.FinishReason
  348. }
  349. var claudeResponse dto.ClaudeResponse
  350. var isEmpty bool
  351. claudeResponse.Type = "content_block_delta"
  352. if len(chosenChoice.Delta.ToolCalls) > 0 {
  353. toolCalls := chosenChoice.Delta.ToolCalls
  354. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeTools {
  355. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  356. info.ClaudeConvertInfo.Index++
  357. }
  358. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeTools
  359. for i, toolCall := range toolCalls {
  360. blockIndex := info.ClaudeConvertInfo.Index
  361. if toolCall.Index != nil {
  362. blockIndex = *toolCall.Index
  363. } else if len(toolCalls) > 1 {
  364. blockIndex = info.ClaudeConvertInfo.Index + i
  365. }
  366. idx := blockIndex
  367. if toolCall.Function.Name != "" {
  368. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  369. Index: &idx,
  370. Type: "content_block_start",
  371. ContentBlock: &dto.ClaudeMediaMessage{
  372. Id: toolCall.ID,
  373. Type: "tool_use",
  374. Name: toolCall.Function.Name,
  375. Input: map[string]interface{}{},
  376. },
  377. })
  378. }
  379. if len(toolCall.Function.Arguments) > 0 {
  380. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  381. Index: &idx,
  382. Type: "content_block_delta",
  383. Delta: &dto.ClaudeMediaMessage{
  384. Type: "input_json_delta",
  385. PartialJson: &toolCall.Function.Arguments,
  386. },
  387. })
  388. }
  389. info.ClaudeConvertInfo.Index = blockIndex
  390. }
  391. } else {
  392. reasoning := chosenChoice.Delta.GetReasoningContent()
  393. textContent := chosenChoice.Delta.GetContentString()
  394. if reasoning != "" || textContent != "" {
  395. if reasoning != "" {
  396. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeThinking {
  397. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  398. Index: &info.ClaudeConvertInfo.Index,
  399. Type: "content_block_start",
  400. ContentBlock: &dto.ClaudeMediaMessage{
  401. Type: "thinking",
  402. Thinking: common.GetPointer[string](""),
  403. },
  404. })
  405. }
  406. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeThinking
  407. claudeResponse.Delta = &dto.ClaudeMediaMessage{
  408. Type: "thinking_delta",
  409. Thinking: &reasoning,
  410. }
  411. } else {
  412. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeText {
  413. if info.ClaudeConvertInfo.LastMessagesType == relaycommon.LastMessageTypeThinking || info.ClaudeConvertInfo.LastMessagesType == relaycommon.LastMessageTypeTools {
  414. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  415. info.ClaudeConvertInfo.Index++
  416. }
  417. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  418. Index: &info.ClaudeConvertInfo.Index,
  419. Type: "content_block_start",
  420. ContentBlock: &dto.ClaudeMediaMessage{
  421. Type: "text",
  422. Text: common.GetPointer[string](""),
  423. },
  424. })
  425. }
  426. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeText
  427. claudeResponse.Delta = &dto.ClaudeMediaMessage{
  428. Type: "text_delta",
  429. Text: common.GetPointer[string](textContent),
  430. }
  431. }
  432. } else {
  433. isEmpty = true
  434. }
  435. }
  436. claudeResponse.Index = &info.ClaudeConvertInfo.Index
  437. if !isEmpty && claudeResponse.Delta != nil {
  438. claudeResponses = append(claudeResponses, &claudeResponse)
  439. }
  440. if doneChunk || info.ClaudeConvertInfo.Done {
  441. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  442. oaiUsage := openAIResponse.Usage
  443. if oaiUsage == nil {
  444. oaiUsage = info.ClaudeConvertInfo.Usage
  445. }
  446. if oaiUsage != nil {
  447. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  448. Type: "message_delta",
  449. Usage: &dto.ClaudeUsage{
  450. InputTokens: oaiUsage.PromptTokens,
  451. OutputTokens: oaiUsage.CompletionTokens,
  452. CacheCreationInputTokens: oaiUsage.PromptTokensDetails.CachedCreationTokens,
  453. CacheReadInputTokens: oaiUsage.PromptTokensDetails.CachedTokens,
  454. },
  455. Delta: &dto.ClaudeMediaMessage{
  456. StopReason: common.GetPointer[string](stopReasonOpenAI2Claude(info.FinishReason)),
  457. },
  458. })
  459. }
  460. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  461. Type: "message_stop",
  462. })
  463. info.ClaudeConvertInfo.Done = true
  464. return claudeResponses
  465. }
  466. }
  467. return claudeResponses
  468. }
  469. func ResponseOpenAI2Claude(openAIResponse *dto.OpenAITextResponse, info *relaycommon.RelayInfo) *dto.ClaudeResponse {
  470. var stopReason string
  471. contents := make([]dto.ClaudeMediaMessage, 0)
  472. claudeResponse := &dto.ClaudeResponse{
  473. Id: openAIResponse.Id,
  474. Type: "message",
  475. Role: "assistant",
  476. Model: openAIResponse.Model,
  477. }
  478. for _, choice := range openAIResponse.Choices {
  479. stopReason = stopReasonOpenAI2Claude(choice.FinishReason)
  480. if choice.FinishReason == "tool_calls" {
  481. for _, toolUse := range choice.Message.ParseToolCalls() {
  482. claudeContent := dto.ClaudeMediaMessage{}
  483. claudeContent.Type = "tool_use"
  484. claudeContent.Id = toolUse.ID
  485. claudeContent.Name = toolUse.Function.Name
  486. var mapParams map[string]interface{}
  487. if err := common.Unmarshal([]byte(toolUse.Function.Arguments), &mapParams); err == nil {
  488. claudeContent.Input = mapParams
  489. } else {
  490. claudeContent.Input = toolUse.Function.Arguments
  491. }
  492. contents = append(contents, claudeContent)
  493. }
  494. } else {
  495. claudeContent := dto.ClaudeMediaMessage{}
  496. claudeContent.Type = "text"
  497. claudeContent.SetText(choice.Message.StringContent())
  498. contents = append(contents, claudeContent)
  499. }
  500. }
  501. claudeResponse.Content = contents
  502. claudeResponse.StopReason = stopReason
  503. claudeResponse.Usage = &dto.ClaudeUsage{
  504. InputTokens: openAIResponse.PromptTokens,
  505. OutputTokens: openAIResponse.CompletionTokens,
  506. }
  507. return claudeResponse
  508. }
  509. func stopReasonOpenAI2Claude(reason string) string {
  510. switch reason {
  511. case "stop":
  512. return "end_turn"
  513. case "stop_sequence":
  514. return "stop_sequence"
  515. case "length":
  516. fallthrough
  517. case "max_tokens":
  518. return "max_tokens"
  519. case "tool_calls":
  520. return "tool_use"
  521. default:
  522. return reason
  523. }
  524. }
  525. func toJSONString(v interface{}) string {
  526. b, err := json.Marshal(v)
  527. if err != nil {
  528. return "{}"
  529. }
  530. return string(b)
  531. }
  532. func GeminiToOpenAIRequest(geminiRequest *dto.GeminiChatRequest, info *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
  533. openaiRequest := &dto.GeneralOpenAIRequest{
  534. Model: info.UpstreamModelName,
  535. Stream: info.IsStream,
  536. }
  537. // 转换 messages
  538. var messages []dto.Message
  539. for _, content := range geminiRequest.Contents {
  540. message := dto.Message{
  541. Role: convertGeminiRoleToOpenAI(content.Role),
  542. }
  543. // 处理 parts
  544. var mediaContents []dto.MediaContent
  545. var toolCalls []dto.ToolCallRequest
  546. for _, part := range content.Parts {
  547. if part.Text != "" {
  548. mediaContent := dto.MediaContent{
  549. Type: "text",
  550. Text: part.Text,
  551. }
  552. mediaContents = append(mediaContents, mediaContent)
  553. } else if part.InlineData != nil {
  554. mediaContent := dto.MediaContent{
  555. Type: "image_url",
  556. ImageUrl: &dto.MessageImageUrl{
  557. Url: fmt.Sprintf("data:%s;base64,%s", part.InlineData.MimeType, part.InlineData.Data),
  558. Detail: "auto",
  559. MimeType: part.InlineData.MimeType,
  560. },
  561. }
  562. mediaContents = append(mediaContents, mediaContent)
  563. } else if part.FileData != nil {
  564. mediaContent := dto.MediaContent{
  565. Type: "image_url",
  566. ImageUrl: &dto.MessageImageUrl{
  567. Url: part.FileData.FileUri,
  568. Detail: "auto",
  569. MimeType: part.FileData.MimeType,
  570. },
  571. }
  572. mediaContents = append(mediaContents, mediaContent)
  573. } else if part.FunctionCall != nil {
  574. // 处理 Gemini 的工具调用
  575. toolCall := dto.ToolCallRequest{
  576. ID: fmt.Sprintf("call_%d", len(toolCalls)+1), // 生成唯一ID
  577. Type: "function",
  578. Function: dto.FunctionRequest{
  579. Name: part.FunctionCall.FunctionName,
  580. Arguments: toJSONString(part.FunctionCall.Arguments),
  581. },
  582. }
  583. toolCalls = append(toolCalls, toolCall)
  584. } else if part.FunctionResponse != nil {
  585. // 处理 Gemini 的工具响应,创建单独的 tool 消息
  586. toolMessage := dto.Message{
  587. Role: "tool",
  588. ToolCallId: fmt.Sprintf("call_%d", len(toolCalls)), // 使用对应的调用ID
  589. }
  590. toolMessage.SetStringContent(toJSONString(part.FunctionResponse.Response))
  591. messages = append(messages, toolMessage)
  592. }
  593. }
  594. // 设置消息内容
  595. if len(toolCalls) > 0 {
  596. // 如果有工具调用,设置工具调用
  597. message.SetToolCalls(toolCalls)
  598. } else if len(mediaContents) == 1 && mediaContents[0].Type == "text" {
  599. // 如果只有一个文本内容,直接设置字符串
  600. message.Content = mediaContents[0].Text
  601. } else if len(mediaContents) > 0 {
  602. // 如果有多个内容或包含媒体,设置为数组
  603. message.SetMediaContent(mediaContents)
  604. }
  605. // 只有当消息有内容或工具调用时才添加
  606. if len(message.ParseContent()) > 0 || len(message.ToolCalls) > 0 {
  607. messages = append(messages, message)
  608. }
  609. }
  610. openaiRequest.Messages = messages
  611. if geminiRequest.GenerationConfig.Temperature != nil {
  612. openaiRequest.Temperature = geminiRequest.GenerationConfig.Temperature
  613. }
  614. if geminiRequest.GenerationConfig.TopP > 0 {
  615. openaiRequest.TopP = geminiRequest.GenerationConfig.TopP
  616. }
  617. if geminiRequest.GenerationConfig.TopK > 0 {
  618. openaiRequest.TopK = int(geminiRequest.GenerationConfig.TopK)
  619. }
  620. if geminiRequest.GenerationConfig.MaxOutputTokens > 0 {
  621. openaiRequest.MaxTokens = geminiRequest.GenerationConfig.MaxOutputTokens
  622. }
  623. // gemini stop sequences 最多 5 个,openai stop 最多 4 个
  624. if len(geminiRequest.GenerationConfig.StopSequences) > 0 {
  625. openaiRequest.Stop = geminiRequest.GenerationConfig.StopSequences[:4]
  626. }
  627. if geminiRequest.GenerationConfig.CandidateCount > 0 {
  628. openaiRequest.N = geminiRequest.GenerationConfig.CandidateCount
  629. }
  630. // 转换工具调用
  631. if len(geminiRequest.GetTools()) > 0 {
  632. var tools []dto.ToolCallRequest
  633. for _, tool := range geminiRequest.GetTools() {
  634. if tool.FunctionDeclarations != nil {
  635. // 将 Gemini 的 FunctionDeclarations 转换为 OpenAI 的 ToolCallRequest
  636. functionDeclarations, ok := tool.FunctionDeclarations.([]dto.FunctionRequest)
  637. if ok {
  638. for _, function := range functionDeclarations {
  639. openAITool := dto.ToolCallRequest{
  640. Type: "function",
  641. Function: dto.FunctionRequest{
  642. Name: function.Name,
  643. Description: function.Description,
  644. Parameters: function.Parameters,
  645. },
  646. }
  647. tools = append(tools, openAITool)
  648. }
  649. }
  650. }
  651. }
  652. if len(tools) > 0 {
  653. openaiRequest.Tools = tools
  654. }
  655. }
  656. // gemini system instructions
  657. if geminiRequest.SystemInstructions != nil {
  658. // 将系统指令作为第一条消息插入
  659. systemMessage := dto.Message{
  660. Role: "system",
  661. Content: extractTextFromGeminiParts(geminiRequest.SystemInstructions.Parts),
  662. }
  663. openaiRequest.Messages = append([]dto.Message{systemMessage}, openaiRequest.Messages...)
  664. }
  665. return openaiRequest, nil
  666. }
  667. func convertGeminiRoleToOpenAI(geminiRole string) string {
  668. switch geminiRole {
  669. case "user":
  670. return "user"
  671. case "model":
  672. return "assistant"
  673. case "function":
  674. return "function"
  675. default:
  676. return "user"
  677. }
  678. }
  679. func extractTextFromGeminiParts(parts []dto.GeminiPart) string {
  680. var texts []string
  681. for _, part := range parts {
  682. if part.Text != "" {
  683. texts = append(texts, part.Text)
  684. }
  685. }
  686. return strings.Join(texts, "\n")
  687. }
  688. // ResponseOpenAI2Gemini 将 OpenAI 响应转换为 Gemini 格式
  689. func ResponseOpenAI2Gemini(openAIResponse *dto.OpenAITextResponse, info *relaycommon.RelayInfo) *dto.GeminiChatResponse {
  690. geminiResponse := &dto.GeminiChatResponse{
  691. Candidates: make([]dto.GeminiChatCandidate, 0, len(openAIResponse.Choices)),
  692. UsageMetadata: dto.GeminiUsageMetadata{
  693. PromptTokenCount: openAIResponse.PromptTokens,
  694. CandidatesTokenCount: openAIResponse.CompletionTokens,
  695. TotalTokenCount: openAIResponse.PromptTokens + openAIResponse.CompletionTokens,
  696. },
  697. }
  698. for _, choice := range openAIResponse.Choices {
  699. candidate := dto.GeminiChatCandidate{
  700. Index: int64(choice.Index),
  701. SafetyRatings: []dto.GeminiChatSafetyRating{},
  702. }
  703. // 设置结束原因
  704. var finishReason string
  705. switch choice.FinishReason {
  706. case "stop":
  707. finishReason = "STOP"
  708. case "length":
  709. finishReason = "MAX_TOKENS"
  710. case "content_filter":
  711. finishReason = "SAFETY"
  712. case "tool_calls":
  713. finishReason = "STOP"
  714. default:
  715. finishReason = "STOP"
  716. }
  717. candidate.FinishReason = &finishReason
  718. // 转换消息内容
  719. content := dto.GeminiChatContent{
  720. Role: "model",
  721. Parts: make([]dto.GeminiPart, 0),
  722. }
  723. // 处理工具调用
  724. toolCalls := choice.Message.ParseToolCalls()
  725. if len(toolCalls) > 0 {
  726. for _, toolCall := range toolCalls {
  727. // 解析参数
  728. var args map[string]interface{}
  729. if toolCall.Function.Arguments != "" {
  730. if err := json.Unmarshal([]byte(toolCall.Function.Arguments), &args); err != nil {
  731. args = map[string]interface{}{"arguments": toolCall.Function.Arguments}
  732. }
  733. } else {
  734. args = make(map[string]interface{})
  735. }
  736. part := dto.GeminiPart{
  737. FunctionCall: &dto.FunctionCall{
  738. FunctionName: toolCall.Function.Name,
  739. Arguments: args,
  740. },
  741. }
  742. content.Parts = append(content.Parts, part)
  743. }
  744. } else {
  745. // 处理文本内容
  746. textContent := choice.Message.StringContent()
  747. if textContent != "" {
  748. part := dto.GeminiPart{
  749. Text: textContent,
  750. }
  751. content.Parts = append(content.Parts, part)
  752. }
  753. }
  754. candidate.Content = content
  755. geminiResponse.Candidates = append(geminiResponse.Candidates, candidate)
  756. }
  757. return geminiResponse
  758. }
  759. // StreamResponseOpenAI2Gemini 将 OpenAI 流式响应转换为 Gemini 格式
  760. func StreamResponseOpenAI2Gemini(openAIResponse *dto.ChatCompletionsStreamResponse, info *relaycommon.RelayInfo) *dto.GeminiChatResponse {
  761. // 检查是否有实际内容或结束标志
  762. hasContent := false
  763. hasFinishReason := false
  764. for _, choice := range openAIResponse.Choices {
  765. if len(choice.Delta.GetContentString()) > 0 || (choice.Delta.ToolCalls != nil && len(choice.Delta.ToolCalls) > 0) {
  766. hasContent = true
  767. }
  768. if choice.FinishReason != nil {
  769. hasFinishReason = true
  770. }
  771. }
  772. // 如果没有实际内容且没有结束标志,跳过。主要针对 openai 流响应开头的空数据
  773. if !hasContent && !hasFinishReason {
  774. return nil
  775. }
  776. geminiResponse := &dto.GeminiChatResponse{
  777. Candidates: make([]dto.GeminiChatCandidate, 0, len(openAIResponse.Choices)),
  778. UsageMetadata: dto.GeminiUsageMetadata{
  779. PromptTokenCount: info.GetEstimatePromptTokens(),
  780. CandidatesTokenCount: 0, // 流式响应中可能没有完整的 usage 信息
  781. TotalTokenCount: info.GetEstimatePromptTokens(),
  782. },
  783. }
  784. if openAIResponse.Usage != nil {
  785. geminiResponse.UsageMetadata.PromptTokenCount = openAIResponse.Usage.PromptTokens
  786. geminiResponse.UsageMetadata.CandidatesTokenCount = openAIResponse.Usage.CompletionTokens
  787. geminiResponse.UsageMetadata.TotalTokenCount = openAIResponse.Usage.TotalTokens
  788. }
  789. for _, choice := range openAIResponse.Choices {
  790. candidate := dto.GeminiChatCandidate{
  791. Index: int64(choice.Index),
  792. SafetyRatings: []dto.GeminiChatSafetyRating{},
  793. }
  794. // 设置结束原因
  795. if choice.FinishReason != nil {
  796. var finishReason string
  797. switch *choice.FinishReason {
  798. case "stop":
  799. finishReason = "STOP"
  800. case "length":
  801. finishReason = "MAX_TOKENS"
  802. case "content_filter":
  803. finishReason = "SAFETY"
  804. case "tool_calls":
  805. finishReason = "STOP"
  806. default:
  807. finishReason = "STOP"
  808. }
  809. candidate.FinishReason = &finishReason
  810. }
  811. // 转换消息内容
  812. content := dto.GeminiChatContent{
  813. Role: "model",
  814. Parts: make([]dto.GeminiPart, 0),
  815. }
  816. // 处理工具调用
  817. if choice.Delta.ToolCalls != nil {
  818. for _, toolCall := range choice.Delta.ToolCalls {
  819. // 解析参数
  820. var args map[string]interface{}
  821. if toolCall.Function.Arguments != "" {
  822. if err := json.Unmarshal([]byte(toolCall.Function.Arguments), &args); err != nil {
  823. args = map[string]interface{}{"arguments": toolCall.Function.Arguments}
  824. }
  825. } else {
  826. args = make(map[string]interface{})
  827. }
  828. part := dto.GeminiPart{
  829. FunctionCall: &dto.FunctionCall{
  830. FunctionName: toolCall.Function.Name,
  831. Arguments: args,
  832. },
  833. }
  834. content.Parts = append(content.Parts, part)
  835. }
  836. } else {
  837. // 处理文本内容
  838. textContent := choice.Delta.GetContentString()
  839. if textContent != "" {
  840. part := dto.GeminiPart{
  841. Text: textContent,
  842. }
  843. content.Parts = append(content.Parts, part)
  844. }
  845. }
  846. candidate.Content = content
  847. geminiResponse.Candidates = append(geminiResponse.Candidates, candidate)
  848. }
  849. return geminiResponse
  850. }