convert.go 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810
  1. package service
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "strings"
  6. "github.com/QuantumNous/new-api/common"
  7. "github.com/QuantumNous/new-api/constant"
  8. "github.com/QuantumNous/new-api/dto"
  9. "github.com/QuantumNous/new-api/relay/channel/openrouter"
  10. relaycommon "github.com/QuantumNous/new-api/relay/common"
  11. )
  12. func ClaudeToOpenAIRequest(claudeRequest dto.ClaudeRequest, info *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
  13. openAIRequest := dto.GeneralOpenAIRequest{
  14. Model: claudeRequest.Model,
  15. MaxTokens: claudeRequest.MaxTokens,
  16. Temperature: claudeRequest.Temperature,
  17. TopP: claudeRequest.TopP,
  18. Stream: claudeRequest.Stream,
  19. }
  20. isOpenRouter := info.ChannelType == constant.ChannelTypeOpenRouter
  21. if claudeRequest.Thinking != nil && claudeRequest.Thinking.Type == "enabled" {
  22. if isOpenRouter {
  23. reasoning := openrouter.RequestReasoning{
  24. MaxTokens: claudeRequest.Thinking.GetBudgetTokens(),
  25. }
  26. reasoningJSON, err := json.Marshal(reasoning)
  27. if err != nil {
  28. return nil, fmt.Errorf("failed to marshal reasoning: %w", err)
  29. }
  30. openAIRequest.Reasoning = reasoningJSON
  31. } else {
  32. thinkingSuffix := "-thinking"
  33. if strings.HasSuffix(info.OriginModelName, thinkingSuffix) &&
  34. !strings.HasSuffix(openAIRequest.Model, thinkingSuffix) {
  35. openAIRequest.Model = openAIRequest.Model + thinkingSuffix
  36. }
  37. }
  38. }
  39. // Convert stop sequences
  40. if len(claudeRequest.StopSequences) == 1 {
  41. openAIRequest.Stop = claudeRequest.StopSequences[0]
  42. } else if len(claudeRequest.StopSequences) > 1 {
  43. openAIRequest.Stop = claudeRequest.StopSequences
  44. }
  45. // Convert tools
  46. tools, _ := common.Any2Type[[]dto.Tool](claudeRequest.Tools)
  47. openAITools := make([]dto.ToolCallRequest, 0)
  48. for _, claudeTool := range tools {
  49. openAITool := dto.ToolCallRequest{
  50. Type: "function",
  51. Function: dto.FunctionRequest{
  52. Name: claudeTool.Name,
  53. Description: claudeTool.Description,
  54. Parameters: claudeTool.InputSchema,
  55. },
  56. }
  57. openAITools = append(openAITools, openAITool)
  58. }
  59. openAIRequest.Tools = openAITools
  60. // Convert messages
  61. openAIMessages := make([]dto.Message, 0)
  62. // Add system message if present
  63. if claudeRequest.System != nil {
  64. if claudeRequest.IsStringSystem() && claudeRequest.GetStringSystem() != "" {
  65. openAIMessage := dto.Message{
  66. Role: "system",
  67. }
  68. openAIMessage.SetStringContent(claudeRequest.GetStringSystem())
  69. openAIMessages = append(openAIMessages, openAIMessage)
  70. } else {
  71. systems := claudeRequest.ParseSystem()
  72. if len(systems) > 0 {
  73. openAIMessage := dto.Message{
  74. Role: "system",
  75. }
  76. isOpenRouterClaude := isOpenRouter && strings.HasPrefix(info.UpstreamModelName, "anthropic/claude")
  77. if isOpenRouterClaude {
  78. systemMediaMessages := make([]dto.MediaContent, 0, len(systems))
  79. for _, system := range systems {
  80. message := dto.MediaContent{
  81. Type: "text",
  82. Text: system.GetText(),
  83. CacheControl: system.CacheControl,
  84. }
  85. systemMediaMessages = append(systemMediaMessages, message)
  86. }
  87. openAIMessage.SetMediaContent(systemMediaMessages)
  88. } else {
  89. systemStr := ""
  90. for _, system := range systems {
  91. if system.Text != nil {
  92. systemStr += *system.Text
  93. }
  94. }
  95. openAIMessage.SetStringContent(systemStr)
  96. }
  97. openAIMessages = append(openAIMessages, openAIMessage)
  98. }
  99. }
  100. }
  101. for _, claudeMessage := range claudeRequest.Messages {
  102. openAIMessage := dto.Message{
  103. Role: claudeMessage.Role,
  104. }
  105. //log.Printf("claudeMessage.Content: %v", claudeMessage.Content)
  106. if claudeMessage.IsStringContent() {
  107. openAIMessage.SetStringContent(claudeMessage.GetStringContent())
  108. } else {
  109. content, err := claudeMessage.ParseContent()
  110. if err != nil {
  111. return nil, err
  112. }
  113. contents := content
  114. var toolCalls []dto.ToolCallRequest
  115. mediaMessages := make([]dto.MediaContent, 0, len(contents))
  116. for _, mediaMsg := range contents {
  117. switch mediaMsg.Type {
  118. case "text":
  119. message := dto.MediaContent{
  120. Type: "text",
  121. Text: mediaMsg.GetText(),
  122. CacheControl: mediaMsg.CacheControl,
  123. }
  124. mediaMessages = append(mediaMessages, message)
  125. case "image":
  126. // Handle image conversion (base64 to URL or keep as is)
  127. imageData := fmt.Sprintf("data:%s;base64,%s", mediaMsg.Source.MediaType, mediaMsg.Source.Data)
  128. //textContent += fmt.Sprintf("[Image: %s]", imageData)
  129. mediaMessage := dto.MediaContent{
  130. Type: "image_url",
  131. ImageUrl: &dto.MessageImageUrl{Url: imageData},
  132. }
  133. mediaMessages = append(mediaMessages, mediaMessage)
  134. case "tool_use":
  135. toolCall := dto.ToolCallRequest{
  136. ID: mediaMsg.Id,
  137. Type: "function",
  138. Function: dto.FunctionRequest{
  139. Name: mediaMsg.Name,
  140. Arguments: toJSONString(mediaMsg.Input),
  141. },
  142. }
  143. toolCalls = append(toolCalls, toolCall)
  144. case "tool_result":
  145. // Add tool result as a separate message
  146. toolName := mediaMsg.Name
  147. if toolName == "" {
  148. toolName = claudeRequest.SearchToolNameByToolCallId(mediaMsg.ToolUseId)
  149. }
  150. oaiToolMessage := dto.Message{
  151. Role: "tool",
  152. Name: &toolName,
  153. ToolCallId: mediaMsg.ToolUseId,
  154. }
  155. //oaiToolMessage.SetStringContent(*mediaMsg.GetMediaContent().Text)
  156. if mediaMsg.IsStringContent() {
  157. oaiToolMessage.SetStringContent(mediaMsg.GetStringContent())
  158. } else {
  159. mediaContents := mediaMsg.ParseMediaContent()
  160. encodeJson, _ := common.Marshal(mediaContents)
  161. oaiToolMessage.SetStringContent(string(encodeJson))
  162. }
  163. openAIMessages = append(openAIMessages, oaiToolMessage)
  164. }
  165. }
  166. if len(toolCalls) > 0 {
  167. openAIMessage.SetToolCalls(toolCalls)
  168. }
  169. if len(mediaMessages) > 0 && len(toolCalls) == 0 {
  170. openAIMessage.SetMediaContent(mediaMessages)
  171. }
  172. }
  173. if len(openAIMessage.ParseContent()) > 0 || len(openAIMessage.ToolCalls) > 0 {
  174. openAIMessages = append(openAIMessages, openAIMessage)
  175. }
  176. }
  177. openAIRequest.Messages = openAIMessages
  178. return &openAIRequest, nil
  179. }
  180. func generateStopBlock(index int) *dto.ClaudeResponse {
  181. return &dto.ClaudeResponse{
  182. Type: "content_block_stop",
  183. Index: common.GetPointer[int](index),
  184. }
  185. }
  186. func StreamResponseOpenAI2Claude(openAIResponse *dto.ChatCompletionsStreamResponse, info *relaycommon.RelayInfo) []*dto.ClaudeResponse {
  187. var claudeResponses []*dto.ClaudeResponse
  188. if info.SendResponseCount == 1 {
  189. msg := &dto.ClaudeMediaMessage{
  190. Id: openAIResponse.Id,
  191. Model: openAIResponse.Model,
  192. Type: "message",
  193. Role: "assistant",
  194. Usage: &dto.ClaudeUsage{
  195. InputTokens: info.PromptTokens,
  196. OutputTokens: 0,
  197. },
  198. }
  199. msg.SetContent(make([]any, 0))
  200. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  201. Type: "message_start",
  202. Message: msg,
  203. })
  204. claudeResponses = append(claudeResponses)
  205. //claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  206. // Type: "ping",
  207. //})
  208. if openAIResponse.IsToolCall() {
  209. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeTools
  210. resp := &dto.ClaudeResponse{
  211. Type: "content_block_start",
  212. ContentBlock: &dto.ClaudeMediaMessage{
  213. Id: openAIResponse.GetFirstToolCall().ID,
  214. Type: "tool_use",
  215. Name: openAIResponse.GetFirstToolCall().Function.Name,
  216. Input: map[string]interface{}{},
  217. },
  218. }
  219. resp.SetIndex(0)
  220. claudeResponses = append(claudeResponses, resp)
  221. } else {
  222. }
  223. // 判断首个响应是否存在内容(非标准的 OpenAI 响应)
  224. if len(openAIResponse.Choices) > 0 && len(openAIResponse.Choices[0].Delta.GetContentString()) > 0 {
  225. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  226. Index: &info.ClaudeConvertInfo.Index,
  227. Type: "content_block_start",
  228. ContentBlock: &dto.ClaudeMediaMessage{
  229. Type: "text",
  230. Text: common.GetPointer[string](""),
  231. },
  232. })
  233. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  234. Index: &info.ClaudeConvertInfo.Index,
  235. Type: "content_block_delta",
  236. Delta: &dto.ClaudeMediaMessage{
  237. Type: "text_delta",
  238. Text: common.GetPointer[string](openAIResponse.Choices[0].Delta.GetContentString()),
  239. },
  240. })
  241. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeText
  242. }
  243. return claudeResponses
  244. }
  245. if len(openAIResponse.Choices) == 0 {
  246. // no choices
  247. // 可能为非标准的 OpenAI 响应,判断是否已经完成
  248. if info.Done {
  249. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  250. oaiUsage := info.ClaudeConvertInfo.Usage
  251. if oaiUsage != nil {
  252. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  253. Type: "message_delta",
  254. Usage: &dto.ClaudeUsage{
  255. InputTokens: oaiUsage.PromptTokens,
  256. OutputTokens: oaiUsage.CompletionTokens,
  257. CacheCreationInputTokens: oaiUsage.PromptTokensDetails.CachedCreationTokens,
  258. CacheReadInputTokens: oaiUsage.PromptTokensDetails.CachedTokens,
  259. },
  260. Delta: &dto.ClaudeMediaMessage{
  261. StopReason: common.GetPointer[string](stopReasonOpenAI2Claude(info.FinishReason)),
  262. },
  263. })
  264. }
  265. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  266. Type: "message_stop",
  267. })
  268. }
  269. return claudeResponses
  270. } else {
  271. chosenChoice := openAIResponse.Choices[0]
  272. if chosenChoice.FinishReason != nil && *chosenChoice.FinishReason != "" {
  273. // should be done
  274. info.FinishReason = *chosenChoice.FinishReason
  275. if !info.Done {
  276. return claudeResponses
  277. }
  278. }
  279. if info.Done {
  280. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  281. oaiUsage := info.ClaudeConvertInfo.Usage
  282. if oaiUsage != nil {
  283. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  284. Type: "message_delta",
  285. Usage: &dto.ClaudeUsage{
  286. InputTokens: oaiUsage.PromptTokens,
  287. OutputTokens: oaiUsage.CompletionTokens,
  288. CacheCreationInputTokens: oaiUsage.PromptTokensDetails.CachedCreationTokens,
  289. CacheReadInputTokens: oaiUsage.PromptTokensDetails.CachedTokens,
  290. },
  291. Delta: &dto.ClaudeMediaMessage{
  292. StopReason: common.GetPointer[string](stopReasonOpenAI2Claude(info.FinishReason)),
  293. },
  294. })
  295. }
  296. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  297. Type: "message_stop",
  298. })
  299. } else {
  300. var claudeResponse dto.ClaudeResponse
  301. var isEmpty bool
  302. claudeResponse.Type = "content_block_delta"
  303. if len(chosenChoice.Delta.ToolCalls) > 0 {
  304. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeTools {
  305. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  306. info.ClaudeConvertInfo.Index++
  307. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  308. Index: &info.ClaudeConvertInfo.Index,
  309. Type: "content_block_start",
  310. ContentBlock: &dto.ClaudeMediaMessage{
  311. Id: openAIResponse.GetFirstToolCall().ID,
  312. Type: "tool_use",
  313. Name: openAIResponse.GetFirstToolCall().Function.Name,
  314. Input: map[string]interface{}{},
  315. },
  316. })
  317. }
  318. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeTools
  319. // tools delta
  320. claudeResponse.Delta = &dto.ClaudeMediaMessage{
  321. Type: "input_json_delta",
  322. PartialJson: &chosenChoice.Delta.ToolCalls[0].Function.Arguments,
  323. }
  324. } else {
  325. reasoning := chosenChoice.Delta.GetReasoningContent()
  326. textContent := chosenChoice.Delta.GetContentString()
  327. if reasoning != "" || textContent != "" {
  328. if reasoning != "" {
  329. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeThinking {
  330. //info.ClaudeConvertInfo.Index++
  331. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  332. Index: &info.ClaudeConvertInfo.Index,
  333. Type: "content_block_start",
  334. ContentBlock: &dto.ClaudeMediaMessage{
  335. Type: "thinking",
  336. Thinking: common.GetPointer[string](""),
  337. },
  338. })
  339. }
  340. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeThinking
  341. // text delta
  342. claudeResponse.Delta = &dto.ClaudeMediaMessage{
  343. Type: "thinking_delta",
  344. Thinking: &reasoning,
  345. }
  346. } else {
  347. if info.ClaudeConvertInfo.LastMessagesType != relaycommon.LastMessageTypeText {
  348. if info.LastMessagesType == relaycommon.LastMessageTypeThinking || info.LastMessagesType == relaycommon.LastMessageTypeTools {
  349. claudeResponses = append(claudeResponses, generateStopBlock(info.ClaudeConvertInfo.Index))
  350. info.ClaudeConvertInfo.Index++
  351. }
  352. claudeResponses = append(claudeResponses, &dto.ClaudeResponse{
  353. Index: &info.ClaudeConvertInfo.Index,
  354. Type: "content_block_start",
  355. ContentBlock: &dto.ClaudeMediaMessage{
  356. Type: "text",
  357. Text: common.GetPointer[string](""),
  358. },
  359. })
  360. }
  361. info.ClaudeConvertInfo.LastMessagesType = relaycommon.LastMessageTypeText
  362. // text delta
  363. claudeResponse.Delta = &dto.ClaudeMediaMessage{
  364. Type: "text_delta",
  365. Text: common.GetPointer[string](textContent),
  366. }
  367. }
  368. } else {
  369. isEmpty = true
  370. }
  371. }
  372. claudeResponse.Index = &info.ClaudeConvertInfo.Index
  373. if !isEmpty {
  374. claudeResponses = append(claudeResponses, &claudeResponse)
  375. }
  376. }
  377. }
  378. return claudeResponses
  379. }
  380. func ResponseOpenAI2Claude(openAIResponse *dto.OpenAITextResponse, info *relaycommon.RelayInfo) *dto.ClaudeResponse {
  381. var stopReason string
  382. contents := make([]dto.ClaudeMediaMessage, 0)
  383. claudeResponse := &dto.ClaudeResponse{
  384. Id: openAIResponse.Id,
  385. Type: "message",
  386. Role: "assistant",
  387. Model: openAIResponse.Model,
  388. }
  389. for _, choice := range openAIResponse.Choices {
  390. stopReason = stopReasonOpenAI2Claude(choice.FinishReason)
  391. if choice.FinishReason == "tool_calls" {
  392. for _, toolUse := range choice.Message.ParseToolCalls() {
  393. claudeContent := dto.ClaudeMediaMessage{}
  394. claudeContent.Type = "tool_use"
  395. claudeContent.Id = toolUse.ID
  396. claudeContent.Name = toolUse.Function.Name
  397. var mapParams map[string]interface{}
  398. if err := common.Unmarshal([]byte(toolUse.Function.Arguments), &mapParams); err == nil {
  399. claudeContent.Input = mapParams
  400. } else {
  401. claudeContent.Input = toolUse.Function.Arguments
  402. }
  403. contents = append(contents, claudeContent)
  404. }
  405. } else {
  406. claudeContent := dto.ClaudeMediaMessage{}
  407. claudeContent.Type = "text"
  408. claudeContent.SetText(choice.Message.StringContent())
  409. contents = append(contents, claudeContent)
  410. }
  411. }
  412. claudeResponse.Content = contents
  413. claudeResponse.StopReason = stopReason
  414. claudeResponse.Usage = &dto.ClaudeUsage{
  415. InputTokens: openAIResponse.PromptTokens,
  416. OutputTokens: openAIResponse.CompletionTokens,
  417. }
  418. return claudeResponse
  419. }
  420. func stopReasonOpenAI2Claude(reason string) string {
  421. switch reason {
  422. case "stop":
  423. return "end_turn"
  424. case "stop_sequence":
  425. return "stop_sequence"
  426. case "length":
  427. fallthrough
  428. case "max_tokens":
  429. return "max_tokens"
  430. case "tool_calls":
  431. return "tool_use"
  432. default:
  433. return reason
  434. }
  435. }
  436. func toJSONString(v interface{}) string {
  437. b, err := json.Marshal(v)
  438. if err != nil {
  439. return "{}"
  440. }
  441. return string(b)
  442. }
  443. func GeminiToOpenAIRequest(geminiRequest *dto.GeminiChatRequest, info *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
  444. openaiRequest := &dto.GeneralOpenAIRequest{
  445. Model: info.UpstreamModelName,
  446. Stream: info.IsStream,
  447. }
  448. // 转换 messages
  449. var messages []dto.Message
  450. for _, content := range geminiRequest.Contents {
  451. message := dto.Message{
  452. Role: convertGeminiRoleToOpenAI(content.Role),
  453. }
  454. // 处理 parts
  455. var mediaContents []dto.MediaContent
  456. var toolCalls []dto.ToolCallRequest
  457. for _, part := range content.Parts {
  458. if part.Text != "" {
  459. mediaContent := dto.MediaContent{
  460. Type: "text",
  461. Text: part.Text,
  462. }
  463. mediaContents = append(mediaContents, mediaContent)
  464. } else if part.InlineData != nil {
  465. mediaContent := dto.MediaContent{
  466. Type: "image_url",
  467. ImageUrl: &dto.MessageImageUrl{
  468. Url: fmt.Sprintf("data:%s;base64,%s", part.InlineData.MimeType, part.InlineData.Data),
  469. Detail: "auto",
  470. MimeType: part.InlineData.MimeType,
  471. },
  472. }
  473. mediaContents = append(mediaContents, mediaContent)
  474. } else if part.FileData != nil {
  475. mediaContent := dto.MediaContent{
  476. Type: "image_url",
  477. ImageUrl: &dto.MessageImageUrl{
  478. Url: part.FileData.FileUri,
  479. Detail: "auto",
  480. MimeType: part.FileData.MimeType,
  481. },
  482. }
  483. mediaContents = append(mediaContents, mediaContent)
  484. } else if part.FunctionCall != nil {
  485. // 处理 Gemini 的工具调用
  486. toolCall := dto.ToolCallRequest{
  487. ID: fmt.Sprintf("call_%d", len(toolCalls)+1), // 生成唯一ID
  488. Type: "function",
  489. Function: dto.FunctionRequest{
  490. Name: part.FunctionCall.FunctionName,
  491. Arguments: toJSONString(part.FunctionCall.Arguments),
  492. },
  493. }
  494. toolCalls = append(toolCalls, toolCall)
  495. } else if part.FunctionResponse != nil {
  496. // 处理 Gemini 的工具响应,创建单独的 tool 消息
  497. toolMessage := dto.Message{
  498. Role: "tool",
  499. ToolCallId: fmt.Sprintf("call_%d", len(toolCalls)), // 使用对应的调用ID
  500. }
  501. toolMessage.SetStringContent(toJSONString(part.FunctionResponse.Response))
  502. messages = append(messages, toolMessage)
  503. }
  504. }
  505. // 设置消息内容
  506. if len(toolCalls) > 0 {
  507. // 如果有工具调用,设置工具调用
  508. message.SetToolCalls(toolCalls)
  509. } else if len(mediaContents) == 1 && mediaContents[0].Type == "text" {
  510. // 如果只有一个文本内容,直接设置字符串
  511. message.Content = mediaContents[0].Text
  512. } else if len(mediaContents) > 0 {
  513. // 如果有多个内容或包含媒体,设置为数组
  514. message.SetMediaContent(mediaContents)
  515. }
  516. // 只有当消息有内容或工具调用时才添加
  517. if len(message.ParseContent()) > 0 || len(message.ToolCalls) > 0 {
  518. messages = append(messages, message)
  519. }
  520. }
  521. openaiRequest.Messages = messages
  522. if geminiRequest.GenerationConfig.Temperature != nil {
  523. openaiRequest.Temperature = geminiRequest.GenerationConfig.Temperature
  524. }
  525. if geminiRequest.GenerationConfig.TopP > 0 {
  526. openaiRequest.TopP = geminiRequest.GenerationConfig.TopP
  527. }
  528. if geminiRequest.GenerationConfig.TopK > 0 {
  529. openaiRequest.TopK = int(geminiRequest.GenerationConfig.TopK)
  530. }
  531. if geminiRequest.GenerationConfig.MaxOutputTokens > 0 {
  532. openaiRequest.MaxTokens = geminiRequest.GenerationConfig.MaxOutputTokens
  533. }
  534. // gemini stop sequences 最多 5 个,openai stop 最多 4 个
  535. if len(geminiRequest.GenerationConfig.StopSequences) > 0 {
  536. openaiRequest.Stop = geminiRequest.GenerationConfig.StopSequences[:4]
  537. }
  538. if geminiRequest.GenerationConfig.CandidateCount > 0 {
  539. openaiRequest.N = geminiRequest.GenerationConfig.CandidateCount
  540. }
  541. // 转换工具调用
  542. if len(geminiRequest.GetTools()) > 0 {
  543. var tools []dto.ToolCallRequest
  544. for _, tool := range geminiRequest.GetTools() {
  545. if tool.FunctionDeclarations != nil {
  546. // 将 Gemini 的 FunctionDeclarations 转换为 OpenAI 的 ToolCallRequest
  547. functionDeclarations, ok := tool.FunctionDeclarations.([]dto.FunctionRequest)
  548. if ok {
  549. for _, function := range functionDeclarations {
  550. openAITool := dto.ToolCallRequest{
  551. Type: "function",
  552. Function: dto.FunctionRequest{
  553. Name: function.Name,
  554. Description: function.Description,
  555. Parameters: function.Parameters,
  556. },
  557. }
  558. tools = append(tools, openAITool)
  559. }
  560. }
  561. }
  562. }
  563. if len(tools) > 0 {
  564. openaiRequest.Tools = tools
  565. }
  566. }
  567. // gemini system instructions
  568. if geminiRequest.SystemInstructions != nil {
  569. // 将系统指令作为第一条消息插入
  570. systemMessage := dto.Message{
  571. Role: "system",
  572. Content: extractTextFromGeminiParts(geminiRequest.SystemInstructions.Parts),
  573. }
  574. openaiRequest.Messages = append([]dto.Message{systemMessage}, openaiRequest.Messages...)
  575. }
  576. return openaiRequest, nil
  577. }
  578. func convertGeminiRoleToOpenAI(geminiRole string) string {
  579. switch geminiRole {
  580. case "user":
  581. return "user"
  582. case "model":
  583. return "assistant"
  584. case "function":
  585. return "function"
  586. default:
  587. return "user"
  588. }
  589. }
  590. func extractTextFromGeminiParts(parts []dto.GeminiPart) string {
  591. var texts []string
  592. for _, part := range parts {
  593. if part.Text != "" {
  594. texts = append(texts, part.Text)
  595. }
  596. }
  597. return strings.Join(texts, "\n")
  598. }
  599. // ResponseOpenAI2Gemini 将 OpenAI 响应转换为 Gemini 格式
  600. func ResponseOpenAI2Gemini(openAIResponse *dto.OpenAITextResponse, info *relaycommon.RelayInfo) *dto.GeminiChatResponse {
  601. geminiResponse := &dto.GeminiChatResponse{
  602. Candidates: make([]dto.GeminiChatCandidate, 0, len(openAIResponse.Choices)),
  603. UsageMetadata: dto.GeminiUsageMetadata{
  604. PromptTokenCount: openAIResponse.PromptTokens,
  605. CandidatesTokenCount: openAIResponse.CompletionTokens,
  606. TotalTokenCount: openAIResponse.PromptTokens + openAIResponse.CompletionTokens,
  607. },
  608. }
  609. for _, choice := range openAIResponse.Choices {
  610. candidate := dto.GeminiChatCandidate{
  611. Index: int64(choice.Index),
  612. SafetyRatings: []dto.GeminiChatSafetyRating{},
  613. }
  614. // 设置结束原因
  615. var finishReason string
  616. switch choice.FinishReason {
  617. case "stop":
  618. finishReason = "STOP"
  619. case "length":
  620. finishReason = "MAX_TOKENS"
  621. case "content_filter":
  622. finishReason = "SAFETY"
  623. case "tool_calls":
  624. finishReason = "STOP"
  625. default:
  626. finishReason = "STOP"
  627. }
  628. candidate.FinishReason = &finishReason
  629. // 转换消息内容
  630. content := dto.GeminiChatContent{
  631. Role: "model",
  632. Parts: make([]dto.GeminiPart, 0),
  633. }
  634. // 处理工具调用
  635. toolCalls := choice.Message.ParseToolCalls()
  636. if len(toolCalls) > 0 {
  637. for _, toolCall := range toolCalls {
  638. // 解析参数
  639. var args map[string]interface{}
  640. if toolCall.Function.Arguments != "" {
  641. if err := json.Unmarshal([]byte(toolCall.Function.Arguments), &args); err != nil {
  642. args = map[string]interface{}{"arguments": toolCall.Function.Arguments}
  643. }
  644. } else {
  645. args = make(map[string]interface{})
  646. }
  647. part := dto.GeminiPart{
  648. FunctionCall: &dto.FunctionCall{
  649. FunctionName: toolCall.Function.Name,
  650. Arguments: args,
  651. },
  652. }
  653. content.Parts = append(content.Parts, part)
  654. }
  655. } else {
  656. // 处理文本内容
  657. textContent := choice.Message.StringContent()
  658. if textContent != "" {
  659. part := dto.GeminiPart{
  660. Text: textContent,
  661. }
  662. content.Parts = append(content.Parts, part)
  663. }
  664. }
  665. candidate.Content = content
  666. geminiResponse.Candidates = append(geminiResponse.Candidates, candidate)
  667. }
  668. return geminiResponse
  669. }
  670. // StreamResponseOpenAI2Gemini 将 OpenAI 流式响应转换为 Gemini 格式
  671. func StreamResponseOpenAI2Gemini(openAIResponse *dto.ChatCompletionsStreamResponse, info *relaycommon.RelayInfo) *dto.GeminiChatResponse {
  672. // 检查是否有实际内容或结束标志
  673. hasContent := false
  674. hasFinishReason := false
  675. for _, choice := range openAIResponse.Choices {
  676. if len(choice.Delta.GetContentString()) > 0 || (choice.Delta.ToolCalls != nil && len(choice.Delta.ToolCalls) > 0) {
  677. hasContent = true
  678. }
  679. if choice.FinishReason != nil {
  680. hasFinishReason = true
  681. }
  682. }
  683. // 如果没有实际内容且没有结束标志,跳过。主要针对 openai 流响应开头的空数据
  684. if !hasContent && !hasFinishReason {
  685. return nil
  686. }
  687. geminiResponse := &dto.GeminiChatResponse{
  688. Candidates: make([]dto.GeminiChatCandidate, 0, len(openAIResponse.Choices)),
  689. UsageMetadata: dto.GeminiUsageMetadata{
  690. PromptTokenCount: info.PromptTokens,
  691. CandidatesTokenCount: 0, // 流式响应中可能没有完整的 usage 信息
  692. TotalTokenCount: info.PromptTokens,
  693. },
  694. }
  695. for _, choice := range openAIResponse.Choices {
  696. candidate := dto.GeminiChatCandidate{
  697. Index: int64(choice.Index),
  698. SafetyRatings: []dto.GeminiChatSafetyRating{},
  699. }
  700. // 设置结束原因
  701. if choice.FinishReason != nil {
  702. var finishReason string
  703. switch *choice.FinishReason {
  704. case "stop":
  705. finishReason = "STOP"
  706. case "length":
  707. finishReason = "MAX_TOKENS"
  708. case "content_filter":
  709. finishReason = "SAFETY"
  710. case "tool_calls":
  711. finishReason = "STOP"
  712. default:
  713. finishReason = "STOP"
  714. }
  715. candidate.FinishReason = &finishReason
  716. }
  717. // 转换消息内容
  718. content := dto.GeminiChatContent{
  719. Role: "model",
  720. Parts: make([]dto.GeminiPart, 0),
  721. }
  722. // 处理工具调用
  723. if choice.Delta.ToolCalls != nil {
  724. for _, toolCall := range choice.Delta.ToolCalls {
  725. // 解析参数
  726. var args map[string]interface{}
  727. if toolCall.Function.Arguments != "" {
  728. if err := json.Unmarshal([]byte(toolCall.Function.Arguments), &args); err != nil {
  729. args = map[string]interface{}{"arguments": toolCall.Function.Arguments}
  730. }
  731. } else {
  732. args = make(map[string]interface{})
  733. }
  734. part := dto.GeminiPart{
  735. FunctionCall: &dto.FunctionCall{
  736. FunctionName: toolCall.Function.Name,
  737. Arguments: args,
  738. },
  739. }
  740. content.Parts = append(content.Parts, part)
  741. }
  742. } else {
  743. // 处理文本内容
  744. textContent := choice.Delta.GetContentString()
  745. if textContent != "" {
  746. part := dto.GeminiPart{
  747. Text: textContent,
  748. }
  749. content.Parts = append(content.Parts, part)
  750. }
  751. }
  752. candidate.Content = content
  753. geminiResponse.Candidates = append(geminiResponse.Candidates, candidate)
  754. }
  755. return geminiResponse
  756. }