| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018 |
- package dto
- import (
- "encoding/json"
- "fmt"
- "strings"
- "github.com/QuantumNous/new-api/common"
- "github.com/QuantumNous/new-api/types"
- "github.com/gin-gonic/gin"
- )
- type ResponseFormat struct {
- Type string `json:"type,omitempty"`
- JsonSchema json.RawMessage `json:"json_schema,omitempty"`
- }
- type FormatJsonSchema struct {
- Description string `json:"description,omitempty"`
- Name string `json:"name"`
- Schema any `json:"schema,omitempty"`
- Strict json.RawMessage `json:"strict,omitempty"`
- }
- // GeneralOpenAIRequest represents a general request structure for OpenAI-compatible APIs.
- // 参数增加规范:无引用的参数必须使用json.RawMessage类型,并添加omitempty标签
- type GeneralOpenAIRequest struct {
- Model string `json:"model,omitempty"`
- Messages []Message `json:"messages,omitempty"`
- Prompt any `json:"prompt,omitempty"`
- Prefix any `json:"prefix,omitempty"`
- Suffix any `json:"suffix,omitempty"`
- Stream bool `json:"stream,omitempty"`
- StreamOptions *StreamOptions `json:"stream_options,omitempty"`
- MaxTokens uint `json:"max_tokens,omitempty"`
- MaxCompletionTokens uint `json:"max_completion_tokens,omitempty"`
- ReasoningEffort string `json:"reasoning_effort,omitempty"`
- Verbosity json.RawMessage `json:"verbosity,omitempty"` // gpt-5
- Temperature *float64 `json:"temperature,omitempty"`
- TopP float64 `json:"top_p,omitempty"`
- TopK int `json:"top_k,omitempty"`
- Stop any `json:"stop,omitempty"`
- N int `json:"n,omitempty"`
- Input any `json:"input,omitempty"`
- Instruction string `json:"instruction,omitempty"`
- Size string `json:"size,omitempty"`
- Functions json.RawMessage `json:"functions,omitempty"`
- FrequencyPenalty float64 `json:"frequency_penalty,omitempty"`
- PresencePenalty float64 `json:"presence_penalty,omitempty"`
- ResponseFormat *ResponseFormat `json:"response_format,omitempty"`
- EncodingFormat json.RawMessage `json:"encoding_format,omitempty"`
- Seed float64 `json:"seed,omitempty"`
- ParallelTooCalls *bool `json:"parallel_tool_calls,omitempty"`
- Tools []ToolCallRequest `json:"tools,omitempty"`
- ToolChoice any `json:"tool_choice,omitempty"`
- User string `json:"user,omitempty"`
- LogProbs bool `json:"logprobs,omitempty"`
- TopLogProbs int `json:"top_logprobs,omitempty"`
- Dimensions int `json:"dimensions,omitempty"`
- Modalities json.RawMessage `json:"modalities,omitempty"`
- Audio json.RawMessage `json:"audio,omitempty"`
- // 安全标识符,用于帮助 OpenAI 检测可能违反使用政策的应用程序用户
- // 注意:此字段会向 OpenAI 发送用户标识信息,默认过滤以保护用户隐私
- SafetyIdentifier string `json:"safety_identifier,omitempty"`
- // Whether or not to store the output of this chat completion request for use in our model distillation or evals products.
- // 是否存储此次请求数据供 OpenAI 用于评估和优化产品
- // 注意:默认过滤此字段以保护用户隐私,但过滤后可能导致 Codex 无法正常使用
- Store json.RawMessage `json:"store,omitempty"`
- // Used by OpenAI to cache responses for similar requests to optimize your cache hit rates. Replaces the user field
- PromptCacheKey string `json:"prompt_cache_key,omitempty"`
- PromptCacheRetention json.RawMessage `json:"prompt_cache_retention,omitempty"`
- LogitBias json.RawMessage `json:"logit_bias,omitempty"`
- Metadata json.RawMessage `json:"metadata,omitempty"`
- Prediction json.RawMessage `json:"prediction,omitempty"`
- // gemini
- ExtraBody json.RawMessage `json:"extra_body,omitempty"`
- //xai
- SearchParameters json.RawMessage `json:"search_parameters,omitempty"`
- // claude
- WebSearchOptions *WebSearchOptions `json:"web_search_options,omitempty"`
- // OpenRouter Params
- Usage json.RawMessage `json:"usage,omitempty"`
- Reasoning json.RawMessage `json:"reasoning,omitempty"`
- // Ali Qwen Params
- VlHighResolutionImages json.RawMessage `json:"vl_high_resolution_images,omitempty"`
- EnableThinking json.RawMessage `json:"enable_thinking,omitempty"`
- ChatTemplateKwargs json.RawMessage `json:"chat_template_kwargs,omitempty"`
- EnableSearch json.RawMessage `json:"enable_search,omitempty"`
- // ollama Params
- Think json.RawMessage `json:"think,omitempty"`
- // baidu v2
- WebSearch json.RawMessage `json:"web_search,omitempty"`
- // doubao,zhipu_v4
- THINKING json.RawMessage `json:"thinking,omitempty"`
- // pplx Params
- SearchDomainFilter json.RawMessage `json:"search_domain_filter,omitempty"`
- SearchRecencyFilter string `json:"search_recency_filter,omitempty"`
- ReturnImages bool `json:"return_images,omitempty"`
- ReturnRelatedQuestions bool `json:"return_related_questions,omitempty"`
- SearchMode string `json:"search_mode,omitempty"`
- }
- // createFileSource 根据数据内容创建正确类型的 FileSource
- func createFileSource(data string) *types.FileSource {
- if strings.HasPrefix(data, "http://") || strings.HasPrefix(data, "https://") {
- return types.NewURLFileSource(data)
- }
- return types.NewBase64FileSource(data, "")
- }
- func (r *GeneralOpenAIRequest) GetTokenCountMeta() *types.TokenCountMeta {
- var tokenCountMeta types.TokenCountMeta
- var texts = make([]string, 0)
- var fileMeta = make([]*types.FileMeta, 0)
- if r.Prompt != nil {
- switch v := r.Prompt.(type) {
- case string:
- texts = append(texts, v)
- case []any:
- for _, item := range v {
- if str, ok := item.(string); ok {
- texts = append(texts, str)
- }
- }
- default:
- texts = append(texts, fmt.Sprintf("%v", r.Prompt))
- }
- }
- if r.Input != nil {
- inputs := r.ParseInput()
- texts = append(texts, inputs...)
- }
- if r.MaxCompletionTokens > r.MaxTokens {
- tokenCountMeta.MaxTokens = int(r.MaxCompletionTokens)
- } else {
- tokenCountMeta.MaxTokens = int(r.MaxTokens)
- }
- for _, message := range r.Messages {
- tokenCountMeta.MessagesCount++
- texts = append(texts, message.Role)
- if message.Content != nil {
- if message.Name != nil {
- tokenCountMeta.NameCount++
- texts = append(texts, *message.Name)
- }
- arrayContent := message.ParseContent()
- for _, m := range arrayContent {
- if m.Type == ContentTypeImageURL {
- imageUrl := m.GetImageMedia()
- if imageUrl != nil && imageUrl.Url != "" {
- source := createFileSource(imageUrl.Url)
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeImage,
- Source: source,
- Detail: imageUrl.Detail,
- })
- }
- } else if m.Type == ContentTypeInputAudio {
- inputAudio := m.GetInputAudio()
- if inputAudio != nil && inputAudio.Data != "" {
- source := createFileSource(inputAudio.Data)
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeAudio,
- Source: source,
- })
- }
- } else if m.Type == ContentTypeFile {
- file := m.GetFile()
- if file != nil && file.FileData != "" {
- source := createFileSource(file.FileData)
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeFile,
- Source: source,
- })
- }
- } else if m.Type == ContentTypeVideoUrl {
- videoUrl := m.GetVideoUrl()
- if videoUrl != nil && videoUrl.Url != "" {
- source := createFileSource(videoUrl.Url)
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeVideo,
- Source: source,
- })
- }
- } else {
- texts = append(texts, m.Text)
- }
- }
- }
- }
- if r.Tools != nil {
- openaiTools := r.Tools
- for _, tool := range openaiTools {
- tokenCountMeta.ToolsCount++
- texts = append(texts, tool.Function.Name)
- if tool.Function.Description != "" {
- texts = append(texts, tool.Function.Description)
- }
- if tool.Function.Parameters != nil {
- texts = append(texts, fmt.Sprintf("%v", tool.Function.Parameters))
- }
- }
- //toolTokens := CountTokenInput(countStr, request.Model)
- //tkm += 8
- //tkm += toolTokens
- }
- tokenCountMeta.CombineText = strings.Join(texts, "\n")
- tokenCountMeta.Files = fileMeta
- return &tokenCountMeta
- }
- func (r *GeneralOpenAIRequest) IsStream(c *gin.Context) bool {
- return r.Stream
- }
- func (r *GeneralOpenAIRequest) SetModelName(modelName string) {
- if modelName != "" {
- r.Model = modelName
- }
- }
- func (r *GeneralOpenAIRequest) ToMap() map[string]any {
- result := make(map[string]any)
- data, _ := common.Marshal(r)
- _ = common.Unmarshal(data, &result)
- return result
- }
- func (r *GeneralOpenAIRequest) GetSystemRoleName() string {
- if strings.HasPrefix(r.Model, "o") {
- if !strings.HasPrefix(r.Model, "o1-mini") && !strings.HasPrefix(r.Model, "o1-preview") {
- return "developer"
- }
- } else if strings.HasPrefix(r.Model, "gpt-5") {
- return "developer"
- }
- return "system"
- }
- const CustomType = "custom"
- type ToolCallRequest struct {
- ID string `json:"id,omitempty"`
- Type string `json:"type"`
- Function FunctionRequest `json:"function,omitempty"`
- Custom json.RawMessage `json:"custom,omitempty"`
- }
- type FunctionRequest struct {
- Description string `json:"description,omitempty"`
- Name string `json:"name"`
- Parameters any `json:"parameters,omitempty"`
- Arguments string `json:"arguments,omitempty"`
- }
- type StreamOptions struct {
- IncludeUsage bool `json:"include_usage,omitempty"`
- }
- func (r *GeneralOpenAIRequest) GetMaxTokens() uint {
- if r.MaxCompletionTokens != 0 {
- return r.MaxCompletionTokens
- }
- return r.MaxTokens
- }
- func (r *GeneralOpenAIRequest) ParseInput() []string {
- if r.Input == nil {
- return nil
- }
- var input []string
- switch r.Input.(type) {
- case string:
- input = []string{r.Input.(string)}
- case []any:
- input = make([]string, 0, len(r.Input.([]any)))
- for _, item := range r.Input.([]any) {
- if str, ok := item.(string); ok {
- input = append(input, str)
- }
- }
- }
- return input
- }
- type Message struct {
- Role string `json:"role"`
- Content any `json:"content"`
- Name *string `json:"name,omitempty"`
- Prefix *bool `json:"prefix,omitempty"`
- ReasoningContent string `json:"reasoning_content,omitempty"`
- Reasoning string `json:"reasoning,omitempty"`
- ToolCalls json.RawMessage `json:"tool_calls,omitempty"`
- ToolCallId string `json:"tool_call_id,omitempty"`
- parsedContent []MediaContent
- //parsedStringContent *string
- }
- type MediaContent struct {
- Type string `json:"type"`
- Text string `json:"text,omitempty"`
- ImageUrl any `json:"image_url,omitempty"`
- InputAudio any `json:"input_audio,omitempty"`
- File any `json:"file,omitempty"`
- VideoUrl any `json:"video_url,omitempty"`
- // OpenRouter Params
- CacheControl json.RawMessage `json:"cache_control,omitempty"`
- }
- func (m *MediaContent) GetImageMedia() *MessageImageUrl {
- if m.ImageUrl != nil {
- if _, ok := m.ImageUrl.(*MessageImageUrl); ok {
- return m.ImageUrl.(*MessageImageUrl)
- }
- if itemMap, ok := m.ImageUrl.(map[string]any); ok {
- out := &MessageImageUrl{
- Url: common.Interface2String(itemMap["url"]),
- Detail: common.Interface2String(itemMap["detail"]),
- MimeType: common.Interface2String(itemMap["mime_type"]),
- }
- return out
- }
- }
- return nil
- }
- func (m *MediaContent) GetInputAudio() *MessageInputAudio {
- if m.InputAudio != nil {
- if _, ok := m.InputAudio.(*MessageInputAudio); ok {
- return m.InputAudio.(*MessageInputAudio)
- }
- if itemMap, ok := m.InputAudio.(map[string]any); ok {
- out := &MessageInputAudio{
- Data: common.Interface2String(itemMap["data"]),
- Format: common.Interface2String(itemMap["format"]),
- }
- return out
- }
- }
- return nil
- }
- func (m *MediaContent) GetFile() *MessageFile {
- if m.File != nil {
- if _, ok := m.File.(*MessageFile); ok {
- return m.File.(*MessageFile)
- }
- if itemMap, ok := m.File.(map[string]any); ok {
- out := &MessageFile{
- FileName: common.Interface2String(itemMap["file_name"]),
- FileData: common.Interface2String(itemMap["file_data"]),
- FileId: common.Interface2String(itemMap["file_id"]),
- }
- return out
- }
- }
- return nil
- }
- func (m *MediaContent) GetVideoUrl() *MessageVideoUrl {
- if m.VideoUrl != nil {
- if _, ok := m.VideoUrl.(*MessageVideoUrl); ok {
- return m.VideoUrl.(*MessageVideoUrl)
- }
- if itemMap, ok := m.VideoUrl.(map[string]any); ok {
- out := &MessageVideoUrl{
- Url: common.Interface2String(itemMap["url"]),
- }
- return out
- }
- }
- return nil
- }
- type MessageImageUrl struct {
- Url string `json:"url"`
- Detail string `json:"detail"`
- MimeType string
- }
- func (m *MessageImageUrl) IsRemoteImage() bool {
- return strings.HasPrefix(m.Url, "http")
- }
- type MessageInputAudio struct {
- Data string `json:"data"` //base64
- Format string `json:"format"`
- }
- type MessageFile struct {
- FileName string `json:"filename,omitempty"`
- FileData string `json:"file_data,omitempty"`
- FileId string `json:"file_id,omitempty"`
- }
- type MessageVideoUrl struct {
- Url string `json:"url"`
- }
- const (
- ContentTypeText = "text"
- ContentTypeImageURL = "image_url"
- ContentTypeInputAudio = "input_audio"
- ContentTypeFile = "file"
- ContentTypeVideoUrl = "video_url" // 阿里百炼视频识别
- //ContentTypeAudioUrl = "audio_url"
- )
- func (m *Message) GetPrefix() bool {
- if m.Prefix == nil {
- return false
- }
- return *m.Prefix
- }
- func (m *Message) SetPrefix(prefix bool) {
- m.Prefix = &prefix
- }
- func (m *Message) ParseToolCalls() []ToolCallRequest {
- if m.ToolCalls == nil {
- return nil
- }
- var toolCalls []ToolCallRequest
- if err := json.Unmarshal(m.ToolCalls, &toolCalls); err == nil {
- return toolCalls
- }
- return toolCalls
- }
- func (m *Message) SetToolCalls(toolCalls any) {
- toolCallsJson, _ := json.Marshal(toolCalls)
- m.ToolCalls = toolCallsJson
- }
- func (m *Message) StringContent() string {
- switch m.Content.(type) {
- case string:
- return m.Content.(string)
- case []any:
- var contentStr string
- for _, contentItem := range m.Content.([]any) {
- contentMap, ok := contentItem.(map[string]any)
- if !ok {
- continue
- }
- if contentMap["type"] == ContentTypeText {
- if subStr, ok := contentMap["text"].(string); ok {
- contentStr += subStr
- }
- }
- }
- return contentStr
- }
- return ""
- }
- func (m *Message) SetNullContent() {
- m.Content = nil
- m.parsedContent = nil
- }
- func (m *Message) SetStringContent(content string) {
- m.Content = content
- m.parsedContent = nil
- }
- func (m *Message) SetMediaContent(content []MediaContent) {
- m.Content = content
- m.parsedContent = content
- }
- func (m *Message) IsStringContent() bool {
- _, ok := m.Content.(string)
- if ok {
- return true
- }
- return false
- }
- func (m *Message) ParseContent() []MediaContent {
- if m.Content == nil {
- return nil
- }
- if len(m.parsedContent) > 0 {
- return m.parsedContent
- }
- var contentList []MediaContent
- // 先尝试解析为字符串
- content, ok := m.Content.(string)
- if ok {
- contentList = []MediaContent{{
- Type: ContentTypeText,
- Text: content,
- }}
- m.parsedContent = contentList
- return contentList
- }
- // 尝试解析为数组
- //var arrayContent []map[string]interface{}
- arrayContent, ok := m.Content.([]any)
- if !ok {
- return contentList
- }
- for _, contentItemAny := range arrayContent {
- mediaItem, ok := contentItemAny.(MediaContent)
- if ok {
- contentList = append(contentList, mediaItem)
- continue
- }
- contentItem, ok := contentItemAny.(map[string]any)
- if !ok {
- continue
- }
- contentType, ok := contentItem["type"].(string)
- if !ok {
- continue
- }
- switch contentType {
- case ContentTypeText:
- if text, ok := contentItem["text"].(string); ok {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeText,
- Text: text,
- })
- }
- case ContentTypeImageURL:
- imageUrl := contentItem["image_url"]
- temp := &MessageImageUrl{
- Detail: "high",
- }
- switch v := imageUrl.(type) {
- case string:
- temp.Url = v
- case map[string]interface{}:
- url, ok1 := v["url"].(string)
- detail, ok2 := v["detail"].(string)
- if ok2 {
- temp.Detail = detail
- }
- if ok1 {
- temp.Url = url
- }
- }
- contentList = append(contentList, MediaContent{
- Type: ContentTypeImageURL,
- ImageUrl: temp,
- })
- case ContentTypeInputAudio:
- if audioData, ok := contentItem["input_audio"].(map[string]interface{}); ok {
- data, ok1 := audioData["data"].(string)
- format, ok2 := audioData["format"].(string)
- if ok1 && ok2 {
- temp := &MessageInputAudio{
- Data: data,
- Format: format,
- }
- contentList = append(contentList, MediaContent{
- Type: ContentTypeInputAudio,
- InputAudio: temp,
- })
- }
- }
- case ContentTypeFile:
- if fileData, ok := contentItem["file"].(map[string]interface{}); ok {
- fileId, ok3 := fileData["file_id"].(string)
- if ok3 {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeFile,
- File: &MessageFile{
- FileId: fileId,
- },
- })
- } else {
- fileName, ok1 := fileData["filename"].(string)
- fileDataStr, ok2 := fileData["file_data"].(string)
- if ok1 && ok2 {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeFile,
- File: &MessageFile{
- FileName: fileName,
- FileData: fileDataStr,
- },
- })
- }
- }
- }
- case ContentTypeVideoUrl:
- if videoUrl, ok := contentItem["video_url"].(string); ok {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeVideoUrl,
- VideoUrl: &MessageVideoUrl{
- Url: videoUrl,
- },
- })
- }
- }
- }
- if len(contentList) > 0 {
- m.parsedContent = contentList
- }
- return contentList
- }
- // old code
- /*func (m *Message) StringContent() string {
- if m.parsedStringContent != nil {
- return *m.parsedStringContent
- }
- var stringContent string
- if err := json.Unmarshal(m.Content, &stringContent); err == nil {
- m.parsedStringContent = &stringContent
- return stringContent
- }
- contentStr := new(strings.Builder)
- arrayContent := m.ParseContent()
- for _, content := range arrayContent {
- if content.Type == ContentTypeText {
- contentStr.WriteString(content.Text)
- }
- }
- stringContent = contentStr.String()
- m.parsedStringContent = &stringContent
- return stringContent
- }
- func (m *Message) SetNullContent() {
- m.Content = nil
- m.parsedStringContent = nil
- m.parsedContent = nil
- }
- func (m *Message) SetStringContent(content string) {
- jsonContent, _ := json.Marshal(content)
- m.Content = jsonContent
- m.parsedStringContent = &content
- m.parsedContent = nil
- }
- func (m *Message) SetMediaContent(content []MediaContent) {
- jsonContent, _ := json.Marshal(content)
- m.Content = jsonContent
- m.parsedContent = nil
- m.parsedStringContent = nil
- }
- func (m *Message) IsStringContent() bool {
- if m.parsedStringContent != nil {
- return true
- }
- var stringContent string
- if err := json.Unmarshal(m.Content, &stringContent); err == nil {
- m.parsedStringContent = &stringContent
- return true
- }
- return false
- }
- func (m *Message) ParseContent() []MediaContent {
- if m.parsedContent != nil {
- return m.parsedContent
- }
- var contentList []MediaContent
- // 先尝试解析为字符串
- var stringContent string
- if err := json.Unmarshal(m.Content, &stringContent); err == nil {
- contentList = []MediaContent{{
- Type: ContentTypeText,
- Text: stringContent,
- }}
- m.parsedContent = contentList
- return contentList
- }
- // 尝试解析为数组
- var arrayContent []map[string]interface{}
- if err := json.Unmarshal(m.Content, &arrayContent); err == nil {
- for _, contentItem := range arrayContent {
- contentType, ok := contentItem["type"].(string)
- if !ok {
- continue
- }
- switch contentType {
- case ContentTypeText:
- if text, ok := contentItem["text"].(string); ok {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeText,
- Text: text,
- })
- }
- case ContentTypeImageURL:
- imageUrl := contentItem["image_url"]
- temp := &MessageImageUrl{
- Detail: "high",
- }
- switch v := imageUrl.(type) {
- case string:
- temp.Url = v
- case map[string]interface{}:
- url, ok1 := v["url"].(string)
- detail, ok2 := v["detail"].(string)
- if ok2 {
- temp.Detail = detail
- }
- if ok1 {
- temp.Url = url
- }
- }
- contentList = append(contentList, MediaContent{
- Type: ContentTypeImageURL,
- ImageUrl: temp,
- })
- case ContentTypeInputAudio:
- if audioData, ok := contentItem["input_audio"].(map[string]interface{}); ok {
- data, ok1 := audioData["data"].(string)
- format, ok2 := audioData["format"].(string)
- if ok1 && ok2 {
- temp := &MessageInputAudio{
- Data: data,
- Format: format,
- }
- contentList = append(contentList, MediaContent{
- Type: ContentTypeInputAudio,
- InputAudio: temp,
- })
- }
- }
- case ContentTypeFile:
- if fileData, ok := contentItem["file"].(map[string]interface{}); ok {
- fileId, ok3 := fileData["file_id"].(string)
- if ok3 {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeFile,
- File: &MessageFile{
- FileId: fileId,
- },
- })
- } else {
- fileName, ok1 := fileData["filename"].(string)
- fileDataStr, ok2 := fileData["file_data"].(string)
- if ok1 && ok2 {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeFile,
- File: &MessageFile{
- FileName: fileName,
- FileData: fileDataStr,
- },
- })
- }
- }
- }
- case ContentTypeVideoUrl:
- if videoUrl, ok := contentItem["video_url"].(string); ok {
- contentList = append(contentList, MediaContent{
- Type: ContentTypeVideoUrl,
- VideoUrl: &MessageVideoUrl{
- Url: videoUrl,
- },
- })
- }
- }
- }
- }
- if len(contentList) > 0 {
- m.parsedContent = contentList
- }
- return contentList
- }*/
- type WebSearchOptions struct {
- SearchContextSize string `json:"search_context_size,omitempty"`
- UserLocation json.RawMessage `json:"user_location,omitempty"`
- }
- // https://platform.openai.com/docs/api-reference/responses/create
- type OpenAIResponsesRequest struct {
- Model string `json:"model"`
- Input json.RawMessage `json:"input,omitempty"`
- Include json.RawMessage `json:"include,omitempty"`
- Instructions json.RawMessage `json:"instructions,omitempty"`
- MaxOutputTokens uint `json:"max_output_tokens,omitempty"`
- Metadata json.RawMessage `json:"metadata,omitempty"`
- ParallelToolCalls json.RawMessage `json:"parallel_tool_calls,omitempty"`
- PreviousResponseID string `json:"previous_response_id,omitempty"`
- Reasoning *Reasoning `json:"reasoning,omitempty"`
- // 服务层级字段,用于指定 API 服务等级。允许透传可能导致实际计费高于预期,默认应过滤
- ServiceTier string `json:"service_tier,omitempty"`
- Store json.RawMessage `json:"store,omitempty"`
- PromptCacheKey json.RawMessage `json:"prompt_cache_key,omitempty"`
- PromptCacheRetention json.RawMessage `json:"prompt_cache_retention,omitempty"`
- Stream bool `json:"stream,omitempty"`
- Temperature *float64 `json:"temperature,omitempty"`
- Text json.RawMessage `json:"text,omitempty"`
- ToolChoice json.RawMessage `json:"tool_choice,omitempty"`
- Tools json.RawMessage `json:"tools,omitempty"` // 需要处理的参数很少,MCP 参数太多不确定,所以用 map
- TopP *float64 `json:"top_p,omitempty"`
- Truncation string `json:"truncation,omitempty"`
- User string `json:"user,omitempty"`
- MaxToolCalls uint `json:"max_tool_calls,omitempty"`
- Prompt json.RawMessage `json:"prompt,omitempty"`
- // qwen
- EnableThinking json.RawMessage `json:"enable_thinking,omitempty"`
- // perplexity
- Preset json.RawMessage `json:"preset,omitempty"`
- }
- func (r *OpenAIResponsesRequest) GetTokenCountMeta() *types.TokenCountMeta {
- var fileMeta = make([]*types.FileMeta, 0)
- var texts = make([]string, 0)
- if r.Input != nil {
- inputs := r.ParseInput()
- for _, input := range inputs {
- if input.Type == "input_image" {
- if input.ImageUrl != "" {
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeImage,
- Source: createFileSource(input.ImageUrl),
- Detail: input.Detail,
- })
- }
- } else if input.Type == "input_file" {
- if input.FileUrl != "" {
- fileMeta = append(fileMeta, &types.FileMeta{
- FileType: types.FileTypeFile,
- Source: createFileSource(input.FileUrl),
- })
- }
- } else {
- texts = append(texts, input.Text)
- }
- }
- }
- if len(r.Instructions) > 0 {
- texts = append(texts, string(r.Instructions))
- }
- if len(r.Metadata) > 0 {
- texts = append(texts, string(r.Metadata))
- }
- if len(r.Text) > 0 {
- texts = append(texts, string(r.Text))
- }
- if len(r.ToolChoice) > 0 {
- texts = append(texts, string(r.ToolChoice))
- }
- if len(r.Prompt) > 0 {
- texts = append(texts, string(r.Prompt))
- }
- if len(r.Tools) > 0 {
- texts = append(texts, string(r.Tools))
- }
- return &types.TokenCountMeta{
- CombineText: strings.Join(texts, "\n"),
- Files: fileMeta,
- MaxTokens: int(r.MaxOutputTokens),
- }
- }
- func (r *OpenAIResponsesRequest) IsStream(c *gin.Context) bool {
- return r.Stream
- }
- func (r *OpenAIResponsesRequest) SetModelName(modelName string) {
- if modelName != "" {
- r.Model = modelName
- }
- }
- func (r *OpenAIResponsesRequest) GetToolsMap() []map[string]any {
- var toolsMap []map[string]any
- if len(r.Tools) > 0 {
- _ = common.Unmarshal(r.Tools, &toolsMap)
- }
- return toolsMap
- }
- type Reasoning struct {
- Effort string `json:"effort,omitempty"`
- Summary string `json:"summary,omitempty"`
- }
- type Input struct {
- Type string `json:"type,omitempty"`
- Role string `json:"role,omitempty"`
- Content json.RawMessage `json:"content,omitempty"`
- }
- type MediaInput struct {
- Type string `json:"type"`
- Text string `json:"text,omitempty"`
- FileUrl string `json:"file_url,omitempty"`
- ImageUrl string `json:"image_url,omitempty"`
- Detail string `json:"detail,omitempty"` // 仅 input_image 有效
- }
- // ParseInput parses the Responses API `input` field into a normalized slice of MediaInput.
- // Reference implementation mirrors Message.ParseContent:
- // - input can be a string, treated as an input_text item
- // - input can be an array of objects with a `type` field
- // supported types: input_text, input_image, input_file
- func (r *OpenAIResponsesRequest) ParseInput() []MediaInput {
- if r.Input == nil {
- return nil
- }
- var mediaInputs []MediaInput
- // Try string first
- // if str, ok := common.GetJsonType(r.Input); ok {
- // inputs = append(inputs, MediaInput{Type: "input_text", Text: str})
- // return inputs
- // }
- if common.GetJsonType(r.Input) == "string" {
- var str string
- _ = common.Unmarshal(r.Input, &str)
- mediaInputs = append(mediaInputs, MediaInput{Type: "input_text", Text: str})
- return mediaInputs
- }
- // Try array of parts
- if common.GetJsonType(r.Input) == "array" {
- var inputs []Input
- _ = common.Unmarshal(r.Input, &inputs)
- for _, input := range inputs {
- if common.GetJsonType(input.Content) == "string" {
- var str string
- _ = common.Unmarshal(input.Content, &str)
- mediaInputs = append(mediaInputs, MediaInput{Type: "input_text", Text: str})
- }
- if common.GetJsonType(input.Content) == "array" {
- var array []any
- _ = common.Unmarshal(input.Content, &array)
- for _, itemAny := range array {
- // Already parsed MediaContent
- if media, ok := itemAny.(MediaInput); ok {
- mediaInputs = append(mediaInputs, media)
- continue
- }
- // Generic map
- item, ok := itemAny.(map[string]any)
- if !ok {
- continue
- }
- typeVal, ok := item["type"].(string)
- if !ok {
- continue
- }
- switch typeVal {
- case "input_text":
- text, _ := item["text"].(string)
- mediaInputs = append(mediaInputs, MediaInput{Type: "input_text", Text: text})
- case "input_image":
- // image_url may be string or object with url field
- var imageUrl string
- switch v := item["image_url"].(type) {
- case string:
- imageUrl = v
- case map[string]any:
- if url, ok := v["url"].(string); ok {
- imageUrl = url
- }
- }
- mediaInputs = append(mediaInputs, MediaInput{Type: "input_image", ImageUrl: imageUrl})
- case "input_file":
- // file_url may be string or object with url field
- var fileUrl string
- switch v := item["file_url"].(type) {
- case string:
- fileUrl = v
- case map[string]any:
- if url, ok := v["url"].(string); ok {
- fileUrl = url
- }
- }
- mediaInputs = append(mediaInputs, MediaInput{Type: "input_file", FileUrl: fileUrl})
- }
- }
- }
- }
- }
- return mediaInputs
- }
|