AI
/
aiproxy
mirror de https://gitee.com/NovemberRain/aiproxy.git


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371
							package model

import (
	"github.com/labring/aiproxy/core/model"
)

// InputItemType represents the type of an input item
type InputItemType = string

const (
	InputItemTypeMessage            InputItemType = "message"
	InputItemTypeFunctionCall       InputItemType = "function_call"
	InputItemTypeFunctionCallOutput InputItemType = "function_call_output"
)

// InputContentType represents the type of input content
type InputContentType = string

const (
	InputContentTypeInputText  InputContentType = "input_text"
	InputContentTypeOutputText InputContentType = "output_text"
)

// OutputContentType represents the type of output content
type OutputContentType = string

const (
	OutputContentTypeText       OutputContentType = "text"
	OutputContentTypeOutputText OutputContentType = "output_text"
)

// ResponseStatus represents the status of a response
type ResponseStatus = string

const (
	ResponseStatusInProgress ResponseStatus = "in_progress"
	ResponseStatusCompleted  ResponseStatus = "completed"
	ResponseStatusFailed     ResponseStatus = "failed"
	ResponseStatusIncomplete ResponseStatus = "incomplete"
	ResponseStatusCancelled  ResponseStatus = "cancelled"
)

// ResponseStreamEventType represents the type of a response stream event
type ResponseStreamEventType = string

const (
	// Response lifecycle events
	EventResponseCreated    ResponseStreamEventType = "response.created"
	EventResponseInProgress ResponseStreamEventType = "response.in_progress"
	EventResponseCompleted  ResponseStreamEventType = "response.completed"
	EventResponseFailed     ResponseStreamEventType = "response.failed"
	EventResponseIncomplete ResponseStreamEventType = "response.incomplete"
	EventResponseQueued     ResponseStreamEventType = "response.queued"
	EventResponseDone       ResponseStreamEventType = "response.done" // Legacy/compatibility

	// Output item events
	EventOutputItemAdded ResponseStreamEventType = "response.output_item.added"
	EventOutputItemDone  ResponseStreamEventType = "response.output_item.done"

	// Content part events
	EventContentPartAdded ResponseStreamEventType = "response.content_part.added"
	EventContentPartDone  ResponseStreamEventType = "response.content_part.done"

	// Text output events
	EventOutputTextDelta ResponseStreamEventType = "response.output_text.delta"
	EventOutputTextDone  ResponseStreamEventType = "response.output_text.done"

	// Refusal events
	EventRefusalDelta ResponseStreamEventType = "response.refusal.delta"
	EventRefusalDone  ResponseStreamEventType = "response.refusal.done"

	// Function call events
	EventFunctionCallArgumentsDelta ResponseStreamEventType = "response.function_call_arguments.delta"
	EventFunctionCallArgumentsDone  ResponseStreamEventType = "response.function_call_arguments.done"

	// Reasoning events
	EventReasoningSummaryPartAdded ResponseStreamEventType = "response.reasoning_summary_part.added"
	EventReasoningSummaryPartDone  ResponseStreamEventType = "response.reasoning_summary_part.done"
	EventReasoningSummaryTextDelta ResponseStreamEventType = "response.reasoning_summary_text.delta"
	EventReasoningSummaryTextDone  ResponseStreamEventType = "response.reasoning_summary_text.done"
	EventReasoningTextDelta        ResponseStreamEventType = "response.reasoning_text.delta"
	EventReasoningTextDone         ResponseStreamEventType = "response.reasoning_text.done"

	// Tool call events
	EventFileSearchCallInProgress ResponseStreamEventType = "response.file_search_call.in_progress"
	EventFileSearchCallSearching  ResponseStreamEventType = "response.file_search_call.searching"
	EventFileSearchCallCompleted  ResponseStreamEventType = "response.file_search_call.completed"

	EventWebSearchCallInProgress ResponseStreamEventType = "response.web_search_call.in_progress"
	EventWebSearchCallSearching  ResponseStreamEventType = "response.web_search_call.searching"
	EventWebSearchCallCompleted  ResponseStreamEventType = "response.web_search_call.completed"

	EventCodeInterpreterCallInProgress   ResponseStreamEventType = "response.code_interpreter_call.in_progress"
	EventCodeInterpreterCallInterpreting ResponseStreamEventType = "response.code_interpreter_call.interpreting"
	EventCodeInterpreterCallCompleted    ResponseStreamEventType = "response.code_interpreter_call.completed"
	EventCodeInterpreterCallCodeDelta    ResponseStreamEventType = "response.code_interpreter_call_code.delta"
	EventCodeInterpreterCallCodeDone     ResponseStreamEventType = "response.code_interpreter_call_code.done"

	EventImageGenerationCallInProgress   ResponseStreamEventType = "response.image_generation_call.in_progress"
	EventImageGenerationCallGenerating   ResponseStreamEventType = "response.image_generation_call.generating"
	EventImageGenerationCallCompleted    ResponseStreamEventType = "response.image_generation_call.completed"
	EventImageGenerationCallPartialImage ResponseStreamEventType = "response.image_generation_call.partial_image"

	EventMCPCallInProgress      ResponseStreamEventType = "response.mcp_call.in_progress"
	EventMCPCallCompleted       ResponseStreamEventType = "response.mcp_call.completed"
	EventMCPCallFailed          ResponseStreamEventType = "response.mcp_call.failed"
	EventMCPCallArgumentsDelta  ResponseStreamEventType = "response.mcp_call_arguments.delta"
	EventMCPCallArgumentsDone   ResponseStreamEventType = "response.mcp_call_arguments.done"
	EventMCPListToolsInProgress ResponseStreamEventType = "response.mcp_list_tools.in_progress"
	EventMCPListToolsCompleted  ResponseStreamEventType = "response.mcp_list_tools.completed"
	EventMCPListToolsFailed     ResponseStreamEventType = "response.mcp_list_tools.failed"

	EventCustomToolCallInputDelta ResponseStreamEventType = "response.custom_tool_call_input.delta"
	EventCustomToolCallInputDone  ResponseStreamEventType = "response.custom_tool_call_input.done"

	// Annotation events
	EventOutputTextAnnotationAdded ResponseStreamEventType = "response.output_text.annotation.added"

	// Error event
	EventError ResponseStreamEventType = "error"
)

// ResponseError represents an error in a response
type ResponseError struct {
	Code    string `json:"code"`
	Message string `json:"message"`
}

// ResponseTool represents a tool in the Responses API format (flattened structure)
type ResponseTool struct {
	Type        string `json:"type"`
	Name        string `json:"name,omitempty"`
	Description string `json:"description,omitempty"`
	Parameters  any    `json:"parameters,omitempty"`
}

// IncompleteDetails represents details about why a response is incomplete
type IncompleteDetails struct {
	Reason string `json:"reason"`
}

// ResponseReasoning represents reasoning information
type ResponseReasoning struct {
	Effort  *string `json:"effort"`
	Summary *string `json:"summary"`
}

// ResponseTextFormat represents text format configuration
type ResponseTextFormat struct {
	Type string `json:"type"`
}

// ResponseText represents text configuration
type ResponseText struct {
	Format ResponseTextFormat `json:"format"`
}

// OutputContent represents content in an output item
type OutputContent struct {
	Type        string `json:"type"`
	Text        string `json:"text,omitempty"`
	Annotations []any  `json:"annotations,omitempty"`
}

// OutputItem represents an output item in a response
type OutputItem struct {
	ID        string          `json:"id"`
	Type      string          `json:"type"`
	Status    ResponseStatus  `json:"status,omitempty"`
	Role      string          `json:"role,omitempty"`
	Content   []OutputContent `json:"content,omitempty"`
	Arguments string          `json:"arguments,omitempty"` // For function_call type
	CallID    string          `json:"call_id,omitempty"`   // For function_call type
	Name      string          `json:"name,omitempty"`      // For function_call type
	Summary   []string        `json:"summary,omitempty"`   // For reasoning type
}

// InputContent represents content in an input item
type InputContent struct {
	Type string `json:"type"`
	Text string `json:"text,omitempty"`
	// Fields for function_call type
	ID        string `json:"id,omitempty"`
	Name      string `json:"name,omitempty"`
	Arguments string `json:"arguments,omitempty"`
	// Fields for function_result type
	CallID string `json:"call_id,omitempty"`
	Output string `json:"output,omitempty"`
}

// InputItem represents an input item
type InputItem struct {
	ID      string         `json:"id,omitempty"`
	Type    string         `json:"type"`
	Role    string         `json:"role,omitempty"`
	Content []InputContent `json:"content,omitempty"`
	// Fields for function_call type
	Name      string `json:"name,omitempty"`
	Arguments string `json:"arguments,omitempty"`
	// Fields for function_result type
	CallID string `json:"call_id,omitempty"`
	Output string `json:"output,omitempty"`
}

// ResponseUsageDetails represents detailed token usage information
type ResponseUsageDetails struct {
	CachedTokens    int64 `json:"cached_tokens,omitempty"`
	ReasoningTokens int64 `json:"reasoning_tokens,omitempty"`
}

// ResponseUsage represents usage information for a response
type ResponseUsage struct {
	InputTokens         int64                 `json:"input_tokens"`
	OutputTokens        int64                 `json:"output_tokens"`
	TotalTokens         int64                 `json:"total_tokens"`
	InputTokensDetails  *ResponseUsageDetails `json:"input_tokens_details,omitempty"`
	OutputTokensDetails *ResponseUsageDetails `json:"output_tokens_details,omitempty"`
}

// Response represents an OpenAI response object
type Response struct {
	ID                 string             `json:"id"`
	Object             string             `json:"object"`
	CreatedAt          int64              `json:"created_at"`
	Status             ResponseStatus     `json:"status"`
	Error              *ResponseError     `json:"error"`
	IncompleteDetails  *IncompleteDetails `json:"incomplete_details"`
	Instructions       *string            `json:"instructions"`
	MaxOutputTokens    *int               `json:"max_output_tokens"`
	Model              string             `json:"model"`
	Output             []OutputItem       `json:"output"`
	ParallelToolCalls  bool               `json:"parallel_tool_calls"`
	PreviousResponseID *string            `json:"previous_response_id"`
	Reasoning          ResponseReasoning  `json:"reasoning"`
	Store              bool               `json:"store"`
	Temperature        float64            `json:"temperature"`
	Text               ResponseText       `json:"text"`
	ToolChoice         any                `json:"tool_choice"`
	Tools              []ResponseTool     `json:"tools"`
	TopP               float64            `json:"top_p"`
	Truncation         string             `json:"truncation"`
	Usage              *ResponseUsage     `json:"usage"`
	User               *string            `json:"user"`
	Metadata           map[string]any     `json:"metadata"`
}

// CreateResponseRequest represents a request to create a response
type CreateResponseRequest struct {
	Model              string         `json:"model"`
	Input              any            `json:"input"`
	Background         *bool          `json:"background,omitempty"`
	Conversation       any            `json:"conversation,omitempty"` // string or object
	Include            []string       `json:"include,omitempty"`
	Instructions       *string        `json:"instructions,omitempty"`
	MaxOutputTokens    *int           `json:"max_output_tokens,omitempty"`
	MaxToolCalls       *int           `json:"max_tool_calls,omitempty"`
	Metadata           map[string]any `json:"metadata,omitempty"`
	ParallelToolCalls  *bool          `json:"parallel_tool_calls,omitempty"`
	PreviousResponseID *string        `json:"previous_response_id,omitempty"`
	PromptCacheKey     *string        `json:"prompt_cache_key,omitempty"`
	SafetyIdentifier   *string        `json:"safety_identifier,omitempty"`
	ServiceTier        *string        `json:"service_tier,omitempty"`
	Store              *bool          `json:"store,omitempty"`
	Stream             bool           `json:"stream,omitempty"`
	Temperature        *float64       `json:"temperature,omitempty"`
	Text               *ResponseText  `json:"text,omitempty"`
	ToolChoice         any            `json:"tool_choice,omitempty"`
	Tools              []ResponseTool `json:"tools,omitempty"`
	TopLogprobs        *int           `json:"top_logprobs,omitempty"`
	TopP               *float64       `json:"top_p,omitempty"`
	Truncation         *string        `json:"truncation,omitempty"`
	User               *string        `json:"user,omitempty"` // Deprecated, use prompt_cache_key
}

// InputItemList represents a list of input items
type InputItemList struct {
	Object  string      `json:"object"`
	Data    []InputItem `json:"data"`
	FirstID string      `json:"first_id"`
	LastID  string      `json:"last_id"`
	HasMore bool        `json:"has_more"`
}

// ResponseStreamEvent represents a server-sent event for response streaming
type ResponseStreamEvent struct {
	Type           string         `json:"type"`
	Response       *Response      `json:"response,omitempty"`
	OutputIndex    *int           `json:"output_index,omitempty"`
	Item           *OutputItem    `json:"item,omitempty"`
	ItemID         string         `json:"item_id,omitempty"`
	ContentIndex   *int           `json:"content_index,omitempty"`
	Part           *OutputContent `json:"part,omitempty"`      // For content_part events
	Delta          string         `json:"delta,omitempty"`     // For text.delta, function_call_arguments.delta
	Text           string         `json:"text,omitempty"`      // For text content
	Arguments      string         `json:"arguments,omitempty"` // For function_call_arguments.done
	SequenceNumber int            `json:"sequence_number,omitempty"`
}

func (u *ResponseUsage) ToModelUsage() model.Usage {
	usage := model.Usage{
		InputTokens:  model.ZeroNullInt64(u.InputTokens),
		OutputTokens: model.ZeroNullInt64(u.OutputTokens),
		TotalTokens:  model.ZeroNullInt64(u.TotalTokens),
	}

	if u.InputTokensDetails != nil {
		usage.CachedTokens = model.ZeroNullInt64(u.InputTokensDetails.CachedTokens)
	}

	if u.OutputTokensDetails != nil {
		usage.ReasoningTokens = model.ZeroNullInt64(u.OutputTokensDetails.ReasoningTokens)
	}

	return usage
}

// ToChatUsage converts ResponseUsage to ChatUsage (OpenAI Chat Completions format)
func (u *ResponseUsage) ToChatUsage() ChatUsage {
	usage := ChatUsage{
		PromptTokens:     u.InputTokens,
		CompletionTokens: u.OutputTokens,
		TotalTokens:      u.TotalTokens,
	}

	if u.InputTokensDetails != nil && u.InputTokensDetails.CachedTokens > 0 {
		usage.PromptTokensDetails = &PromptTokensDetails{
			CachedTokens: u.InputTokensDetails.CachedTokens,
		}
	}

	if u.OutputTokensDetails != nil && u.OutputTokensDetails.ReasoningTokens > 0 {
		usage.CompletionTokensDetails = &CompletionTokensDetails{
			ReasoningTokens: u.OutputTokensDetails.ReasoningTokens,
		}
	}

	return usage
}

// ToClaudeUsage converts ResponseUsage to ClaudeUsage (Anthropic Claude format)
func (u *ResponseUsage) ToClaudeUsage() ClaudeUsage {
	usage := ClaudeUsage{
		InputTokens:  u.InputTokens,
		OutputTokens: u.OutputTokens,
	}

	if u.InputTokensDetails != nil && u.InputTokensDetails.CachedTokens > 0 {
		usage.CacheReadInputTokens = u.InputTokensDetails.CachedTokens
	}

	return usage
}

// ToGeminiUsage converts ResponseUsage to GeminiUsageMetadata (Google Gemini format)
func (u *ResponseUsage) ToGeminiUsage() GeminiUsageMetadata {
	usage := GeminiUsageMetadata{
		PromptTokenCount:     u.InputTokens,
		CandidatesTokenCount: u.OutputTokens,
		TotalTokenCount:      u.TotalTokens,
	}

	if u.InputTokensDetails != nil && u.InputTokensDetails.CachedTokens > 0 {
		usage.CachedContentTokenCount = u.InputTokensDetails.CachedTokens
	}

	if u.OutputTokensDetails != nil && u.OutputTokensDetails.ReasoningTokens > 0 {
		usage.ThoughtsTokenCount = u.OutputTokensDetails.ReasoningTokens
	}

	return usage
}