realtime.go 3.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586
  1. package dto
  2. const (
  3. RealtimeEventTypeError = "error"
  4. RealtimeEventTypeSessionUpdate = "session.update"
  5. RealtimeEventTypeConversationCreate = "conversation.item.create"
  6. RealtimeEventTypeResponseCreate = "response.create"
  7. RealtimeEventInputAudioBufferAppend = "input_audio_buffer.append"
  8. )
  9. const (
  10. RealtimeEventTypeResponseDone = "response.done"
  11. RealtimeEventTypeSessionUpdated = "session.updated"
  12. RealtimeEventTypeSessionCreated = "session.created"
  13. RealtimeEventResponseAudioDelta = "response.audio.delta"
  14. RealtimeEventResponseAudioTranscriptionDelta = "response.audio_transcript.delta"
  15. RealtimeEventResponseFunctionCallArgumentsDelta = "response.function_call_arguments.delta"
  16. RealtimeEventResponseFunctionCallArgumentsDone = "response.function_call_arguments.done"
  17. RealtimeEventConversationItemCreated = "conversation.item.created"
  18. )
  19. type RealtimeEvent struct {
  20. EventId string `json:"event_id"`
  21. Type string `json:"type"`
  22. //PreviousItemId string `json:"previous_item_id"`
  23. Session *RealtimeSession `json:"session,omitempty"`
  24. Item *RealtimeItem `json:"item,omitempty"`
  25. Error *OpenAIError `json:"error,omitempty"`
  26. Response *RealtimeResponse `json:"response,omitempty"`
  27. Delta string `json:"delta,omitempty"`
  28. Audio string `json:"audio,omitempty"`
  29. }
  30. type RealtimeResponse struct {
  31. Usage *RealtimeUsage `json:"usage"`
  32. }
  33. type RealtimeUsage struct {
  34. TotalTokens int `json:"total_tokens"`
  35. InputTokens int `json:"input_tokens"`
  36. OutputTokens int `json:"output_tokens"`
  37. InputTokenDetails InputTokenDetails `json:"input_token_details"`
  38. OutputTokenDetails OutputTokenDetails `json:"output_token_details"`
  39. }
  40. type RealtimeSession struct {
  41. Modalities []string `json:"modalities"`
  42. Instructions string `json:"instructions"`
  43. Voice string `json:"voice"`
  44. InputAudioFormat string `json:"input_audio_format"`
  45. OutputAudioFormat string `json:"output_audio_format"`
  46. InputAudioTranscription InputAudioTranscription `json:"input_audio_transcription"`
  47. TurnDetection interface{} `json:"turn_detection"`
  48. Tools []RealTimeTool `json:"tools"`
  49. ToolChoice string `json:"tool_choice"`
  50. Temperature float64 `json:"temperature"`
  51. //MaxResponseOutputTokens int `json:"max_response_output_tokens"`
  52. }
  53. type InputAudioTranscription struct {
  54. Model string `json:"model"`
  55. }
  56. type RealTimeTool struct {
  57. Type string `json:"type"`
  58. Name string `json:"name"`
  59. Description string `json:"description"`
  60. Parameters any `json:"parameters"`
  61. }
  62. type RealtimeItem struct {
  63. Id string `json:"id"`
  64. Type string `json:"type"`
  65. Status string `json:"status"`
  66. Role string `json:"role"`
  67. Content []RealtimeContent `json:"content"`
  68. Name *string `json:"name,omitempty"`
  69. ToolCalls any `json:"tool_calls,omitempty"`
  70. CallId string `json:"call_id,omitempty"`
  71. }
  72. type RealtimeContent struct {
  73. Type string `json:"type"`
  74. Text string `json:"text,omitempty"`
  75. Audio string `json:"audio,omitempty"` // Base64-encoded audio bytes.
  76. Transcript string `json:"transcript,omitempty"`
  77. }