realtime.go 3.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697
  1. package dto
  2. const (
  3. RealtimeEventTypeError = "error"
  4. RealtimeEventTypeSessionUpdate = "session.update"
  5. RealtimeEventTypeConversationCreate = "conversation.item.create"
  6. RealtimeEventTypeResponseCreate = "response.create"
  7. RealtimeEventInputAudioBufferAppend = "input_audio_buffer.append"
  8. )
  9. const (
  10. RealtimeEventTypeResponseDone = "response.done"
  11. RealtimeEventTypeSessionUpdated = "session.updated"
  12. RealtimeEventTypeSessionCreated = "session.created"
  13. RealtimeEventResponseAudioDelta = "response.audio.delta"
  14. RealtimeEventResponseAudioTranscriptionDelta = "response.audio_transcript.delta"
  15. RealtimeEventResponseFunctionCallArgumentsDelta = "response.function_call_arguments.delta"
  16. RealtimeEventResponseFunctionCallArgumentsDone = "response.function_call_arguments.done"
  17. RealtimeEventConversationItemCreated = "conversation.item.created"
  18. )
  19. type RealtimeEvent struct {
  20. EventId string `json:"event_id"`
  21. Type string `json:"type"`
  22. //PreviousItemId string `json:"previous_item_id"`
  23. Session *RealtimeSession `json:"session,omitempty"`
  24. Item *RealtimeItem `json:"item,omitempty"`
  25. Error *OpenAIError `json:"error,omitempty"`
  26. Response *RealtimeResponse `json:"response,omitempty"`
  27. Delta string `json:"delta,omitempty"`
  28. Audio string `json:"audio,omitempty"`
  29. }
  30. type RealtimeResponse struct {
  31. Usage *RealtimeUsage `json:"usage"`
  32. }
  33. type RealtimeUsage struct {
  34. TotalTokens int `json:"total_tokens"`
  35. InputTokens int `json:"input_tokens"`
  36. OutputTokens int `json:"output_tokens"`
  37. InputTokenDetails InputTokenDetails `json:"input_token_details"`
  38. OutputTokenDetails OutputTokenDetails `json:"output_token_details"`
  39. }
  40. type InputTokenDetails struct {
  41. CachedTokens int `json:"cached_tokens"`
  42. TextTokens int `json:"text_tokens"`
  43. AudioTokens int `json:"audio_tokens"`
  44. }
  45. type OutputTokenDetails struct {
  46. TextTokens int `json:"text_tokens"`
  47. AudioTokens int `json:"audio_tokens"`
  48. }
  49. type RealtimeSession struct {
  50. Modalities []string `json:"modalities"`
  51. Instructions string `json:"instructions"`
  52. Voice string `json:"voice"`
  53. InputAudioFormat string `json:"input_audio_format"`
  54. OutputAudioFormat string `json:"output_audio_format"`
  55. InputAudioTranscription InputAudioTranscription `json:"input_audio_transcription"`
  56. TurnDetection interface{} `json:"turn_detection"`
  57. Tools []RealTimeTool `json:"tools"`
  58. ToolChoice string `json:"tool_choice"`
  59. Temperature float64 `json:"temperature"`
  60. //MaxResponseOutputTokens int `json:"max_response_output_tokens"`
  61. }
  62. type InputAudioTranscription struct {
  63. Model string `json:"model"`
  64. }
  65. type RealTimeTool struct {
  66. Type string `json:"type"`
  67. Name string `json:"name"`
  68. Description string `json:"description"`
  69. Parameters any `json:"parameters"`
  70. }
  71. type RealtimeItem struct {
  72. Id string `json:"id"`
  73. Type string `json:"type"`
  74. Status string `json:"status"`
  75. Role string `json:"role"`
  76. Content []RealtimeContent `json:"content"`
  77. Name *string `json:"name,omitempty"`
  78. ToolCalls any `json:"tool_calls,omitempty"`
  79. CallId string `json:"call_id,omitempty"`
  80. }
  81. type RealtimeContent struct {
  82. Type string `json:"type"`
  83. Text string `json:"text,omitempty"`
  84. Audio string `json:"audio,omitempty"` // Base64-encoded audio bytes.
  85. Transcript string `json:"transcript,omitempty"`
  86. }