-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmessages.go
More file actions
140 lines (125 loc) · 3.54 KB
/
messages.go
File metadata and controls
140 lines (125 loc) · 3.54 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
package vatel
import "encoding/json"
const (
TypeSessionStarted = "session_started"
TypeResponseAudio = "response_audio"
TypeResponseText = "response_text"
TypeInputAudioTranscript = "input_audio_transcript"
TypeSpeechStarted = "speech_started"
TypeSpeechStopped = "speech_stopped"
TypeSessionEnded = "session_ended"
TypeInterruption = "interruption"
TypeToolCall = "tool_call"
TypeInputAudio = "input_audio"
TypeToolCallOutput = "tool_call_output"
)
// ServerMessage is a discriminated server event. Check Type and use ParseData() to get the typed payload.
type ServerMessage struct {
Type string `json:"type"`
Data json.RawMessage `json:"data,omitempty"`
}
type SessionStartedData struct {
ID string `json:"id"`
}
type ResponseAudioData struct {
TurnID string `json:"turn_id"`
Audio string `json:"audio"`
}
type ResponseTextData struct {
TurnID string `json:"turn_id"`
Text string `json:"text"`
}
type InputAudioTranscriptData struct {
Transcript string `json:"transcript"`
}
type SpeechStartedData struct {
Emulated bool `json:"emulated"`
}
type ToolCallArgument struct {
Name string `json:"name"`
Type string `json:"type"`
DataType string `json:"dataType"`
Description string `json:"description"`
Required bool `json:"required"`
Value interface{} `json:"value"`
}
type ToolCallData struct {
ToolCallID string `json:"toolCallId"`
ToolName string `json:"toolName"`
Arguments []ToolCallArgument `json:"arguments"`
}
type InputAudioPayload struct {
Type string `json:"type"`
Data struct {
Audio string `json:"audio"`
} `json:"data"`
}
type ToolCallOutputPayload struct {
Type string `json:"type"`
Data struct {
ToolCallID string `json:"toolCallId"`
Output string `json:"output"`
} `json:"data"`
}
func NewInputAudioMessage(audioBase64 string) InputAudioPayload {
return InputAudioPayload{
Type: TypeInputAudio,
Data: struct {
Audio string `json:"audio"`
}{Audio: audioBase64},
}
}
func NewToolCallOutputMessage(toolCallID, output string) ToolCallOutputPayload {
return ToolCallOutputPayload{
Type: TypeToolCallOutput,
Data: struct {
ToolCallID string `json:"toolCallId"`
Output string `json:"output"`
}{ToolCallID: toolCallID, Output: output},
}
}
// ParseData unmarshals Data into the concrete type for this message (e.g. SessionStartedData, ResponseAudioData, ToolCallData). Returns nil for message types with no payload.
func (m *ServerMessage) ParseData() (interface{}, error) {
switch m.Type {
case TypeSessionStarted:
var d SessionStartedData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeResponseAudio:
var d ResponseAudioData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeResponseText:
var d ResponseTextData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeInputAudioTranscript:
var d InputAudioTranscriptData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeSpeechStarted:
var d SpeechStartedData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeToolCall:
var d ToolCallData
if err := json.Unmarshal(m.Data, &d); err != nil {
return nil, err
}
return d, nil
case TypeSpeechStopped, TypeSessionEnded, TypeInterruption:
return nil, nil
default:
return m.Data, nil
}
}