-
-
Notifications
You must be signed in to change notification settings - Fork 6
Expand file tree
/
Copy pathperplexity_msg.go
More file actions
372 lines (320 loc) · 11 KB
/
Copy pathperplexity_msg.go
File metadata and controls
372 lines (320 loc) · 11 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
package perplexity
import (
"errors"
"fmt"
)
// ContentType represents the type of content in a multimodal message.
type ContentType string
const (
// ContentTypeText represents text content in a multimodal message.
ContentTypeText ContentType = "text"
// ContentTypeImageURL represents image URL content in a multimodal message.
ContentTypeImageURL ContentType = "image_url"
// ContentTypeFileURL represents file URL content in a multimodal message.
ContentTypeFileURL ContentType = "file_url"
)
// Content represents text, image, or file content in a multimodal message.
type Content struct {
Type ContentType `json:"type" validate:"required,oneof=text image_url file_url"`
Text *string `json:"text,omitempty" validate:"required_if=Type text"`
ImageURL *ImageURL `json:"image_url,omitempty" validate:"required_if=Type image_url"`
FileURL *FileURL `json:"file_url,omitempty" validate:"required_if=Type file_url"`
FileName *string `json:"file_name,omitempty"` // Optional filename for base64 encoded files
}
// ImageURL represents image content with URL or base64 data URI.
type ImageURL struct {
URL string `json:"url" validate:"required"`
}
// FileURL represents file content with URL or base64 data.
type FileURL struct {
URL string `json:"url" validate:"required"`
}
// MultimodalMessage supports both text and image content according to Perplexity API specification.
type MultimodalMessage struct {
Role string `json:"role" validate:"required,oneof=system user assistant"`
Content []Content `json:"content" validate:"required,min=1,dive"`
}
// NewTextContent creates a text content object for multimodal messages.
func NewTextContent(text string) Content {
return Content{
Type: ContentTypeText,
Text: &text,
}
}
// NewImageURLContent creates an image URL content object for multimodal messages.
func NewImageURLContent(url string) Content {
return Content{
Type: ContentTypeImageURL,
ImageURL: &ImageURL{
URL: url,
},
}
}
// NewImageFileContent creates image content from a file path by encoding it to base64 data URI.
func NewImageFileContent(filepath string) (Content, error) {
processor := NewImageProcessor()
dataURI, err := processor.EncodeImageFromFile(filepath)
if err != nil {
return Content{}, err
}
return NewImageURLContent(dataURI), nil
}
// NewFileURLContent creates a file URL content object for multimodal messages.
// The fileName parameter is optional and only required for base64 encoded files.
func NewFileURLContent(url string, fileName string) Content {
content := Content{
Type: ContentTypeFileURL,
FileURL: &FileURL{
URL: url,
},
}
if fileName != "" {
content.FileName = &fileName
}
return content
}
// NewFileFileContent creates file content from a file path by encoding it to a base64 data URI.
// The resulting URL field contains a "data:<mime>;base64,<payload>" URI accepted by the Perplexity API.
func NewFileFileContent(filepath string) (Content, error) {
processor := NewFileProcessor()
base64Data, fileName, err := processor.EncodeFileFromPath(filepath)
if err != nil {
return Content{}, err
}
format := processor.getFileFormatFromPath(filepath)
mime := processor.getFileMimeType(format)
dataURI := fmt.Sprintf("data:%s;base64,%s", mime, base64Data)
return NewFileURLContent(dataURI, fileName), nil
}
// Error definitions.
var (
// ErrPrevMessageShouldBeAssistant is returned when the previous message is not from the assistant.
ErrPrevMessageShouldBeAssistant = errors.New("previous message should be an assistant message")
// ErrFirstMessageShouldBeUser is returned when the first message is not from the user.
ErrFirstMessageShouldBeUser = errors.New("first message should be a user message")
// ErrPrevMessageShouldBeUser is returned when the previous message is not from the user.
ErrPrevMessageShouldBeUser = errors.New("previous message should be a user message")
// ErrMultimodalContentEmpty is returned when multimodal message content is empty.
ErrMultimodalContentEmpty = errors.New("multimodal message content cannot be empty")
// ErrMultimodalInvalidContentType is returned when multimodal content has invalid type.
ErrMultimodalInvalidContentType = errors.New("invalid content type in multimodal message")
)
// Message is a message object for the Perplexity API.
type Message struct {
Role string `json:"role" validate:"required,oneof=system user assistant"`
Content string `json:"content"`
}
// Messages is an object that contains a list of messages for the Perplexity API.
type Messages struct {
systemMessage string
messages []Message // A list of messages comprising the conversation so far.
multimodalMessages []MultimodalMessage // A list of multimodal messages (when using images).
useMultimodal bool // Flag to indicate if multimodal messages are being used.
}
// NewMessages returns a new Messages object.
func NewMessages(opts ...MessagesOption) Messages {
m := Messages{}
for _, opt := range opts {
opt(&m)
}
return m
}
// MessagesOption is an option for the NewMessages function.
type MessagesOption func(*Messages)
// WithSystemMessage sets the system message for the Messages object.
func WithSystemMessage(content string) MessagesOption {
return func(m *Messages) {
m.systemMessage = content
}
}
// AddUserMessage adds a user message to the Messages object.
func (m *Messages) AddUserMessage(content string) error {
if len(m.messages) > 0 {
// Previous message should be an assistant message.
if m.messages[len(m.messages)-1].Role != "assistant" {
return ErrPrevMessageShouldBeAssistant
}
}
m.messages = append(m.messages, Message{
Role: "user",
Content: content,
})
return nil
}
// AddAgentMessage adds an assistant message to the Messages object.
func (m *Messages) AddAgentMessage(content string) error {
if len(m.messages) == 0 {
// First message should be a user message.
return ErrFirstMessageShouldBeUser
}
// Previous message should be a user message.
if m.messages[len(m.messages)-1].Role != "user" {
return ErrPrevMessageShouldBeUser
}
m.messages = append(m.messages, Message{
Role: "assistant",
Content: content,
})
return nil
}
// GetMessages returns all messages including the system message (if any) as a slice of Message.
// The system message is always included as the first message when present.
func (m *Messages) GetMessages() []Message {
var result []Message
// system message is added in the first position
if m.systemMessage != "" {
result = append(result, Message{
Role: "system",
Content: m.systemMessage,
})
}
// user and assistant messages are added in the following positions
result = append(result, m.messages...)
return result
}
// GetSystemMessage returns the system message.
func (m *Messages) GetSystemMessage() string {
return m.systemMessage
}
// AddMultimodalUserMessage adds a user message with mixed content (text + images + files).
func (m *Messages) AddMultimodalUserMessage(contents []Content) error {
if len(contents) == 0 {
return ErrMultimodalContentEmpty
}
// Validate content types
for _, content := range contents {
if content.Type != ContentTypeText && content.Type != ContentTypeImageURL && content.Type != ContentTypeFileURL {
return ErrMultimodalInvalidContentType
}
}
if len(m.multimodalMessages) > 0 {
// Previous message should be an assistant message.
if m.multimodalMessages[len(m.multimodalMessages)-1].Role != "assistant" {
return ErrPrevMessageShouldBeAssistant
}
}
m.multimodalMessages = append(m.multimodalMessages, MultimodalMessage{
Role: "user",
Content: contents,
})
m.useMultimodal = true
return nil
}
// AddUserMessageWithImage adds a user message with text and a single image URL.
func (m *Messages) AddUserMessageWithImage(text, imageURL string) error {
// Validate image URL
processor := NewImageProcessor()
if err := processor.ValidateImageURL(imageURL); err != nil {
return err
}
contents := []Content{
NewTextContent(text),
NewImageURLContent(imageURL),
}
return m.AddMultimodalUserMessage(contents)
}
// AddUserMessageWithImageFile adds a user message with text and image from file path.
func (m *Messages) AddUserMessageWithImageFile(text, filepath string) error {
imageContent, err := NewImageFileContent(filepath)
if err != nil {
return err
}
contents := []Content{
NewTextContent(text),
imageContent,
}
return m.AddMultimodalUserMessage(contents)
}
// AddUserMessageWithFile adds a user message with text and a single file URL.
func (m *Messages) AddUserMessageWithFile(text, fileURL, fileName string) error {
// Validate file URL
processor := NewFileProcessor()
if err := processor.ValidateFileURL(fileURL); err != nil {
return err
}
contents := []Content{
NewTextContent(text),
NewFileURLContent(fileURL, fileName),
}
return m.AddMultimodalUserMessage(contents)
}
// AddUserMessageWithFileFromPath adds a user message with text and file from file path.
func (m *Messages) AddUserMessageWithFileFromPath(text, filepath string) error {
fileContent, err := NewFileFileContent(filepath)
if err != nil {
return err
}
contents := []Content{
NewTextContent(text),
fileContent,
}
return m.AddMultimodalUserMessage(contents)
}
// AddMultimodalAgentMessage adds an assistant message with mixed content.
func (m *Messages) AddMultimodalAgentMessage(contents []Content) error {
if len(contents) == 0 {
return ErrMultimodalContentEmpty
}
if len(m.multimodalMessages) == 0 {
// First message should be a user message.
return ErrFirstMessageShouldBeUser
}
// Previous message should be a user message.
if m.multimodalMessages[len(m.multimodalMessages)-1].Role != "user" {
return ErrPrevMessageShouldBeUser
}
m.multimodalMessages = append(m.multimodalMessages, MultimodalMessage{
Role: "assistant",
Content: contents,
})
m.useMultimodal = true
return nil
}
// GetMultimodalMessages returns all messages in multimodal format including the system message.
func (m *Messages) GetMultimodalMessages() []MultimodalMessage {
var result []MultimodalMessage
// Add system message as first message if present
if m.systemMessage != "" {
result = append(result, MultimodalMessage{
Role: "system",
Content: []Content{
NewTextContent(m.systemMessage),
},
})
}
// Add multimodal messages
result = append(result, m.multimodalMessages...)
return result
}
// IsMultimodal returns true if the Messages object contains multimodal messages.
func (m *Messages) IsMultimodal() bool {
return m.useMultimodal
}
// HasImages returns true if any of the multimodal messages contain images.
func (m *Messages) HasImages() bool {
if !m.useMultimodal {
return false
}
for _, msg := range m.multimodalMessages {
for _, content := range msg.Content {
if content.Type == ContentTypeImageURL {
return true
}
}
}
return false
}
// HasFiles returns true if any of the multimodal messages contain files.
func (m *Messages) HasFiles() bool {
if !m.useMultimodal {
return false
}
for _, msg := range m.multimodalMessages {
for _, content := range msg.Content {
if content.Type == ContentTypeFileURL {
return true
}
}
}
return false
}