content.go

  1package message
  2
  3import (
  4	"encoding/base64"
  5	"errors"
  6	"slices"
  7	"strings"
  8	"time"
  9
 10	"github.com/charmbracelet/catwalk/pkg/catwalk"
 11	"github.com/charmbracelet/fantasy/ai"
 12	"github.com/charmbracelet/fantasy/anthropic"
 13)
 14
 15type MessageRole string
 16
 17const (
 18	Assistant MessageRole = "assistant"
 19	User      MessageRole = "user"
 20	System    MessageRole = "system"
 21	Tool      MessageRole = "tool"
 22)
 23
 24type FinishReason string
 25
 26const (
 27	FinishReasonEndTurn          FinishReason = "end_turn"
 28	FinishReasonMaxTokens        FinishReason = "max_tokens"
 29	FinishReasonToolUse          FinishReason = "tool_use"
 30	FinishReasonCanceled         FinishReason = "canceled"
 31	FinishReasonError            FinishReason = "error"
 32	FinishReasonPermissionDenied FinishReason = "permission_denied"
 33
 34	// Should never happen
 35	FinishReasonUnknown FinishReason = "unknown"
 36)
 37
 38type ContentPart interface {
 39	isPart()
 40}
 41
 42type ReasoningContent struct {
 43	Thinking   string `json:"thinking"`
 44	Signature  string `json:"signature"`
 45	StartedAt  int64  `json:"started_at,omitempty"`
 46	FinishedAt int64  `json:"finished_at,omitempty"`
 47}
 48
 49func (tc ReasoningContent) String() string {
 50	return tc.Thinking
 51}
 52func (ReasoningContent) isPart() {}
 53
 54type TextContent struct {
 55	Text string `json:"text"`
 56}
 57
 58func (tc TextContent) String() string {
 59	return tc.Text
 60}
 61
 62func (TextContent) isPart() {}
 63
 64type ImageURLContent struct {
 65	URL    string `json:"url"`
 66	Detail string `json:"detail,omitempty"`
 67}
 68
 69func (iuc ImageURLContent) String() string {
 70	return iuc.URL
 71}
 72
 73func (ImageURLContent) isPart() {}
 74
 75type BinaryContent struct {
 76	Path     string
 77	MIMEType string
 78	Data     []byte
 79}
 80
 81func (bc BinaryContent) String(p catwalk.InferenceProvider) string {
 82	base64Encoded := base64.StdEncoding.EncodeToString(bc.Data)
 83	if p == catwalk.InferenceProviderOpenAI {
 84		return "data:" + bc.MIMEType + ";base64," + base64Encoded
 85	}
 86	return base64Encoded
 87}
 88
 89func (BinaryContent) isPart() {}
 90
 91type ToolCall struct {
 92	ID               string `json:"id"`
 93	Name             string `json:"name"`
 94	Input            string `json:"input"`
 95	ProviderExecuted bool   `json:"provider_executed"`
 96	Finished         bool   `json:"finished"`
 97}
 98
 99func (ToolCall) isPart() {}
100
101type ToolResult struct {
102	ToolCallID string `json:"tool_call_id"`
103	Name       string `json:"name"`
104	Content    string `json:"content"`
105	Data       string `json:"data"`
106	MIMEType   string `json:"mime_type"`
107	Metadata   string `json:"metadata"`
108	IsError    bool   `json:"is_error"`
109}
110
111func (ToolResult) isPart() {}
112
113type Finish struct {
114	Reason  FinishReason `json:"reason"`
115	Time    int64        `json:"time"`
116	Message string       `json:"message,omitempty"`
117	Details string       `json:"details,omitempty"`
118}
119
120func (Finish) isPart() {}
121
122type Message struct {
123	ID        string
124	Role      MessageRole
125	SessionID string
126	Parts     []ContentPart
127	Model     string
128	Provider  string
129	CreatedAt int64
130	UpdatedAt int64
131}
132
133func (m *Message) Content() TextContent {
134	for _, part := range m.Parts {
135		if c, ok := part.(TextContent); ok {
136			return c
137		}
138	}
139	return TextContent{}
140}
141
142func (m *Message) ReasoningContent() ReasoningContent {
143	for _, part := range m.Parts {
144		if c, ok := part.(ReasoningContent); ok {
145			return c
146		}
147	}
148	return ReasoningContent{}
149}
150
151func (m *Message) ImageURLContent() []ImageURLContent {
152	imageURLContents := make([]ImageURLContent, 0)
153	for _, part := range m.Parts {
154		if c, ok := part.(ImageURLContent); ok {
155			imageURLContents = append(imageURLContents, c)
156		}
157	}
158	return imageURLContents
159}
160
161func (m *Message) BinaryContent() []BinaryContent {
162	binaryContents := make([]BinaryContent, 0)
163	for _, part := range m.Parts {
164		if c, ok := part.(BinaryContent); ok {
165			binaryContents = append(binaryContents, c)
166		}
167	}
168	return binaryContents
169}
170
171func (m *Message) ToolCalls() []ToolCall {
172	toolCalls := make([]ToolCall, 0)
173	for _, part := range m.Parts {
174		if c, ok := part.(ToolCall); ok {
175			toolCalls = append(toolCalls, c)
176		}
177	}
178	return toolCalls
179}
180
181func (m *Message) ToolResults() []ToolResult {
182	toolResults := make([]ToolResult, 0)
183	for _, part := range m.Parts {
184		if c, ok := part.(ToolResult); ok {
185			toolResults = append(toolResults, c)
186		}
187	}
188	return toolResults
189}
190
191func (m *Message) IsFinished() bool {
192	for _, part := range m.Parts {
193		if _, ok := part.(Finish); ok {
194			return true
195		}
196	}
197	return false
198}
199
200func (m *Message) FinishPart() *Finish {
201	for _, part := range m.Parts {
202		if c, ok := part.(Finish); ok {
203			return &c
204		}
205	}
206	return nil
207}
208
209func (m *Message) FinishReason() FinishReason {
210	for _, part := range m.Parts {
211		if c, ok := part.(Finish); ok {
212			return c.Reason
213		}
214	}
215	return ""
216}
217
218func (m *Message) IsThinking() bool {
219	if m.ReasoningContent().Thinking != "" && m.Content().Text == "" && !m.IsFinished() {
220		return true
221	}
222	return false
223}
224
225func (m *Message) AppendContent(delta string) {
226	found := false
227	for i, part := range m.Parts {
228		if c, ok := part.(TextContent); ok {
229			m.Parts[i] = TextContent{Text: c.Text + delta}
230			found = true
231		}
232	}
233	if !found {
234		m.Parts = append(m.Parts, TextContent{Text: delta})
235	}
236}
237
238func (m *Message) AppendReasoningContent(delta string) {
239	found := false
240	for i, part := range m.Parts {
241		if c, ok := part.(ReasoningContent); ok {
242			m.Parts[i] = ReasoningContent{
243				Thinking:   c.Thinking + delta,
244				Signature:  c.Signature,
245				StartedAt:  c.StartedAt,
246				FinishedAt: c.FinishedAt,
247			}
248			found = true
249		}
250	}
251	if !found {
252		m.Parts = append(m.Parts, ReasoningContent{
253			Thinking:  delta,
254			StartedAt: time.Now().Unix(),
255		})
256	}
257}
258
259func (m *Message) AppendReasoningSignature(signature string) {
260	for i, part := range m.Parts {
261		if c, ok := part.(ReasoningContent); ok {
262			m.Parts[i] = ReasoningContent{
263				Thinking:   c.Thinking,
264				Signature:  c.Signature + signature,
265				StartedAt:  c.StartedAt,
266				FinishedAt: c.FinishedAt,
267			}
268			return
269		}
270	}
271	m.Parts = append(m.Parts, ReasoningContent{Signature: signature})
272}
273
274func (m *Message) FinishThinking() {
275	for i, part := range m.Parts {
276		if c, ok := part.(ReasoningContent); ok {
277			if c.FinishedAt == 0 {
278				m.Parts[i] = ReasoningContent{
279					Thinking:   c.Thinking,
280					Signature:  c.Signature,
281					StartedAt:  c.StartedAt,
282					FinishedAt: time.Now().Unix(),
283				}
284			}
285			return
286		}
287	}
288}
289
290func (m *Message) ThinkingDuration() time.Duration {
291	reasoning := m.ReasoningContent()
292	if reasoning.StartedAt == 0 {
293		return 0
294	}
295
296	endTime := reasoning.FinishedAt
297	if endTime == 0 {
298		endTime = time.Now().Unix()
299	}
300
301	return time.Duration(endTime-reasoning.StartedAt) * time.Second
302}
303
304func (m *Message) FinishToolCall(toolCallID string) {
305	for i, part := range m.Parts {
306		if c, ok := part.(ToolCall); ok {
307			if c.ID == toolCallID {
308				m.Parts[i] = ToolCall{
309					ID:       c.ID,
310					Name:     c.Name,
311					Input:    c.Input,
312					Finished: true,
313				}
314				return
315			}
316		}
317	}
318}
319
320func (m *Message) AppendToolCallInput(toolCallID string, inputDelta string) {
321	for i, part := range m.Parts {
322		if c, ok := part.(ToolCall); ok {
323			if c.ID == toolCallID {
324				m.Parts[i] = ToolCall{
325					ID:       c.ID,
326					Name:     c.Name,
327					Input:    c.Input + inputDelta,
328					Finished: c.Finished,
329				}
330				return
331			}
332		}
333	}
334}
335
336func (m *Message) AddToolCall(tc ToolCall) {
337	for i, part := range m.Parts {
338		if c, ok := part.(ToolCall); ok {
339			if c.ID == tc.ID {
340				m.Parts[i] = tc
341				return
342			}
343		}
344	}
345	m.Parts = append(m.Parts, tc)
346}
347
348func (m *Message) SetToolCalls(tc []ToolCall) {
349	// remove any existing tool call part it could have multiple
350	parts := make([]ContentPart, 0)
351	for _, part := range m.Parts {
352		if _, ok := part.(ToolCall); ok {
353			continue
354		}
355		parts = append(parts, part)
356	}
357	m.Parts = parts
358	for _, toolCall := range tc {
359		m.Parts = append(m.Parts, toolCall)
360	}
361}
362
363func (m *Message) AddToolResult(tr ToolResult) {
364	m.Parts = append(m.Parts, tr)
365}
366
367func (m *Message) SetToolResults(tr []ToolResult) {
368	for _, toolResult := range tr {
369		m.Parts = append(m.Parts, toolResult)
370	}
371}
372
373func (m *Message) AddFinish(reason FinishReason, message, details string) {
374	// remove any existing finish part
375	for i, part := range m.Parts {
376		if _, ok := part.(Finish); ok {
377			m.Parts = slices.Delete(m.Parts, i, i+1)
378			break
379		}
380	}
381	m.Parts = append(m.Parts, Finish{Reason: reason, Time: time.Now().Unix(), Message: message, Details: details})
382}
383
384func (m *Message) AddImageURL(url, detail string) {
385	m.Parts = append(m.Parts, ImageURLContent{URL: url, Detail: detail})
386}
387
388func (m *Message) AddBinary(mimeType string, data []byte) {
389	m.Parts = append(m.Parts, BinaryContent{MIMEType: mimeType, Data: data})
390}
391
392func (m *Message) ToAIMessage() []ai.Message {
393	var messages []ai.Message
394	switch m.Role {
395	case User:
396		var parts []ai.MessagePart
397		text := strings.TrimSpace(m.Content().Text)
398		if text != "" {
399			parts = append(parts, ai.TextPart{Text: text})
400		}
401		for _, content := range m.BinaryContent() {
402			parts = append(parts, ai.FilePart{
403				Filename:  content.Path,
404				Data:      content.Data,
405				MediaType: content.MIMEType,
406			})
407		}
408		messages = append(messages, ai.Message{
409			Role:    ai.MessageRoleUser,
410			Content: parts,
411		})
412	case Assistant:
413		var parts []ai.MessagePart
414		text := strings.TrimSpace(m.Content().Text)
415		if text != "" {
416			parts = append(parts, ai.TextPart{Text: text})
417		}
418		reasoning := m.ReasoningContent()
419		if reasoning.Thinking != "" {
420			reasoningPart := ai.ReasoningPart{Text: reasoning.Thinking, ProviderOptions: ai.ProviderOptions{}}
421			if reasoning.Signature != "" {
422				reasoningPart.ProviderOptions["anthropic"] = &anthropic.ReasoningOptionMetadata{
423					Signature: reasoning.Signature,
424				}
425			}
426			parts = append(parts, reasoningPart)
427		}
428		for _, call := range m.ToolCalls() {
429			parts = append(parts, ai.ToolCallPart{
430				ToolCallID:       call.ID,
431				ToolName:         call.Name,
432				Input:            call.Input,
433				ProviderExecuted: call.ProviderExecuted,
434			})
435		}
436		messages = append(messages, ai.Message{
437			Role:    ai.MessageRoleAssistant,
438			Content: parts,
439		})
440	case Tool:
441		var parts []ai.MessagePart
442		for _, result := range m.ToolResults() {
443			var content ai.ToolResultOutputContent
444			if result.IsError {
445				content = ai.ToolResultOutputContentError{
446					Error: errors.New(result.Content),
447				}
448			} else if result.Data != "" {
449				content = ai.ToolResultOutputContentMedia{
450					Data:      result.Data,
451					MediaType: result.MIMEType,
452				}
453			} else {
454				content = ai.ToolResultOutputContentText{
455					Text: result.Content,
456				}
457			}
458			parts = append(parts, ai.ToolResultPart{
459				ToolCallID: result.ToolCallID,
460				Output:     content,
461			})
462		}
463		messages = append(messages, ai.Message{
464			Role:    ai.MessageRoleTool,
465			Content: parts,
466		})
467	}
468	return messages
469}