mirror of
https://github.com/memohai/Memoh.git
synced 2026-04-27 07:16:19 +09:00
36d50738b5
- Extract ContainsMarkdown to shared channel package - Auto-detect markdown in normalizeOutboundMessage and MCP send tool - Apply markdown-to-HTML conversion during streaming deltas, not just on the final message - Remove resolveTelegramParseMode which incorrectly returned Telegram's native "Markdown" mode instead of converting to HTML - Fix all 14 Telegram send/edit paths for consistent parse mode handling - Reset parseMode for plain-text error messages to avoid HTML corruption
522 lines
14 KiB
Go
522 lines
14 KiB
Go
package telegram
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"log/slog"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
tgbotapi "github.com/go-telegram-bot-api/telegram-bot-api/v5"
|
|
|
|
"github.com/memohai/memoh/internal/channel"
|
|
)
|
|
|
|
const (
|
|
telegramStreamEditThrottle = 5000 * time.Millisecond
|
|
telegramDraftThrottle = 300 * time.Millisecond
|
|
telegramStreamToolHintText = "Calling tools..."
|
|
telegramStreamPendingSuffix = "\n……"
|
|
)
|
|
|
|
var testEditFunc func(bot *tgbotapi.BotAPI, chatID int64, msgID int, text string, parseMode string) error
|
|
|
|
type telegramOutboundStream struct {
|
|
adapter *TelegramAdapter
|
|
cfg channel.ChannelConfig
|
|
target string
|
|
reply *channel.ReplyRef
|
|
parseMode string
|
|
isPrivateChat bool
|
|
draftID int
|
|
closed atomic.Bool
|
|
mu sync.Mutex
|
|
buf strings.Builder
|
|
streamChatID int64
|
|
streamMsgID int
|
|
lastEdited string
|
|
lastEditedAt time.Time
|
|
}
|
|
|
|
func (s *telegramOutboundStream) getBot(_ context.Context) (bot *tgbotapi.BotAPI, err error) {
|
|
telegramCfg, err := parseConfig(s.cfg.Credentials)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
bot, err = s.adapter.getOrCreateBot(telegramCfg, s.cfg.ID)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return bot, nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) getBotAndReply(ctx context.Context) (bot *tgbotapi.BotAPI, replyTo int, err error) {
|
|
bot, err = s.getBot(ctx)
|
|
if err != nil {
|
|
return nil, 0, err
|
|
}
|
|
replyTo = parseReplyToMessageID(s.reply)
|
|
return bot, replyTo, nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) refreshTypingAction(ctx context.Context) error {
|
|
// When ensureStreamMessage is called, always means that the message has not been completely generated
|
|
// so always refresh the "typing" action to improve the user experience
|
|
bot, err := s.getBot(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
action := tgbotapi.NewChatAction(s.streamChatID, tgbotapi.ChatTyping)
|
|
_, err = bot.Request(action)
|
|
return err
|
|
}
|
|
|
|
func (s *telegramOutboundStream) ensureStreamMessage(ctx context.Context, text string) error {
|
|
s.mu.Lock()
|
|
go func() {
|
|
if err := s.refreshTypingAction(ctx); err != nil {
|
|
if s.adapter != nil && s.adapter.logger != nil {
|
|
s.adapter.logger.Debug("refresh typing action failed", slog.Any("error", err))
|
|
}
|
|
}
|
|
}()
|
|
if s.streamMsgID != 0 {
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
bot, replyTo, err := s.getBotAndReply(ctx)
|
|
if err != nil {
|
|
s.mu.Unlock()
|
|
return err
|
|
}
|
|
if strings.TrimSpace(text) == "" {
|
|
text = "..."
|
|
} else {
|
|
text = strings.TrimSpace(text) + telegramStreamPendingSuffix
|
|
}
|
|
chatID, msgID, err := sendTelegramTextReturnMessage(bot, s.target, text, replyTo, s.parseMode)
|
|
if err != nil {
|
|
s.mu.Unlock()
|
|
return err
|
|
}
|
|
s.streamChatID = chatID
|
|
s.streamMsgID = msgID
|
|
s.lastEdited = text
|
|
s.lastEditedAt = time.Now()
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
|
|
func normalizeStreamComparableText(value string) string {
|
|
normalized := strings.TrimSpace(value)
|
|
normalized = strings.TrimSuffix(normalized, telegramStreamPendingSuffix)
|
|
return strings.TrimSpace(normalized)
|
|
}
|
|
|
|
func (s *telegramOutboundStream) editStreamMessage(ctx context.Context, text string) error {
|
|
s.mu.Lock()
|
|
chatID := s.streamChatID
|
|
msgID := s.streamMsgID
|
|
lastEdited := s.lastEdited
|
|
lastEditedAt := s.lastEditedAt
|
|
s.mu.Unlock()
|
|
if msgID == 0 {
|
|
return nil
|
|
}
|
|
if normalizeStreamComparableText(text) == normalizeStreamComparableText(lastEdited) {
|
|
return nil
|
|
}
|
|
text = strings.TrimSpace(text) + telegramStreamPendingSuffix
|
|
if time.Since(lastEditedAt) < telegramStreamEditThrottle {
|
|
return nil
|
|
}
|
|
bot, _, err := s.getBotAndReply(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
editErr := error(nil)
|
|
if testEditFunc != nil {
|
|
editErr = testEditFunc(bot, chatID, msgID, text, s.parseMode)
|
|
} else {
|
|
editErr = editTelegramMessageText(bot, chatID, msgID, text, s.parseMode)
|
|
}
|
|
if editErr != nil {
|
|
if isTelegramTooManyRequests(editErr) {
|
|
d := getTelegramRetryAfter(editErr)
|
|
if d <= 0 {
|
|
d = telegramStreamEditThrottle
|
|
}
|
|
s.mu.Lock()
|
|
s.lastEditedAt = time.Now().Add(d)
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
return editErr
|
|
}
|
|
s.mu.Lock()
|
|
s.lastEdited = text
|
|
s.lastEditedAt = time.Now()
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
|
|
const telegramFinalEditMaxRetries = 3
|
|
|
|
// editStreamMessageFinal edits the streamed message for the final content.
|
|
// Retries on 429 with server-provided backoff to ensure delivery.
|
|
func (s *telegramOutboundStream) editStreamMessageFinal(ctx context.Context, text string) error {
|
|
s.mu.Lock()
|
|
chatID := s.streamChatID
|
|
msgID := s.streamMsgID
|
|
lastEdited := s.lastEdited
|
|
s.mu.Unlock()
|
|
if msgID == 0 {
|
|
return nil
|
|
}
|
|
if strings.TrimSpace(text) == lastEdited {
|
|
return nil
|
|
}
|
|
bot, _, err := s.getBotAndReply(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for attempt := range telegramFinalEditMaxRetries {
|
|
editErr := error(nil)
|
|
if testEditFunc != nil {
|
|
editErr = testEditFunc(bot, chatID, msgID, text, s.parseMode)
|
|
} else {
|
|
editErr = editTelegramMessageText(bot, chatID, msgID, text, s.parseMode)
|
|
}
|
|
if editErr == nil {
|
|
s.mu.Lock()
|
|
s.lastEdited = text
|
|
s.lastEditedAt = time.Now()
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
if !isTelegramTooManyRequests(editErr) {
|
|
return editErr
|
|
}
|
|
d := getTelegramRetryAfter(editErr)
|
|
if d <= 0 {
|
|
d = time.Duration(attempt+1) * time.Second
|
|
}
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
case <-time.After(d):
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// sendDraft sends a partial message via sendMessageDraft with throttling.
|
|
// Only used for private chats.
|
|
func (s *telegramOutboundStream) sendDraft(ctx context.Context, text string) error {
|
|
s.mu.Lock()
|
|
lastEditedAt := s.lastEditedAt
|
|
s.mu.Unlock()
|
|
|
|
if time.Since(lastEditedAt) < telegramDraftThrottle {
|
|
return nil
|
|
}
|
|
if strings.TrimSpace(text) == "" {
|
|
return nil
|
|
}
|
|
|
|
bot, err := s.getBot(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
draftErr := sendTelegramDraft(bot, s.streamChatID, s.draftID, text, s.parseMode)
|
|
if draftErr != nil {
|
|
if isTelegramTooManyRequests(draftErr) {
|
|
d := getTelegramRetryAfter(draftErr)
|
|
if d <= 0 {
|
|
d = telegramDraftThrottle
|
|
}
|
|
s.mu.Lock()
|
|
s.lastEditedAt = time.Now().Add(d)
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
return draftErr
|
|
}
|
|
|
|
s.mu.Lock()
|
|
s.lastEditedAt = time.Now()
|
|
s.mu.Unlock()
|
|
return nil
|
|
}
|
|
|
|
// sendPermanentMessage sends a final, permanent message via sendMessage.
|
|
// Used in draft mode to commit text after streaming is complete for a phase.
|
|
func (s *telegramOutboundStream) sendPermanentMessage(ctx context.Context, text string, parseMode string) error {
|
|
if strings.TrimSpace(text) == "" {
|
|
return nil
|
|
}
|
|
bot, replyTo, err := s.getBotAndReply(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return sendTelegramText(bot, s.target, text, replyTo, parseMode)
|
|
}
|
|
|
|
// resetStreamState clears the streaming message state so a fresh message will
|
|
// be created on the next delta. Must be called without holding s.mu.
|
|
func (s *telegramOutboundStream) resetStreamState() {
|
|
s.mu.Lock()
|
|
s.streamMsgID = 0
|
|
if !s.isPrivateChat {
|
|
s.streamChatID = 0
|
|
}
|
|
s.lastEdited = ""
|
|
s.lastEditedAt = time.Time{}
|
|
s.buf.Reset()
|
|
s.mu.Unlock()
|
|
}
|
|
|
|
// deliverFinalText sends or edits the final text depending on chat mode.
|
|
func (s *telegramOutboundStream) deliverFinalText(ctx context.Context, text, parseMode string) error {
|
|
if s.isPrivateChat {
|
|
return s.sendPermanentMessage(ctx, text, parseMode)
|
|
}
|
|
if err := s.ensureStreamMessage(ctx, text); err != nil {
|
|
return err
|
|
}
|
|
return s.editStreamMessageFinal(ctx, text)
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushToolCallStart(ctx context.Context) error {
|
|
s.mu.Lock()
|
|
bufText := strings.TrimSpace(s.buf.String())
|
|
hasMsg := s.streamMsgID != 0
|
|
s.mu.Unlock()
|
|
if bufText != "" {
|
|
bufText = s.formatStreamContent(bufText)
|
|
}
|
|
if s.isPrivateChat {
|
|
// In draft mode, send buffered text as a permanent message before tool execution.
|
|
if bufText != "" {
|
|
if err := s.sendPermanentMessage(ctx, bufText, s.parseMode); err != nil {
|
|
if s.adapter != nil && s.adapter.logger != nil {
|
|
s.adapter.logger.Warn("telegram: draft permanent message failed", slog.Any("error", err))
|
|
}
|
|
}
|
|
}
|
|
} else if hasMsg && bufText != "" {
|
|
_ = s.editStreamMessageFinal(ctx, bufText)
|
|
}
|
|
s.resetStreamState()
|
|
return nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushAttachment(ctx context.Context, event channel.StreamEvent) error {
|
|
if len(event.Attachments) == 0 {
|
|
return nil
|
|
}
|
|
bot, replyTo, err := s.getBotAndReply(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for _, att := range event.Attachments {
|
|
if sendErr := sendTelegramAttachmentWithAssets(ctx, bot, s.target, att, "", replyTo, "", s.adapter.assets); sendErr != nil {
|
|
if s.adapter != nil && s.adapter.logger != nil {
|
|
s.adapter.logger.Warn("telegram: stream attachment send failed",
|
|
slog.String("config_id", s.cfg.ID),
|
|
slog.String("type", string(att.Type)),
|
|
slog.Any("error", sendErr),
|
|
)
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushPhaseEnd(ctx context.Context, event channel.StreamEvent) error {
|
|
if event.Phase != channel.StreamPhaseText {
|
|
return nil
|
|
}
|
|
// In draft mode, skip phase-end finalization; StreamEventFinal sends the
|
|
// permanent formatted message.
|
|
if s.isPrivateChat {
|
|
return nil
|
|
}
|
|
s.mu.Lock()
|
|
finalText := strings.TrimSpace(s.buf.String())
|
|
s.mu.Unlock()
|
|
if finalText != "" {
|
|
finalText = s.formatStreamContent(finalText)
|
|
if err := s.ensureStreamMessage(ctx, finalText); err != nil {
|
|
return err
|
|
}
|
|
return s.editStreamMessageFinal(ctx, finalText)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushDelta(ctx context.Context, event channel.StreamEvent) error {
|
|
if event.Delta == "" || event.Phase == channel.StreamPhaseReasoning {
|
|
return nil
|
|
}
|
|
s.mu.Lock()
|
|
s.buf.WriteString(event.Delta)
|
|
content := s.buf.String()
|
|
s.mu.Unlock()
|
|
content = s.formatStreamContent(content)
|
|
if s.isPrivateChat {
|
|
return s.sendDraft(ctx, content)
|
|
}
|
|
if err := s.ensureStreamMessage(ctx, content); err != nil {
|
|
return err
|
|
}
|
|
return s.editStreamMessage(ctx, content)
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushFinal(ctx context.Context, event channel.StreamEvent) error {
|
|
// In draft mode, read and reset buffer atomically to prevent duplicate
|
|
// permanent messages when multiple StreamEventFinal events fire
|
|
// (one per assistant output in multi-tool-call responses).
|
|
s.mu.Lock()
|
|
bufText := strings.TrimSpace(s.buf.String())
|
|
if s.isPrivateChat {
|
|
s.buf.Reset()
|
|
}
|
|
s.mu.Unlock()
|
|
|
|
if event.Final == nil || event.Final.Message.IsEmpty() {
|
|
if bufText != "" {
|
|
bufText = s.formatStreamContent(bufText)
|
|
if err := s.deliverFinalText(ctx, bufText, s.parseMode); err != nil {
|
|
if s.adapter != nil && s.adapter.logger != nil {
|
|
s.adapter.logger.Warn("telegram: deliver buffered final text failed", slog.Any("error", err))
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
msg := event.Final.Message
|
|
finalText := bufText
|
|
if finalText == "" && !s.isPrivateChat {
|
|
finalText = strings.TrimSpace(msg.PlainText())
|
|
}
|
|
|
|
// Convert markdown to Telegram HTML for the final message.
|
|
formatted, pm := formatTelegramOutput(finalText, msg.Format)
|
|
if pm != "" {
|
|
s.mu.Lock()
|
|
s.parseMode = pm
|
|
s.mu.Unlock()
|
|
finalText = formatted
|
|
}
|
|
|
|
if err := s.deliverFinalText(ctx, finalText, s.parseMode); err != nil {
|
|
return err
|
|
}
|
|
|
|
if len(msg.Attachments) > 0 {
|
|
bot, err := s.getBot(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
replyTo := parseReplyToMessageID(s.reply)
|
|
parseMode := s.parseMode
|
|
for i, att := range msg.Attachments {
|
|
to := replyTo
|
|
if i > 0 {
|
|
to = 0
|
|
}
|
|
if err := sendTelegramAttachmentWithAssets(ctx, bot, s.target, att, "", to, parseMode, s.adapter.assets); err != nil && s.adapter.logger != nil {
|
|
s.adapter.logger.Error("stream final attachment failed", slog.String("config_id", s.cfg.ID), slog.Any("error", err))
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (s *telegramOutboundStream) pushError(ctx context.Context, event channel.StreamEvent) error {
|
|
errText := strings.TrimSpace(event.Error)
|
|
if errText == "" {
|
|
return nil
|
|
}
|
|
display := "Error: " + errText
|
|
// Error messages are plain text; reset parseMode so HTML-mode
|
|
// left over from earlier deltas does not corrupt the output.
|
|
s.mu.Lock()
|
|
s.parseMode = ""
|
|
s.mu.Unlock()
|
|
if s.isPrivateChat {
|
|
return s.sendPermanentMessage(ctx, display, "")
|
|
}
|
|
if err := s.ensureStreamMessage(ctx, display); err != nil {
|
|
return err
|
|
}
|
|
return s.editStreamMessage(ctx, display)
|
|
}
|
|
|
|
func (s *telegramOutboundStream) Push(ctx context.Context, event channel.StreamEvent) error {
|
|
if s == nil || s.adapter == nil {
|
|
return errors.New("telegram stream not configured")
|
|
}
|
|
if s.closed.Load() {
|
|
return errors.New("telegram stream is closed")
|
|
}
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
default:
|
|
}
|
|
switch event.Type {
|
|
case channel.StreamEventToolCallStart:
|
|
return s.pushToolCallStart(ctx)
|
|
case channel.StreamEventToolCallEnd:
|
|
s.resetStreamState()
|
|
return nil
|
|
case channel.StreamEventAttachment:
|
|
return s.pushAttachment(ctx, event)
|
|
case channel.StreamEventPhaseEnd:
|
|
return s.pushPhaseEnd(ctx, event)
|
|
case channel.StreamEventDelta:
|
|
return s.pushDelta(ctx, event)
|
|
case channel.StreamEventFinal:
|
|
return s.pushFinal(ctx, event)
|
|
case channel.StreamEventError:
|
|
return s.pushError(ctx, event)
|
|
default:
|
|
return nil
|
|
}
|
|
}
|
|
|
|
// formatStreamContent applies markdown-to-HTML conversion for the accumulated
|
|
// stream buffer text and updates parseMode accordingly. Safe for incomplete
|
|
// markdown — unclosed constructs are left as plain text.
|
|
func (s *telegramOutboundStream) formatStreamContent(text string) string {
|
|
if channel.ContainsMarkdown(text) {
|
|
formatted, pm := formatTelegramOutput(text, channel.MessageFormatMarkdown)
|
|
if pm != "" {
|
|
s.mu.Lock()
|
|
s.parseMode = pm
|
|
s.mu.Unlock()
|
|
return formatted
|
|
}
|
|
}
|
|
return text
|
|
}
|
|
|
|
func (s *telegramOutboundStream) Close(ctx context.Context) error {
|
|
if s == nil {
|
|
return nil
|
|
}
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
default:
|
|
}
|
|
s.closed.Store(true)
|
|
return nil
|
|
}
|