mirror of
https://github.com/memohai/Memoh.git
synced 2026-04-25 07:00:48 +09:00
d3bf6bc90a
* feat(channel): add DingTalk channel adapter - Add DingTalk channel adapter (`internal/channel/adapters/dingtalk/`) using dingtalk-stream-sdk-go, supporting inbound message receiving and outbound text/markdown reply - Register DingTalk adapter in cmd/agent and cmd/memoh - Add go.mod dependency: github.com/memohai/dingtalk-stream-sdk-go - Add Dingtalk and Wecom SVG icons and Vue components to @memohai/icon - Refactor existing icon components to remove redundant inline wrappers - Add `channelTypeDisplayName` util for consistent channel label resolution - Add DingTalk/WeCom i18n entries (en/zh) for types and typesShort - Extend channel-icon, bot-channels, channel-settings-panel to support dingtalk/wecom - Use channelTypeDisplayName in profile page to replace ad-hoc i18n lookup * fix(channel,attachment): channel quality refactor & attachment pipeline fixes Channel module: - Fix RemoveAdapter not cleaning connectionMeta (stale status leak) - Fix preparedAttachmentTypeFromMime misclassifying image/gif - Fix sleepWithContext time.After goroutine/timer leak - Export IsDataURL/IsHTTPURL/IsDataPath, dedup across packages - Cache OutboundPolicy in managerOutboundStream to avoid repeated lookups - Split OutboundAttachmentStore: extract ContainerAttachmentIngester interface - Add ManagerOption funcs (WithInboundQueueSize, WithInboundWorkers, WithRefreshInterval) - Add thread-safety docs on OutboundStream / managerOutboundStream - Add debug logs on successful send/edit paths - Expand outbound_prepare_test.go with 21 new cases - Convert no-receiver adapter helpers to package-level funcs; drop unused params DingTalk adapter: - Implement AttachmentResolver: download inbound media via /v1.0/robot/messageFiles/download - Fix pure-image inbound messages failing due to missing resolver Attachment pipeline: - Fix images invisible to LLM in pipeline (DCP) path: inject InlineImages into last user message when cfg.Query is empty - Fix public_url fallback: skip direct URL-to-LLM when ContentHash is set, always prefer inlined persisted asset - Inject path: carry ImageParts through agent.InjectMessage; inline persisted attachments in resolver inject goroutine so mid-stream images reach the model - Fix ResolveMime for images: prefer content-sniffed MIME over platform-declared MIME (fixes Feishu sending image/png header for actual JPEG content → API 400)
151 lines
4.3 KiB
Go
151 lines
4.3 KiB
Go
package agent
|
|
|
|
import (
|
|
"encoding/json"
|
|
"net/http"
|
|
"time"
|
|
|
|
sdk "github.com/memohai/twilight-ai/sdk"
|
|
)
|
|
|
|
// SessionContext carries request-scoped identity and routing information.
|
|
type SessionContext struct {
|
|
BotID string
|
|
ChatID string
|
|
SessionID string
|
|
ChannelIdentityID string
|
|
CurrentPlatform string
|
|
ReplyTarget string
|
|
ConversationType string
|
|
Timezone string
|
|
TimezoneLocation *time.Location
|
|
SessionToken string //nolint:gosec // carries session credential material at runtime
|
|
IsSubagent bool
|
|
}
|
|
|
|
// SkillEntry represents a skill loaded from the bot container.
|
|
type SkillEntry struct {
|
|
Name string
|
|
Description string
|
|
Content string
|
|
Metadata map[string]any
|
|
}
|
|
|
|
// Schedule represents a scheduled task definition.
|
|
type Schedule struct {
|
|
ID string `json:"id"`
|
|
Name string `json:"name"`
|
|
Description string `json:"description"`
|
|
Pattern string `json:"pattern"`
|
|
MaxCalls *int `json:"maxCalls,omitempty"`
|
|
Command string `json:"command"`
|
|
}
|
|
|
|
// LoopDetectionConfig controls loop detection behavior.
|
|
type LoopDetectionConfig struct {
|
|
Enabled bool
|
|
}
|
|
|
|
// InjectMessage carries a user message to be injected into a running agent
|
|
// stream between tool rounds via the PrepareStep hook.
|
|
type InjectMessage struct {
|
|
Text string
|
|
HeaderifiedText string
|
|
// ImageParts carries inline images (data URL or public URL) to attach
|
|
// alongside the injected text when the model supports vision input.
|
|
ImageParts []sdk.ImagePart
|
|
}
|
|
|
|
// RunConfig holds everything needed for a single agent invocation.
|
|
type RunConfig struct {
|
|
Model *sdk.Model
|
|
ReasoningEffort string
|
|
Messages []sdk.Message
|
|
Query string
|
|
System string
|
|
SessionType string
|
|
SupportsImageInput bool
|
|
SupportsToolCall bool
|
|
InlineImages []sdk.ImagePart
|
|
Identity SessionContext
|
|
Skills []SkillEntry
|
|
LoopDetection LoopDetectionConfig
|
|
|
|
// InjectCh receives user messages to inject between tool rounds.
|
|
// When non-nil, a PrepareStep hook drains this channel and appends
|
|
// user messages to the conversation before the next LLM call.
|
|
InjectCh <-chan InjectMessage
|
|
|
|
// InjectedRecorder is called each time a message is injected via
|
|
// PrepareStep, recording the headerified text and the number of SDK
|
|
// output messages that preceded the injection. Used by the resolver
|
|
// to interleave injected messages at the correct position in storeRound.
|
|
InjectedRecorder func(headerifiedText string, insertAfter int)
|
|
}
|
|
|
|
// GenerateResult holds the result of a non-streaming agent invocation.
|
|
type GenerateResult struct {
|
|
Messages []sdk.Message
|
|
Text string
|
|
Attachments []FileAttachment
|
|
Reactions []ReactionItem
|
|
Speeches []SpeechItem
|
|
Usage *sdk.Usage
|
|
}
|
|
|
|
// FileAttachment represents a file reference extracted from agent output.
|
|
type FileAttachment struct {
|
|
Type string `json:"type"`
|
|
Path string `json:"path,omitempty"`
|
|
URL string `json:"url,omitempty"`
|
|
Mime string `json:"mime,omitempty"`
|
|
Name string `json:"name,omitempty"`
|
|
ContentHash string `json:"content_hash,omitempty"`
|
|
Size int64 `json:"size,omitempty"`
|
|
Metadata map[string]any `json:"metadata,omitempty"`
|
|
}
|
|
|
|
// ReactionItem represents an emoji reaction extracted from agent output.
|
|
type ReactionItem struct {
|
|
Emoji string `json:"emoji"`
|
|
}
|
|
|
|
// SpeechItem represents a TTS request extracted from agent output.
|
|
type SpeechItem struct {
|
|
Text string `json:"text"`
|
|
}
|
|
|
|
// SystemFile is a file loaded from the bot container for prompt generation.
|
|
type SystemFile struct {
|
|
Filename string
|
|
Content string
|
|
}
|
|
|
|
// ModelConfig holds provider and model information resolved from DB.
|
|
type ModelConfig struct {
|
|
ModelID string
|
|
ClientType string
|
|
APIKey string //nolint:gosec // carries provider credential material at runtime
|
|
CodexAccountID string
|
|
BaseURL string
|
|
HTTPClient *http.Client
|
|
ReasoningConfig *ReasoningConfig
|
|
}
|
|
|
|
// ReasoningConfig controls extended thinking/reasoning behavior.
|
|
type ReasoningConfig struct {
|
|
Enabled bool
|
|
Effort string
|
|
}
|
|
|
|
func mustMarshal(v any) json.RawMessage {
|
|
data, err := json.Marshal(v)
|
|
if err != nil {
|
|
return nil
|
|
}
|
|
return data
|
|
}
|
|
|
|
// TimeNow is a hook for testing. Defaults to time.Now.
|
|
var TimeNow = time.Now
|