Files
Memoh/internal/providers/service.go
T
Acbox Liu b88ca96064 refactor: provider & models (#277)
* refactor: move client_type to provider, replace model fields with config JSONB

- Move `client_type` from `models` to `llm_providers` table
- Add `icon` field to `llm_providers`
- Replace `dimensions`, `input_modalities`, `supports_reasoning` on `models`
  with a single `config` JSONB column containing `dimensions`,
  `compatibilities` (vision, tool-call, image-output, reasoning),
  and `context_window`
- Auto-imported models default to vision + tool-call + reasoning
- Update all backend consumers (agent, flow resolver, handlers, memory)
- Regenerate sqlc, swagger, and TypeScript SDK
- Update frontend forms, display, and i18n for new schema

* ui: show provider icon avatar in sidebar and detail header, remove icon input

* feat: add built-in provider registry with YAML definitions and enable toggle

- Add `enable` column to llm_providers (default true, backward-compatible)
- Create internal/registry package to load YAML provider/model definitions
  on startup and upsert into database (new providers disabled by default)
- Add conf/providers/ with OpenAI, Anthropic, Google YAML definitions
- Add RegistryConfig to TOML config (providers_dir, default conf/providers)
- Model listing APIs and conversation flow now filter by enabled providers
- Frontend: enable switch in provider form, green status dot in sidebar,
  enabled providers sorted to top

* fix: make 0041 migration idempotent for fresh databases

Guard data migration steps with column-existence checks so the
migration succeeds on databases created from the updated init schema.
2026-03-22 17:24:45 +08:00

331 lines
8.4 KiB
Go

package providers
import (
"context"
"encoding/json"
"fmt"
"io"
"log/slog"
"net/http"
"strings"
"time"
"github.com/jackc/pgx/v5/pgtype"
sdk "github.com/memohai/twilight-ai/sdk"
"github.com/memohai/memoh/internal/db"
"github.com/memohai/memoh/internal/db/sqlc"
"github.com/memohai/memoh/internal/models"
)
// Service handles provider operations.
type Service struct {
queries *sqlc.Queries
logger *slog.Logger
}
// NewService creates a new provider service.
func NewService(log *slog.Logger, queries *sqlc.Queries) *Service {
return &Service{
queries: queries,
logger: log.With(slog.String("service", "providers")),
}
}
// Create creates a new LLM provider.
func (s *Service) Create(ctx context.Context, req CreateRequest) (GetResponse, error) {
// Marshal metadata
metadataJSON, err := json.Marshal(req.Metadata)
if err != nil {
return GetResponse{}, fmt.Errorf("marshal metadata: %w", err)
}
clientType := req.ClientType
if clientType == "" {
clientType = string(models.ClientTypeOpenAICompletions)
}
var icon pgtype.Text
if req.Icon != "" {
icon = pgtype.Text{String: req.Icon, Valid: true}
}
provider, err := s.queries.CreateLlmProvider(ctx, sqlc.CreateLlmProviderParams{
Name: req.Name,
BaseUrl: req.BaseURL,
ApiKey: req.APIKey,
ClientType: clientType,
Icon: icon,
Enable: true,
Metadata: metadataJSON,
})
if err != nil {
return GetResponse{}, fmt.Errorf("create provider: %w", err)
}
return s.toGetResponse(provider), nil
}
// Get retrieves a provider by ID.
func (s *Service) Get(ctx context.Context, id string) (GetResponse, error) {
providerID, err := db.ParseUUID(id)
if err != nil {
return GetResponse{}, err
}
provider, err := s.queries.GetLlmProviderByID(ctx, providerID)
if err != nil {
return GetResponse{}, fmt.Errorf("get provider: %w", err)
}
return s.toGetResponse(provider), nil
}
// GetByName retrieves a provider by name.
func (s *Service) GetByName(ctx context.Context, name string) (GetResponse, error) {
provider, err := s.queries.GetLlmProviderByName(ctx, name)
if err != nil {
return GetResponse{}, fmt.Errorf("get provider by name: %w", err)
}
return s.toGetResponse(provider), nil
}
// List retrieves all providers.
func (s *Service) List(ctx context.Context) ([]GetResponse, error) {
providers, err := s.queries.ListLlmProviders(ctx)
if err != nil {
return nil, fmt.Errorf("list providers: %w", err)
}
results := make([]GetResponse, 0, len(providers))
for _, p := range providers {
results = append(results, s.toGetResponse(p))
}
return results, nil
}
// Update updates an existing provider.
func (s *Service) Update(ctx context.Context, id string, req UpdateRequest) (GetResponse, error) {
providerID, err := db.ParseUUID(id)
if err != nil {
return GetResponse{}, err
}
// Get existing provider
existing, err := s.queries.GetLlmProviderByID(ctx, providerID)
if err != nil {
return GetResponse{}, fmt.Errorf("get provider: %w", err)
}
// Apply updates
name := existing.Name
if req.Name != nil {
name = *req.Name
}
baseURL := existing.BaseUrl
if req.BaseURL != nil {
baseURL = *req.BaseURL
}
apiKey := resolveUpdatedAPIKey(existing.ApiKey, req.APIKey)
clientType := existing.ClientType
if req.ClientType != nil {
clientType = *req.ClientType
}
icon := existing.Icon
if req.Icon != nil {
icon = pgtype.Text{String: *req.Icon, Valid: *req.Icon != ""}
}
enable := existing.Enable
if req.Enable != nil {
enable = *req.Enable
}
metadata := existing.Metadata
if req.Metadata != nil {
metadataJSON, err := json.Marshal(req.Metadata)
if err != nil {
return GetResponse{}, fmt.Errorf("marshal metadata: %w", err)
}
metadata = metadataJSON
}
// Update provider
updated, err := s.queries.UpdateLlmProvider(ctx, sqlc.UpdateLlmProviderParams{
ID: providerID,
Name: name,
BaseUrl: baseURL,
ApiKey: apiKey,
ClientType: clientType,
Icon: icon,
Enable: enable,
Metadata: metadata,
})
if err != nil {
return GetResponse{}, fmt.Errorf("update provider: %w", err)
}
return s.toGetResponse(updated), nil
}
// Delete deletes a provider by ID.
func (s *Service) Delete(ctx context.Context, id string) error {
providerID, err := db.ParseUUID(id)
if err != nil {
return err
}
if err := s.queries.DeleteLlmProvider(ctx, providerID); err != nil {
return fmt.Errorf("delete provider: %w", err)
}
return nil
}
// Count returns the total count of providers.
func (s *Service) Count(ctx context.Context) (int64, error) {
count, err := s.queries.CountLlmProviders(ctx)
if err != nil {
return 0, fmt.Errorf("count providers: %w", err)
}
return count, nil
}
const probeTimeout = 5 * time.Second
// Test probes the provider using the Twilight AI SDK to check
// reachability and authentication.
func (s *Service) Test(ctx context.Context, id string) (TestResponse, error) {
providerID, err := db.ParseUUID(id)
if err != nil {
return TestResponse{}, err
}
provider, err := s.queries.GetLlmProviderByID(ctx, providerID)
if err != nil {
return TestResponse{}, fmt.Errorf("get provider: %w", err)
}
baseURL := strings.TrimRight(provider.BaseUrl, "/")
clientType := models.ClientType(provider.ClientType)
sdkProvider := models.NewSDKProvider(baseURL, provider.ApiKey, clientType, probeTimeout)
start := time.Now()
result := sdkProvider.Test(ctx)
latency := time.Since(start).Milliseconds()
return TestResponse{
Reachable: result.Status != sdk.ProviderStatusUnreachable,
LatencyMs: latency,
Message: result.Message,
}, nil
}
// FetchRemoteModels fetches models from the provider's /v1/models endpoint.
func (s *Service) FetchRemoteModels(ctx context.Context, id string) ([]RemoteModel, error) {
providerID, err := db.ParseUUID(id)
if err != nil {
return nil, err
}
provider, err := s.queries.GetLlmProviderByID(ctx, providerID)
if err != nil {
return nil, fmt.Errorf("get provider: %w", err)
}
baseURL := strings.TrimRight(provider.BaseUrl, "/")
modelsURL := fmt.Sprintf("%s/models", baseURL)
ctx, cancel := context.WithTimeout(ctx, probeTimeout)
defer cancel()
req, err := http.NewRequestWithContext(ctx, http.MethodGet, modelsURL, nil)
if err != nil {
return nil, fmt.Errorf("create request: %w", err)
}
if provider.ApiKey != "" {
req.Header.Set("Authorization", fmt.Sprintf("Bearer %s", provider.ApiKey))
}
resp, err := http.DefaultClient.Do(req) //nolint:gosec // G704: URL is from operator-configured LLM provider base URL
if err != nil {
return nil, fmt.Errorf("execute request: %w", err)
}
defer func() { _ = resp.Body.Close() }()
if resp.StatusCode != http.StatusOK {
body, _ := io.ReadAll(resp.Body)
return nil, fmt.Errorf("unexpected status code: %d, body: %s", resp.StatusCode, string(body))
}
var fetchResp FetchModelsResponse
if err := json.NewDecoder(resp.Body).Decode(&fetchResp); err != nil {
return nil, fmt.Errorf("decode response: %w", err)
}
return fetchResp.Data, nil
}
// toGetResponse converts a database provider to a response.
func (s *Service) toGetResponse(provider sqlc.LlmProvider) GetResponse {
var metadata map[string]any
if len(provider.Metadata) > 0 {
if err := json.Unmarshal(provider.Metadata, &metadata); err != nil {
if s.logger != nil {
s.logger.Warn("provider metadata unmarshal failed", slog.String("id", provider.ID.String()), slog.Any("error", err))
}
}
}
// Mask API key (show only first 8 characters)
maskedAPIKey := maskAPIKey(provider.ApiKey)
var icon string
if provider.Icon.Valid {
icon = provider.Icon.String
}
return GetResponse{
ID: provider.ID.String(),
Name: provider.Name,
BaseURL: provider.BaseUrl,
APIKey: maskedAPIKey,
ClientType: provider.ClientType,
Icon: icon,
Enable: provider.Enable,
Metadata: metadata,
CreatedAt: provider.CreatedAt.Time,
UpdatedAt: provider.UpdatedAt.Time,
}
}
// maskAPIKey masks an API key for security.
func maskAPIKey(apiKey string) string {
if apiKey == "" {
return ""
}
if len(apiKey) <= 8 {
return strings.Repeat("*", len(apiKey))
}
return apiKey[:8] + strings.Repeat("*", len(apiKey)-8)
}
// resolveUpdatedAPIKey keeps the original key when the request value matches the masked version.
// This prevents masked placeholder values from overwriting the real stored credential.
func resolveUpdatedAPIKey(existing string, updated *string) string {
if updated == nil {
return existing
}
if *updated == maskAPIKey(existing) {
return existing
}
return *updated
}