feat: embedding router

This commit is contained in:
Ran
2026-01-26 05:10:53 +07:00
parent c332ce7749
commit 3ff0e2c4dd
22 changed files with 2572 additions and 392 deletions
+136
View File
@@ -0,0 +1,136 @@
package handlers
import (
"net/http"
"strings"
"time"
"github.com/labstack/echo/v4"
"github.com/memohai/memoh/internal/db/sqlc"
"github.com/memohai/memoh/internal/embeddings"
"github.com/memohai/memoh/internal/models"
)
const DefaultEmbeddingTimeout = 10 * time.Second
type EmbeddingsHandler struct {
resolver *embeddings.Resolver
}
type EmbeddingsRequest struct {
Type string `json:"type"`
Provider string `json:"provider,omitempty"`
Model string `json:"model,omitempty"`
Dimensions int `json:"dimensions,omitempty"`
Input EmbeddingsInput `json:"input"`
}
type EmbeddingsInput struct {
Text string `json:"text,omitempty"`
ImageURL string `json:"image_url,omitempty"`
VideoURL string `json:"video_url,omitempty"`
}
type EmbeddingsResponse struct {
Type string `json:"type"`
Provider string `json:"provider"`
Model string `json:"model"`
Dimensions int `json:"dimensions"`
Embedding []float32 `json:"embedding"`
Usage EmbeddingsUsage `json:"usage,omitempty"`
Message string `json:"message,omitempty"`
}
type EmbeddingsUsage struct {
InputTokens int `json:"input_tokens,omitempty"`
ImageTokens int `json:"image_tokens,omitempty"`
VideoTokens int `json:"video_tokens,omitempty"`
}
func NewEmbeddingsHandler(modelsService *models.Service, queries *sqlc.Queries) *EmbeddingsHandler {
return &EmbeddingsHandler{
resolver: embeddings.NewResolver(modelsService, queries, DefaultEmbeddingTimeout),
}
}
func (h *EmbeddingsHandler) Register(e *echo.Echo) {
e.POST("/embeddings", h.Embed)
}
// Embed godoc
// @Summary Create embeddings
// @Description Create text or multimodal embeddings
// @Tags embeddings
// @Param payload body EmbeddingsRequest true "Embeddings request"
// @Success 200 {object} EmbeddingsResponse
// @Failure 400 {object} ErrorResponse
// @Failure 501 {object} EmbeddingsResponse
// @Failure 500 {object} ErrorResponse
// @Router /embeddings [post]
func (h *EmbeddingsHandler) Embed(c echo.Context) error {
var req EmbeddingsRequest
if err := c.Bind(&req); err != nil {
return echo.NewHTTPError(http.StatusBadRequest, err.Error())
}
req.Type = normalizeEmbeddingValue(req.Type)
req.Provider = normalizeEmbeddingValue(req.Provider)
req.Model = strings.TrimSpace(req.Model)
req.Input.Text = strings.TrimSpace(req.Input.Text)
req.Input.ImageURL = strings.TrimSpace(req.Input.ImageURL)
req.Input.VideoURL = strings.TrimSpace(req.Input.VideoURL)
result, err := h.resolver.Embed(c.Request().Context(), embeddings.Request{
Type: req.Type,
Provider: req.Provider,
Model: req.Model,
Dimensions: req.Dimensions,
Input: embeddings.Input{
Text: req.Input.Text,
ImageURL: req.Input.ImageURL,
VideoURL: req.Input.VideoURL,
},
})
if err != nil {
message := err.Error()
switch message {
case "no embedding models available":
return echo.NewHTTPError(http.StatusNotFound, message)
case "embedding model not found":
return echo.NewHTTPError(http.StatusBadRequest, message)
case "provider not implemented":
resp := EmbeddingsResponse{
Type: req.Type,
Provider: req.Provider,
Model: req.Model,
Dimensions: req.Dimensions,
Embedding: []float32{},
Message: "embeddings provider not implemented",
}
return c.JSON(http.StatusNotImplemented, resp)
default:
if strings.Contains(message, "required") || strings.Contains(message, "invalid") {
return echo.NewHTTPError(http.StatusBadRequest, message)
}
return echo.NewHTTPError(http.StatusInternalServerError, message)
}
}
return c.JSON(http.StatusOK, EmbeddingsResponse{
Type: result.Type,
Provider: result.Provider,
Model: result.Model,
Dimensions: result.Dimensions,
Embedding: result.Embedding,
Usage: EmbeddingsUsage{
InputTokens: result.Usage.InputTokens,
ImageTokens: result.Usage.ImageTokens,
VideoTokens: result.Usage.VideoTokens,
},
})
}
func normalizeEmbeddingValue(value string) string {
return strings.ToLower(strings.TrimSpace(value))
}
+32
View File
@@ -22,6 +22,7 @@ func NewMemoryHandler(service *memory.Service) *MemoryHandler {
func (h *MemoryHandler) Register(e *echo.Echo) {
group := e.Group("/memory")
group.POST("/add", h.Add)
group.POST("/embed", h.EmbedUpsert)
group.POST("/search", h.Search)
group.POST("/update", h.Update)
group.GET("/memories/:memoryId", h.Get)
@@ -30,6 +31,37 @@ func (h *MemoryHandler) Register(e *echo.Echo) {
group.DELETE("/memories", h.DeleteAll)
}
// EmbedUpsert godoc
// @Summary Embed and upsert memory
// @Description Embed text or multimodal input and upsert into memory store
// @Tags memory
// @Param payload body memory.EmbedUpsertRequest true "Embed upsert request"
// @Success 200 {object} memory.EmbedUpsertResponse
// @Failure 400 {object} ErrorResponse
// @Failure 500 {object} ErrorResponse
// @Router /memory/embed [post]
func (h *MemoryHandler) EmbedUpsert(c echo.Context) error {
userID, err := h.requireUserID(c)
if err != nil {
return err
}
var req memory.EmbedUpsertRequest
if err := c.Bind(&req); err != nil {
return echo.NewHTTPError(http.StatusBadRequest, err.Error())
}
if req.UserID != "" && req.UserID != userID {
return echo.NewHTTPError(http.StatusForbidden, "user mismatch")
}
req.UserID = userID
resp, err := h.service.EmbedUpsert(c.Request().Context(), req)
if err != nil {
return echo.NewHTTPError(http.StatusInternalServerError, err.Error())
}
return c.JSON(http.StatusOK, resp)
}
// Add godoc
// @Summary Add memory
// @Description Add memory for a user via memory