feat(model-registry): models.dev updater + admin endpoints

This commit is contained in:
zenfun
2025-12-17 23:59:34 +08:00
parent 96e1fe41a5
commit b2d2df18c5
8 changed files with 1223 additions and 103 deletions

View File

@@ -2,16 +2,14 @@ package service
import (
"context"
"crypto/sha256"
"encoding/hex"
"fmt"
"sort"
"strings"
"time"
"github.com/ez-api/ez-api/internal/model"
groupx "github.com/ez-api/foundation/group"
"github.com/ez-api/foundation/jsoncodec"
"github.com/ez-api/foundation/modelcap"
"github.com/ez-api/foundation/routing"
"github.com/ez-api/foundation/tokenhash"
"github.com/redis/go-redis/v9"
@@ -120,17 +118,17 @@ func (s *SyncService) SyncProvider(provider *model.Provider) error {
// SyncModel writes a single model metadata record.
func (s *SyncService) SyncModel(m *model.Model) error {
ctx := context.Background()
snap := modelSnapshot{
snap := modelcap.Model{
Name: m.Name,
Kind: normalizeModelKind(m.Kind),
Kind: string(modelcap.NormalizeKind(m.Kind)),
ContextWindow: m.ContextWindow,
CostPerToken: m.CostPerToken,
SupportsVision: m.SupportsVision,
SupportsFunction: m.SupportsFunctions,
SupportsToolChoice: m.SupportsToolChoice,
SupportsFIM: m.SupportsFIM,
SupportsFim: m.SupportsFIM,
MaxOutputTokens: m.MaxOutputTokens,
}
}.Normalized()
if err := s.hsetJSON(ctx, "meta:models", snap.Name, snap); err != nil {
return err
}
@@ -159,18 +157,6 @@ type providerSnapshot struct {
// keySnapshot is no longer needed as we write directly to auth:token:*
type modelSnapshot struct {
Name string `json:"name"`
Kind string `json:"kind"`
ContextWindow int `json:"context_window"`
CostPerToken float64 `json:"cost_per_token"`
SupportsVision bool `json:"supports_vision"`
SupportsFunction bool `json:"supports_functions"`
SupportsToolChoice bool `json:"supports_tool_choice"`
SupportsFIM bool `json:"supports_fim"`
MaxOutputTokens int `json:"max_output_tokens"`
}
// SyncAll rebuilds Redis hashes from the database; use for cold starts or forced refreshes.
func (s *SyncService) SyncAll(db *gorm.DB) error {
ctx := context.Background()
@@ -194,6 +180,7 @@ func (s *SyncService) SyncAll(db *gorm.DB) error {
if err := db.Find(&models).Error; err != nil {
return fmt.Errorf("load models: %w", err)
}
var modelsPayloads map[string]string
var bindings []model.Binding
if err := db.Find(&bindings).Error; err != nil {
@@ -292,29 +279,35 @@ func (s *SyncService) SyncAll(db *gorm.DB) error {
}
for _, m := range models {
snap := modelSnapshot{
snap := modelcap.Model{
Name: m.Name,
Kind: normalizeModelKind(m.Kind),
Kind: string(modelcap.NormalizeKind(m.Kind)),
ContextWindow: m.ContextWindow,
CostPerToken: m.CostPerToken,
SupportsVision: m.SupportsVision,
SupportsFunction: m.SupportsFunctions,
SupportsToolChoice: m.SupportsToolChoice,
SupportsFIM: m.SupportsFIM,
SupportsFim: m.SupportsFIM,
MaxOutputTokens: m.MaxOutputTokens,
}
}.Normalized()
payload, err := jsoncodec.Marshal(snap)
if err != nil {
return fmt.Errorf("marshal model %s: %w", m.Name, err)
}
// Capture payloads so we can compute deterministic checksum for meta:models_meta.
if modelsPayloads == nil {
modelsPayloads = make(map[string]string, len(models))
}
modelsPayloads[snap.Name] = string(payload)
pipe.HSet(ctx, "meta:models", snap.Name, payload)
}
if err := writeModelsMeta(ctx, pipe, modelsMetaInput{
Source: "db",
Version: fmt.Sprintf("%d", time.Now().Unix()),
UpdatedAtSec: time.Now().Unix(),
Models: models,
now := time.Now().Unix()
if err := writeModelsMeta(ctx, pipe, modelcap.Meta{
Version: fmt.Sprintf("%d", now),
UpdatedAt: fmt.Sprintf("%d", now),
Source: "db",
Checksum: modelcap.ChecksumFromPayloads(modelsPayloads),
}); err != nil {
return err
}
@@ -469,36 +462,6 @@ func normalizeStatus(status string) string {
}
}
func normalizeModelKind(kind string) string {
k := strings.ToLower(strings.TrimSpace(kind))
if k == "" {
return "chat"
}
switch k {
case "chat", "embedding", "rerank", "other":
return k
default:
return "other"
}
}
func checksumModelPayloads(payloads map[string]string) string {
keys := make([]string, 0, len(payloads))
for k := range payloads {
keys = append(keys, k)
}
sort.Strings(keys)
h := sha256.New()
for _, k := range keys {
_, _ = h.Write([]byte(k))
_, _ = h.Write([]byte{'\n'})
_, _ = h.Write([]byte(payloads[k]))
_, _ = h.Write([]byte{'\n'})
}
return hex.EncodeToString(h.Sum(nil))
}
func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source string) error {
raw, err := s.rdb.HGetAll(ctx, "meta:models").Result()
if err != nil {
@@ -509,7 +472,7 @@ func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source str
"version": fmt.Sprintf("%d", now),
"updated_at": fmt.Sprintf("%d", now),
"source": source,
"checksum": checksumModelPayloads(raw),
"checksum": modelcap.ChecksumFromPayloads(raw),
}
if err := s.rdb.HSet(ctx, "meta:models_meta", meta).Err(); err != nil {
return fmt.Errorf("write meta:models_meta: %w", err)
@@ -517,47 +480,33 @@ func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source str
return nil
}
type modelsMetaInput struct {
Source string
Version string
UpdatedAtSec int64
Models []model.Model
}
func writeModelsMeta(ctx context.Context, pipe redis.Pipeliner, in modelsMetaInput) error {
payloads := make(map[string]string, len(in.Models))
for _, m := range in.Models {
snap := modelSnapshot{
Name: m.Name,
Kind: normalizeModelKind(m.Kind),
ContextWindow: m.ContextWindow,
CostPerToken: m.CostPerToken,
SupportsVision: m.SupportsVision,
SupportsFunction: m.SupportsFunctions,
SupportsToolChoice: m.SupportsToolChoice,
SupportsFIM: m.SupportsFIM,
MaxOutputTokens: m.MaxOutputTokens,
func writeModelsMeta(ctx context.Context, pipe redis.Pipeliner, meta modelcap.Meta) error {
fields := map[string]string{
"version": strings.TrimSpace(meta.Version),
"updated_at": strings.TrimSpace(meta.UpdatedAt),
"source": strings.TrimSpace(meta.Source),
"checksum": strings.TrimSpace(meta.Checksum),
"upstream_url": strings.TrimSpace(meta.UpstreamURL),
"upstream_ref": strings.TrimSpace(meta.UpstreamRef),
}
for k, v := range fields {
if v == "" {
delete(fields, k)
}
b, err := jsoncodec.Marshal(snap)
if err != nil {
return fmt.Errorf("marshal model %s for meta: %w", m.Name, err)
}
payloads[snap.Name] = string(b)
}
meta := map[string]string{
"version": strings.TrimSpace(in.Version),
"updated_at": fmt.Sprintf("%d", in.UpdatedAtSec),
"source": strings.TrimSpace(in.Source),
"checksum": checksumModelPayloads(payloads),
if fields["version"] == "" {
fields["version"] = fmt.Sprintf("%d", time.Now().Unix())
}
if strings.TrimSpace(meta["version"]) == "" {
meta["version"] = fmt.Sprintf("%d", time.Now().Unix())
if fields["updated_at"] == "" {
fields["updated_at"] = fmt.Sprintf("%d", time.Now().Unix())
}
if strings.TrimSpace(meta["source"]) == "" {
meta["source"] = "db"
if fields["source"] == "" {
fields["source"] = "db"
}
if err := pipe.HSet(ctx, "meta:models_meta", meta).Err(); err != nil {
if fields["checksum"] == "" {
fields["checksum"] = "unknown"
}
if err := pipe.HSet(ctx, "meta:models_meta", fields).Err(); err != nil {
return fmt.Errorf("write meta:models_meta: %w", err)
}
return nil