mirror of
https://github.com/EZ-Api/ez-api.git
synced 2026-01-13 17:47:51 +00:00
feat(model-registry): models.dev updater + admin endpoints
This commit is contained in:
@@ -2,16 +2,14 @@ package service
|
||||
|
||||
import (
|
||||
"context"
|
||||
"crypto/sha256"
|
||||
"encoding/hex"
|
||||
"fmt"
|
||||
"sort"
|
||||
"strings"
|
||||
"time"
|
||||
|
||||
"github.com/ez-api/ez-api/internal/model"
|
||||
groupx "github.com/ez-api/foundation/group"
|
||||
"github.com/ez-api/foundation/jsoncodec"
|
||||
"github.com/ez-api/foundation/modelcap"
|
||||
"github.com/ez-api/foundation/routing"
|
||||
"github.com/ez-api/foundation/tokenhash"
|
||||
"github.com/redis/go-redis/v9"
|
||||
@@ -120,17 +118,17 @@ func (s *SyncService) SyncProvider(provider *model.Provider) error {
|
||||
// SyncModel writes a single model metadata record.
|
||||
func (s *SyncService) SyncModel(m *model.Model) error {
|
||||
ctx := context.Background()
|
||||
snap := modelSnapshot{
|
||||
snap := modelcap.Model{
|
||||
Name: m.Name,
|
||||
Kind: normalizeModelKind(m.Kind),
|
||||
Kind: string(modelcap.NormalizeKind(m.Kind)),
|
||||
ContextWindow: m.ContextWindow,
|
||||
CostPerToken: m.CostPerToken,
|
||||
SupportsVision: m.SupportsVision,
|
||||
SupportsFunction: m.SupportsFunctions,
|
||||
SupportsToolChoice: m.SupportsToolChoice,
|
||||
SupportsFIM: m.SupportsFIM,
|
||||
SupportsFim: m.SupportsFIM,
|
||||
MaxOutputTokens: m.MaxOutputTokens,
|
||||
}
|
||||
}.Normalized()
|
||||
if err := s.hsetJSON(ctx, "meta:models", snap.Name, snap); err != nil {
|
||||
return err
|
||||
}
|
||||
@@ -159,18 +157,6 @@ type providerSnapshot struct {
|
||||
|
||||
// keySnapshot is no longer needed as we write directly to auth:token:*
|
||||
|
||||
type modelSnapshot struct {
|
||||
Name string `json:"name"`
|
||||
Kind string `json:"kind"`
|
||||
ContextWindow int `json:"context_window"`
|
||||
CostPerToken float64 `json:"cost_per_token"`
|
||||
SupportsVision bool `json:"supports_vision"`
|
||||
SupportsFunction bool `json:"supports_functions"`
|
||||
SupportsToolChoice bool `json:"supports_tool_choice"`
|
||||
SupportsFIM bool `json:"supports_fim"`
|
||||
MaxOutputTokens int `json:"max_output_tokens"`
|
||||
}
|
||||
|
||||
// SyncAll rebuilds Redis hashes from the database; use for cold starts or forced refreshes.
|
||||
func (s *SyncService) SyncAll(db *gorm.DB) error {
|
||||
ctx := context.Background()
|
||||
@@ -194,6 +180,7 @@ func (s *SyncService) SyncAll(db *gorm.DB) error {
|
||||
if err := db.Find(&models).Error; err != nil {
|
||||
return fmt.Errorf("load models: %w", err)
|
||||
}
|
||||
var modelsPayloads map[string]string
|
||||
|
||||
var bindings []model.Binding
|
||||
if err := db.Find(&bindings).Error; err != nil {
|
||||
@@ -292,29 +279,35 @@ func (s *SyncService) SyncAll(db *gorm.DB) error {
|
||||
}
|
||||
|
||||
for _, m := range models {
|
||||
snap := modelSnapshot{
|
||||
snap := modelcap.Model{
|
||||
Name: m.Name,
|
||||
Kind: normalizeModelKind(m.Kind),
|
||||
Kind: string(modelcap.NormalizeKind(m.Kind)),
|
||||
ContextWindow: m.ContextWindow,
|
||||
CostPerToken: m.CostPerToken,
|
||||
SupportsVision: m.SupportsVision,
|
||||
SupportsFunction: m.SupportsFunctions,
|
||||
SupportsToolChoice: m.SupportsToolChoice,
|
||||
SupportsFIM: m.SupportsFIM,
|
||||
SupportsFim: m.SupportsFIM,
|
||||
MaxOutputTokens: m.MaxOutputTokens,
|
||||
}
|
||||
}.Normalized()
|
||||
payload, err := jsoncodec.Marshal(snap)
|
||||
if err != nil {
|
||||
return fmt.Errorf("marshal model %s: %w", m.Name, err)
|
||||
}
|
||||
// Capture payloads so we can compute deterministic checksum for meta:models_meta.
|
||||
if modelsPayloads == nil {
|
||||
modelsPayloads = make(map[string]string, len(models))
|
||||
}
|
||||
modelsPayloads[snap.Name] = string(payload)
|
||||
pipe.HSet(ctx, "meta:models", snap.Name, payload)
|
||||
}
|
||||
|
||||
if err := writeModelsMeta(ctx, pipe, modelsMetaInput{
|
||||
Source: "db",
|
||||
Version: fmt.Sprintf("%d", time.Now().Unix()),
|
||||
UpdatedAtSec: time.Now().Unix(),
|
||||
Models: models,
|
||||
now := time.Now().Unix()
|
||||
if err := writeModelsMeta(ctx, pipe, modelcap.Meta{
|
||||
Version: fmt.Sprintf("%d", now),
|
||||
UpdatedAt: fmt.Sprintf("%d", now),
|
||||
Source: "db",
|
||||
Checksum: modelcap.ChecksumFromPayloads(modelsPayloads),
|
||||
}); err != nil {
|
||||
return err
|
||||
}
|
||||
@@ -469,36 +462,6 @@ func normalizeStatus(status string) string {
|
||||
}
|
||||
}
|
||||
|
||||
func normalizeModelKind(kind string) string {
|
||||
k := strings.ToLower(strings.TrimSpace(kind))
|
||||
if k == "" {
|
||||
return "chat"
|
||||
}
|
||||
switch k {
|
||||
case "chat", "embedding", "rerank", "other":
|
||||
return k
|
||||
default:
|
||||
return "other"
|
||||
}
|
||||
}
|
||||
|
||||
func checksumModelPayloads(payloads map[string]string) string {
|
||||
keys := make([]string, 0, len(payloads))
|
||||
for k := range payloads {
|
||||
keys = append(keys, k)
|
||||
}
|
||||
sort.Strings(keys)
|
||||
|
||||
h := sha256.New()
|
||||
for _, k := range keys {
|
||||
_, _ = h.Write([]byte(k))
|
||||
_, _ = h.Write([]byte{'\n'})
|
||||
_, _ = h.Write([]byte(payloads[k]))
|
||||
_, _ = h.Write([]byte{'\n'})
|
||||
}
|
||||
return hex.EncodeToString(h.Sum(nil))
|
||||
}
|
||||
|
||||
func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source string) error {
|
||||
raw, err := s.rdb.HGetAll(ctx, "meta:models").Result()
|
||||
if err != nil {
|
||||
@@ -509,7 +472,7 @@ func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source str
|
||||
"version": fmt.Sprintf("%d", now),
|
||||
"updated_at": fmt.Sprintf("%d", now),
|
||||
"source": source,
|
||||
"checksum": checksumModelPayloads(raw),
|
||||
"checksum": modelcap.ChecksumFromPayloads(raw),
|
||||
}
|
||||
if err := s.rdb.HSet(ctx, "meta:models_meta", meta).Err(); err != nil {
|
||||
return fmt.Errorf("write meta:models_meta: %w", err)
|
||||
@@ -517,47 +480,33 @@ func (s *SyncService) refreshModelsMetaFromRedis(ctx context.Context, source str
|
||||
return nil
|
||||
}
|
||||
|
||||
type modelsMetaInput struct {
|
||||
Source string
|
||||
Version string
|
||||
UpdatedAtSec int64
|
||||
Models []model.Model
|
||||
}
|
||||
|
||||
func writeModelsMeta(ctx context.Context, pipe redis.Pipeliner, in modelsMetaInput) error {
|
||||
payloads := make(map[string]string, len(in.Models))
|
||||
for _, m := range in.Models {
|
||||
snap := modelSnapshot{
|
||||
Name: m.Name,
|
||||
Kind: normalizeModelKind(m.Kind),
|
||||
ContextWindow: m.ContextWindow,
|
||||
CostPerToken: m.CostPerToken,
|
||||
SupportsVision: m.SupportsVision,
|
||||
SupportsFunction: m.SupportsFunctions,
|
||||
SupportsToolChoice: m.SupportsToolChoice,
|
||||
SupportsFIM: m.SupportsFIM,
|
||||
MaxOutputTokens: m.MaxOutputTokens,
|
||||
func writeModelsMeta(ctx context.Context, pipe redis.Pipeliner, meta modelcap.Meta) error {
|
||||
fields := map[string]string{
|
||||
"version": strings.TrimSpace(meta.Version),
|
||||
"updated_at": strings.TrimSpace(meta.UpdatedAt),
|
||||
"source": strings.TrimSpace(meta.Source),
|
||||
"checksum": strings.TrimSpace(meta.Checksum),
|
||||
"upstream_url": strings.TrimSpace(meta.UpstreamURL),
|
||||
"upstream_ref": strings.TrimSpace(meta.UpstreamRef),
|
||||
}
|
||||
for k, v := range fields {
|
||||
if v == "" {
|
||||
delete(fields, k)
|
||||
}
|
||||
b, err := jsoncodec.Marshal(snap)
|
||||
if err != nil {
|
||||
return fmt.Errorf("marshal model %s for meta: %w", m.Name, err)
|
||||
}
|
||||
payloads[snap.Name] = string(b)
|
||||
}
|
||||
|
||||
meta := map[string]string{
|
||||
"version": strings.TrimSpace(in.Version),
|
||||
"updated_at": fmt.Sprintf("%d", in.UpdatedAtSec),
|
||||
"source": strings.TrimSpace(in.Source),
|
||||
"checksum": checksumModelPayloads(payloads),
|
||||
if fields["version"] == "" {
|
||||
fields["version"] = fmt.Sprintf("%d", time.Now().Unix())
|
||||
}
|
||||
if strings.TrimSpace(meta["version"]) == "" {
|
||||
meta["version"] = fmt.Sprintf("%d", time.Now().Unix())
|
||||
if fields["updated_at"] == "" {
|
||||
fields["updated_at"] = fmt.Sprintf("%d", time.Now().Unix())
|
||||
}
|
||||
if strings.TrimSpace(meta["source"]) == "" {
|
||||
meta["source"] = "db"
|
||||
if fields["source"] == "" {
|
||||
fields["source"] = "db"
|
||||
}
|
||||
if err := pipe.HSet(ctx, "meta:models_meta", meta).Err(); err != nil {
|
||||
if fields["checksum"] == "" {
|
||||
fields["checksum"] = "unknown"
|
||||
}
|
||||
if err := pipe.HSet(ctx, "meta:models_meta", fields).Err(); err != nil {
|
||||
return fmt.Errorf("write meta:models_meta: %w", err)
|
||||
}
|
||||
return nil
|
||||
|
||||
Reference in New Issue
Block a user