feat(api): add internal alerts reporting endpoint with deduplication

Add ReportAlerts endpoint for Data Plane to report alerts to Control Plane
with fingerprint-based deduplication using a 5-minute cooldown period.

Changes:
- Add POST /internal/alerts/report endpoint with validation
- Add Fingerprint field to Alert model for deduplication
- Extend GetAPIKeyStatsSummary with optional time range filtering
  using since/until query parameters to query from log records
This commit is contained in:
zenfun
2025-12-31 14:18:09 +08:00
parent 71f7578c7b
commit bfba16bbd4
4 changed files with 208 additions and 1 deletions

View File

@@ -1,6 +1,7 @@
package api
import (
"fmt"
"net/http"
"strings"
"time"
@@ -251,3 +252,131 @@ func (h *InternalHandler) FlushAPIKeyStats(c *gin.Context) {
c.JSON(http.StatusOK, gin.H{"updated": updated, "groups_updated": groupsUpdated})
}
// Alert reporting types
type reportAlertEntry struct {
Type string `json:"type" binding:"required"`
Severity string `json:"severity" binding:"required"`
Title string `json:"title" binding:"required"`
Message string `json:"message"`
RelatedID uint `json:"related_id"`
RelatedType string `json:"related_type"`
RelatedName string `json:"related_name"`
Fingerprint string `json:"fingerprint"`
Metadata string `json:"metadata"`
}
type reportAlertsRequest struct {
Alerts []reportAlertEntry `json:"alerts" binding:"required"`
}
type reportAlertsResponse struct {
Accepted int `json:"accepted"`
Deduplicated int `json:"deduplicated"`
Errors []string `json:"errors"`
}
// Default cooldown period for alert deduplication
const alertDeduplicationCooldown = 5 * time.Minute
// ReportAlerts godoc
// @Summary Report alerts from DP
// @Description Internal endpoint for Data Plane to report alerts to Control Plane
// @Tags internal
// @Accept json
// @Produce json
// @Param request body reportAlertsRequest true "Alerts to report"
// @Success 200 {object} reportAlertsResponse
// @Failure 400 {object} gin.H
// @Failure 500 {object} gin.H
// @Router /internal/alerts/report [post]
func (h *InternalHandler) ReportAlerts(c *gin.Context) {
if h == nil || h.db == nil {
c.JSON(http.StatusInternalServerError, gin.H{"error": "database not configured"})
return
}
var req reportAlertsRequest
if err := c.ShouldBindJSON(&req); err != nil {
c.JSON(http.StatusBadRequest, gin.H{"error": "invalid request body", "details": err.Error()})
return
}
if len(req.Alerts) == 0 {
c.JSON(http.StatusOK, reportAlertsResponse{Accepted: 0, Deduplicated: 0, Errors: []string{}})
return
}
// Valid alert types and severities
validTypes := map[string]bool{
"rate_limit": true, "error_spike": true, "quota_exceeded": true,
"key_disabled": true, "key_expired": true, "provider_down": true,
}
validSeverities := map[string]bool{"info": true, "warning": true, "critical": true}
accepted := 0
deduplicated := 0
var errors []string
cooldownTime := time.Now().UTC().Add(-alertDeduplicationCooldown)
for i, entry := range req.Alerts {
// Validate type
if !validTypes[entry.Type] {
errors = append(errors, fmt.Sprintf("alert %d: invalid type '%s'", i, entry.Type))
continue
}
// Validate severity
if !validSeverities[entry.Severity] {
errors = append(errors, fmt.Sprintf("alert %d: invalid severity '%s'", i, entry.Severity))
continue
}
// Generate fingerprint if not provided
fingerprint := strings.TrimSpace(entry.Fingerprint)
if fingerprint == "" && entry.RelatedType != "" {
fingerprint = fmt.Sprintf("%s:%s:%d", entry.Type, entry.RelatedType, entry.RelatedID)
}
// Check for deduplication if fingerprint is present
if fingerprint != "" {
var existingCount int64
h.db.Model(&model.Alert{}).
Where("fingerprint = ? AND status = ? AND created_at >= ?", fingerprint, model.AlertStatusActive, cooldownTime).
Count(&existingCount)
if existingCount > 0 {
deduplicated++
continue
}
}
// Create the alert
alert := model.Alert{
Type: model.AlertType(entry.Type),
Severity: model.AlertSeverity(entry.Severity),
Status: model.AlertStatusActive,
Title: strings.TrimSpace(entry.Title),
Message: strings.TrimSpace(entry.Message),
RelatedID: entry.RelatedID,
RelatedType: strings.TrimSpace(entry.RelatedType),
RelatedName: strings.TrimSpace(entry.RelatedName),
Fingerprint: fingerprint,
Metadata: entry.Metadata,
}
if err := h.db.Create(&alert).Error; err != nil {
errors = append(errors, fmt.Sprintf("alert %d: failed to create - %s", i, err.Error()))
continue
}
accepted++
}
c.JSON(http.StatusOK, reportAlertsResponse{
Accepted: accepted,
Deduplicated: deduplicated,
Errors: errors,
})
}