feat(alerts): Health-Alarme via Webhook + Email-SMTP

Sidebar → System → Alarme.

Migration 0021: alert_channels (kind=webhook|email, target, settings,
active) + alert_events (kind, severity=info/warning/error/critical,
subject, message, sent_to JSONB).

internal/services/alerts/:
  - Fire(kind, severity, subject, message) — broadcastet an alle
    aktiven Channels + persistiert Event mit per-Channel-Result
    (ok/error) in sent_to.
  - Webhook-Sender: POST JSON {kind, severity, subject, message,
    content, text, fired_at}. Slack/Discord/Teams akzeptieren das
    out-of-the-box ohne Adapter (content + text-Felder gleichzeitig).
  - Email-Sender: net/smtp + STARTTLS optional. Settings (smtp_host,
    smtp_port, username/password, from, use_tls) liegen in
    channel.settings JSONB.

internal/handlers/alerts.go: CRUD + POST /alerts/test + GET
/alerts/events (history).

Scheduler-Trigger:
  - cert.expiring  — TLS-Cert <14 Tage Restzeit (12h-dedupe pro cert)
                     severity warning, <3 Tage → error
  - cert.renew_failed       — Renewer-Cycle hat fails
  - cert.renewer.run_failed — Renewer-Cycle abgebrochen
  - backup.failed  — Scheduled Backup error
  - license.invalid — License-Server liefert valid=false

In-process Dedupe (12h TTL, map[key]time.Time) verhindert dass
identische Alerts in Schleifen feuern.

UI (pages/Alerts): Tabs Channels (CRUD-Tabelle, Add-Modal mit
conditional-Email-Fields) + History (200 letzte Events mit
severity-Tag + per-Channel-Delivery-Status). Header-Button
„Test-Alert" feuert einen Test-Event in alle aktiven Channels.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
Debian
2026-05-13 15:57:05 +02:00
parent 4a34629023
commit 81a8217493
13 changed files with 1012 additions and 14 deletions

134
internal/handlers/alerts.go Normal file
View File

@@ -0,0 +1,134 @@
package handlers
import (
"errors"
"strconv"
"github.com/gin-gonic/gin"
"git.netcell-it.de/projekte/edgeguard-native/internal/handlers/response"
"git.netcell-it.de/projekte/edgeguard-native/internal/services/alerts"
"git.netcell-it.de/projekte/edgeguard-native/internal/services/audit"
)
// AlertsHandler exposes:
//
// GET /api/v1/alerts/channels
// POST /api/v1/alerts/channels
// PUT /api/v1/alerts/channels/:id
// DELETE /api/v1/alerts/channels/:id
// POST /api/v1/alerts/test — Test-Event in alle aktiven Channels
// GET /api/v1/alerts/events?limit=N — History
type AlertsHandler struct {
Service *alerts.Service
Audit *audit.Repo
NodeID string
}
func NewAlertsHandler(s *alerts.Service, a *audit.Repo, nodeID string) *AlertsHandler {
return &AlertsHandler{Service: s, Audit: a, NodeID: nodeID}
}
func (h *AlertsHandler) Register(rg *gin.RouterGroup) {
g := rg.Group("/alerts")
g.GET("/channels", h.ListChannels)
g.POST("/channels", h.CreateChannel)
g.PUT("/channels/:id", h.UpdateChannel)
g.DELETE("/channels/:id", h.DeleteChannel)
g.POST("/test", h.TestFire)
g.GET("/events", h.ListEvents)
}
func (h *AlertsHandler) ListChannels(c *gin.Context) {
out, err := h.Service.ListChannels(c.Request.Context())
if err != nil {
response.Internal(c, err)
return
}
response.OK(c, gin.H{"channels": out})
}
func (h *AlertsHandler) CreateChannel(c *gin.Context) {
var req alerts.Channel
if err := c.ShouldBindJSON(&req); err != nil {
response.BadRequest(c, err)
return
}
out, err := h.Service.CreateChannel(c.Request.Context(), req)
if err != nil {
response.Internal(c, err)
return
}
_ = h.Audit.Log(c.Request.Context(), actorOf(c), "alert.channel.create",
out.Name, out, h.NodeID)
response.Created(c, out)
}
func (h *AlertsHandler) UpdateChannel(c *gin.Context) {
id, ok := parseID(c)
if !ok {
return
}
var req alerts.Channel
if err := c.ShouldBindJSON(&req); err != nil {
response.BadRequest(c, err)
return
}
out, err := h.Service.UpdateChannel(c.Request.Context(), id, req)
if err != nil {
if errors.Is(err, alerts.ErrNotFound) {
response.NotFound(c, err)
return
}
response.Internal(c, err)
return
}
_ = h.Audit.Log(c.Request.Context(), actorOf(c), "alert.channel.update",
out.Name, out, h.NodeID)
response.OK(c, out)
}
func (h *AlertsHandler) DeleteChannel(c *gin.Context) {
id, ok := parseID(c)
if !ok {
return
}
if err := h.Service.DeleteChannel(c.Request.Context(), id); err != nil {
if errors.Is(err, alerts.ErrNotFound) {
response.NotFound(c, err)
return
}
response.Internal(c, err)
return
}
_ = h.Audit.Log(c.Request.Context(), actorOf(c), "alert.channel.delete",
strconv.FormatInt(id, 10), gin.H{"id": id}, h.NodeID)
response.NoContent(c)
}
func (h *AlertsHandler) TestFire(c *gin.Context) {
ev, err := h.Service.Fire(c.Request.Context(), "test", alerts.SeverityInfo,
"EdgeGuard-Test-Alert",
"Dies ist ein Test-Event. Wenn du das siehst, funktionieren deine Alert-Channels.")
if err != nil {
response.Internal(c, err)
return
}
_ = h.Audit.Log(c.Request.Context(), actorOf(c), "alert.test", "test", ev, h.NodeID)
response.OK(c, ev)
}
func (h *AlertsHandler) ListEvents(c *gin.Context) {
limit := 100
if v := c.Query("limit"); v != "" {
if n, err := strconv.Atoi(v); err == nil {
limit = n
}
}
out, err := h.Service.ListEvents(c.Request.Context(), limit)
if err != nil {
response.Internal(c, err)
return
}
response.OK(c, gin.H{"events": out})
}