Add two complementary features to reduce remote revision cache staleness: 1. Smart local cache: When current system revision matches cached remote revision, force an immediate cache refresh to check for newer revisions. 2. NATS integration: Share cache updates across hosts via NATS pub/sub. Hosts publish revision updates when they fetch new data, and subscribe to receive updates from other hosts. Features include: - Auto-reconnect with infinite retries - Graceful fallback when NATS unavailable - Filtering by flake URL and hostname New CLI flags: --flake.nats.enable --flake.nats.url --flake.nats.subject --flake.nats.credentials-file New NixOS module options under services.prometheus.exporters.nixos.flake.nats Bumps version to 0.3.0. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
101 lines
2.7 KiB
Go
101 lines
2.7 KiB
Go
package main
|
|
|
|
import (
|
|
"context"
|
|
"log/slog"
|
|
"net/http"
|
|
"os"
|
|
"os/signal"
|
|
"syscall"
|
|
"time"
|
|
|
|
"git.t-juice.club/torjus/nixos-exporter/collector"
|
|
"git.t-juice.club/torjus/nixos-exporter/config"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/client_golang/prometheus/promhttp"
|
|
)
|
|
|
|
const version = "0.3.0"
|
|
|
|
func main() {
|
|
cfg, err := config.Parse()
|
|
if err != nil {
|
|
slog.Error("Failed to parse config", "error", err)
|
|
os.Exit(1)
|
|
}
|
|
|
|
// Register generation collector
|
|
genCollector := collector.NewGenerationCollector()
|
|
prometheus.MustRegister(genCollector)
|
|
slog.Info("Registered generation collector")
|
|
|
|
// Register flake collector if enabled
|
|
var flakeCollector *collector.FlakeCollector
|
|
if cfg.FlakeCollector {
|
|
var err error
|
|
flakeCollector, err = collector.NewFlakeCollectorWithNATS(collector.FlakeCollectorConfig{
|
|
FlakeURL: cfg.FlakeURL,
|
|
CheckInterval: cfg.FlakeCheckInterval,
|
|
NATSEnabled: cfg.FlakeNATSEnable,
|
|
NATSURL: cfg.FlakeNATSURL,
|
|
NATSSubject: cfg.FlakeNATSSubject,
|
|
NATSCredentialsFile: cfg.FlakeNATSCredentialsFile,
|
|
})
|
|
if err != nil {
|
|
slog.Error("Failed to create flake collector", "error", err)
|
|
os.Exit(1)
|
|
}
|
|
prometheus.MustRegister(flakeCollector)
|
|
slog.Info("Registered flake collector", "url", cfg.FlakeURL, "check_interval", cfg.FlakeCheckInterval, "nats_enabled", cfg.FlakeNATSEnable)
|
|
}
|
|
|
|
mux := http.NewServeMux()
|
|
mux.Handle("/metrics", promhttp.Handler())
|
|
mux.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
|
|
_, _ = w.Write([]byte(`<html>
|
|
<head><title>NixOS Exporter</title></head>
|
|
<body>
|
|
<h1>NixOS Exporter</h1>
|
|
<p><a href="/metrics">Metrics</a></p>
|
|
</body>
|
|
</html>`))
|
|
})
|
|
|
|
server := &http.Server{
|
|
Addr: cfg.ListenAddr,
|
|
Handler: mux,
|
|
ReadTimeout: 10 * time.Second,
|
|
WriteTimeout: 10 * time.Second,
|
|
IdleTimeout: 60 * time.Second,
|
|
}
|
|
|
|
// Handle shutdown gracefully
|
|
ctx, stop := signal.NotifyContext(context.Background(), syscall.SIGINT, syscall.SIGTERM)
|
|
defer stop()
|
|
|
|
go func() {
|
|
slog.Info("Starting server", "version", version, "addr", cfg.ListenAddr)
|
|
if err := server.ListenAndServe(); err != nil && err != http.ErrServerClosed {
|
|
slog.Error("Server error", "error", err)
|
|
os.Exit(1)
|
|
}
|
|
}()
|
|
|
|
<-ctx.Done()
|
|
slog.Info("Shutting down server")
|
|
|
|
// Close flake collector (NATS connection)
|
|
if flakeCollector != nil {
|
|
if err := flakeCollector.Close(); err != nil {
|
|
slog.Error("Failed to close flake collector", "error", err)
|
|
}
|
|
}
|
|
|
|
shutdownCtx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
|
|
defer cancel()
|
|
|
|
if err := server.Shutdown(shutdownCtx); err != nil {
|
|
slog.Error("Failed to shutdown server", "error", err)
|
|
}
|
|
}
|