fix(tui): bump Subtle ANSI fallback from "8" to "7"

Bright black ("8") plus Faint made PENDING status and dividers nearly invisible in 16-color terminals. White ("7") with Faint renders as a readable dim gray while still sitting below Muted in the hierarchy.
feat(tui): add monochrome emphasis attributes for SSH readability
2026-06-19 17:27:54 -04:00 · 2026-06-19 17:27:54 -04:00 · 2026-06-19 17:27:54 -04:00 · 2026-06-17 17:26:16 -04:00 · 2026-06-17 14:00:05 -04:00 · 2026-06-16 20:32:41 -04:00
79 changed files with 4181 additions and 2455 deletions
@@ -10,3 +10,5 @@ vendor/
 *.local
 .env
 .github/
 dist/
 uptop
@@ -65,7 +65,7 @@ jobs:
          go-version: "1.26"
      - name: Install govulncheck
-        run: go install golang.org/x/vuln/cmd/govulncheck@latest
+        run: go install golang.org/x/vuln/cmd/govulncheck@v1.1.4
      - name: Run govulncheck
        run: govulncheck ./...
@@ -3,7 +3,7 @@ name: Release Binaries
 on:
  push:
    tags:
-      - "[0-9]*"
+      - "v[0-9]*"
 jobs:
  release:
@@ -13,7 +13,7 @@ jobs:
        shell: sh
    steps:
      - name: Install build tools
-        run: apk add --no-cache git gcc musl-dev
+        run: apk add --no-cache git
      - uses: actions/checkout@v4
        with:
@@ -33,8 +33,8 @@ jobs:
      - name: Install git-cliff
        run: |
-          apk add --no-cache curl jq
+          apk add --no-cache curl
-          VERSION=$(curl -sS https://api.github.com/repos/orhun/git-cliff/releases/latest | jq -r '.tag_name' | sed 's/^v//')
+          VERSION=2.13.1
          curl -sSL "https://github.com/orhun/git-cliff/releases/download/v${VERSION}/git-cliff-${VERSION}-x86_64-unknown-linux-musl.tar.gz" | tar xz -C /tmp
          mv /tmp/git-cliff-*/git-cliff /usr/local/bin/
          git-cliff --version
@@ -49,6 +49,11 @@ jobs:
          version: "~> v2"
          args: release --clean --release-notes=/tmp/release-notes.md
        env:
          GORELEASER_CURRENT_TAG: ${{ github.ref_name }}
          GORELEASER_FORCE_TOKEN: gitea
          GITEA_TOKEN: ${{ secrets.RELEASE_TOKEN }}
          GITEA_API_URL: http://gitea:3000/api/v1
      # GitHub release relaying is handled by .github/workflows/mirror-release.yml,
      # which runs on GitHub Actions when the push mirror delivers the tag and
      # copies this run's Gitea release assets — no PAT needed on this side.
@@ -3,11 +3,11 @@ name: Release Docker
 on:
  push:
    tags:
-      - "[0-9]*"
+      - "v[0-9]*"
  workflow_dispatch:
    inputs:
      tag:
-        description: "Image tag (e.g. 2026.06.1). Defaults to latest commit SHA."
+        description: "Image tag (e.g. 1.0.0, no v prefix). Defaults to latest commit SHA."
        required: false
 jobs:
@@ -27,10 +27,23 @@ jobs:
              TAG="${{ github.sha }}"
            fi
          else
            # Docker convention: git tag v1.2.3 -> image tag 1.2.3
            TAG="${{ github.ref_name }}"
            TAG="${TAG#v}"
          fi
          echo "tag=$TAG" >> "$GITHUB_OUTPUT"
          TAGS="lerkolabs/uptop:${TAG}"
          TAGS="${TAGS},lerkolabs/uptop:sha-${SHORT_SHA}"
          # :latest only for real releases — rc rehearsal tags must not move it
          if [ "${{ github.ref_type }}" = "tag" ]; then
            case "$TAG" in
              *-*) ;;
              *) TAGS="${TAGS},lerkolabs/uptop:latest" ;;
            esac
          fi
          echo "tags=$TAGS" >> "$GITHUB_OUTPUT"
      - name: Set up QEMU
        uses: docker/setup-qemu-action@v3
@@ -43,6 +56,26 @@ jobs:
          username: ${{ secrets.DOCKERHUB_USERNAME }}
          password: ${{ secrets.DOCKERHUB_TOKEN }}
      # Scan must gate the push: build amd64 locally, scan it, and only then run
      # the multi-arch push (amd64 layers come from the builder cache, so the
      # second build only adds the arm64 work).
      - name: Build for scan (amd64, local)
        uses: docker/build-push-action@v5
        with:
          context: .
          load: true
          platforms: linux/amd64
          tags: uptop-scan:${{ steps.meta.outputs.tag }}
          build-args: |
            VERSION=${{ steps.meta.outputs.tag }}
            COMMIT=${{ github.sha }}
            BUILD_DATE=${{ github.event.head_commit.timestamp }}
      - name: Scan image for CVEs
        run: |
          curl -sSfL https://raw.githubusercontent.com/anchore/grype/main/install.sh | sh -s -- -b /usr/local/bin v0.114.0
          grype uptop-scan:${{ steps.meta.outputs.tag }} --fail-on critical --output table
      - name: Build and push
        uses: docker/build-push-action@v5
        with:
@@ -51,20 +84,12 @@ jobs:
          platforms: linux/amd64,linux/arm64
          sbom: true
          provenance: mode=max
-          tags: |
+          tags: ${{ steps.meta.outputs.tags }}
            lerkolabs/uptop:${{ steps.meta.outputs.tag }}
            lerkolabs/uptop:latest
            lerkolabs/uptop:sha-${{ steps.meta.outputs.short_sha }}
          build-args: |
            VERSION=${{ steps.meta.outputs.tag }}
            COMMIT=${{ github.sha }}
            BUILD_DATE=${{ github.event.head_commit.timestamp }}
      - name: Scan image for CVEs
        run: |
          curl -sSfL https://raw.githubusercontent.com/anchore/grype/main/install.sh | sh -s -- -b /usr/local/bin
          grype lerkolabs/uptop:${{ steps.meta.outputs.tag }} --fail-on critical --output table || echo "::warning::CVE scan found critical issues — review output above"
      - name: Update Docker Hub description
        uses: peter-evans/dockerhub-description@v4
        with:
@@ -75,5 +100,7 @@ jobs:
      - name: Cleanup Docker artifacts
        if: always()
        run: |
          # the scan image is tagged, so image prune won't catch it
          docker image rm "uptop-scan:${{ steps.meta.outputs.tag }}" 2>/dev/null || true
          docker image prune -f
          docker builder prune -f --keep-storage=2GB
@@ -3,7 +3,7 @@ name: Mirror Release to GitHub
 on:
  push:
    tags:
-      - "[0-9]*"
+      - "v[0-9]*"
 permissions:
  contents: write
@@ -19,26 +19,35 @@ jobs:
        run: |
          API="https://gitea.lerkolabs.com/api/v1/repos/lerkolabs/uptop/releases/tags/${TAG}"
-          for i in $(seq 1 20); do
+          # 40 x 30s = 20 min: the Gitea release can queue behind the ~18-min
          # Docker job on the single runner. Asset count must hold steady for
          # two consecutive polls — GoReleaser uploads one file at a time, and
          # mirroring mid-upload would publish a partial asset set.
          PREV_COUNT=0
          ASSET_COUNT=0
          for i in $(seq 1 40); do
            if RESPONSE=$(curl -sf "$API" 2>/dev/null); then
              ASSET_COUNT=$(echo "$RESPONSE" | jq '.assets | length')
-              if [ "$ASSET_COUNT" -gt 0 ]; then
+              if [ "$ASSET_COUNT" -gt 0 ] && [ "$ASSET_COUNT" -eq "$PREV_COUNT" ]; then
-                echo "Found release with $ASSET_COUNT assets"
+                echo "Found release with $ASSET_COUNT assets (stable)"
                break
              fi
-              echo "Release exists but no assets yet... attempt $i/20"
+              echo "Release has $ASSET_COUNT assets (was $PREV_COUNT)... attempt $i/40"
              PREV_COUNT="$ASSET_COUNT"
            else
-              echo "Waiting for Gitea release... attempt $i/20"
+              echo "Waiting for Gitea release... attempt $i/40"
            fi
            sleep 30
          done
          if [ -z "$RESPONSE" ] || [ "$ASSET_COUNT" -eq 0 ]; then
-            echo "::error::Gitea release for ${TAG} not found or has no assets after 10 minutes"
+            echo "::error::Gitea release for ${TAG} not found or has no assets after 20 minutes"
            exit 1
          fi
-          echo "$RESPONSE" | jq -r '.body // empty' > /tmp/release-notes.md
+          # select() so an empty-string body produces an empty file — `// empty`
          # treats "" as truthy and wrote a blank line, defeating this fallback.
          echo "$RESPONSE" | jq -r '.body | select(. != null and . != "")' > /tmp/release-notes.md
          if [ ! -s /tmp/release-notes.md ]; then
            echo "Release ${TAG} from [Gitea](https://gitea.lerkolabs.com/lerkolabs/uptop/releases/tag/${TAG})" > /tmp/release-notes.md
@@ -62,8 +71,11 @@ jobs:
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          TAG: ${{ github.ref_name }}
        run: |
          PRERELEASE=""
          case "$TAG" in *-*) PRERELEASE="--prerelease" ;; esac
          gh release create "$TAG" \
            --repo "$GITHUB_REPOSITORY" \
            --title "$TAG" \
            --notes-file /tmp/release-notes.md \
            $PRERELEASE \
            /tmp/assets/*
@@ -8,16 +8,20 @@ release:
  gitea:
    owner: lerkolabs
    name: uptop
  prerelease: auto
 builds:
-  - main: ./cmd/uptop/main.go
+  - main: ./cmd/uptop
    binary: uptop
    env:
-      - CGO_ENABLED=1
+      - CGO_ENABLED=0
    goos:
      - linux
      - darwin
      - windows
    goarch:
      - amd64
      - arm64
    ldflags:
      - -s -w
      - -X main.version={{ .Version }}
@@ -29,6 +33,9 @@ builds:
 archives:
  - formats: [tar.gz]
    name_template: "{{ .ProjectName }}_{{ .Os }}_{{ .Arch }}"
    format_overrides:
      - goos: windows
        formats: [zip]
 checksum:
  name_template: checksums.txt
@@ -52,22 +59,7 @@ nfpms:
        dst: /usr/share/doc/uptop/LICENSE
        type: doc
-homebrew_casks:
+# Changelog generation must stay enabled: the --release-notes flag is consumed
-  - name: uptop
+# by the changelog pipe, so disabling it silently drops the git-cliff notes
-    homepage: https://gitea.lerkolabs.com/lerkolabs/uptop
+# (empty release body on v0.1.0-rc.1). With --release-notes set, GoReleaser
-    description: Self-hosted uptime monitoring with a TUI over SSH
+# skips its own generation and uses the file.
    directory: Casks
    skip_upload: true
    commit_msg_template: "update uptop to {{ .Tag }}"
    url:
      template: "https://gitea.lerkolabs.com/lerkolabs/uptop/releases/download/{{ .Tag }}/{{ .ArtifactName }}"
    repository:
      owner: lerkolabs
      name: homebrew-tap
      git:
        url: "ssh://git@gitea.lerkolabs.com:2222/lerkolabs/homebrew-tap.git"
        private_key: "{{ if index .Env \"TAP_SSH_KEY\" }}{{ .Env.TAP_SSH_KEY }}{{ end }}"
        ssh_command: "ssh -o StrictHostKeyChecking=accept-new"
 changelog:
  disable: true
@@ -0,0 +1,11 @@
 ignore:
  # SCP path traversal in charmbracelet/wish — same flaw, two ids: grype has
  # matched it as CVE-2026-41589 and as GHSA-xjvp-7243-rg9h depending on db
  # version, and ignore matching is exact-id, so both stay listed.
  # We only import wish/bubbletea for the SSH TUI server — the vulnerable
  # scp.Middleware / scp.NewFileSystemHandler symbols are never compiled in
  # (govulncheck reachability agrees). No fix for wish v1; v2
  # (charm.land/wish/v2 >= 2.0.1) requires the bubbletea-v2 stack migration,
  # tracked in issue #126. Remove both entries when that lands.
  - vulnerability: CVE-2026-41589
  - vulnerability: GHSA-xjvp-7243-rg9h
@@ -1,129 +1,183 @@
 # Changelog
-## [2026.06.2] — 2026-06-02 (infrastructure)
+## [Unreleased]
 ### Added
 - initial commit — uptime monitor (forked from go-upkeep)
 - enhanced dashboard with lipgloss tables, huh forms, mouse support, and animations
 - upgrade users tab with lipgloss table, edit support, role select
 - upgrade alerts tab with lipgloss table, click zones, colored types
 - widen Site struct and DB schema for ping, port, dns, group monitor types
 - add ping, port, and DNS check routines
 - add ntfy notification provider with TUI support
 - add Uptime Kuma backup converter with CLI and API
 - add mouse wheel scrolling for all tabs
 - add per-site pause, fix viewport, polish status page
 - add monitor groups with collapse/expand and tree view
 - add Telegram, PagerDuty, Pushover, Gotify providers
 - add Prometheus /metrics endpoint
 - expose HTTP method and accepted status codes in monitor form
 - add config-as-code YAML import/export
 - add distributed probing foundation — schema, models, and probe APIs
 - add probe execution mode, check extraction, and result aggregation
 - add region affinity, Nodes TUI tab, and probe metrics
 - add status bar, tab badges, and detail panel
 - bordered modals, welcome state, and dynamic name width
 - DOWN-first sort, health pulse, and site filter
 - split available width evenly between NAME and HISTORY columns
 - add type icons to sites table
 - persist logs to DB, load on startup
 - add incident management and maintenance windows
 - zebra striping, detail breadcrumb, sparkline stats, collapse persistence
 - add --version flag with build metadata injection
 - add theme system with 4 curated palettes
 - swap light theme for Tokyo Night and Gruvbox
 - seed SSH users from env var and authorized_keys file (#31)
 - show error reason when monitors go DOWN
 - proper push monitor lifecycle — PENDING, LATE, DOWN states
 - logs tab overhaul — severity tags, filtering, recovery durations
 - alert channel health indicator + test alerts
 - add GitHub release relay workflow
 - classify error reasons on DOWN monitors
 - add state change history view with outage duration
 - add Opsgenie provider
 - add STALE state for push monitors
 - add SLA reporting view
 - overhaul latency sparkline scaling, color, and layout
 - auto-prune expired maintenance windows
 - click-to-inspect sparkline tooltips in detail view
 ### Changed
- Split release pipeline into separate binary and Docker workflows (#45)
+
- Pin Docker base images by digest (#45)
+- replace database ID column with row counter
- Add GitHub release relay — mirrors Gitea releases to GitHub (#49)
+- unify SQLite and Postgres into dialect-based SQLStore
- Add Grype CVE scanning to Docker pipeline (#45)
+- add error returns to all Store interface methods
- Make CVE scan non-blocking for non-exploitable wish SCP vulnerability (#48)
+- remove store global singleton, thread store explicitly
 - extract shared HTTPProvider for webhook-based alerts
 - extract shared table rendering, fix cursor bounds
 - encapsulate engine state, add graceful shutdown and tests
 - split release pipeline, add nfpm/homebrew/git-cliff
 - decompose god files into single-concern modules
 - consistent chrome across all views
 - status icons, clean STATUS column, relative time
 - extract magic numbers into named constants
 - check all discarded errors in sqlstore_test.go
 - overhaul tab bar — consistent counts, active highlight, colored alerts
 - responsive column hiding — 3-tier priority-based layout
 - swap mattn/go-sqlite3 for modernc.org/sqlite
 - propagate context.Context through all Store methods
 - typed Status constants with IsBroken() predicate
 - schema_version migration table + DeleteAlert FK fix
 - shared storetest.BaseMock replaces 5 duplicated mocks
 - consolidate env parsing into appConfig struct
 - extract Server type with named handler methods
 - split Site into SiteConfig + SiteState
 - unify logging with log/slog
 - restructure site form to 2 type-aware pages
 ### Fixed
 - git-cliff install in CI — resolve download URL dynamically, extract to /tmp (#46, #47)
-## [2026.06.1] — 2026-06-01
+- forward all msg types to huh forms, improve row selection UX
 - harden TLS, timeouts, validation, logging, and token generation
 - add delete confirm, input validation, XSS fix, history persistence
 - correctness and robustness fixes across all subsystems
 - make status bar and tab badges visible
 - use stable sort to prevent site list shuffling each tick
 - sort children by ID before status to prevent map-order shuffling
 - sparkline now spans full column width
 - sparkline right-aligned — current time at right edge, dots fill left
 - increase history buffer to 60 so sparkline fills completely
 - compute uptime from windowed statuses, not running counters
 - seed status and latency from DB history on startup
 - strip push tokens from /status/json response
 - correct viewport sizing and dynamic chrome calculation
 - constrain form height to terminal and forward resize events
 - skip children in maintenance when computing group status
 - exclude maintenance'd monitors from down count and pulse
 - group selection highlight, layout constants, group history graphs
 - stable monitor count and universal group icons
 - replace panic with error return, handle unmarshal errors
 - add context to Provider.Send, log alert failures
 - constant-time secret comparison, request size limits
 - graceful shutdown for HTTP, SSH servers and database
 - add jitter to check intervals and stagger startup
 - use sh instead of bash for runner compatibility
 - enable CGO for race detector, use lint-action v7
 - install gcc for race detector support
 - skip irrelevant field validation by monitor type
 - guard max retries validator for group type
 - tighten zebra row contrast for Tokyo Night and Gruvbox
 - phase 1 critical fixes for public release
 - phase 2 high-severity hardening
 - phase 3 medium reliability and hardening
 - phase 4 code quality and low-severity fixes
 - rename GITEA_TOKEN to RELEASE_TOKEN
 - remove explicit container, use sh shell
 - bump golang.org/x/crypto v0.47.0 → v0.52.0
 - install git and gcc for GoReleaser in release pipeline
 - use internal Gitea URL for GoReleaser API calls
 - use docker-builder runner for Docker image builds
 - patch Docker Scout CVEs and remove unused openssh-client (#41)
 - non-root user, supply chain attestations, build cleanup
 - move SSH host key path into /data for non-root user
 - create .ssh dir explicitly, ensure entrypoint is executable
 - resolve git-cliff download URL dynamically
 - extract git-cliff to /tmp to avoid dirty worktree
 - make Grype CVE scan non-blocking for known wish vuln
 - bump Go 1.26.3 → 1.26.4
 - remove error truncation from detail panel
 - classify safedial "failed to connect" as TCP
 - resolve staticcheck lint errors in history view
 - trigger immediate recheck after site config edit
 - broken tick chain after form/dialog + retries off-by-one
 - wire up [e] edit key in detail panel
 - show push token and URL in detail panel
 - show correct push heartbeat curl command in detail panel
 - propagate STALE/LATE child status to group
 - quick wins batch — version footer, column widths, zebra, sparkline
 - logs tab use viewport for scrollable content
 - pin footer to bottom of terminal
 - normalize content whitespace for consistent footer position
 - clip overflowing content to keep footer pinned
 - remove extra blank lines above footer
 - expand log viewport to fill content area
 - log STALE recovery in push heartbeat handler
 - check fmt.Sscanf return value (errcheck lint)
 - inject time into ComputeDailyBreakdown for testability
 - cascade delete related rows when removing a site
 - merge check results into live state, never overwrite
 - serialize DB writes through a single drained writer
 - close XFF bypass and three secret-leak paths
 - move blocking DB IO out of Update/View into tea.Cmds
 - move theme styles onto the Model to end cross-session races
 - finish moving keypress DB reads into tea.Cmds
 - move all store writes out of Update into tea.Cmds
 - mask alert secrets in the TUI detail panel and table
 - serve /status/json through a public DTO
 - make SSH key revocation fail closed
 - six correctness fixes for the state machine
 - migrate Postgres timestamps to TIMESTAMPTZ
 - seven quick-win bug fixes across engine, server, TUI, CLI
 - SSRF guard gaps + DNS port restriction + metrics auth
 - track selection by site ID + q means back everywhere
 - apply convergence + push/group check history
 - Kuma import tokens/paused, Docker hardening, migrate-secrets idempotency
 - six small fixes — rate limiter leak, DST SLA, probe sort, TUI cleanup
 - seven fixes — token scan, variadic cleanup, TUI layout, compose secrets
 - chmod SQLite DB files to 0600 on open
 - close DNS-rebind TOCTOU on ping/port checks
 - API import no longer replaces user accounts
 - email send respects context deadline
 - rename X-Upkeep-Secret header to X-Uptop-Secret
 - apply log filter to full log list, not viewport window
 - repair pipeline defects found in v0.1.0-rc.1 rehearsal
 - suppress wish GHSA alias in grype, fold rc tags into launch notes
 - scan gates docker push, rc tags spare :latest, mirror waits for stable assets
 - remove tagged scan image in cleanup step
 - exclude rc tags from cliff tag_pattern so launch notes span full history
 - fall back to embedded build info when ldflags absent
 - drop body-grep Security grouping, map polish type in cliff
 - sync selectedID on click so refreshLive doesn't revert cursor
 - resolve 4 tag-blocking issues for v0.1.0
 ### Changed
 - Container runs as non-root user `uptop` (UID/GID 1000) instead of root (#44)
 - SSH host key relocated to `/data/.ssh/id_ed25519` for non-root compatibility (#44)
 - Release workflow prunes dangling images and build cache after Docker push (#44)
 ### Added
 - SBOM and provenance attestations on Docker images for supply chain compliance (#44)
 - Entrypoint script with volume writability check and migration guidance (#44)
 ### Breaking
 - Existing Docker volumes with root-owned files require migration before upgrading:
  `docker run --rm -v <volume>:/data alpine chown -R 1000:1000 /data`
 ## [2026.05.6] — 2026-05-30 (infrastructure)
 ### Changed
 - Sync README to Docker Hub on release (#43)
 ### Security
 - Patch Docker Scout CVEs, remove unused openssh-client (#41)
 ## [2026.05.5] — 2026-05-29
 ### Added
 - Error reason display when monitors go DOWN (#33)
 - Push monitor lifecycle — PENDING, LATE, DOWN states (#34)
 - Logs tab overhaul — severity tags, filtering, recovery durations (#35)
 - Alert channel health indicator and test alerts (#36)
 - TUI screenshots in `assets/` (#32)
 - CI status badge in README
 ### Changed
 - Visual polish — detail sections, column headers, alert detail (#37)
 - README rewritten with hero image, badges, collapsible install sections (#32)
 - Changelog rewritten to match actual CalVer tag history
 - Migrated to `lerkolabs` org namespace (#38)
 - Docker-compose files moved to `deploy/`
 ## [2026.05.4] — 2026-05-27
 ### Added
 - SSH user seeding from `UPTOP_ADMIN_KEY` env var and `UPTOP_KEYS` file (#31)
 - GoReleaser for binary releases
 - govulncheck in CI pipeline
 - Multi-arch Docker builds (amd64 + arm64)
 ### Changed
 - CI overhaul — Go 1.26, build caching, streamlined pipeline (#30)
 - Bumped golang.org/x/crypto v0.47.0 → v0.52.0
 - Bumped Alpine 3.21 → 3.23
 ### Security
 - Phase 1: SSRF protection, input validation, safe dial (#26)
 - Phase 2: TLS hardening, auth bypass fixes, rate limiting (#27)
 - Phase 3: Graceful degradation, connection limits, timeout enforcement (#28)
 - Phase 4: Code quality, error handling, linter fixes (#29)
 ## [2026.05.3] — 2026-05-25
 ### Added
 - Theme system with 5 dark palettes — Default, Dracula, Nord, Tokyo Night, Gruvbox (#24)
 - `--version` flag with build metadata injection
 - Gitea Actions CI pipeline — test + lint (#20)
 - golangci-lint configuration
 - Comprehensive test suite — 94 tests across monitor, server, cluster (#19)
 - CONTRIBUTING.md and SECURITY.md
 ### Changed
 - Renamed project from go-upkeep to uptop (#25)
 - Updated LICENSE with dual copyright for independent fork
 ### Fixed
 - Form validators scoped to relevant monitor types (#23)
 - Graceful shutdown for HTTP, SSH servers and database (#19)
 - Constant-time secret comparison, request size limits (#19)
 - Check interval jitter to prevent thundering herd (#19)
 - TUI visual polish — zebra striping, group icons, sparkline stats (#18)
 ## [2026.05.2] — 2026-05-22
 ### Added
 - Incident management and maintenance windows (#17)
 - Production docker-compose.yml
 ### Fixed
 - Viewport sizing and dynamic chrome calculation (#16)
 - Form height constrained to terminal with resize forwarding
 - Maintenance'd monitors excluded from down count and pulse
 - Group status correctly skips children in maintenance
 ## [2026.05.1] — 2026-05-16
 ### Added
 - Distributed probing with leader + probe nodes
 - Config-as-code — YAML apply/export with dry-run and prune
 - TUI polish — status bar, tab badges, detail panel, modals
 - DOWN-first sort, health pulse, site filter
 - Type icons in sites table
 - Sparkline history graphs
 - Persistent state — uptime, status, latency, and logs survive restarts
 - Push token stripping from /status/json response
 ## [2026.04.1] — 2026-04-01
 ### Added
 - SSH-accessible TUI built on Bubble Tea + Wish
 - 6 check types — HTTP, Push, Ping, Port, DNS, Group
 - 9 alert providers — Discord, Slack, Email, Ntfy, Telegram, PagerDuty, Pushover, Gotify, Webhook
 - SQLite and PostgreSQL support
 - HA clustering with automatic failover
 - Prometheus /metrics endpoint
 - Public status page (HTML + JSON)
 - Uptime Kuma backup import
@@ -3,7 +3,7 @@
 ## Development
 ```sh
-go run cmd/uptop/main.go -demo  # starts with sample data
+go run ./cmd/uptop -demo        # starts with sample data
 ssh -p 23234 localhost              # connect to TUI
 ```
@@ -1,18 +1,17 @@
 # --- Stage 1: Builder ---
-FROM golang:1.26-alpine3.23@sha256:91eda9776261207ea25fd06b5b7fed8d397dd2c0a283e77f2ab6e91bfa71079d AS builder
+FROM golang:1.26.4-alpine3.23@sha256:f23e8b227fb4493eabe03bede4d5a32d04092da71962f1fb79b5f7d1e6c2a17f AS builder
 RUN apk add --no-cache gcc musl-dev
 WORKDIR /app
 COPY go.mod go.sum ./
 RUN --mount=type=cache,target=/go/pkg/mod \
    go mod download
 COPY . .
-ENV CGO_ENABLED=1
+ENV CGO_ENABLED=0
 ARG VERSION=dev
 ARG COMMIT=none
 ARG BUILD_DATE=unknown
 RUN --mount=type=cache,target=/go/pkg/mod \
    --mount=type=cache,target=/root/.cache/go-build \
-    go build -trimpath -ldflags="-s -w -X main.version=${VERSION} -X main.commit=${COMMIT} -X main.date=${BUILD_DATE}" -o uptop ./cmd/uptop/main.go
+    go build -trimpath -ldflags="-s -w -X main.version=${VERSION} -X main.commit=${COMMIT} -X main.date=${BUILD_DATE}" -o uptop ./cmd/uptop
 # --- Stage 2: Runner ---
 FROM alpine:3.23@sha256:5b10f432ef3da1b8d4c7eb6c487f2f5a8f096bc91145e68878dd4a5019afde11
@@ -32,6 +31,8 @@ ENV UPTOP_SSH_HOST_KEY=/data/.ssh/id_ed25519
 ENV UPTOP_PORT=23234
 EXPOSE 23234
 HEALTHCHECK --interval=30s --timeout=5s --start-period=10s --retries=3 \
  CMD wget -qO- http://localhost:8080/api/health || exit 1
 USER uptop
 ENTRYPOINT ["docker-entrypoint.sh"]
 CMD ["./uptop"]
@@ -19,6 +19,8 @@ An uptime monitor you manage entirely from the terminal. It runs as a server, ex
 Built on [RDGames/go-upkeep](https://github.com/RDGames/go-upkeep). Rewritten for clustering, config-as-code, and a proper dashboard.
 Canonical repo: [gitea.lerkolabs.com/lerkolabs/uptop](https://gitea.lerkolabs.com/lerkolabs/uptop) — [GitHub](https://github.com/lerkolabs/uptop) is a mirror; releases are published to both.
 ## Features
 - **6 check types** — HTTP, Push (heartbeat), Ping, Port, DNS, Groups
@@ -30,6 +32,8 @@ Built on [RDGames/go-upkeep](https://github.com/RDGames/go-upkeep). Rewritten fo
 - **SQLite or Postgres** — SQLite for single-node, Postgres for production
 - **Uptime Kuma import** — migrate from Kuma with one command
 > Group monitors roll up child status for display but don't fire their own alerts yet — attach alerts to the children.
 ## Screenshots
 <table>
@@ -49,14 +53,14 @@ Built on [RDGames/go-upkeep](https://github.com/RDGames/go-upkeep). Rewritten fo
 ## Quick start
 ```bash
-go run cmd/uptop/main.go
+UPTOP_ADMIN_KEY="$(cat ~/.ssh/id_ed25519.pub)" go run ./cmd/uptop
 ssh -p 23234 localhost
 ```
 Want some data to look at first:
 ```bash
-go run cmd/uptop/main.go -demo
+UPTOP_ADMIN_KEY="$(cat ~/.ssh/id_ed25519.pub)" go run ./cmd/uptop -demo
 ```
 ## Install
@@ -79,16 +83,20 @@ services:
      # - UPTOP_ADMIN_KEY=ssh-ed25519 AAAA... you@host
    volumes:
      - ./data:/data
    sysctls:
      - net.ipv4.ping_group_range=0 2147483647
 ```
-First run: set `UPTOP_ADMIN_KEY` to your SSH public key, or attach to the container and add it in the Users tab.
+First run: set `UPTOP_ADMIN_KEY` to your SSH public key.
 The `sysctls` line enables unprivileged ICMP inside the container — without it, ping monitors get no response and silently report DOWN.
 </details>
 <details>
-<summary><strong>Binary (Linux amd64)</strong></summary>
+<summary><strong>Binary (Linux, macOS, Windows)</strong></summary>
-Download from [Releases](https://github.com/lerkolabs/uptop/releases).
+Download from [Releases](https://github.com/lerkolabs/uptop/releases) — amd64 and arm64 tarballs (zip for Windows), plus `.deb`/`.rpm` packages and `checksums.txt`.
 </details>
@@ -162,6 +170,19 @@ Set `UPTOP_ENCRYPTION_KEY` to encrypt alert credentials (SMTP passwords, webhook
 Without this, credentials are stored as plaintext in the database. uptop warns on startup if unset. To encrypt credentials on an existing install, run `uptop migrate-secrets` with the key set.
 ### Data retention
 uptop prunes its own history in the background — no external cleanup jobs needed:
 | Data | Kept |
 |---|---|
 | Check history | newest 1,000 checks per monitor |
 | State changes (UP/DOWN transitions) | newest 5,000 per monitor |
 | Logs | newest 200 entries |
 | Maintenance windows | 7 days after they end (configurable) |
 Sparklines, uptime percentages, and SLA reports are computed from these windows, so very long-horizon stats aren't retained. Export to Prometheus via `/metrics` if you need unlimited history.
 ## Clustering
 uptop supports three modes: **leader** (default single node), **follower** (HA failover — takes over if the leader goes down), and **probe** (stateless distributed checks from multiple regions).
@@ -174,7 +195,7 @@ Export your Kuma backup JSON, then:
 ```bash
 curl -X POST http://localhost:8080/api/import/kuma \
-  -H "X-Upkeep-Secret: your-secret" \
+  -H "X-Uptop-Secret: your-secret" \
  -H "Content-Type: application/json" \
  -d @kuma-backup.json
 ```
@@ -23,7 +23,13 @@ filter_unconventional = true
 split_commits = false
 protect_breaking_commits = false
 filter_commits = false
-tag_pattern = "[0-9]*"
+# Only final tags count as releases — rc rehearsal tags must not become
 # section boundaries, or the final tag's notes would cover only
 # commits-since-last-rc (v0.1.0 rendered 0 commits with ignore_tags, which
 # drops rc-tagged commits instead of folding them forward). With rc tags
 # outside the pattern, finals render the full span and rc tags render
 # [Unreleased] with everything pending. Verified empirically on both.
 tag_pattern = 'v[0-9]+\.[0-9]+\.[0-9]+$'
 topo_order = false
 sort_commits = "oldest"
@@ -33,7 +39,7 @@ commit_parsers = [
    { message = "^perf", group = "Changed" },
    { message = "^refactor", group = "Changed" },
    { message = "^security", group = "Security" },
-    { body = ".*security", group = "Security" },
+    { message = "^polish", group = "Changed" },
    { body = "BREAKING", group = "Breaking" },
    { footer = "BREAKING.CHANGE", group = "Breaking" },
    { message = "^docs", skip = true },
@@ -0,0 +1,133 @@
 package main
 import (
 	"net"
 	"os"
 	"strconv"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/server"
 )
 type appConfig struct {
 	Port       int
 	SSHHostKey string
 	DBType string
 	DBDSN  string
 	HTTPPort int
 	TLSCert  string
 	TLSKey   string
 	StatusEnabled bool
 	StatusTitle   string
 	ClusterMode   string
 	ClusterSecret string
 	PeerURL       string
 	NodeID        string
 	NodeName      string
 	NodeRegion    string
 	AggStrategy         string
 	AllowPrivateTargets bool
 	InsecureSkipVerify  bool
 	MaintRetention      time.Duration
 	EncryptionKey       string
 	MetricsPublic  bool
 	CORSOrigin     string
 	TrustedProxies []*net.IPNet
 	AdminKey string
 	KeysFile string
 }
 func parseConfig() appConfig {
 	cfg := appConfig{
 		Port:           23234,
 		SSHHostKey:     ".ssh/id_ed25519",
 		DBType:         "sqlite",
 		DBDSN:          "uptop.db",
 		HTTPPort:       8080,
 		StatusTitle:    "System Status",
 		ClusterMode:    "leader",
 		MaintRetention: 7 * 24 * time.Hour,
 	}
 	if v := os.Getenv("UPTOP_PORT"); v != "" {
 		if n, err := strconv.Atoi(v); err == nil {
 			cfg.Port = n
 		}
 	}
 	if v := os.Getenv("UPTOP_DB_TYPE"); v != "" {
 		cfg.DBType = v
 	}
 	if v := os.Getenv("UPTOP_DB_DSN"); v != "" {
 		cfg.DBDSN = v
 	}
 	if v := os.Getenv("UPTOP_HTTP_PORT"); v != "" {
 		if n, err := strconv.Atoi(v); err == nil {
 			cfg.HTTPPort = n
 		}
 	}
 	if os.Getenv("UPTOP_STATUS_ENABLED") == "true" {
 		cfg.StatusEnabled = true
 	}
 	if v := os.Getenv("UPTOP_STATUS_TITLE"); v != "" {
 		cfg.StatusTitle = v
 	}
 	if v := os.Getenv("UPTOP_CLUSTER_MODE"); v != "" {
 		cfg.ClusterMode = v
 	}
 	if v := os.Getenv("UPTOP_PEER_URL"); v != "" {
 		cfg.PeerURL = v
 	}
 	if v := os.Getenv("UPTOP_CLUSTER_SECRET"); v != "" {
 		cfg.ClusterSecret = v
 	}
 	cfg.NodeID = os.Getenv("UPTOP_NODE_ID")
 	cfg.NodeName = os.Getenv("UPTOP_NODE_NAME")
 	cfg.NodeRegion = os.Getenv("UPTOP_NODE_REGION")
 	cfg.AggStrategy = os.Getenv("UPTOP_AGG_STRATEGY")
 	cfg.AllowPrivateTargets = os.Getenv("UPTOP_ALLOW_PRIVATE_TARGETS") == "true"
 	cfg.InsecureSkipVerify = os.Getenv("UPTOP_INSECURE_SKIP_VERIFY") == "true"
 	cfg.MetricsPublic = os.Getenv("UPTOP_METRICS_PUBLIC") == "true"
 	cfg.EncryptionKey = os.Getenv("UPTOP_ENCRYPTION_KEY")
 	cfg.TLSCert = os.Getenv("UPTOP_TLS_CERT")
 	cfg.TLSKey = os.Getenv("UPTOP_TLS_KEY")
 	cfg.CORSOrigin = os.Getenv("UPTOP_CORS_ORIGIN")
 	cfg.TrustedProxies = parseTrustedProxies(os.Getenv("UPTOP_TRUSTED_PROXIES"))
 	cfg.SSHHostKey = envOrDefault("UPTOP_SSH_HOST_KEY", cfg.SSHHostKey)
 	cfg.AdminKey = os.Getenv("UPTOP_ADMIN_KEY")
 	cfg.KeysFile = os.Getenv("UPTOP_KEYS")
 	if v := os.Getenv("UPTOP_MAINT_RETENTION"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil && d > 0 {
 			cfg.MaintRetention = d
 		}
 	}
 	return cfg
 }
 func (c appConfig) serverConfig(quietHTTPLog bool) server.ServerConfig {
 	return server.ServerConfig{
 		Port:           c.HTTPPort,
 		EnableStatus:   c.StatusEnabled,
 		Title:          c.StatusTitle,
 		ClusterKey:     c.ClusterSecret,
 		TLSCert:        c.TLSCert,
 		TLSKey:         c.TLSKey,
 		ClusterMode:    c.ClusterMode,
 		MetricsPublic:  c.MetricsPublic,
 		CORSOrigin:     c.CORSOrigin,
 		TrustedProxies: c.TrustedProxies,
 		QuietHTTPLog:   quietHTTPLog,
 	}
 }
@@ -0,0 +1,115 @@
 package main
 import (
 	"context"
 	"crypto/ed25519"
 	"crypto/rand"
 	"errors"
 	"testing"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 	"github.com/charmbracelet/ssh"
 	gossh "golang.org/x/crypto/ssh"
 )
 // kcMockStore embeds BaseMock for default no-ops; only GetAllUsers is
 // overridden because the tests mutate users/err between calls.
 type kcMockStore struct {
 	storetest.BaseMock
 	users []models.User
 	err   error
 }
 func (m *kcMockStore) GetAllUsers(_ context.Context) ([]models.User, error) { return m.users, m.err }
 func testKey(t *testing.T) (string, ssh.PublicKey) {
 	t.Helper()
 	pub, _, err := ed25519.GenerateKey(rand.Reader)
 	if err != nil {
 		t.Fatal(err)
 	}
 	sk, err := gossh.NewPublicKey(pub)
 	if err != nil {
 		t.Fatal(err)
 	}
 	return string(gossh.MarshalAuthorizedKey(sk)), sk
 }
 func TestKeyCache_AllowsKnownDeniesUnknown(t *testing.T) {
 	authorized, known := testKey(t)
 	_, unknown := testKey(t)
 	kc := newKeyCache(&kcMockStore{users: []models.User{{PublicKey: authorized}}})
 	if !kc.IsAllowed(known) {
 		t.Error("known key denied")
 	}
 	if kc.IsAllowed(unknown) {
 		t.Error("unknown key allowed")
 	}
 }
 func TestKeyCache_RetainsKeysOnRefreshError(t *testing.T) {
 	authorized, known := testKey(t)
 	ms := &kcMockStore{users: []models.User{{PublicKey: authorized}}}
 	kc := newKeyCache(ms)
 	if !kc.IsAllowed(known) {
 		t.Fatal("known key denied on first refresh")
 	}
 	// DB goes down and the cache goes stale: a transient error must not lock
 	// every admin out — the previous key set stays in effect.
 	ms.err = errors.New("db down")
 	kc.mu.Lock()
 	kc.updated = time.Now().Add(-time.Hour)
 	kc.mu.Unlock()
 	if !kc.IsAllowed(known) {
 		t.Error("transient refresh error locked out a previously valid key")
 	}
 }
 func TestKeyCache_FailsClosedAfterInvalidate(t *testing.T) {
 	authorized, known := testKey(t)
 	ms := &kcMockStore{users: []models.User{{PublicKey: authorized}}}
 	kc := newKeyCache(ms)
 	if !kc.IsAllowed(known) {
 		t.Fatal("known key denied on first refresh")
 	}
 	// Revocation happened (Invalidate) and the DB is unreachable for the
 	// re-read: the revoked key must NOT keep working off the stale cache.
 	ms.err = errors.New("db down")
 	kc.Invalidate()
 	if kc.IsAllowed(known) {
 		t.Error("revoked key still allowed while DB is down — fails open")
 	}
 }
 func TestUserInvalidatingStore_DeleteDropsKeyCache(t *testing.T) {
 	authorized, known := testKey(t)
 	ms := &kcMockStore{users: []models.User{{PublicKey: authorized}}}
 	kc := newKeyCache(ms)
 	s := &userInvalidatingStore{Store: ms, kc: kc}
 	if !kc.IsAllowed(known) {
 		t.Fatal("known key denied on first refresh")
 	}
 	// Revoke the user; DB unreachable immediately after. The cached key must
 	// be gone the moment the delete returns.
 	if err := s.DeleteUser(context.Background(), 1); err != nil {
 		t.Fatal(err)
 	}
 	ms.users = nil
 	ms.err = errors.New("db down")
 	if kc.IsAllowed(known) {
 		t.Error("deleted user's key still allowed from stale cache")
 	}
 }
@@ -6,13 +6,13 @@ import (
 	"errors"
 	"flag"
 	"fmt"
-	"log"
+	"log/slog"
 	"net"
 	"net/url"
 	"os"
 	"os/signal"
 	"path/filepath"
-	"strconv"
+	"runtime/debug"
 	"strings"
 	"sync"
 	"syscall"
@@ -40,8 +40,34 @@ var (
 	date    = "unknown"
 )
 // GoReleaser stamps the vars above via ldflags, but `go install module@tag`
 // compiles without them and would report "dev". The module version and any
 // vcs stamps are embedded in every binary, so fall back to those.
 func init() {
 	if version != "dev" {
 		return
 	}
 	info, ok := debug.ReadBuildInfo()
 	if !ok {
 		return
 	}
 	if mv := info.Main.Version; mv != "" && mv != "(devel)" {
 		version = strings.TrimPrefix(mv, "v")
 	}
 	for _, s := range info.Settings {
 		switch s.Key {
 		case "vcs.revision":
 			commit = s.Value
 		case "vcs.time":
 			date = s.Value
 		}
 	}
 }
 func main() {
-	log.SetOutput(os.Stderr)
+	slog.SetDefault(slog.New(slog.NewTextHandler(os.Stderr, &slog.HandlerOptions{
 		Level: slog.LevelInfo,
 	})))
 	if len(os.Args) >= 2 {
 		switch os.Args[1] {
@@ -63,11 +89,18 @@ func main() {
 }
 func printVersion() {
-	if version == "dev" {
+	out := "uptop " + version
-		fmt.Println("uptop dev")
+	var meta []string
-	} else {
+	if commit != "none" {
-		fmt.Printf("uptop %s (%s, %s)\n", version, commit, date)
+		meta = append(meta, commit)
 	}
 	if date != "unknown" {
 		meta = append(meta, date)
 	}
 	if len(meta) > 0 {
 		out += " (" + strings.Join(meta, ", ") + ")"
 	}
 	fmt.Println(out)
 }
 func envOrDefault(key, fallback string) string {
@@ -111,7 +144,7 @@ func parseTrustedProxies(raw string) []*net.IPNet {
 		}
 		_, ipnet, err := net.ParseCIDR(part)
 		if err != nil {
-			fmt.Fprintf(os.Stderr, "WARNING: ignoring invalid UPTOP_TRUSTED_PROXIES entry %q: %v\n", part, err)
+			slog.Warn("ignoring invalid UPTOP_TRUSTED_PROXIES entry", "entry", part, "err", err) //nolint:gosec // structured slog, not format string
 			continue
 		}
 		cidrs = append(cidrs, ipnet)
@@ -128,21 +161,21 @@ func openStore(dbType, dsn string) store.Store {
 		ss, err = store.NewSQLiteStore(dsn)
 	}
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "database error: %v\n", err)
+		slog.Error("database connection failed", "err", err)
 		os.Exit(1)
 	}
 	if encKey := os.Getenv("UPTOP_ENCRYPTION_KEY"); encKey != "" {
 		enc, err := store.NewEncryptor(encKey)
 		if err != nil {
-			fmt.Fprintf(os.Stderr, "encryption key error: %v\n", err)
+			slog.Error("encryption key invalid", "err", err)
 			os.Exit(1)
 		}
 		ss.SetEncryptor(enc)
 	} else {
-		fmt.Println("WARNING: No UPTOP_ENCRYPTION_KEY set. Alert credentials stored unencrypted.")
+		slog.Warn("no UPTOP_ENCRYPTION_KEY set, alert credentials stored unencrypted")
 	}
-	if err := ss.Init(); err != nil {
+	if err := ss.Init(context.Background()); err != nil {
-		fmt.Fprintf(os.Stderr, "database init error: %v\n", err)
+		slog.Error("database init failed", "err", err)
 		os.Exit(1)
 	}
 	return ss
@@ -167,16 +200,16 @@ func runApply(args []string) {
 	f, err := config.LoadFile(*filePath)
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
+		slog.Error("config load failed", "err", err)
 		os.Exit(1)
 	}
-	changes, err := config.Apply(s, f, config.ApplyOpts{
+	changes, err := config.Apply(context.Background(), s, f, config.ApplyOpts{
 		DryRun: *dryRun,
 		Prune:  *prune,
 	})
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
+		slog.Error("config apply failed", "err", err)
 		os.Exit(1)
 	}
@@ -192,14 +225,14 @@ func runExport(args []string) {
 	s := openStore(*dbType, *dsn)
-	f, err := config.Export(s)
+	f, err := config.Export(context.Background(), s)
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
+		slog.Error("export failed", "err", err)
 		os.Exit(1)
 	}
 	if err := config.WriteFile(f, *outPath); err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
+		slog.Error("export write failed", "err", err)
 		os.Exit(1)
 	}
 }
@@ -217,7 +250,7 @@ func runMigrateSecrets(args []string) {
 	}
 	enc, err := store.NewEncryptor(encKey)
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
+		slog.Error("encryption key invalid", "err", err)
 		os.Exit(1)
 	}
@@ -228,25 +261,25 @@ func runMigrateSecrets(args []string) {
 		ss, err = store.NewSQLiteStore(*dsn)
 	}
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "database error: %v\n", err)
+		slog.Error("database connection failed", "err", err)
 		os.Exit(1)
 	}
-	if err := ss.Init(); err != nil {
+	if err := ss.Init(context.Background()); err != nil {
-		fmt.Fprintf(os.Stderr, "database init error: %v\n", err)
+		slog.Error("database init failed", "err", err)
 		os.Exit(1)
 	}
 	alerts, err := ss.GetAllAlerts()
 	if err != nil {
 		fmt.Fprintf(os.Stderr, "error loading alerts: %v\n", err)
 		os.Exit(1)
 	}
 	ss.SetEncryptor(enc)
 	alerts, err := ss.GetAllAlerts(context.Background())
 	if err != nil {
 		slog.Error("failed to load alerts", "err", err)
 		os.Exit(1)
 	}
 	migrated := 0
 	for _, a := range alerts {
-		if err := ss.UpdateAlert(a.ID, a.Name, a.Type, a.Settings); err != nil {
+		if err := ss.UpdateAlert(context.Background(), a.ID, a.Name, a.Type, a.Settings); err != nil {
-			fmt.Fprintf(os.Stderr, "error migrating alert %q: %v\n", a.Name, err)
+			slog.Error("alert migration failed", "alert", a.Name, "err", err)
 			os.Exit(1)
 		}
 		migrated++
@@ -255,64 +288,19 @@ func runMigrateSecrets(args []string) {
 }
 func runServe(args []string) {
-	portVal := 23234
+	cfg := parseConfig()
 	dbType := "sqlite"
 	dbDSN := "uptop.db"
 	httpPort := 8080
 	enableStatus := false
 	statusTitle := "System Status"
 	clusterMode := "leader"
 	clusterPeer := ""
 	clusterKey := ""
-	if v := os.Getenv("UPTOP_PORT"); v != "" {
+	if cfg.ClusterMode == "probe" {
-		if p, err := strconv.Atoi(v); err == nil {
+		if cfg.NodeID == "" {
 			portVal = p
 		}
 	}
 	if v := os.Getenv("UPTOP_DB_TYPE"); v != "" {
 		dbType = v
 	}
 	if v := os.Getenv("UPTOP_DB_DSN"); v != "" {
 		dbDSN = v
 	}
 	if v := os.Getenv("UPTOP_HTTP_PORT"); v != "" {
 		if p, err := strconv.Atoi(v); err == nil {
 			httpPort = p
 		}
 	}
 	if v := os.Getenv("UPTOP_STATUS_ENABLED"); v == "true" {
 		enableStatus = true
 	}
 	if v := os.Getenv("UPTOP_STATUS_TITLE"); v != "" {
 		statusTitle = v
 	}
 	if v := os.Getenv("UPTOP_CLUSTER_MODE"); v != "" {
 		clusterMode = v
 	}
 	if v := os.Getenv("UPTOP_PEER_URL"); v != "" {
 		clusterPeer = v
 	}
 	if v := os.Getenv("UPTOP_CLUSTER_SECRET"); v != "" {
 		clusterKey = v
 	}
 	nodeID := os.Getenv("UPTOP_NODE_ID")
 	nodeName := os.Getenv("UPTOP_NODE_NAME")
 	nodeRegion := os.Getenv("UPTOP_NODE_REGION")
 	aggStrategy := os.Getenv("UPTOP_AGG_STRATEGY")
 	if clusterMode == "probe" {
 		if nodeID == "" {
 			fmt.Fprintln(os.Stderr, "UPTOP_NODE_ID is required for probe mode")
 			os.Exit(1)
 		}
-		if clusterPeer == "" {
+		if cfg.PeerURL == "" {
 			fmt.Fprintln(os.Stderr, "UPTOP_PEER_URL is required for probe mode")
 			os.Exit(1)
 		}
-		fmt.Printf("Cluster: Running as PROBE (node=%s, region=%s)\n", nodeID, nodeRegion)
+		fmt.Printf("Cluster: Running as PROBE (node=%s, region=%s)\n", cfg.NodeID, cfg.NodeRegion)
 		ctx, cancel := context.WithCancel(context.Background())
 		defer cancel()
@@ -323,29 +311,28 @@ func runServe(args []string) {
 			cancel()
 		}()
-		probeAllowPrivate := os.Getenv("UPTOP_ALLOW_PRIVATE_TARGETS") == "true"
+		if cfg.AllowPrivateTargets {
-		if probeAllowPrivate {
+			slog.Warn("private target blocking disabled, monitor URLs can reach internal networks")
 			fmt.Println("WARNING: Private target blocking disabled. Monitor URLs can reach internal networks.")
 		}
 		if err := cluster.RunProbe(ctx, cluster.ProbeConfig{
-			NodeID:              nodeID,
+			NodeID:              cfg.NodeID,
-			NodeName:            nodeName,
+			NodeName:            cfg.NodeName,
-			Region:              nodeRegion,
+			Region:              cfg.NodeRegion,
-			LeaderURL:           clusterPeer,
+			LeaderURL:           cfg.PeerURL,
-			SharedKey:           clusterKey,
+			SharedKey:           cfg.ClusterSecret,
 			Interval:            30,
-			AllowPrivateTargets: probeAllowPrivate,
+			AllowPrivateTargets: cfg.AllowPrivateTargets,
 		}); err != nil {
-			fmt.Fprintf(os.Stderr, "Probe error: %v\n", err)
+			slog.Error("probe failed", "err", err)
 		}
 		return
 	}
 	fs := flag.NewFlagSet("serve", flag.ExitOnError)
-	port := fs.Int("port", portVal, "SSH Port")
+	port := fs.Int("port", cfg.Port, "SSH Port")
-	flagDBType := fs.String("db-type", dbType, "Database type")
+	flagDBType := fs.String("db-type", cfg.DBType, "Database type")
-	flagDSN := fs.String("dsn", dbDSN, "Database DSN")
+	flagDSN := fs.String("dsn", cfg.DBDSN, "Database DSN")
 	demo := fs.Bool("demo", false, "Seed demo data")
 	importKuma := fs.String("import-kuma", "", "Import Uptime Kuma backup JSON file")
 	_ = fs.Parse(args) // ExitOnError: parse errors exit before returning
@@ -354,31 +341,32 @@ func runServe(args []string) {
 	var dbErr error
 	if *flagDBType == "postgres" {
 		ss, dbErr = store.NewPostgresStore(*flagDSN)
-		fmt.Printf("Using PostgreSQL: %s\n", redactDSN(*flagDSN))
+		slog.Info("database connected", "type", "postgres", "dsn", redactDSN(*flagDSN))
 	} else {
 		ss, dbErr = store.NewSQLiteStore(*flagDSN)
-		fmt.Printf("Using SQLite: %s\n", *flagDSN)
+		slog.Info("database connected", "type", "sqlite", "dsn", *flagDSN)
 	}
 	if dbErr != nil {
-		fmt.Fprintf(os.Stderr, "database connection error: %v\n", dbErr)
+		slog.Error("database connection failed", "err", dbErr)
 		os.Exit(1)
 	}
 	defer ss.Close()
-	if encKey := os.Getenv("UPTOP_ENCRYPTION_KEY"); encKey != "" {
+	if cfg.EncryptionKey != "" {
-		enc, err := store.NewEncryptor(encKey)
+		enc, err := store.NewEncryptor(cfg.EncryptionKey)
 		if err != nil {
-			fmt.Fprintf(os.Stderr, "encryption key error: %v\n", err)
+			slog.Error("encryption key invalid", "err", err)
 			os.Exit(1)
 		}
 		ss.SetEncryptor(enc)
 	} else {
-		fmt.Println("WARNING: No UPTOP_ENCRYPTION_KEY set. Alert credentials stored unencrypted.")
+		slog.Warn("no UPTOP_ENCRYPTION_KEY set, alert credentials stored unencrypted")
 	}
-	var s store.Store = ss
+	kc := newKeyCache(ss)
-	if err := s.Init(); err != nil {
+	var s store.Store = &userInvalidatingStore{Store: ss, kc: kc}
-		fmt.Fprintf(os.Stderr, "database init error: %v\n", err)
+	if err := s.Init(context.Background()); err != nil {
 		slog.Error("database init failed", "err", err)
 		os.Exit(1)
 	}
 	if *demo {
@@ -390,34 +378,29 @@ func runServe(args []string) {
 	if *importKuma != "" {
 		kb, err := importer.LoadKumaFile(*importKuma)
 		if err != nil {
-			fmt.Fprintf(os.Stderr, "kuma import error: %v\n", err)
+			slog.Error("kuma import failed", "err", err)
 			os.Exit(1)
 		}
 		backup := importer.ConvertKuma(kb)
-		if err := s.ImportData(backup); err != nil {
+		if err := s.ImportData(context.Background(), backup); err != nil {
-			fmt.Fprintf(os.Stderr, "import failed: %v\n", err)
+			slog.Error("import failed", "err", err)
 			os.Exit(1)
 		}
 		fmt.Printf("Imported %d monitors and %d alerts from Uptime Kuma v%s\n", len(backup.Sites), len(backup.Alerts), kb.Version)
 	}
-	allowPrivate := os.Getenv("UPTOP_ALLOW_PRIVATE_TARGETS") == "true"
+	if cfg.AllowPrivateTargets {
-	if allowPrivate {
+		slog.Warn("private target blocking disabled, monitor URLs can reach internal networks")
 		fmt.Println("WARNING: Private target blocking disabled. Monitor URLs can reach internal networks.")
 	}
-	eng := monitor.NewEngineWithOpts(s, allowPrivate)
+	eng := monitor.NewEngineWithOpts(s, cfg.AllowPrivateTargets)
-	if os.Getenv("UPTOP_INSECURE_SKIP_VERIFY") == "true" {
+	if cfg.InsecureSkipVerify {
 		eng.SetInsecureSkipVerify(true)
 	}
-	if aggStrategy != "" {
+	if cfg.AggStrategy != "" {
-		eng.SetAggStrategy(monitor.AggregationStrategy(aggStrategy))
+		eng.SetAggStrategy(monitor.AggregationStrategy(cfg.AggStrategy))
 	}
 	if v := os.Getenv("UPTOP_MAINT_RETENTION"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil && d > 0 {
 			eng.SetMaintRetention(d)
 		}
 	}
 	eng.SetMaintRetention(cfg.MaintRetention)
 	ctx, cancel := context.WithCancel(context.Background())
 	defer cancel()
@@ -427,35 +410,22 @@ func runServe(args []string) {
 	eng.InitAlertHealth()
 	eng.Start(ctx)
-	tlsCert := os.Getenv("UPTOP_TLS_CERT")
+	localTUI := isatty.IsTerminal(os.Stdout.Fd()) || isatty.IsCygwinTerminal(os.Stdout.Fd())
 	tlsKey := os.Getenv("UPTOP_TLS_KEY")
-	httpSrv := server.Start(server.ServerConfig{
+	httpSrv := server.Start(cfg.serverConfig(localTUI), s, eng)
 		Port:           httpPort,
 		EnableStatus:   enableStatus,
 		Title:          statusTitle,
 		ClusterKey:     clusterKey,
 		TLSCert:        tlsCert,
 		TLSKey:         tlsKey,
 		ClusterMode:    clusterMode,
 		MetricsPublic:  os.Getenv("UPTOP_METRICS_PUBLIC") == "true",
 		CORSOrigin:     os.Getenv("UPTOP_CORS_ORIGIN"),
 		TrustedProxies: parseTrustedProxies(os.Getenv("UPTOP_TRUSTED_PROXIES")),
 	}, s, eng)
 	cluster.Start(ctx, cluster.Config{
-		Mode:      clusterMode,
+		Mode:      cfg.ClusterMode,
-		PeerURL:   clusterPeer,
+		PeerURL:   cfg.PeerURL,
-		SharedKey: clusterKey,
+		SharedKey: cfg.ClusterSecret,
 	}, eng)
 	kc := newKeyCache(s)
 	sshSrv := startSSHServer(*port, s, eng, kc)
-	if isatty.IsTerminal(os.Stdout.Fd()) || isatty.IsCygwinTerminal(os.Stdout.Fd()) {
+	if localTUI {
 		p := tea.NewProgram(tui.InitialModel(true, s, eng, version), tea.WithAltScreen(), tea.WithMouseCellMotion())
 		if _, err := p.Run(); err != nil {
-			fmt.Fprintf(os.Stderr, "error: %v\n", err)
+			slog.Error("TUI failed", "err", err)
 		}
 	} else {
 		fmt.Println("uptop running in HEADLESS mode")
@@ -466,20 +436,18 @@ func runServe(args []string) {
 	}
 	cancel()
 	// Drain pending DB writes before the deferred ss.Close() runs, so no
 	// write races a closed database.
 	eng.Stop()
 	shutdownCtx, shutdownCancel := context.WithTimeout(context.Background(), 30*time.Second)
 	defer shutdownCancel()
 	if httpSrv != nil {
 		if err := httpSrv.Shutdown(shutdownCtx); err != nil {
-			log.Printf("HTTP shutdown error: %v", err)
+			slog.Error("HTTP shutdown failed", "err", err)
 		}
 	}
 	if sshSrv != nil {
 		if err := sshSrv.Shutdown(shutdownCtx); err != nil {
-			log.Printf("SSH shutdown error: %v", err)
+			slog.Error("SSH shutdown failed", "err", err)
 		}
 	}
 }
@@ -498,48 +466,49 @@ func startSSHServer(port int, db store.Store, eng *monitor.Engine, kc *keyCache)
 		),
 	)
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "SSH server error: %v\n", err)
+		slog.Error("SSH server failed", "err", err)
 		return nil
 	}
 	go func() {
 		if err := s.ListenAndServe(); err != nil && !errors.Is(err, ssh.ErrServerClosed) {
-			log.Printf("SSH server error: %v", err)
+			slog.Error("SSH server failed", "err", err)
 		}
 	}()
 	return s
 }
 func seedDemoData(s store.Store) {
-	existing, _ := s.GetSites()
+	ctx := context.Background()
 	existing, _ := s.GetSites(ctx)
 	if len(existing) > 0 {
 		return
 	}
 	fmt.Println("Seeding demo data...")
-	if err := s.AddAlert("Discord Ops", "discord", map[string]string{"url": "https://discord.com/api/webhooks/demo/token"}); err != nil {
+	if err := s.AddAlert(ctx, "Discord Ops", "discord", map[string]string{"url": "https://discord.com/api/webhooks/demo/token"}); err != nil {
-		log.Printf("demo seed: add alert: %v", err)
+		slog.Error("demo seed failed", "step", "add alert", "err", err)
 		return
 	}
-	if err := s.AddAlert("Slack Infra", "slack", map[string]string{"url": "https://hooks.slack.com/services/DEMO/WEBHOOK"}); err != nil {
+	if err := s.AddAlert(ctx, "Slack Infra", "slack", map[string]string{"url": "https://hooks.slack.com/services/DEMO/WEBHOOK"}); err != nil {
-		log.Printf("demo seed: add alert: %v", err)
+		slog.Error("demo seed failed", "step", "add alert", "err", err)
 		return
 	}
-	if err := s.AddAlert("Email Oncall", "email", map[string]string{
+	if err := s.AddAlert(ctx, "Email Oncall", "email", map[string]string{
 		"host": "smtp.example.com", "port": "587",
 		"user": "oncall@example.com", "pass": "replace-me",
 		"from": "oncall@example.com", "to": "team@example.com",
 	}); err != nil {
-		log.Printf("demo seed: add alert: %v", err)
+		slog.Error("demo seed failed", "step", "add alert", "err", err)
 		return
 	}
-	alerts, _ := s.GetAllAlerts()
+	alerts, _ := s.GetAllAlerts(ctx)
 	alertID := 0
 	if len(alerts) > 0 {
 		alertID = alerts[0].ID
 	}
-	demoSites := []models.Site{
+	demoSites := []models.SiteConfig{
 		{Name: "Google", URL: "https://www.google.com", Type: "http", Interval: 30, AlertID: alertID, CheckSSL: true, ExpiryThreshold: 14, MaxRetries: 2},
 		{Name: "GitHub", URL: "https://github.com", Type: "http", Interval: 30, AlertID: alertID, CheckSSL: true, ExpiryThreshold: 7, MaxRetries: 3},
 		{Name: "Cloudflare DNS", URL: "https://1.1.1.1", Type: "http", Interval: 60, AlertID: alertID, ExpiryThreshold: 7, MaxRetries: 1},
@@ -552,8 +521,8 @@ func seedDemoData(s store.Store) {
 		{Name: "SSH Server", Type: "port", Interval: 60, AlertID: alertID, Hostname: "10.0.0.1", Port: 22, Timeout: 5, ExpiryThreshold: 7},
 	}
 	for _, site := range demoSites {
-		if err := s.AddSite(site); err != nil {
+		if err := s.AddSite(ctx, site); err != nil {
-			log.Printf("demo seed: add site %q: %v", site.Name, err)
+			slog.Error("demo seed failed", "step", "add site", "site", site.Name, "err", err)
 		}
 	}
 }
@@ -571,8 +540,12 @@ func newKeyCache(db store.Store) *keyCache {
 }
 func (c *keyCache) refresh() {
-	users, err := c.db.GetAllUsers()
+	users, err := c.db.GetAllUsers(context.Background())
 	if err != nil {
 		// Keep the previous key set: a transient DB error must not lock every
 		// admin out. Revocation still fails closed because Invalidate clears
 		// the set immediately.
 		slog.Error("SSH key cache refresh failed", "err", err)
 		return
 	}
 	keys := make([]ssh.PublicKey, 0, len(users))
@@ -589,8 +562,13 @@ func (c *keyCache) refresh() {
 	c.mu.Unlock()
 }
 // Invalidate clears the cached key set, not just the timestamp. If the
 // refresh that follows a user revocation fails, auth fails closed (everyone
 // re-authenticates after the next successful refresh) instead of the revoked
 // key silently continuing to work off the stale cache.
 func (c *keyCache) Invalidate() {
 	c.mu.Lock()
 	c.keys = nil
 	c.updated = time.Time{}
 	c.mu.Unlock()
 }
@@ -614,7 +592,41 @@ func (c *keyCache) IsAllowed(incomingKey ssh.PublicKey) bool {
 	return false
 }
 // userInvalidatingStore drops the SSH key cache whenever the user table
 // changes, so a revocation takes effect on the next connection attempt
 // instead of after the cache TTL — and fails closed if the DB is unreachable
 // when that next attempt re-reads the table.
 type userInvalidatingStore struct {
 	store.Store
 	kc *keyCache
 }
 func (s *userInvalidatingStore) AddUser(ctx context.Context, username, publicKey, role string) error {
 	err := s.Store.AddUser(ctx, username, publicKey, role)
 	s.kc.Invalidate()
 	return err
 }
 func (s *userInvalidatingStore) UpdateUser(ctx context.Context, id int, username, publicKey, role string) error {
 	err := s.Store.UpdateUser(ctx, id, username, publicKey, role)
 	s.kc.Invalidate()
 	return err
 }
 func (s *userInvalidatingStore) DeleteUser(ctx context.Context, id int) error {
 	err := s.Store.DeleteUser(ctx, id)
 	s.kc.Invalidate()
 	return err
 }
 func (s *userInvalidatingStore) ImportData(ctx context.Context, data models.Backup) error {
 	err := s.Store.ImportData(ctx, data)
 	s.kc.Invalidate()
 	return err
 }
 func seedKeysFromEnv(s store.Store) {
 	ctx := context.Background()
 	var keys []string
 	if v := os.Getenv("UPTOP_ADMIN_KEY"); v != "" {
@@ -623,7 +635,9 @@ func seedKeysFromEnv(s store.Store) {
 	if path := os.Getenv("UPTOP_KEYS"); path != "" {
 		f, err := os.Open(filepath.Clean(path))
-		if err == nil {
+		if err != nil {
 			slog.Warn("failed to open UPTOP_KEYS file", "path", path, "err", err) //nolint:gosec // structured slog, not format string
 		} else {
 			scanner := bufio.NewScanner(f)
 			for scanner.Scan() {
 				line := strings.TrimSpace(scanner.Text())
@@ -640,9 +654,9 @@ func seedKeysFromEnv(s store.Store) {
 		return
 	}
-	existing, err := s.GetAllUsers()
+	existing, err := s.GetAllUsers(ctx)
 	if err != nil {
-		fmt.Fprintf(os.Stderr, "warning: could not check existing users: %v\n", err)
+		slog.Warn("could not check existing users", "err", err)
 		return
 	}
@@ -658,8 +672,8 @@ func seedKeysFromEnv(s store.Store) {
 		}
 		username := usernameFromKey(key, i, len(existing)+added)
-		if err := s.AddUser(username, key, "admin"); err != nil {
+		if err := s.AddUser(ctx, username, key, "admin"); err != nil {
-			fmt.Fprintf(os.Stderr, "warning: failed to seed user %q: %v\n", username, err)
+			slog.Warn("failed to seed user", "user", username, "err", err) //nolint:gosec // structured slog, not format string
 			continue
 		}
 		fmt.Printf("Seeded admin user %q from %s\n", username, seedSource(i, len(keys), os.Getenv("UPTOP_ADMIN_KEY") != ""))
@@ -3,7 +3,7 @@ services:
  # LEADER NODE
  # -------------------------
  leader:
-    build: .
+    image: lerkolabs/uptop:latest
    container_name: uptop-leader
    ports:
      - "23234:23234" # SSH
@@ -18,7 +18,7 @@ services:
      # Cluster Config
      - UPTOP_CLUSTER_MODE=leader
-      - UPTOP_CLUSTER_SECRET=mysecret
+      - UPTOP_CLUSTER_SECRET=mysecret  # EXAMPLE ONLY — rotate before use
    depends_on:
      - leader-db
    stdin_open: true
@@ -38,7 +38,7 @@ services:
  # FOLLOWER NODE
  # -------------------------
  follower:
-    build: .
+    image: lerkolabs/uptop:latest
    container_name: uptop-follower
    ports:
      - "23233:23234" # SSH (Mapped to different host port)
@@ -53,7 +53,7 @@ services:
      # Cluster Config
      - UPTOP_CLUSTER_MODE=follower
-      - UPTOP_CLUSTER_SECRET=mysecret
+      - UPTOP_CLUSTER_SECRET=mysecret  # EXAMPLE ONLY — rotate before use
      # IMPORTANT: Uses the Service Name "leader" to connect internally
      - UPTOP_PEER_URL=http://leader:8080
    depends_on:
@@ -1,8 +1,8 @@
 services:
  # The Application
  app:
-    build: 
+    build:
-      context: .
+      context: ..
      dockerfile: Dockerfile
    container_name: uptop-dev
    ports:
@@ -1,9 +1,9 @@
 services:
  leader:
-    build: .
+    image: lerkolabs/uptop:latest
    environment:
      - UPTOP_CLUSTER_MODE=leader
-      - UPTOP_CLUSTER_SECRET=changeme
+      - UPTOP_CLUSTER_SECRET=changeme  # EXAMPLE ONLY — rotate before use
      - UPTOP_AGG_STRATEGY=any-down
      - UPTOP_STATUS_ENABLED=true
    ports:
@@ -11,25 +11,25 @@ services:
      - "23234:23234"
  probe-us-east:
-    build: .
+    image: lerkolabs/uptop:latest
    environment:
      - UPTOP_CLUSTER_MODE=probe
      - UPTOP_NODE_ID=us-east-1
      - UPTOP_NODE_NAME=US East Probe
      - UPTOP_NODE_REGION=us-east
      - UPTOP_PEER_URL=http://leader:8080
-      - UPTOP_CLUSTER_SECRET=changeme
+      - UPTOP_CLUSTER_SECRET=changeme  # EXAMPLE ONLY — rotate before use
    depends_on:
      - leader
  probe-eu-west:
-    build: .
+    image: lerkolabs/uptop:latest
    environment:
      - UPTOP_CLUSTER_MODE=probe
      - UPTOP_NODE_ID=eu-west-1
      - UPTOP_NODE_NAME=EU West Probe
      - UPTOP_NODE_REGION=eu-west
      - UPTOP_PEER_URL=http://leader:8080
-      - UPTOP_CLUSTER_SECRET=changeme
+      - UPTOP_CLUSTER_SECRET=changeme  # EXAMPLE ONLY — rotate before use
    depends_on:
      - leader
@@ -1,10 +1,15 @@
 services:
  app:
-    build:
+    image: lerkolabs/uptop:latest
      context: .
      dockerfile: Dockerfile
    container_name: uptop
    restart: unless-stopped
    read_only: true
    cap_drop:
      - ALL
    security_opt:
      - no-new-privileges:true
    tmpfs:
      - /tmp
    ports:
      - "23234:23234"
      - "8080:8080"
@@ -16,6 +16,11 @@ A follower is a standby replica that takes over if the leader goes down.
 - When the leader recovers, the follower detects it and goes back to standby
 - Both nodes have their own database — they do not share state
 **Limitations:**
 - During a network partition where both nodes are healthy, both will run checks and fire alerts independently. There is no leader fencing — the follower has no way to confirm the leader is actually down vs. unreachable from its perspective. This window lasts until the partition heals, at which point the follower detects the leader and steps down.
 - Expect duplicate alerts and doubled check history entries during a split-brain event. Alerts are idempotent for most providers (a second "site is down" notification is noisy but not harmful).
 - Failover takeover time is ~15 seconds (3 missed polls × 5 second interval). This is not configurable.
 **Required env vars:**
 | Node | Variable | Value |
@@ -76,5 +81,5 @@ Set via `UPTOP_AGG_STRATEGY` on the leader.
 ## Security
 - Set `UPTOP_CLUSTER_SECRET` on all nodes. Without it, cluster API endpoints are unauthenticated.
- Secrets are sent in HTTP headers (`X-Upkeep-Secret`). Use TLS or a reverse proxy for production.
+- Secrets are sent in HTTP headers (`X-Uptop-Secret`). Use TLS or a reverse proxy for production.
 - uptop warns on startup if the cluster secret is missing or if cluster mode is active without TLS.
@@ -122,7 +122,7 @@ Groups can't nest inside other groups. A group is healthy when all its children
 ## Alert types
-All 9 providers work in the YAML. The `settings` map is different per type.
+All 10 providers work in the YAML. The `settings` map is different per type.
 ```yaml
 # Discord / Slack / Generic Webhook — just a URL
@@ -149,6 +149,9 @@ All 9 providers work in the YAML. The `settings` map is different per type.
    url: https://ntfy.sh
    topic: my-alerts
    priority: "4"
    # for protected topics:
    # username: user
    # password: pass
 # Telegram
 - name: Telegram Ops
@@ -178,6 +181,14 @@ All 9 providers work in the YAML. The `settings` map is different per type.
    url: https://gotify.example.com
    token: app-token
    priority: "8"
 # Opsgenie
 - name: Opsgenie
  type: opsgenie
  settings:
    api_key: your-api-key
    priority: P2        # P1–P5, default P3
    # eu: "true"        # use the EU API endpoint
 ```
 ## Commands
@@ -224,7 +235,25 @@ Monitors and alerts are matched by **name**. Names must be unique across the ent
 Apply is idempotent. Run it twice with the same file, second run changes nothing.
-If something fails mid-apply, just fix the issue and run it again. It picks up where it left off.
+Apply is **not atomic** — items are written one at a time, so an error mid-apply (bad value, lost DB connection, ctrl-C) leaves the items already written in place. That's safe to recover from: apply diffs against the database by name, so fix the issue and run it again — it converges the rest. Just don't run two applies against the same database at once.
 ## Backups and secrets
 `uptop export` writes alert credentials (SMTP passwords, API tokens, webhook URLs) into the YAML in clear text — that's what makes the file restorable. Treat it like a secrets file.
 The HTTP export endpoint redacts those same fields **by default**:
 ```bash
 # secrets show as ***REDACTED*** — fine for sharing or review
 curl -H "X-Uptop-Secret: your-secret" \
  "http://localhost:8080/api/backup/export"
 # full backup you can actually restore from
 curl -H "X-Uptop-Secret: your-secret" \
  "http://localhost:8080/api/backup/export?redact_secrets=false"
 ```
 Restoring a redacted export imports the literal string `***REDACTED***` as your credentials. For real backups, pass `redact_secrets=false` or run `uptop export` on the host.
 ## Typical workflow
@@ -13,10 +13,11 @@ require (
 	github.com/lib/pq v1.11.1
 	github.com/lrstanley/bubblezone v1.0.0
 	github.com/mattn/go-isatty v0.0.20
 	github.com/mattn/go-sqlite3 v1.14.33
 	github.com/miekg/dns v1.1.72
 	github.com/prometheus-community/pro-bing v0.8.0
 	golang.org/x/crypto v0.52.0
 	gopkg.in/yaml.v3 v3.0.1
 	modernc.org/sqlite v1.52.0
 )
 require (
@@ -48,9 +49,10 @@ require (
 	github.com/muesli/ansi v0.0.0-20230316100256-276c6243b2f6 // indirect
 	github.com/muesli/cancelreader v0.2.2 // indirect
 	github.com/muesli/termenv v0.16.0 // indirect
 	github.com/ncruces/go-strftime v1.0.0 // indirect
 	github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec // indirect
 	github.com/rivo/uniseg v0.4.7 // indirect
 	github.com/xo/terminfo v0.0.0-20220910002029-abceb7e1c41e // indirect
 	golang.org/x/crypto v0.52.0 // indirect
 	golang.org/x/exp v0.0.0-20240719175910-8a7402abbf56 // indirect
 	golang.org/x/mod v0.35.0 // indirect
 	golang.org/x/net v0.55.0 // indirect
@@ -58,4 +60,7 @@ require (
 	golang.org/x/sys v0.45.0 // indirect
 	golang.org/x/text v0.37.0 // indirect
 	golang.org/x/tools v0.44.0 // indirect
 	modernc.org/libc v1.72.3 // indirect
 	modernc.org/mathutil v1.7.1 // indirect
 	modernc.org/memory v1.11.0 // indirect
 )
@@ -64,8 +64,12 @@ github.com/go-logfmt/logfmt v0.6.0 h1:wGYYu3uicYdqXVgoYbvnkrPVXkuLM1p1ifugDMEdRi
 github.com/go-logfmt/logfmt v0.6.0/go.mod h1:WYhtIu8zTZfxdn5+rREduYbwxfcBr/Vr6KEVveWlfTs=
 github.com/google/go-cmp v0.7.0 h1:wk8382ETsv4JYUZwIsn6YpYiWiBsYLSJiTsyBybVuN8=
 github.com/google/go-cmp v0.7.0/go.mod h1:pXiqmnSA92OHEEa9HXL2W4E7lf9JzCmGVUdgjX3N/iU=
 github.com/google/pprof v0.0.0-20250317173921-a4b03ec1a45e h1:ijClszYn+mADRFY17kjQEVQ1XRhq2/JR1M3sGqeJoxs=
 github.com/google/pprof v0.0.0-20250317173921-a4b03ec1a45e/go.mod h1:boTsfXsheKC2y+lKOCMpSfarhxDeIzfZG1jqGcPl3cA=
 github.com/google/uuid v1.6.0 h1:NIvaJDMOsjHA8n1jAhLSgzrAzy1Hgr+hNrb57e+94F0=
 github.com/google/uuid v1.6.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
 github.com/hashicorp/golang-lru/v2 v2.0.7 h1:a+bsQ5rvGLjzHuww6tVxozPZFVghXaHOwFs4luLUK2k=
 github.com/hashicorp/golang-lru/v2 v2.0.7/go.mod h1:QeFd9opnmA6QUJc5vARoKUSoFhyfM2/ZepoAG6RGpeM=
 github.com/lib/pq v1.11.1 h1:wuChtj2hfsGmmx3nf1m7xC2XpK6OtelS2shMY+bGMtI=
 github.com/lib/pq v1.11.1/go.mod h1:/p+8NSbOcwzAEI7wiMXFlgydTwcgTr3OSKMsD2BitpA=
 github.com/lrstanley/bubblezone v1.0.0 h1:bIpUaBilD42rAQwlg/4u5aTqVAt6DSRKYZuSdmkr8UA=
@@ -78,8 +82,6 @@ github.com/mattn/go-localereader v0.0.1 h1:ygSAOl7ZXTx4RdPYinUpg6W99U8jWvWi9Ye2J
 github.com/mattn/go-localereader v0.0.1/go.mod h1:8fBrzywKY7BI3czFoHkuzRoWE9C+EiG4R1k4Cjx5p88=
 github.com/mattn/go-runewidth v0.0.16 h1:E5ScNMtiwvlvB5paMFdw9p4kSQzbXFikJ5SQO6TULQc=
 github.com/mattn/go-runewidth v0.0.16/go.mod h1:Jdepj2loyihRzMpdS35Xk/zdY8IAYHsh153qUoGf23w=
 github.com/mattn/go-sqlite3 v1.14.33 h1:A5blZ5ulQo2AtayQ9/limgHEkFreKj1Dv226a1K73s0=
 github.com/mattn/go-sqlite3 v1.14.33/go.mod h1:Uh1q+B4BYcTPb+yiD3kU8Ct7aC0hY9fxUwlHK0RXw+Y=
 github.com/miekg/dns v1.1.72 h1:vhmr+TF2A3tuoGNkLDFK9zi36F2LS+hKTRW0Uf8kbzI=
 github.com/miekg/dns v1.1.72/go.mod h1:+EuEPhdHOsfk6Wk5TT2CzssZdqkmFhf8r+aVyDEToIs=
 github.com/mitchellh/hashstructure/v2 v2.0.2 h1:vGKWl0YJqUNxE8d+h8f6NJLcCJrgbhC4NcD46KavDd4=
@@ -90,10 +92,14 @@ github.com/muesli/cancelreader v0.2.2 h1:3I4Kt4BQjOR54NavqnDogx/MIoWBFa0StPA8ELU
 github.com/muesli/cancelreader v0.2.2/go.mod h1:3XuTXfFS2VjM+HTLZY9Ak0l6eUKfijIfMUZ4EgX0QYo=
 github.com/muesli/termenv v0.16.0 h1:S5AlUN9dENB57rsbnkPyfdGuWIlkmzJjbFf0Tf5FWUc=
 github.com/muesli/termenv v0.16.0/go.mod h1:ZRfOIKPFDYQoDFF4Olj7/QJbW60Ol/kL1pU3VfY/Cnk=
 github.com/ncruces/go-strftime v1.0.0 h1:HMFp8mLCTPp341M/ZnA4qaf7ZlsbTc+miZjCLOFAw7w=
 github.com/ncruces/go-strftime v1.0.0/go.mod h1:Fwc5htZGVVkseilnfgOVb9mKy6w1naJmn9CehxcKcls=
 github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
 github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
 github.com/prometheus-community/pro-bing v0.8.0 h1:CEY/g1/AgERRDjxw5P32ikcOgmrSuXs7xon7ovx6mNc=
 github.com/prometheus-community/pro-bing v0.8.0/go.mod h1:Idyxz8raDO6TgkUN6ByiEGvWJNyQd40kN9ZUeho3lN0=
 github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec h1:W09IVJc94icq4NjY3clb7Lk8O1qJ8BdBEF8z0ibU0rE=
 github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec/go.mod h1:qqbHyh8v60DhA7CoWK5oRCqLrMHRGoxYCSS9EjAz6Eo=
 github.com/rivo/uniseg v0.2.0/go.mod h1:J6wj4VEh+S6ZtnVlnTBMWIodfgj8LQOQFoIToxlJtxc=
 github.com/rivo/uniseg v0.4.7 h1:WUdvkW8uEhrYfLC4ZzdpI2ztxP1I582+49Oc5Mq64VQ=
 github.com/rivo/uniseg v0.4.7/go.mod h1:FN3SvrM+Zdj16jyLfmOkMNblXMcoc8DfTHruCPUcx88=
@@ -125,3 +131,31 @@ gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405 h1:yhCVgyC4o1eVCa2tZl7eS0r+
 gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
 gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
 gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
 modernc.org/cc/v4 v4.28.2 h1:3tQ0lf2ADtoby2EtSP+J7IE2SHwEJdP8ioR59wx7XpY=
 modernc.org/cc/v4 v4.28.2/go.mod h1:OnovgIhbbMXMu1aISnJ0wvVD1KnW+cAUJkIrAWh+kVI=
 modernc.org/ccgo/v4 v4.34.0 h1:yRLPFZieg532OT4rp4JFNIVcquwalMX26G95WQDqwCQ=
 modernc.org/ccgo/v4 v4.34.0/go.mod h1:AS5WYMyBakQ+fhsHhtP8mWB82KTGPkNNJDGfGQCe0/A=
 modernc.org/fileutil v1.4.0 h1:j6ZzNTftVS054gi281TyLjHPp6CPHr2KCxEXjEbD6SM=
 modernc.org/fileutil v1.4.0/go.mod h1:EqdKFDxiByqxLk8ozOxObDSfcVOv/54xDs/DUHdvCUU=
 modernc.org/gc/v2 v2.6.5 h1:nyqdV8q46KvTpZlsw66kWqwXRHdjIlJOhG6kxiV/9xI=
 modernc.org/gc/v2 v2.6.5/go.mod h1:YgIahr1ypgfe7chRuJi2gD7DBQiKSLMPgBQe9oIiito=
 modernc.org/gc/v3 v3.1.2 h1:ZtDCnhonXSZexk/AYsegNRV1lJGgaNZJuKjJSWKyEqo=
 modernc.org/gc/v3 v3.1.2/go.mod h1:HFK/6AGESC7Ex+EZJhJ2Gni6cTaYpSMmU/cT9RmlfYY=
 modernc.org/goabi0 v0.2.0 h1:HvEowk7LxcPd0eq6mVOAEMai46V+i7Jrj13t4AzuNks=
 modernc.org/goabi0 v0.2.0/go.mod h1:CEFRnnJhKvWT1c1JTI3Avm+tgOWbkOu5oPA8eH8LnMI=
 modernc.org/libc v1.72.3 h1:ZnDF4tXn4NBXFutMMQC4vtbTFSXhhKzR73fv0beZEAU=
 modernc.org/libc v1.72.3/go.mod h1:dn0dZNnnn1clLyvRxLxYExxiKRZIRENOfqQ8XEeg4Qs=
 modernc.org/mathutil v1.7.1 h1:GCZVGXdaN8gTqB1Mf/usp1Y/hSqgI2vAGGP4jZMCxOU=
 modernc.org/mathutil v1.7.1/go.mod h1:4p5IwJITfppl0G4sUEDtCr4DthTaT47/N3aT6MhfgJg=
 modernc.org/memory v1.11.0 h1:o4QC8aMQzmcwCK3t3Ux/ZHmwFPzE6hf2Y5LbkRs+hbI=
 modernc.org/memory v1.11.0/go.mod h1:/JP4VbVC+K5sU2wZi9bHoq2MAkCnrt2r98UGeSK7Mjw=
 modernc.org/opt v0.2.0 h1:tGyef5ApycA7FSEOMraay9SaTk5zmbx7Tu+cJs4QKZg=
 modernc.org/opt v0.2.0/go.mod h1:03fq9lsNfvkYSfxrfUhZCWPk1lm4cq4N+Bh//bEtgns=
 modernc.org/sortutil v1.2.1 h1:+xyoGf15mM3NMlPDnFqrteY07klSFxLElE2PVuWIJ7w=
 modernc.org/sortutil v1.2.1/go.mod h1:7ZI3a3REbai7gzCLcotuw9AC4VZVpYMjDzETGsSMqJE=
 modernc.org/sqlite v1.52.0 h1:p4dhYh2tXZCiyaqHwRVJDjIGKWyXayiQpThxgDzJaxo=
 modernc.org/sqlite v1.52.0/go.mod h1:tcNzv5p84E0skkmJn038y+hWJbLQXQqEnQfeh5r2JLM=
 modernc.org/strutil v1.2.1 h1:UneZBkQA+DX2Rp35KcM69cSsNES9ly8mQWD71HKlOA0=
 modernc.org/strutil v1.2.1/go.mod h1:EHkiggD70koQxjVdSBM3JKM7k6L0FbGE5eymy9i3B9A=
 modernc.org/token v1.1.0 h1:Xl7Ap9dKaEs5kLoOQeQmPWevfnk/DM5qcLcYlA8ys6Y=
 modernc.org/token v1.1.0/go.mod h1:UGzOrNV1mAFSEB63lOFHIpNRUVMvYTc6yu1SMY/XTDM=
@@ -3,9 +3,11 @@ package alert
 import (
 	"bytes"
 	"context"
 	"crypto/tls"
 	"encoding/json"
 	"errors"
 	"fmt"
 	"net"
 	"net/http"
 	"net/smtp"
 	"net/url"
@@ -244,7 +246,6 @@ func (e *EmailProvider) Send(ctx context.Context, title, message string) error {
 		return ctx.Err()
 	default:
 	}
 	auth := smtp.PlainAuth("", e.User, e.Pass, e.Host)
 	to := sanitizeHeader(e.To)
 	from := sanitizeHeader(e.From)
 	subject := sanitizeHeader(title)
@@ -256,7 +257,67 @@ func (e *EmailProvider) Send(ctx context.Context, title, message string) error {
 		"Content-Type: text/plain; charset=utf-8\r\n" +
 		"\r\n" +
 		body + "\r\n")
-	return smtp.SendMail(e.Host+":"+e.Port, auth, from, []string{to}, msg)
+	return sendMailContext(ctx, e.Host, e.Port, e.User, e.Pass, from, []string{to}, msg)
 }
 // sendMailContext is a ctx-aware replacement for smtp.SendMail.
 // smtp.SendMail ignores context entirely — a blackholed SMTP server hangs for
 // the OS TCP timeout (minutes). This dials with the context deadline and sets
 // connection deadlines so cancellation is respected throughout.
 func sendMailContext(ctx context.Context, host, port, user, pass, from string, rcpt []string, msg []byte) error {
 	addr := host + ":" + port
 	dialer := net.Dialer{}
 	conn, err := dialer.DialContext(ctx, "tcp", addr)
 	if err != nil {
 		return fmt.Errorf("smtp dial: %w", err)
 	}
 	if deadline, ok := ctx.Deadline(); ok {
 		_ = conn.SetDeadline(deadline)
 	}
 	c, err := smtp.NewClient(conn, host)
 	if err != nil {
 		_ = conn.Close()
 		return fmt.Errorf("smtp client: %w", err)
 	}
 	defer c.Close()
 	if ok, _ := c.Extension("STARTTLS"); ok {
 		if err := c.StartTLS(&tls.Config{ServerName: host}); err != nil {
 			return fmt.Errorf("smtp starttls: %w", err)
 		}
 	}
 	if user != "" || pass != "" {
 		auth := smtp.PlainAuth("", user, pass, host)
 		if err := c.Auth(auth); err != nil {
 			return fmt.Errorf("smtp auth: %w", err)
 		}
 	}
 	if err := c.Mail(from); err != nil {
 		return fmt.Errorf("smtp mail: %w", err)
 	}
 	for _, r := range rcpt {
 		if err := c.Rcpt(r); err != nil {
 			return fmt.Errorf("smtp rcpt: %w", err)
 		}
 	}
 	w, err := c.Data()
 	if err != nil {
 		return fmt.Errorf("smtp data: %w", err)
 	}
 	if _, err := w.Write(msg); err != nil {
 		return fmt.Errorf("smtp write: %w", err)
 	}
 	if err := w.Close(); err != nil {
 		return fmt.Errorf("smtp data close: %w", err)
 	}
 	return c.Quit()
 }
 type NtfyProvider struct {
@@ -1,14 +1,18 @@
 package alert
 import (
 	"bufio"
 	"context"
 	"encoding/json"
 	"errors"
 	"fmt"
 	"net"
 	"net/http"
 	"net/http/httptest"
 	"net/url"
 	"strings"
 	"testing"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
@@ -330,3 +334,116 @@ func TestSanitizeError(t *testing.T) {
 		t.Error("nil should stay nil")
 	}
 }
 func TestEmailProvider_ContextTimeout(t *testing.T) {
 	// Listener that accepts but never speaks — simulates a blackholed SMTP server.
 	ln, err := net.Listen("tcp", "127.0.0.1:0")
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer ln.Close()
 	go func() {
 		for {
 			conn, err := ln.Accept()
 			if err != nil {
 				return
 			}
 			// Hold connection open, never send banner.
 			go func(c net.Conn) {
 				time.Sleep(30 * time.Second)
 				c.Close()
 			}(conn)
 		}
 	}()
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	provider := &EmailProvider{
 		Host: "127.0.0.1", Port: portStr,
 		From: "test@test.com", To: "dest@test.com",
 	}
 	ctx, cancel := context.WithTimeout(context.Background(), 200*time.Millisecond)
 	defer cancel()
 	start := time.Now()
 	err = provider.Send(ctx, "test", "body")
 	elapsed := time.Since(start)
 	if err == nil {
 		t.Fatal("expected error from stalled SMTP")
 	}
 	if elapsed > 2*time.Second {
 		t.Errorf("Send took %v — context deadline not respected", elapsed)
 	}
 }
 func TestSendMailContext_HappyPath(t *testing.T) {
 	// Minimal fake SMTP server that accepts one message.
 	ln, err := net.Listen("tcp", "127.0.0.1:0")
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer ln.Close()
 	received := make(chan string, 1)
 	go func() {
 		conn, err := ln.Accept()
 		if err != nil {
 			return
 		}
 		defer conn.Close()
 		fmt.Fprintf(conn, "220 localhost ESMTP\r\n")
 		scanner := bufio.NewScanner(conn)
 		var dataMode bool
 		var body strings.Builder
 		for scanner.Scan() {
 			line := scanner.Text()
 			if dataMode {
 				if line == "." {
 					dataMode = false
 					fmt.Fprintf(conn, "250 OK\r\n")
 					continue
 				}
 				body.WriteString(line + "\n")
 				continue
 			}
 			switch {
 			case strings.HasPrefix(line, "EHLO"):
 				fmt.Fprintf(conn, "250-localhost\r\n250 OK\r\n")
 			case strings.HasPrefix(line, "MAIL FROM"):
 				fmt.Fprintf(conn, "250 OK\r\n")
 			case strings.HasPrefix(line, "RCPT TO"):
 				fmt.Fprintf(conn, "250 OK\r\n")
 			case line == "DATA":
 				fmt.Fprintf(conn, "354 Go ahead\r\n")
 				dataMode = true
 			case line == "QUIT":
 				fmt.Fprintf(conn, "221 Bye\r\n")
 				received <- body.String()
 				return
 			default:
 				fmt.Fprintf(conn, "250 OK\r\n")
 			}
 		}
 	}()
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
 	defer cancel()
 	err = sendMailContext(ctx, "127.0.0.1", portStr, "", "", "from@test.com", []string{"to@test.com"}, []byte("Subject: test\r\n\r\nhello"))
 	if err != nil {
 		t.Fatalf("sendMailContext: %v", err)
 	}
 	select {
 	case body := <-received:
 		if !strings.Contains(body, "hello") {
 			t.Errorf("expected body to contain 'hello', got: %s", body)
 		}
 	case <-time.After(5 * time.Second):
 		t.Fatal("timed out waiting for fake SMTP to receive message")
 	}
 }
@@ -52,7 +52,7 @@ func runFollowerLoop(ctx context.Context, cfg Config, eng *monitor.Engine) {
 		req, _ := http.NewRequest("GET", cfg.PeerURL+"/api/health", nil)
 		if cfg.SharedKey != "" {
-			req.Header.Set("X-Upkeep-Secret", cfg.SharedKey)
+			req.Header.Set("X-Uptop-Secret", cfg.SharedKey)
 		}
 		resp, err := client.Do(req)
@@ -12,76 +12,13 @@ import (
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 )
 // --- Mock Store (minimal, for monitor.NewEngine) ---
 type mockStore struct {
-	sites []models.Site
+	storetest.BaseMock
 }
 func (m *mockStore) Init() error                                              { return nil }
 func (m *mockStore) GetSites() ([]models.Site, error)                         { return m.sites, nil }
 func (m *mockStore) AddSite(models.Site) error                                { return nil }
 func (m *mockStore) UpdateSite(models.Site) error                             { return nil }
 func (m *mockStore) UpdateSitePaused(int, bool) error                         { return nil }
 func (m *mockStore) DeleteSite(int) error                                     { return nil }
 func (m *mockStore) GetAllAlerts() ([]models.AlertConfig, error)              { return nil, nil }
 func (m *mockStore) GetAlert(int) (models.AlertConfig, error)                 { return models.AlertConfig{}, nil }
 func (m *mockStore) AddAlert(string, string, map[string]string) error         { return nil }
 func (m *mockStore) UpdateAlert(int, string, string, map[string]string) error { return nil }
 func (m *mockStore) DeleteAlert(int) error                                    { return nil }
 func (m *mockStore) GetAllUsers() ([]models.User, error)                      { return nil, nil }
 func (m *mockStore) AddUser(string, string, string) error                     { return nil }
 func (m *mockStore) UpdateUser(int, string, string, string) error             { return nil }
 func (m *mockStore) DeleteUser(int) error                                     { return nil }
 func (m *mockStore) SaveCheck(int, int64, bool) error                         { return nil }
 func (m *mockStore) SaveCheckFromNode(int, string, int64, bool) error         { return nil }
 func (m *mockStore) LoadAllHistory(int) (map[int][]models.CheckRecord, error) { return nil, nil }
 func (m *mockStore) ExportData() (models.Backup, error)                       { return models.Backup{}, nil }
 func (m *mockStore) ImportData(models.Backup) error                           { return nil }
 func (m *mockStore) GetSiteByName(string) (models.Site, error)                { return models.Site{}, nil }
 func (m *mockStore) GetAlertByName(string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, nil
 }
 func (m *mockStore) AddSiteReturningID(models.Site) (int, error) { return 0, nil }
 func (m *mockStore) AddAlertReturningID(string, string, map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *mockStore) RegisterNode(models.ProbeNode) error      { return nil }
 func (m *mockStore) GetNode(string) (models.ProbeNode, error) { return models.ProbeNode{}, nil }
 func (m *mockStore) GetAllNodes() ([]models.ProbeNode, error) { return nil, nil }
 func (m *mockStore) UpdateNodeLastSeen(string) error          { return nil }
 func (m *mockStore) DeleteNode(string) error                  { return nil }
 func (m *mockStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) SaveAlertHealth(models.AlertHealthRecord) error { return nil }
 func (m *mockStore) SaveLog(string) error                           { return nil }
 func (m *mockStore) PruneLogs() error                               { return nil }
 func (m *mockStore) PruneCheckHistory() error                       { return nil }
 func (m *mockStore) PruneStateChanges() error                       { return nil }
 func (m *mockStore) LoadLogs(int) ([]string, error)                 { return nil, nil }
 func (m *mockStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) GetAllMaintenanceWindows(int) ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) AddMaintenanceWindow(models.MaintenanceWindow) error         { return nil }
 func (m *mockStore) EndMaintenanceWindow(int) error                              { return nil }
 func (m *mockStore) DeleteMaintenanceWindow(int) error                           { return nil }
 func (m *mockStore) PruneExpiredMaintenanceWindows(time.Duration) (int64, error) { return 0, nil }
 func (m *mockStore) IsMonitorInMaintenance(int) (bool, error)                    { return false, nil }
 func (m *mockStore) GetPreference(string) (string, error)                        { return "", nil }
 func (m *mockStore) SetPreference(string, string) error                          { return nil }
 func (m *mockStore) SaveStateChange(int, string, string, string) error           { return nil }
 func (m *mockStore) GetStateChanges(int, int) ([]models.StateChange, error)      { return nil, nil }
 func (m *mockStore) GetStateChangesSince(int, time.Time) ([]models.StateChange, error) {
 	return nil, nil
 }
 func (m *mockStore) Close() error { return nil }
 // --- Cluster Start Tests ---
 func TestStart_LeaderMode(t *testing.T) {
@@ -176,7 +113,7 @@ func TestFollowerLoop_SendsSecret(t *testing.T) {
 	var receivedSecret string
 	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		mu.Lock()
-		receivedSecret = r.Header.Get("X-Upkeep-Secret")
+		receivedSecret = r.Header.Get("X-Uptop-Secret")
 		mu.Unlock()
 		w.WriteHeader(200)
 		w.Write([]byte("OK"))
@@ -266,7 +203,7 @@ func TestProbeRegister_Failure(t *testing.T) {
 func TestProbeFetchAssignments_Success(t *testing.T) {
 	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		json.NewEncoder(w).Encode(map[string][]models.Site{
-			"sites": {{ID: 1, Name: "s1", Type: "http", URL: "http://example.com"}},
+			"sites": {{SiteConfig: models.SiteConfig{ID: 1, Name: "s1", Type: "http", URL: "http://example.com"}}},
 		})
 	}))
 	defer srv.Close()
@@ -303,8 +240,8 @@ func TestProbeExecuteChecks(t *testing.T) {
 	defer srv.Close()
 	sites := []models.Site{
-		{ID: 1, Type: "http", URL: srv.URL},
+		{SiteConfig: models.SiteConfig{ID: 1, Type: "http", URL: srv.URL}},
-		{ID: 2, Type: "http", URL: srv.URL},
+		{SiteConfig: models.SiteConfig{ID: 2, Type: "http", URL: srv.URL}},
 	}
 	strict := &http.Client{}
@@ -340,7 +277,7 @@ func TestProbeExecuteChecks_Concurrency(t *testing.T) {
 	var sites []models.Site
 	for i := 0; i < 20; i++ {
-		sites = append(sites, models.Site{ID: i + 1, Type: "http", URL: srv.URL})
+		sites = append(sites, models.Site{SiteConfig: models.SiteConfig{ID: i + 1, Type: "http", URL: srv.URL}})
 	}
 	results := probeExecuteChecks(context.Background(), sites, &http.Client{}, &http.Client{}, true)
@@ -6,7 +6,7 @@ import (
 	"crypto/tls"
 	"encoding/json"
 	"fmt"
-	"log"
+	"log/slog"
 	"net/http"
 	"net/url"
 	"sync"
@@ -47,7 +47,7 @@ func RunProbe(ctx context.Context, cfg ProbeConfig) error {
 	}
 	if err := probeRegister(ctx, apiClient, cfg); err != nil {
-		log.Printf("Probe: initial registration failed: %v (will retry)", err)
+		slog.Error("probe initial registration failed", "err", err)
 	}
 	for {
@@ -59,7 +59,7 @@ func RunProbe(ctx context.Context, cfg ProbeConfig) error {
 		sites, err := probeFetchAssignments(ctx, apiClient, cfg)
 		if err != nil {
-			log.Printf("Probe: failed to fetch assignments: %v", err)
+			slog.Error("probe failed to fetch assignments", "err", err)
 			sleepCtx(ctx, 10*time.Second)
 			continue
 		}
@@ -73,7 +73,7 @@ func RunProbe(ctx context.Context, cfg ProbeConfig) error {
 		if len(results) > 0 {
 			if err := probeReportResults(ctx, apiClient, cfg, results); err != nil {
-				log.Printf("Probe: failed to report results: %v", err)
+				slog.Error("probe failed to report results", "err", err)
 			}
 		}
@@ -90,7 +90,7 @@ func probeRegister(ctx context.Context, client *http.Client, cfg ProbeConfig) er
 		return err
 	}
 	req.Header.Set("Content-Type", "application/json")
-	req.Header.Set("X-Upkeep-Secret", cfg.SharedKey)
+	req.Header.Set("X-Uptop-Secret", cfg.SharedKey)
 	resp, err := client.Do(req)
 	if err != nil {
 		return err
@@ -108,7 +108,7 @@ func probeFetchAssignments(ctx context.Context, client *http.Client, cfg ProbeCo
 	if err != nil {
 		return nil, err
 	}
-	req.Header.Set("X-Upkeep-Secret", cfg.SharedKey)
+	req.Header.Set("X-Uptop-Secret", cfg.SharedKey)
 	resp, err := client.Do(req)
 	if err != nil {
 		return nil, err
@@ -152,12 +152,12 @@ loop:
 			defer wg.Done()
 			defer func() { <-sem }()
-			cr := monitor.RunCheck(s, strict, insecure, false, allowPrivate)
+			cr := monitor.RunCheck(ctx, s.SiteConfig, strict, insecure, false, allowPrivate)
 			mu.Lock()
 			results = append(results, probeResultItem{
 				SiteID:      s.ID,
 				LatencyNs:   cr.LatencyNs,
-				IsUp:        cr.Status == "UP",
+				IsUp:        cr.Status == string(models.StatusUp),
 				ErrorReason: cr.ErrorReason,
 			})
 			mu.Unlock()
@@ -180,7 +180,7 @@ func probeReportResults(ctx context.Context, client *http.Client, cfg ProbeConfi
 		return err
 	}
 	req.Header.Set("Content-Type", "application/json")
-	req.Header.Set("X-Upkeep-Secret", cfg.SharedKey)
+	req.Header.Set("X-Uptop-Secret", cfg.SharedKey)
 	resp, err := client.Do(req)
 	if err != nil {
 		return err
@@ -189,7 +189,7 @@ func probeReportResults(ctx context.Context, client *http.Client, cfg ProbeConfi
 	if resp.StatusCode != 200 {
 		return fmt.Errorf("results returned %d", resp.StatusCode)
 	}
-	fmt.Printf("Probe: reported %d check results\n", len(results))
+	slog.Info("probe reported check results", "count", len(results))
 	return nil
 }
@@ -1,11 +1,13 @@
 package config
 import (
 	"context"
 	"fmt"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store"
 	"reflect"
 	"strings"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store"
 )
 type ApplyOpts struct {
@@ -20,17 +22,17 @@ type Change struct {
 	Details string
 }
-func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
+func Apply(ctx context.Context, s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 	if err := Validate(f); err != nil {
 		return nil, err
 	}
-	existingAlerts, err := s.GetAllAlerts()
+	existingAlerts, err := s.GetAllAlerts(ctx)
 	if err != nil {
 		return nil, fmt.Errorf("load alerts: %w", err)
 	}
-	existingSites, err := s.GetSites()
+	existingSites, err := s.GetSites(ctx)
 	if err != nil {
 		return nil, fmt.Errorf("load sites: %w", err)
 	}
@@ -40,7 +42,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 		existingAlertsByName[a.Name] = a
 	}
-	existingSitesByName := make(map[string]models.Site, len(existingSites))
+	existingSitesByName := make(map[string]models.SiteConfig, len(existingSites))
 	for _, s := range existingSites {
 		existingSitesByName[s.Name] = s
 	}
@@ -52,6 +54,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 		alertMap[ea.Name] = ea.ID
 	}
 	nextPlaceholderID := -1
 	desiredAlertNames := make(map[string]bool, len(f.Alerts))
 	for _, a := range f.Alerts {
 		desiredAlertNames[a.Name] = true
@@ -59,18 +62,21 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 		if !exists {
 			changes = append(changes, Change{Action: "create", Kind: "alert", Name: a.Name, Details: a.Type})
 			if !opts.DryRun {
-				id, err := s.AddAlertReturningID(a.Name, a.Type, a.Settings)
+				id, err := s.AddAlertReturningID(ctx, a.Name, a.Type, a.Settings)
 				if err != nil {
 					return changes, fmt.Errorf("create alert %q: %w", a.Name, err)
 				}
 				alertMap[a.Name] = id
 			} else {
 				alertMap[a.Name] = nextPlaceholderID
 				nextPlaceholderID--
 			}
 		} else {
 			alertMap[a.Name] = existing.ID
 			if diff := diffAlert(existing, a); diff != "" {
 				changes = append(changes, Change{Action: "update", Kind: "alert", Name: a.Name, Details: diff})
 				if !opts.DryRun {
-					if err := s.UpdateAlert(existing.ID, a.Name, a.Type, a.Settings); err != nil {
+					if err := s.UpdateAlert(ctx, existing.ID, a.Name, a.Type, a.Settings); err != nil {
 						return changes, fmt.Errorf("update alert %q: %w", a.Name, err)
 					}
 				}
@@ -102,11 +108,14 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 		if !exists {
 			changes = append(changes, Change{Action: "create", Kind: "monitor", Name: g.Name, Details: "group"})
 			if !opts.DryRun {
-				id, err := s.AddSiteReturningID(site)
+				id, err := s.AddSiteReturningID(ctx, site)
 				if err != nil {
 					return changes, fmt.Errorf("create group %q: %w", g.Name, err)
 				}
 				groupMap[g.Name] = id
 			} else {
 				groupMap[g.Name] = nextPlaceholderID
 				nextPlaceholderID--
 			}
 		} else {
 			groupMap[g.Name] = existing.ID
@@ -114,7 +123,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 			if diff := diffSite(normalizeSite(existing), site); diff != "" {
 				changes = append(changes, Change{Action: "update", Kind: "monitor", Name: g.Name, Details: diff})
 				if !opts.DryRun {
-					if err := s.UpdateSite(site); err != nil {
+					if err := s.UpdateSite(ctx, site); err != nil {
 						return changes, fmt.Errorf("update group %q: %w", g.Name, err)
 					}
 				}
@@ -125,7 +134,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 	for _, g := range groups {
 		parentID := groupMap[g.Name]
 		for _, child := range g.Monitors {
-			c, err := applyMonitor(s, child, alertMap, existingSitesByName, parentID, opts.DryRun)
+			c, err := applyMonitor(ctx, s, child, alertMap, existingSitesByName, parentID, opts.DryRun)
 			if err != nil {
 				return changes, err
 			}
@@ -134,7 +143,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 	}
 	for _, m := range topLevel {
-		c, err := applyMonitor(s, m, alertMap, existingSitesByName, 0, opts.DryRun)
+		c, err := applyMonitor(ctx, s, m, alertMap, existingSitesByName, 0, opts.DryRun)
 		if err != nil {
 			return changes, err
 		}
@@ -155,7 +164,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 				childDeletes = append(childDeletes, c)
 			}
 			if !opts.DryRun {
-				if err := s.DeleteSite(es.ID); err != nil {
+				if err := s.DeleteSite(ctx, es.ID); err != nil {
 					return changes, fmt.Errorf("delete monitor %q: %w", es.Name, err)
 				}
 			}
@@ -169,7 +178,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 			}
 			changes = append(changes, Change{Action: "delete", Kind: "alert", Name: ea.Name, Details: ea.Type})
 			if !opts.DryRun {
-				if err := s.DeleteAlert(ea.ID); err != nil {
+				if err := s.DeleteAlert(ctx, ea.ID); err != nil {
 					return changes, fmt.Errorf("delete alert %q: %w", ea.Name, err)
 				}
 			}
@@ -179,7 +188,7 @@ func Apply(s store.Store, f *File, opts ApplyOpts) ([]Change, error) {
 	return changes, nil
 }
-func applyMonitor(s store.Store, m Monitor, alertMap map[string]int, existing map[string]models.Site, parentID int, dryRun bool) ([]Change, error) {
+func applyMonitor(ctx context.Context, s store.Store, m Monitor, alertMap map[string]int, existing map[string]models.SiteConfig, parentID int, dryRun bool) ([]Change, error) {
 	alertID, err := resolveAlertID(alertMap, m.Alert)
 	if err != nil {
 		return nil, fmt.Errorf("monitor %q: %w", m.Name, err)
@@ -191,7 +200,7 @@ func applyMonitor(s store.Store, m Monitor, alertMap map[string]int, existing ma
 	if !exists {
 		changes = append(changes, Change{Action: "create", Kind: "monitor", Name: m.Name, Details: m.Type})
 		if !dryRun {
-			if _, err := s.AddSiteReturningID(site); err != nil {
+			if _, err := s.AddSiteReturningID(ctx, site); err != nil {
 				return changes, fmt.Errorf("create monitor %q: %w", m.Name, err)
 			}
 		}
@@ -200,7 +209,7 @@ func applyMonitor(s store.Store, m Monitor, alertMap map[string]int, existing ma
 		if diff := diffSite(normalizeSite(ex), site); diff != "" {
 			changes = append(changes, Change{Action: "update", Kind: "monitor", Name: m.Name, Details: diff})
 			if !dryRun {
-				if err := s.UpdateSite(site); err != nil {
+				if err := s.UpdateSite(ctx, site); err != nil {
 					return changes, fmt.Errorf("update monitor %q: %w", m.Name, err)
 				}
 			}
@@ -220,8 +229,8 @@ func resolveAlertID(alertMap map[string]int, name string) (int, error) {
 	return id, nil
 }
-func monitorToSite(m Monitor, alertID, parentID int) models.Site {
+func monitorToSite(m Monitor, alertID, parentID int) models.SiteConfig {
-	s := models.Site{
+	s := models.SiteConfig{
 		Name:     m.Name,
 		Type:     m.Type,
 		URL:      m.URL,
@@ -267,7 +276,7 @@ func collectMonitorNames(monitors []Monitor, names map[string]bool) {
 	}
 }
-func normalizeSite(s models.Site) models.Site {
+func normalizeSite(s models.SiteConfig) models.SiteConfig {
 	if s.Method == "" {
 		s.Method = "GET"
 	}
@@ -291,7 +300,7 @@ func diffAlert(existing models.AlertConfig, desired Alert) string {
 	return strings.Join(diffs, ", ")
 }
-func diffSite(existing, desired models.Site) string {
+func diffSite(existing, desired models.SiteConfig) string {
 	var diffs []string
 	if existing.URL != desired.URL {
 		diffs = append(diffs, fmt.Sprintf("url: %s -> %s", existing.URL, desired.URL))
@@ -1,10 +1,12 @@
 package config
 import (
-	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
+	"context"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store"
 	"strings"
 	"testing"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store"
 )
 func newTestStore(t *testing.T) store.Store {
@@ -13,7 +15,7 @@ func newTestStore(t *testing.T) store.Store {
 	if err != nil {
 		t.Fatalf("NewSQLiteStore: %v", err)
 	}
-	if err := s.Init(); err != nil {
+	if err := s.Init(context.Background()); err != nil {
 		t.Fatalf("Init: %v", err)
 	}
 	return s
@@ -31,7 +33,7 @@ func TestApplyCreateFromScratch(t *testing.T) {
 		},
 	}
-	changes, err := Apply(s, f, ApplyOpts{})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -46,12 +48,12 @@ func TestApplyCreateFromScratch(t *testing.T) {
 		t.Fatalf("expected 3 creates, got %d", creates)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	if len(sites) != 2 {
 		t.Fatalf("expected 2 sites, got %d", len(sites))
 	}
-	alerts, _ := s.GetAllAlerts()
+	alerts, _ := s.GetAllAlerts(context.Background())
 	if len(alerts) != 1 {
 		t.Fatalf("expected 1 alert, got %d", len(alerts))
 	}
@@ -68,11 +70,11 @@ func TestApplyIdempotent(t *testing.T) {
 		},
 	}
-	if _, err := Apply(s, f, ApplyOpts{}); err != nil {
+	if _, err := Apply(context.Background(), s, f, ApplyOpts{}); err != nil {
 		t.Fatalf("first Apply: %v", err)
 	}
-	changes, err := Apply(s, f, ApplyOpts{})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("second Apply: %v", err)
 	}
@@ -90,12 +92,12 @@ func TestApplyUpdate(t *testing.T) {
 		},
 	}
-	if _, err := Apply(s, f, ApplyOpts{}); err != nil {
+	if _, err := Apply(context.Background(), s, f, ApplyOpts{}); err != nil {
 		t.Fatalf("first Apply: %v", err)
 	}
 	f.Monitors[0].Interval = 60
-	changes, err := Apply(s, f, ApplyOpts{})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("second Apply: %v", err)
 	}
@@ -104,7 +106,7 @@ func TestApplyUpdate(t *testing.T) {
 		t.Fatalf("expected 1 update, got %+v", changes)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	if sites[0].Interval != 60 {
 		t.Fatalf("expected interval 60, got %d", sites[0].Interval)
 	}
@@ -112,8 +114,8 @@ func TestApplyUpdate(t *testing.T) {
 func TestApplyPrune(t *testing.T) {
 	s := newTestStore(t)
-	s.AddSite(models.Site{Name: "Keep", URL: "https://keep.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s.AddSite(context.Background(), models.SiteConfig{Name: "Keep", URL: "https://keep.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	s.AddSite(models.Site{Name: "Remove", URL: "https://remove.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s.AddSite(context.Background(), models.SiteConfig{Name: "Remove", URL: "https://remove.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
 	f := &File{
 		Monitors: []Monitor{
@@ -121,7 +123,7 @@ func TestApplyPrune(t *testing.T) {
 		},
 	}
-	changes, err := Apply(s, f, ApplyOpts{Prune: true})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{Prune: true})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -136,7 +138,7 @@ func TestApplyPrune(t *testing.T) {
 		t.Fatalf("expected 1 delete, got %d", deleteCount)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	if len(sites) != 1 || sites[0].Name != "Keep" {
 		t.Fatalf("expected only 'Keep', got %+v", sites)
 	}
@@ -150,7 +152,7 @@ func TestApplyDryRun(t *testing.T) {
 		},
 	}
-	changes, err := Apply(s, f, ApplyOpts{DryRun: true})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{DryRun: true})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -159,7 +161,7 @@ func TestApplyDryRun(t *testing.T) {
 		t.Fatalf("expected 1 create in dry-run, got %+v", changes)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	if len(sites) != 0 {
 		t.Fatalf("expected 0 sites after dry-run, got %d", len(sites))
 	}
@@ -179,7 +181,7 @@ func TestApplyGroupHierarchy(t *testing.T) {
 		},
 	}
-	changes, err := Apply(s, f, ApplyOpts{})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -188,8 +190,8 @@ func TestApplyGroupHierarchy(t *testing.T) {
 		t.Fatalf("expected 3 creates, got %d", len(changes))
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
-	var group models.Site
+	var group models.SiteConfig
 	for _, s := range sites {
 		if s.Type == "group" {
 			group = s
@@ -223,12 +225,12 @@ func TestApplyAlertReference(t *testing.T) {
 		},
 	}
-	if _, err := Apply(s, f, ApplyOpts{}); err != nil {
+	if _, err := Apply(context.Background(), s, f, ApplyOpts{}); err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
-	alerts, _ := s.GetAllAlerts()
+	alerts, _ := s.GetAllAlerts(context.Background())
 	if sites[0].AlertID != alerts[0].ID {
 		t.Fatalf("expected alert_id %d, got %d", alerts[0].ID, sites[0].AlertID)
@@ -243,7 +245,7 @@ func TestApplyInvalidAlertRef(t *testing.T) {
 		},
 	}
-	_, err := Apply(s, f, ApplyOpts{})
+	_, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err == nil || !strings.Contains(err.Error(), "not found") {
 		t.Fatalf("expected alert not found error, got %v", err)
 	}
@@ -258,15 +260,83 @@ func TestApplyDuplicateNames(t *testing.T) {
 		},
 	}
-	_, err := Apply(s, f, ApplyOpts{})
+	_, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err == nil || !strings.Contains(err.Error(), "duplicate") {
 		t.Fatalf("expected duplicate error, got %v", err)
 	}
 }
 func TestApplyDryRunNewAlertAndMonitor(t *testing.T) {
 	s := newTestStore(t)
 	f := &File{
 		Alerts: []Alert{
 			{Name: "Discord", Type: "discord", Settings: map[string]string{"url": "https://example.com"}},
 		},
 		Monitors: []Monitor{
 			{Name: "Web", Type: "http", URL: "https://example.com", Interval: 30, Alert: "Discord"},
 		},
 	}
 	changes, err := Apply(context.Background(), s, f, ApplyOpts{DryRun: true})
 	if err != nil {
 		t.Fatalf("dry-run with new alert+monitor should not error: %v", err)
 	}
 	creates := 0
 	for _, c := range changes {
 		if c.Action == "create" {
 			creates++
 		}
 	}
 	if creates != 2 {
 		t.Fatalf("expected 2 creates (alert+monitor), got %d: %+v", creates, changes)
 	}
 	sites, _ := s.GetSites(context.Background())
 	alerts, _ := s.GetAllAlerts(context.Background())
 	if len(sites) != 0 {
 		t.Fatalf("dry-run should not persist sites, got %d", len(sites))
 	}
 	if len(alerts) != 0 {
 		t.Fatalf("dry-run should not persist alerts, got %d", len(alerts))
 	}
 }
 func TestApplyDryRunNewGroupWithChildren(t *testing.T) {
 	s := newTestStore(t)
 	f := &File{
 		Alerts: []Alert{
 			{Name: "Slack", Type: "slack", Settings: map[string]string{"url": "https://hooks.example.com"}},
 		},
 		Monitors: []Monitor{
 			{
 				Name: "Prod", Type: "group", Alert: "Slack",
 				Monitors: []Monitor{
 					{Name: "API", Type: "http", URL: "https://api.example.com", Interval: 15, Alert: "Slack"},
 				},
 			},
 		},
 	}
 	changes, err := Apply(context.Background(), s, f, ApplyOpts{DryRun: true})
 	if err != nil {
 		t.Fatalf("dry-run with new group+alert should not error: %v", err)
 	}
 	creates := 0
 	for _, c := range changes {
 		if c.Action == "create" {
 			creates++
 		}
 	}
 	if creates != 3 {
 		t.Fatalf("expected 3 creates (alert+group+child), got %d: %+v", creates, changes)
 	}
 }
 func TestApplyExistingAlertReference(t *testing.T) {
 	s := newTestStore(t)
-	s.AddAlert("Existing", "webhook", map[string]string{"url": "https://example.com"})
+	s.AddAlert(context.Background(), "Existing", "webhook", map[string]string{"url": "https://example.com"})
 	f := &File{
 		Monitors: []Monitor{
@@ -274,7 +344,7 @@ func TestApplyExistingAlertReference(t *testing.T) {
 		},
 	}
-	changes, err := Apply(s, f, ApplyOpts{})
+	changes, err := Apply(context.Background(), s, f, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -283,7 +353,7 @@ func TestApplyExistingAlertReference(t *testing.T) {
 		t.Fatalf("expected 1 create, got %+v", changes)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	if sites[0].AlertID == 0 {
 		t.Fatal("expected non-zero alert_id for existing alert reference")
 	}
@@ -1,6 +1,7 @@
 package config
 import (
 	"context"
 	"fmt"
 	"os"
 	"sort"
@@ -11,13 +12,13 @@ import (
 	"gopkg.in/yaml.v3"
 )
-func Export(s store.Store) (*File, error) {
+func Export(ctx context.Context, s store.Store) (*File, error) {
-	dbAlerts, err := s.GetAllAlerts()
+	dbAlerts, err := s.GetAllAlerts(ctx)
 	if err != nil {
 		return nil, fmt.Errorf("load alerts: %w", err)
 	}
-	dbSites, err := s.GetSites()
+	dbSites, err := s.GetSites(ctx)
 	if err != nil {
 		return nil, fmt.Errorf("load sites: %w", err)
 	}
@@ -33,9 +34,9 @@ func Export(s store.Store) (*File, error) {
 		})
 	}
-	groups := make(map[int]models.Site)
+	groups := make(map[int]models.SiteConfig)
-	children := make(map[int][]models.Site)
+	children := make(map[int][]models.SiteConfig)
-	var topLevel []models.Site
+	var topLevel []models.SiteConfig
 	for _, s := range dbSites {
 		switch {
@@ -75,7 +76,7 @@ func Export(s store.Store) (*File, error) {
 	return &File{Alerts: yamlAlerts, Monitors: yamlMonitors}, nil
 }
-func siteToMonitor(s models.Site, alertIDToName map[int]string) Monitor {
+func siteToMonitor(s models.SiteConfig, alertIDToName map[int]string) Monitor {
 	m := Monitor{
 		Name:     s.Name,
 		Type:     s.Type,
@@ -1,13 +1,15 @@
 package config
 import (
-	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
+	"context"
 	"testing"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
 func TestExportEmpty(t *testing.T) {
 	s := newTestStore(t)
-	f, err := Export(s)
+	f, err := Export(context.Background(), s)
 	if err != nil {
 		t.Fatalf("Export: %v", err)
 	}
@@ -18,11 +20,11 @@ func TestExportEmpty(t *testing.T) {
 func TestExportAlertNames(t *testing.T) {
 	s := newTestStore(t)
-	s.AddAlert("Discord", "discord", map[string]string{"url": "https://example.com"})
+	s.AddAlert(context.Background(), "Discord", "discord", map[string]string{"url": "https://example.com"})
-	alerts, _ := s.GetAllAlerts()
+	alerts, _ := s.GetAllAlerts(context.Background())
-	s.AddSite(models.Site{Name: "Web", URL: "https://example.com", Type: "http", Interval: 30, AlertID: alerts[0].ID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s.AddSite(context.Background(), models.SiteConfig{Name: "Web", URL: "https://example.com", Type: "http", Interval: 30, AlertID: alerts[0].ID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	f, err := Export(s)
+	f, err := Export(context.Background(), s)
 	if err != nil {
 		t.Fatalf("Export: %v", err)
 	}
@@ -37,11 +39,11 @@ func TestExportAlertNames(t *testing.T) {
 func TestExportGroupHierarchy(t *testing.T) {
 	s := newTestStore(t)
-	groupID, _ := s.AddSiteReturningID(models.Site{Name: "Prod", Type: "group", ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	groupID, _ := s.AddSiteReturningID(context.Background(), models.SiteConfig{Name: "Prod", Type: "group", ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	s.AddSite(models.Site{Name: "Prod Web", URL: "https://prod.example.com", Type: "http", Interval: 15, ParentID: groupID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s.AddSite(context.Background(), models.SiteConfig{Name: "Prod Web", URL: "https://prod.example.com", Type: "http", Interval: 15, ParentID: groupID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	s.AddSite(models.Site{Name: "Top Level", URL: "https://example.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s.AddSite(context.Background(), models.SiteConfig{Name: "Top Level", URL: "https://example.com", Type: "http", Interval: 30, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	f, err := Export(s)
+	f, err := Export(context.Background(), s)
 	if err != nil {
 		t.Fatalf("Export: %v", err)
 	}
@@ -70,12 +72,12 @@ func TestExportGroupHierarchy(t *testing.T) {
 func TestExportOmitsDefaults(t *testing.T) {
 	s := newTestStore(t)
-	s.AddSite(models.Site{
+	s.AddSite(context.Background(), models.SiteConfig{
 		Name: "Web", URL: "https://example.com", Type: "http", Interval: 30,
 		Method: "GET", AcceptedCodes: "200-299", ExpiryThreshold: 7,
 	})
-	f, err := Export(s)
+	f, err := Export(context.Background(), s)
 	if err != nil {
 		t.Fatalf("Export: %v", err)
 	}
@@ -94,18 +96,18 @@ func TestExportOmitsDefaults(t *testing.T) {
 func TestExportRoundTrip(t *testing.T) {
 	s1 := newTestStore(t)
-	s1.AddAlert("Discord", "discord", map[string]string{"url": "https://example.com"})
+	s1.AddAlert(context.Background(), "Discord", "discord", map[string]string{"url": "https://example.com"})
-	alerts, _ := s1.GetAllAlerts()
+	alerts, _ := s1.GetAllAlerts(context.Background())
-	s1.AddSite(models.Site{Name: "Web", URL: "https://example.com", Type: "http", Interval: 30, AlertID: alerts[0].ID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s1.AddSite(context.Background(), models.SiteConfig{Name: "Web", URL: "https://example.com", Type: "http", Interval: 30, AlertID: alerts[0].ID, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	s1.AddSite(models.Site{Name: "Ping", Type: "ping", Hostname: "10.0.0.1", Interval: 60, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
+	s1.AddSite(context.Background(), models.SiteConfig{Name: "Ping", Type: "ping", Hostname: "10.0.0.1", Interval: 60, ExpiryThreshold: 7, Method: "GET", AcceptedCodes: "200-299"})
-	exported, err := Export(s1)
+	exported, err := Export(context.Background(), s1)
 	if err != nil {
 		t.Fatalf("Export: %v", err)
 	}
 	s2 := newTestStore(t)
-	changes, err := Apply(s2, exported, ApplyOpts{})
+	changes, err := Apply(context.Background(), s2, exported, ApplyOpts{})
 	if err != nil {
 		t.Fatalf("Apply: %v", err)
 	}
@@ -120,7 +122,7 @@ func TestExportRoundTrip(t *testing.T) {
 		t.Fatalf("expected 3 creates, got %d", creates)
 	}
-	reexported, err := Export(s2)
+	reexported, err := Export(context.Background(), s2)
 	if err != nil {
 		t.Fatalf("re-Export: %v", err)
 	}
@@ -1,11 +1,14 @@
 package importer
 import (
 	"crypto/rand"
 	"encoding/hex"
 	"encoding/json"
 	"fmt"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"os"
 	"strings"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
 type KumaBackup struct {
@@ -80,7 +83,7 @@ func ConvertKuma(kb *KumaBackup) models.Backup {
 		}
 	}
-	var sites []models.Site
+	var sites []models.SiteConfig
 	for _, m := range kb.MonitorList {
 		site := convertKumaMonitor(m, kumaToUpkeepAlert)
 		sites = append(sites, site)
@@ -132,8 +135,8 @@ func convertKumaNotifications(entries []KumaNotifEntry) map[int]models.AlertConf
 	return result
 }
-func convertKumaMonitor(m KumaMonitor, alertMap map[int]int) models.Site {
+func convertKumaMonitor(m KumaMonitor, alertMap map[int]int) models.SiteConfig {
-	site := models.Site{
+	site := models.SiteConfig{
 		ID:          m.ID,
 		Name:        m.Name,
 		Description: m.Description,
@@ -155,10 +158,18 @@ func convertKumaMonitor(m KumaMonitor, alertMap map[int]int) models.Site {
 	site.DNSResolveType = m.DNSResolveType
 	site.DNSServer = m.DNSResolveServer
 	site.Paused = !m.Active
 	switch m.Type {
 	case "http":
 		site.URL = m.URL
 		site.CheckSSL = m.ExpiryNotif
 	case "push":
 		site.Type = "push"
 		b := make([]byte, 16)
 		if _, err := rand.Read(b); err == nil {
 			site.Token = hex.EncodeToString(b)
 		}
 	case "ping":
 		if m.Hostname != "" {
 			site.Hostname = m.Hostname
@@ -0,0 +1,210 @@
 package importer
 import (
 	"os"
 	"path/filepath"
 	"strings"
 	"testing"
 )
 func writeTemp(t *testing.T, content string) string {
 	t.Helper()
 	path := filepath.Join(t.TempDir(), "backup.json")
 	if err := os.WriteFile(path, []byte(content), 0o600); err != nil {
 		t.Fatal(err)
 	}
 	return path
 }
 func TestLoadKumaFileMissingFile(t *testing.T) {
 	_, err := LoadKumaFile(filepath.Join(t.TempDir(), "nope.json"))
 	if err == nil {
 		t.Fatal("expected error for missing file")
 	}
 }
 func TestLoadKumaFileMalformedInput(t *testing.T) {
 	cases := []struct {
 		name string
 		body string
 	}{
 		{"empty file", ""},
 		{"truncated JSON", `{"version": "1.23", "monitorList": [`},
 		{"not JSON", "definitely not json"},
 		{"wrong root type", `[1, 2, 3]`},
 		{"monitorList wrong type", `{"monitorList": {"a": 1}}`},
 		{"monitor field wrong type", `{"monitorList": [{"id": "not-an-int"}]}`},
 		{"notificationList wrong type", `{"notificationList": "oops"}`},
 	}
 	for _, tc := range cases {
 		t.Run(tc.name, func(t *testing.T) {
 			_, err := LoadKumaFile(writeTemp(t, tc.body))
 			if err == nil {
 				t.Fatalf("expected parse error for %s", tc.name)
 			}
 			if !strings.Contains(err.Error(), "parse JSON") {
 				t.Fatalf("expected wrapped parse error, got: %v", err)
 			}
 		})
 	}
 }
 func TestLoadKumaFileNullLists(t *testing.T) {
 	kb, err := LoadKumaFile(writeTemp(t, `{"version": "1.23", "monitorList": null, "notificationList": null}`))
 	if err != nil {
 		t.Fatal(err)
 	}
 	backup := ConvertKuma(kb)
 	if len(backup.Sites) != 0 || len(backup.Alerts) != 0 {
 		t.Fatalf("expected empty backup, got %d sites %d alerts", len(backup.Sites), len(backup.Alerts))
 	}
 }
 func TestConvertKumaSkipsMalformedNotificationConfig(t *testing.T) {
 	kb := &KumaBackup{
 		NotificationList: []KumaNotifEntry{
 			{ID: 1, Name: "broken", Config: "{not json"},
 			{ID: 2, Name: "good", Config: `{"type": "discord", "ntfyserverurl": "https://example.com/hook"}`},
 		},
 		MonitorList: []KumaMonitor{
 			{ID: 10, Name: "site", Type: "http", URL: "https://example.com", NotificationIDs: map[string]bool{"1": true}},
 		},
 	}
 	backup := ConvertKuma(kb)
 	if len(backup.Alerts) != 1 {
 		t.Fatalf("expected broken notification skipped, got %d alerts", len(backup.Alerts))
 	}
 	if backup.Alerts[0].Type != "discord" {
 		t.Fatalf("expected discord alert, got %q", backup.Alerts[0].Type)
 	}
 	if backup.Sites[0].AlertID != 0 {
 		t.Fatalf("site referencing skipped notification should keep AlertID 0, got %d", backup.Sites[0].AlertID)
 	}
 }
 func TestConvertKumaNtfyNotification(t *testing.T) {
 	kb := &KumaBackup{
 		NotificationList: []KumaNotifEntry{
 			{ID: 3, Name: "ntfy", Config: `{
 				"type": "ntfy",
 				"ntfyserverurl": "https://ntfy.example.com/",
 				"ntfytopic": "uptime",
 				"ntfyPriority": 4,
 				"ntfyAuthenticationMethod": "usernamePassword",
 				"ntfyusername": "u",
 				"ntfypassword": "p"
 			}`},
 		},
 	}
 	backup := ConvertKuma(kb)
 	if len(backup.Alerts) != 1 {
 		t.Fatalf("expected 1 alert, got %d", len(backup.Alerts))
 	}
 	a := backup.Alerts[0]
 	if a.Type != "ntfy" {
 		t.Fatalf("expected ntfy, got %q", a.Type)
 	}
 	if a.Settings["url"] != "https://ntfy.example.com" {
 		t.Fatalf("expected trailing slash trimmed, got %q", a.Settings["url"])
 	}
 	if a.Settings["topic"] != "uptime" || a.Settings["priority"] != "4" {
 		t.Fatalf("unexpected settings: %v", a.Settings)
 	}
 	if a.Settings["username"] != "u" || a.Settings["password"] != "p" {
 		t.Fatalf("expected credentials mapped, got %v", a.Settings)
 	}
 }
 func TestConvertKumaUnknownNotificationFallsBackToWebhook(t *testing.T) {
 	kb := &KumaBackup{
 		NotificationList: []KumaNotifEntry{
 			{ID: 4, Name: "matrix", Config: `{"type": "matrix", "ntfyserverurl": "https://example.com/hook"}`},
 		},
 	}
 	backup := ConvertKuma(kb)
 	if len(backup.Alerts) != 1 || backup.Alerts[0].Type != "webhook" {
 		t.Fatalf("expected webhook fallback, got %+v", backup.Alerts)
 	}
 }
 func TestConvertKumaHTTPMonitor(t *testing.T) {
 	kb := &KumaBackup{
 		NotificationList: []KumaNotifEntry{
 			{ID: 1, Name: "hook", Config: `{"type": "slack", "ntfyserverurl": "https://example.com/hook"}`},
 		},
 		MonitorList: []KumaMonitor{{
 			ID:              7,
 			Name:            "web",
 			Type:            "http",
 			URL:             "https://example.com",
 			Interval:        60,
 			Timeout:         30,
 			MaxRetries:      2,
 			Method:          "GET",
 			AcceptedCodes:   []string{"200", "301"},
 			IgnoreTLS:       true,
 			ExpiryNotif:     true,
 			Active:          false,
 			NotificationIDs: map[string]bool{"1": true},
 		}},
 	}
 	backup := ConvertKuma(kb)
 	if len(backup.Sites) != 1 {
 		t.Fatalf("expected 1 site, got %d", len(backup.Sites))
 	}
 	s := backup.Sites[0]
 	if s.URL != "https://example.com" || !s.CheckSSL || !s.IgnoreTLS {
 		t.Fatalf("http fields not mapped: %+v", s)
 	}
 	if !s.Paused {
 		t.Fatal("inactive monitor should import paused")
 	}
 	if s.AcceptedCodes != "200,301" {
 		t.Fatalf("expected joined accepted codes, got %q", s.AcceptedCodes)
 	}
 	if s.AlertID != 1 {
 		t.Fatalf("expected alert mapped, got %d", s.AlertID)
 	}
 }
 func TestConvertKumaPushMonitorGetsToken(t *testing.T) {
 	kb := &KumaBackup{
 		MonitorList: []KumaMonitor{{ID: 1, Name: "push", Type: "push", Active: true}},
 	}
 	backup := ConvertKuma(kb)
 	token := backup.Sites[0].Token
 	if len(token) != 32 {
 		t.Fatalf("expected 32-char hex token, got %q", token)
 	}
 }
 func TestConvertKumaNonNumericNotificationID(t *testing.T) {
 	kb := &KumaBackup{
 		MonitorList: []KumaMonitor{{
 			ID:              1,
 			Name:            "site",
 			Type:            "http",
 			NotificationIDs: map[string]bool{"abc": true},
 		}},
 	}
 	backup := ConvertKuma(kb)
 	if backup.Sites[0].AlertID != 0 {
 		t.Fatalf("non-numeric notification ID should not map, got %d", backup.Sites[0].AlertID)
 	}
 }
 func TestConvertKumaGroupAndChildren(t *testing.T) {
 	kb := &KumaBackup{
 		MonitorList: []KumaMonitor{
 			{ID: 1, Name: "grp", Type: "group", Active: true},
 			{ID: 2, Name: "ping", Type: "ping", Hostname: "10.0.0.1", Parent: 1, Active: true},
 		},
 	}
 	backup := ConvertKuma(kb)
 	if backup.Sites[0].Type != "group" {
 		t.Fatalf("expected group type, got %q", backup.Sites[0].Type)
 	}
 	if backup.Sites[1].ParentID != 1 || backup.Sites[1].Hostname != "10.0.0.1" {
 		t.Fatalf("child not mapped: %+v", backup.Sites[1])
 	}
 }
@@ -2,11 +2,12 @@ package metrics
 import (
 	"fmt"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	"net/http"
 	"sort"
 	"strings"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 )
 func Handler(eng *monitor.Engine) http.HandlerFunc {
@@ -19,7 +20,7 @@ func Handler(eng *monitor.Engine) http.HandlerFunc {
 		writeHelp(&b, "uptop_monitor_up", "gauge", "Whether the monitor is up (1) or down (0).")
 		for _, s := range sites {
 			val := 0
-			if s.Status == "UP" {
+			if s.Status == models.StatusUp {
 				val = 1
 			}
 			writeGauge(&b, "uptop_monitor_up", labels(s), float64(val))
@@ -10,79 +10,21 @@ import (
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 )
 type mockStore struct {
-	sites []models.Site
+	storetest.BaseMock
 	sites []models.SiteConfig
 }
-func (m *mockStore) Init() error                                              { return nil }
+func (m *mockStore) GetSites(_ context.Context) ([]models.SiteConfig, error) {
-func (m *mockStore) GetSites() ([]models.Site, error)                         { return m.sites, nil }
+	return m.sites, nil
 func (m *mockStore) AddSite(models.Site) error                                { return nil }
 func (m *mockStore) UpdateSite(models.Site) error                             { return nil }
 func (m *mockStore) UpdateSitePaused(int, bool) error                         { return nil }
 func (m *mockStore) DeleteSite(int) error                                     { return nil }
 func (m *mockStore) GetAllAlerts() ([]models.AlertConfig, error)              { return nil, nil }
 func (m *mockStore) GetAlert(int) (models.AlertConfig, error)                 { return models.AlertConfig{}, nil }
 func (m *mockStore) AddAlert(string, string, map[string]string) error         { return nil }
 func (m *mockStore) UpdateAlert(int, string, string, map[string]string) error { return nil }
 func (m *mockStore) DeleteAlert(int) error                                    { return nil }
 func (m *mockStore) GetAllUsers() ([]models.User, error)                      { return nil, nil }
 func (m *mockStore) AddUser(string, string, string) error                     { return nil }
 func (m *mockStore) UpdateUser(int, string, string, string) error             { return nil }
 func (m *mockStore) DeleteUser(int) error                                     { return nil }
 func (m *mockStore) SaveCheck(int, int64, bool) error                         { return nil }
 func (m *mockStore) LoadAllHistory(int) (map[int][]models.CheckRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) ExportData() (models.Backup, error)        { return models.Backup{}, nil }
 func (m *mockStore) ImportData(models.Backup) error            { return nil }
 func (m *mockStore) GetSiteByName(string) (models.Site, error) { return models.Site{}, nil }
 func (m *mockStore) GetAlertByName(string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, nil
 }
 func (m *mockStore) AddSiteReturningID(models.Site) (int, error) { return 0, nil }
 func (m *mockStore) AddAlertReturningID(string, string, map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *mockStore) SaveCheckFromNode(int, string, int64, bool) error { return nil }
 func (m *mockStore) RegisterNode(models.ProbeNode) error              { return nil }
 func (m *mockStore) GetNode(string) (models.ProbeNode, error)         { return models.ProbeNode{}, nil }
 func (m *mockStore) GetAllNodes() ([]models.ProbeNode, error)         { return nil, nil }
 func (m *mockStore) UpdateNodeLastSeen(string) error                  { return nil }
 func (m *mockStore) DeleteNode(string) error                          { return nil }
 func (m *mockStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) SaveAlertHealth(models.AlertHealthRecord) error { return nil }
 func (m *mockStore) SaveLog(string) error                           { return nil }
 func (m *mockStore) PruneLogs() error                               { return nil }
 func (m *mockStore) PruneCheckHistory() error                       { return nil }
 func (m *mockStore) PruneStateChanges() error                       { return nil }
 func (m *mockStore) LoadLogs(int) ([]string, error)                 { return nil, nil }
 func (m *mockStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) GetAllMaintenanceWindows(int) ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) AddMaintenanceWindow(models.MaintenanceWindow) error         { return nil }
 func (m *mockStore) EndMaintenanceWindow(int) error                              { return nil }
 func (m *mockStore) DeleteMaintenanceWindow(int) error                           { return nil }
 func (m *mockStore) PruneExpiredMaintenanceWindows(time.Duration) (int64, error) { return 0, nil }
 func (m *mockStore) IsMonitorInMaintenance(int) (bool, error)                    { return false, nil }
 func (m *mockStore) GetPreference(string) (string, error)                        { return "", nil }
 func (m *mockStore) SetPreference(string, string) error                          { return nil }
 func (m *mockStore) SaveStateChange(int, string, string, string) error           { return nil }
 func (m *mockStore) GetStateChanges(int, int) ([]models.StateChange, error)      { return nil, nil }
 func (m *mockStore) GetStateChangesSince(int, time.Time) ([]models.StateChange, error) {
 	return nil, nil
 }
 func (m *mockStore) Close() error { return nil }
 func TestMetricsHandler(t *testing.T) {
 	ms := &mockStore{
-		sites: []models.Site{
+		sites: []models.SiteConfig{
 			{ID: 1, Name: "Example", URL: "https://example.com", Type: "http", Interval: 30},
 			{ID: 2, Name: "DNS Check", Type: "dns", Interval: 60},
 		},
@@ -2,7 +2,7 @@ package models
 import "time"
-type Site struct {
+type SiteConfig struct {
 	ID              int
 	Name            string
 	URL             string
@@ -26,9 +26,11 @@ type Site struct {
 	IgnoreTLS      bool
 	Paused         bool
 	Regions        string
 }
 type SiteState struct {
 	FailureCount    int
-	Status          string
+	Status          Status
 	StatusCode      int
 	Latency         time.Duration
 	CertExpiry      time.Time
@@ -40,6 +42,11 @@ type Site struct {
 	LastSuccessAt   time.Time
 }
 type Site struct {
 	SiteConfig
 	SiteState
 }
 type StateChange struct {
 	ID          int
 	SiteID      int
@@ -103,7 +110,7 @@ type MaintenanceWindow struct {
 }
 type Backup struct {
-	Sites              []Site              `json:"sites"`
+	Sites              []SiteConfig        `json:"sites"`
 	Alerts             []AlertConfig       `json:"alerts"`
 	Users              []User              `json:"users"`
 	MaintenanceWindows []MaintenanceWindow `json:"maintenance_windows,omitempty"`
@@ -0,0 +1,36 @@
 package models
 // safeAlertSettingKeys lists, per provider type, the alert settings that are
 // NOT secret and may be shown or exported in the clear. Everything else is
 // redacted. Providers absent from this map (discord, slack, webhook, pushover)
 // carry their secret in a field a denylist would miss — the webhook URL, the
 // pushover token/user — so all of their settings are redacted.
 var safeAlertSettingKeys = map[string]map[string]bool{
 	"email":     {"host": true, "port": true, "to": true, "from": true},
 	"ntfy":      {"topic": true, "priority": true},
 	"telegram":  {"chat_id": true},
 	"pagerduty": {"severity": true},
 	"gotify":    {"priority": true},
 	"opsgenie":  {"priority": true, "eu": true},
 }
 // RedactAlertSettings keeps only the known-safe keys for the alert type and
 // redacts everything else. An allowlist fails safe: an unknown or newly added
 // setting is redacted by default instead of leaking. Shared by the backup
 // export path and the TUI alert detail panel so both render through the same
 // policy.
 func RedactAlertSettings(alertType string, settings map[string]string) map[string]string {
 	safe := safeAlertSettingKeys[alertType]
 	redacted := make(map[string]string, len(settings))
 	for k, v := range settings {
 		switch {
 		case v == "":
 			redacted[k] = ""
 		case safe[k]:
 			redacted[k] = v
 		default:
 			redacted[k] = "***REDACTED***"
 		}
 	}
 	return redacted
 }
@@ -0,0 +1,18 @@
 package models
 type Status string
 const (
 	StatusUp      Status = "UP"
 	StatusDown    Status = "DOWN"
 	StatusPending Status = "PENDING"
 	StatusLate    Status = "LATE"
 	StatusStale   Status = "STALE"
 	StatusSSLExp  Status = "SSL EXP"
 )
 func (s Status) IsBroken() bool {
 	return s == StatusDown || s == StatusSSLExp
 }
 func (s Status) String() string { return string(s) }
@@ -3,6 +3,7 @@ package monitor
 import (
 	"context"
 	"fmt"
 	"io"
 	"net"
 	"net/http"
 	"strconv"
@@ -35,52 +36,57 @@ type CheckResult struct {
 	ErrorReason string
 }
-func RunCheck(site models.Site, strict, insecure *http.Client, globalInsecure bool, allowPrivate ...bool) CheckResult {
+func RunCheck(ctx context.Context, site models.SiteConfig, strict, insecure *http.Client, globalInsecure, allowPrivate bool) CheckResult {
-	private := len(allowPrivate) > 0 && allowPrivate[0]
+	// Resolve + validate once for non-HTTP types to prevent DNS-rebind TOCTOU:
-
+	// a second resolve in the check function could return a different (private) IP.
-	if site.Type != "http" && site.Type != "dns" && !private {
+	// HTTP is safe — SafeDialContext resolves and validates at dial time.
 	var pinnedIP net.IP
 	if site.Type != "http" && site.Type != "dns" && !allowPrivate {
 		host := site.Hostname
 		if host == "" {
 			host = site.URL
 		}
 		if host != "" {
-			if ips, err := net.LookupIP(host); err == nil {
+			ips, err := net.LookupIP(host)
-				for _, ip := range ips {
+			if err != nil {
-					if isPrivateIP(ip) {
+				return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "resolve failed: " + err.Error()}
-						return CheckResult{SiteID: site.ID, Status: "DOWN", ErrorReason: "target resolves to private IP"}
+			}
-					}
+			for _, ip := range ips {
 				if isPrivateIP(ip) {
 					return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "target resolves to private IP"}
 				}
 			}
 			pinnedIP = ips[0]
 		}
 	}
 	switch site.Type {
 	case "http":
-		return runHTTPCheck(site, strict, insecure, globalInsecure)
+		return runHTTPCheck(ctx, site, strict, insecure, globalInsecure)
 	case "ping":
-		return runPingCheck(site)
+		return runPingCheck(ctx, site, pinnedIP)
 	case "port":
-		return runPortCheck(site)
+		return runPortCheck(ctx, site, pinnedIP)
 	case "dns":
-		return runDNSCheck(site)
+		return runDNSCheck(ctx, site, allowPrivate)
 	default:
-		return CheckResult{SiteID: site.ID, Status: "DOWN", ErrorReason: "unsupported monitor type: " + site.Type}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "unsupported monitor type: " + site.Type}
 	}
 }
-func runHTTPCheck(site models.Site, strict, insecure *http.Client, globalInsecure bool) CheckResult {
+func runHTTPCheck(ctx context.Context, site models.SiteConfig, strict, insecure *http.Client, globalInsecure bool) CheckResult {
 	method := site.Method
 	if method == "" {
 		method = "GET"
 	}
 	timeout := siteTimeout(site)
-	ctx, cancel := context.WithTimeout(context.Background(), timeout)
+	ctx, cancel := context.WithTimeout(ctx, timeout)
 	defer cancel()
 	req, err := http.NewRequestWithContext(ctx, method, site.URL, nil)
 	if err != nil {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", ErrorReason: "invalid request: " + err.Error()}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "invalid request: " + err.Error()}
 	}
 	client := strict
@@ -94,20 +100,23 @@ func runHTTPCheck(site models.Site, strict, insecure *http.Client, globalInsecur
 	result := CheckResult{
 		SiteID:    site.ID,
-		Status:    "UP",
+		Status:    string(models.StatusUp),
 		LatencyNs: latency.Nanoseconds(),
 	}
 	if err != nil {
-		result.Status = "DOWN"
+		result.Status = string(models.StatusDown)
 		result.ErrorReason = truncateError(err.Error(), maxErrorLength)
 		return result
 	}
-	defer resp.Body.Close()
+	defer func() {
 		_, _ = io.Copy(io.Discard, resp.Body)
 		_ = resp.Body.Close()
 	}()
 	result.StatusCode = resp.StatusCode
 	if !isCodeAccepted(resp.StatusCode, site.AcceptedCodes) {
-		result.Status = "DOWN"
+		result.Status = string(models.StatusDown)
 		expected := site.AcceptedCodes
 		if expected == "" {
 			expected = defaultAcceptedCodes
@@ -120,7 +129,7 @@ func runHTTPCheck(site models.Site, strict, insecure *http.Client, globalInsecur
 		cert := resp.TLS.PeerCertificates[0]
 		result.CertExpiry = cert.NotAfter
 		if time.Now().After(cert.NotAfter) {
-			result.Status = "SSL EXP"
+			result.Status = string(models.StatusSSLExp)
 			result.ErrorReason = "SSL certificate expired"
 		}
 	}
@@ -128,7 +137,7 @@ func runHTTPCheck(site models.Site, strict, insecure *http.Client, globalInsecur
 	return result
 }
-func runPingCheck(site models.Site) CheckResult {
+func runPingCheck(_ context.Context, site models.SiteConfig, pinnedIP net.IP) CheckResult {
 	host := site.Hostname
 	if host == "" {
 		host = site.URL
@@ -136,7 +145,10 @@ func runPingCheck(site models.Site) CheckResult {
 	pinger, err := probing.NewPinger(host)
 	if err != nil {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", ErrorReason: "ping setup: " + err.Error()}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "ping setup: " + err.Error()}
 	}
 	if pinnedIP != nil {
 		pinger.SetIPAddr(&net.IPAddr{IP: pinnedIP})
 	}
 	pinger.Count = 1
 	pinger.Timeout = siteTimeout(site)
@@ -147,21 +159,24 @@ func runPingCheck(site models.Site) CheckResult {
 	latency := time.Since(start)
 	if err != nil {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", LatencyNs: latency.Nanoseconds(), ErrorReason: "ping failed: " + err.Error()}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), LatencyNs: latency.Nanoseconds(), ErrorReason: "ping failed: " + err.Error()}
 	}
 	if pinger.Statistics().PacketsRecv == 0 {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", LatencyNs: latency.Nanoseconds(), ErrorReason: "no ICMP response"}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), LatencyNs: latency.Nanoseconds(), ErrorReason: "no ICMP response"}
 	}
 	stats := pinger.Statistics()
-	return CheckResult{SiteID: site.ID, Status: "UP", LatencyNs: stats.AvgRtt.Nanoseconds()}
+	return CheckResult{SiteID: site.ID, Status: string(models.StatusUp), LatencyNs: stats.AvgRtt.Nanoseconds()}
 }
-func runPortCheck(site models.Site) CheckResult {
+func runPortCheck(_ context.Context, site models.SiteConfig, pinnedIP net.IP) CheckResult {
 	host := site.Hostname
 	if host == "" {
 		host = site.URL
 	}
 	if pinnedIP != nil {
 		host = pinnedIP.String()
 	}
 	addr := net.JoinHostPort(host, strconv.Itoa(site.Port))
 	timeout := siteTimeout(site)
@@ -170,13 +185,13 @@ func runPortCheck(site models.Site) CheckResult {
 	latency := time.Since(start)
 	if err != nil {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", LatencyNs: latency.Nanoseconds(), ErrorReason: truncateError(err.Error(), maxErrorLength)}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), LatencyNs: latency.Nanoseconds(), ErrorReason: truncateError(err.Error(), maxErrorLength)}
 	}
 	_ = conn.Close()
-	return CheckResult{SiteID: site.ID, Status: "UP", LatencyNs: latency.Nanoseconds()}
+	return CheckResult{SiteID: site.ID, Status: string(models.StatusUp), LatencyNs: latency.Nanoseconds()}
 }
-func runDNSCheck(site models.Site) CheckResult {
+func runDNSCheck(_ context.Context, site models.SiteConfig, allowPrivate bool) CheckResult {
 	host := site.Hostname
 	if host == "" {
 		host = site.URL
@@ -186,9 +201,24 @@ func runDNSCheck(site models.Site) CheckResult {
 	if server == "" {
 		server = defaultDNSServer
 	}
-	if _, _, err := net.SplitHostPort(server); err != nil {
+	serverHost, serverPort, err := net.SplitHostPort(server)
-		server = net.JoinHostPort(server, defaultDNSPort)
+	if err != nil {
 		serverHost = server
 		serverPort = defaultDNSPort
 	}
 	if !allowPrivate {
 		if serverPort != defaultDNSPort {
 			return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "DNS server port must be 53"}
 		}
 		if ips, err := net.LookupIP(serverHost); err == nil {
 			for _, ip := range ips {
 				if isPrivateIP(ip) {
 					return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), ErrorReason: "DNS server resolves to private address"}
 				}
 			}
 		}
 	}
 	server = net.JoinHostPort(serverHost, serverPort)
 	qtype := dns.TypeA
 	switch site.DNSResolveType {
@@ -221,15 +251,15 @@ func runDNSCheck(site models.Site) CheckResult {
 	latency := time.Since(start)
 	if err != nil {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", LatencyNs: latency.Nanoseconds(), ErrorReason: "DNS query failed: " + err.Error()}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), LatencyNs: latency.Nanoseconds(), ErrorReason: "DNS query failed: " + err.Error()}
 	}
 	if r.Rcode != dns.RcodeSuccess {
-		return CheckResult{SiteID: site.ID, Status: "DOWN", StatusCode: r.Rcode, LatencyNs: latency.Nanoseconds(), ErrorReason: "DNS RCODE: " + dns.RcodeToString[r.Rcode]}
+		return CheckResult{SiteID: site.ID, Status: string(models.StatusDown), StatusCode: r.Rcode, LatencyNs: latency.Nanoseconds(), ErrorReason: "DNS RCODE: " + dns.RcodeToString[r.Rcode]}
 	}
-	return CheckResult{SiteID: site.ID, Status: "UP", LatencyNs: latency.Nanoseconds()}
+	return CheckResult{SiteID: site.ID, Status: string(models.StatusUp), LatencyNs: latency.Nanoseconds()}
 }
-func siteTimeout(site models.Site) time.Duration {
+func siteTimeout(site models.SiteConfig) time.Duration {
 	if site.Timeout > 0 {
 		return time.Duration(site.Timeout) * time.Second
 	}
@@ -1,6 +1,7 @@
 package monitor
 import (
 	"context"
 	"crypto/tls"
 	"net"
 	"net/http"
@@ -18,8 +19,8 @@ func TestRunCheck_HTTP_Success(t *testing.T) {
 	}))
 	defer srv.Close()
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL}
-	result := RunCheck(site, http.DefaultClient, http.DefaultClient, false)
+	result := RunCheck(context.Background(), site, http.DefaultClient, http.DefaultClient, false, false)
 	if result.Status != "UP" {
 		t.Errorf("expected UP, got %s", result.Status)
@@ -38,8 +39,8 @@ func TestRunCheck_HTTP_ServerError(t *testing.T) {
 	}))
 	defer srv.Close()
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL}
-	result := RunCheck(site, http.DefaultClient, http.DefaultClient, false)
+	result := RunCheck(context.Background(), site, http.DefaultClient, http.DefaultClient, false, false)
 	if result.Status != "DOWN" {
 		t.Errorf("expected DOWN, got %s", result.Status)
@@ -59,8 +60,8 @@ func TestRunCheck_HTTP_CustomAcceptedCodes(t *testing.T) {
 		return http.ErrUseLastResponse
 	}}
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL, AcceptedCodes: "200-399"}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL, AcceptedCodes: "200-399"}
-	result := RunCheck(site, client, client, false)
+	result := RunCheck(context.Background(), site, client, client, false, false)
 	if result.Status != "UP" {
 		t.Errorf("expected UP with accepted 200-399, got %s", result.Status)
@@ -75,8 +76,8 @@ func TestRunCheck_HTTP_MethodRespected(t *testing.T) {
 	}))
 	defer srv.Close()
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL, Method: "HEAD"}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL, Method: "HEAD"}
-	RunCheck(site, http.DefaultClient, http.DefaultClient, false)
+	RunCheck(context.Background(), site, http.DefaultClient, http.DefaultClient, false, false)
 	if receivedMethod != "HEAD" {
 		t.Errorf("expected HEAD, got %s", receivedMethod)
@@ -90,8 +91,8 @@ func TestRunCheck_HTTP_Timeout(t *testing.T) {
 	}))
 	defer srv.Close()
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL, Timeout: 1}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL, Timeout: 1}
-	result := RunCheck(site, http.DefaultClient, http.DefaultClient, false)
+	result := RunCheck(context.Background(), site, http.DefaultClient, http.DefaultClient, false, false)
 	if result.Status != "DOWN" {
 		t.Errorf("expected DOWN on timeout, got %s", result.Status)
@@ -108,8 +109,8 @@ func TestRunCheck_HTTP_SSLFields(t *testing.T) {
 		Transport: &http.Transport{TLSClientConfig: &tls.Config{InsecureSkipVerify: true}},
 	}
-	site := models.Site{ID: 1, Type: "http", URL: srv.URL, CheckSSL: true, IgnoreTLS: true}
+	site := models.SiteConfig{ID: 1, Type: "http", URL: srv.URL, CheckSSL: true, IgnoreTLS: true}
-	result := RunCheck(site, http.DefaultClient, insecureClient, false)
+	result := RunCheck(context.Background(), site, http.DefaultClient, insecureClient, false, false)
 	if result.Status != "UP" {
 		t.Errorf("expected UP, got %s", result.Status)
@@ -132,8 +133,8 @@ func TestRunCheck_Port_Open(t *testing.T) {
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	port, _ := strconv.Atoi(portStr)
-	site := models.Site{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 2}
+	site := models.SiteConfig{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 2}
-	result := RunCheck(site, nil, nil, false, true)
+	result := RunCheck(context.Background(), site, nil, nil, false, true)
 	if result.Status != "UP" {
 		t.Errorf("expected UP, got %s", result.Status)
@@ -152,14 +153,51 @@ func TestRunCheck_Port_Closed(t *testing.T) {
 	port, _ := strconv.Atoi(portStr)
 	ln.Close()
-	site := models.Site{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 1}
+	site := models.SiteConfig{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 1}
-	result := RunCheck(site, nil, nil, false, true)
+	result := RunCheck(context.Background(), site, nil, nil, false, true)
 	if result.Status != "DOWN" {
 		t.Errorf("expected DOWN, got %s", result.Status)
 	}
 }
 func TestRunPortCheck_UsesPinnedIP(t *testing.T) {
 	ln, err := net.Listen("tcp", "127.0.0.1:0")
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer ln.Close()
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	port, _ := strconv.Atoi(portStr)
 	// Pass a pinned IP — runPortCheck should dial it instead of resolving Hostname.
 	site := models.SiteConfig{ID: 1, Type: "port", Hostname: "will-not-resolve.invalid", Port: port, Timeout: 2}
 	result := runPortCheck(context.Background(), site, net.ParseIP("127.0.0.1"))
 	if result.Status != "UP" {
 		t.Errorf("expected UP when pinned IP used, got %s: %s", result.Status, result.ErrorReason)
 	}
 }
 func TestRunPortCheck_NilPinnedIP_UsesHostname(t *testing.T) {
 	ln, err := net.Listen("tcp", "127.0.0.1:0")
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer ln.Close()
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	port, _ := strconv.Atoi(portStr)
 	site := models.SiteConfig{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 2}
 	result := runPortCheck(context.Background(), site, nil)
 	if result.Status != "UP" {
 		t.Errorf("expected UP with nil pinnedIP fallback, got %s: %s", result.Status, result.ErrorReason)
 	}
 }
 func TestRunCheck_Port_BlocksPrivateByDefault(t *testing.T) {
 	ln, err := net.Listen("tcp", "127.0.0.1:0")
 	if err != nil {
@@ -170,8 +208,8 @@ func TestRunCheck_Port_BlocksPrivateByDefault(t *testing.T) {
 	_, portStr, _ := net.SplitHostPort(ln.Addr().String())
 	port, _ := strconv.Atoi(portStr)
-	site := models.Site{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 2}
+	site := models.SiteConfig{ID: 1, Type: "port", Hostname: "127.0.0.1", Port: port, Timeout: 2}
-	result := RunCheck(site, nil, nil, false)
+	result := RunCheck(context.Background(), site, nil, nil, false, false)
 	if result.Status != "DOWN" {
 		t.Errorf("expected DOWN when private targets blocked, got %s", result.Status)
@@ -179,8 +217,8 @@ func TestRunCheck_Port_BlocksPrivateByDefault(t *testing.T) {
 }
 func TestRunCheck_UnknownType(t *testing.T) {
-	site := models.Site{ID: 1, Type: "invalid"}
+	site := models.SiteConfig{ID: 1, Type: "invalid"}
-	result := RunCheck(site, nil, nil, false)
+	result := RunCheck(context.Background(), site, nil, nil, false, false)
 	if result.Status != "DOWN" {
 		t.Errorf("expected DOWN for unknown type, got %s", result.Status)
@@ -213,10 +251,10 @@ func TestIsCodeAccepted(t *testing.T) {
 }
 func TestSiteTimeout(t *testing.T) {
-	if got := siteTimeout(models.Site{Timeout: 0}); got != 5*time.Second {
+	if got := siteTimeout(models.SiteConfig{Timeout: 0}); got != 5*time.Second {
 		t.Errorf("expected 5s default, got %v", got)
 	}
-	if got := siteTimeout(models.Site{Timeout: 10}); got != 10*time.Second {
+	if got := siteTimeout(models.SiteConfig{Timeout: 10}); got != 10*time.Second {
 		t.Errorf("expected 10s, got %v", got)
 	}
 }
@@ -1,6 +1,8 @@
 package monitor
 import (
 	"context"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store"
 )
@@ -10,14 +12,14 @@ import (
 // serializing all writes through one connection and surfacing errors instead of
 // discarding them. desc names the write for diagnostics on drop/failure.
 type dbWrite interface {
-	exec(s store.Store) error
+	exec(ctx context.Context, s store.Store) error
 	desc() string
 }
 type writeLog struct{ message string }
-func (w writeLog) exec(s store.Store) error { return s.SaveLog(w.message) }
+func (w writeLog) exec(ctx context.Context, s store.Store) error { return s.SaveLog(ctx, w.message) }
-func (w writeLog) desc() string             { return "log" }
+func (w writeLog) desc() string                                  { return "log" }
 type writeCheck struct {
 	siteID    int
@@ -25,8 +27,10 @@ type writeCheck struct {
 	isUp      bool
 }
-func (w writeCheck) exec(s store.Store) error { return s.SaveCheck(w.siteID, w.latencyNs, w.isUp) }
+func (w writeCheck) exec(ctx context.Context, s store.Store) error {
-func (w writeCheck) desc() string             { return "check" }
+	return s.SaveCheck(ctx, w.siteID, w.latencyNs, w.isUp)
 }
 func (w writeCheck) desc() string { return "check" }
 type writeStateChange struct {
 	siteID     int
@@ -35,12 +39,26 @@ type writeStateChange struct {
 	reason     string
 }
-func (w writeStateChange) exec(s store.Store) error {
+func (w writeStateChange) exec(ctx context.Context, s store.Store) error {
-	return s.SaveStateChange(w.siteID, w.fromStatus, w.toStatus, w.reason)
+	return s.SaveStateChange(ctx, w.siteID, w.fromStatus, w.toStatus, w.reason)
 }
 func (w writeStateChange) desc() string { return "state-change" }
 type writeAlertHealth struct{ rec models.AlertHealthRecord }
-func (w writeAlertHealth) exec(s store.Store) error { return s.SaveAlertHealth(w.rec) }
+func (w writeAlertHealth) exec(ctx context.Context, s store.Store) error {
-func (w writeAlertHealth) desc() string             { return "alert-health" }
+	return s.SaveAlertHealth(ctx, w.rec)
 }
 func (w writeAlertHealth) desc() string { return "alert-health" }
 type writeProbeCheck struct {
 	siteID    int
 	nodeID    string
 	latencyNs int64
 	isUp      bool
 }
 func (w writeProbeCheck) exec(ctx context.Context, s store.Store) error {
 	return s.SaveCheckFromNode(ctx, w.siteID, w.nodeID, w.latencyNs, w.isUp)
 }
 func (w writeProbeCheck) desc() string { return "probe-check" }
@@ -1,6 +1,9 @@
 package monitor
-import "time"
+import (
 	"context"
 	"time"
 )
 const maxHistoryLen = 60
@@ -12,7 +15,7 @@ type SiteHistory struct {
 }
 func (e *Engine) InitHistory() {
-	all, err := e.db.LoadAllHistory(maxHistoryLen)
+	all, err := e.db.LoadAllHistory(context.Background(), maxHistoryLen)
 	if err != nil {
 		e.AddLog("Failed to load check history: " + err.Error())
 		return
@@ -60,6 +60,9 @@ type Engine struct {
 	recheckMu sync.RWMutex
 	recheck   map[int]chan struct{}
 	maintCacheMu sync.RWMutex
 	maintCache   map[int]bool
 	db                  store.Store
 	insecureSkipVerify  bool
 	allowPrivateTargets bool
@@ -67,10 +70,11 @@ type Engine struct {
 	strictClient        *http.Client
 	insecureClient      *http.Client
-	dbWrites chan dbWrite
+	dbWrites  chan dbWrite
-	writerWG sync.WaitGroup
+	writerWG  sync.WaitGroup
-	cancel   context.CancelFunc
+	checkerWG sync.WaitGroup
-	stopOnce sync.Once
+	cancel    context.CancelFunc
 	stopOnce  sync.Once
 }
 func NewEngine(s store.Store) *Engine {
@@ -111,10 +115,14 @@ func newEngine(s store.Store, allowPrivateTargets bool) *Engine {
 	}
 }
 // SetInsecureSkipVerify must be called before Start: the field is read by
 // checker goroutines without synchronization.
 func (e *Engine) SetInsecureSkipVerify(skip bool) {
 	e.insecureSkipVerify = skip
 }
 // SetMaintRetention must be called before Start: the field is read by the
 // maintenance prune goroutine without synchronization.
 func (e *Engine) SetMaintRetention(d time.Duration) {
 	e.maintRetention = d
 }
@@ -181,16 +189,16 @@ func (e *Engine) dbWriter(ctx context.Context) {
 	pruneTicker := time.NewTicker(dbPruneInterval)
 	defer pruneTicker.Stop()
-	e.prune()
+	e.prune(ctx)
 	for {
 		select {
 		case w := <-e.dbWrites:
-			if err := w.exec(e.db); err != nil {
+			if err := w.exec(ctx, e.db); err != nil {
 				e.appendLog(fmt.Sprintf("db %s write failed: %v", w.desc(), err))
 			}
 		case <-pruneTicker.C:
-			e.prune()
+			e.prune(ctx)
 		case <-ctx.Done():
 			e.drainWrites()
 			return
@@ -203,7 +211,7 @@ func (e *Engine) drainWrites() {
 	for {
 		select {
 		case w := <-e.dbWrites:
-			if err := w.exec(e.db); err != nil {
+			if err := w.exec(context.Background(), e.db); err != nil {
 				e.appendLog(fmt.Sprintf("db %s write failed (drain): %v", w.desc(), err))
 			}
 		default:
@@ -212,14 +220,14 @@ func (e *Engine) drainWrites() {
 	}
 }
-func (e *Engine) prune() {
+func (e *Engine) prune(ctx context.Context) {
-	if err := e.db.PruneLogs(); err != nil {
+	if err := e.db.PruneLogs(ctx); err != nil {
 		e.appendLog(fmt.Sprintf("log prune failed: %v", err))
 	}
-	if err := e.db.PruneCheckHistory(); err != nil {
+	if err := e.db.PruneCheckHistory(ctx); err != nil {
 		e.appendLog(fmt.Sprintf("check-history prune failed: %v", err))
 	}
-	if err := e.db.PruneStateChanges(); err != nil {
+	if err := e.db.PruneStateChanges(ctx); err != nil {
 		e.appendLog(fmt.Sprintf("state-change prune failed: %v", err))
 	}
 }
@@ -231,12 +239,14 @@ func (e *Engine) Stop() {
 		if e.cancel != nil {
 			e.cancel()
 		}
 		e.checkerWG.Wait()
 		e.writerWG.Wait()
 		e.drainWrites()
 	})
 }
 func (e *Engine) InitLogs() {
-	logs, err := e.db.LoadLogs(maxLogEntries)
+	logs, err := e.db.LoadLogs(context.Background(), maxLogEntries)
 	if err != nil {
 		return
 	}
@@ -251,7 +261,7 @@ func (e *Engine) InitLogs() {
 // InitAlertHealth restores persisted alert send health so the dashboard shows real
 // "last sent" / health state on startup instead of resetting every channel to "never".
 func (e *Engine) InitAlertHealth() {
-	records, err := e.db.LoadAlertHealth()
+	records, err := e.db.LoadAlertHealth(context.Background())
 	if err != nil {
 		return
 	}
@@ -328,7 +338,7 @@ func (e *Engine) RecordHeartbeat(token string) bool {
 	}
 	var (
-		prevStatus string
+		prevStatus models.Status
 		name       string
 		alertID    int
 		downSince  time.Time
@@ -340,12 +350,12 @@ func (e *Engine) RecordHeartbeat(token string) bool {
 		downSince = s.StatusChangedAt // captured before mutation = when it went down
 		s.LastCheck = time.Now()
-		s.Status = "UP"
+		s.Status = models.StatusUp
 		s.FailureCount = 0
 		s.Latency = 0
 		s.LastError = ""
 		s.LastSuccessAt = time.Now()
-		if prevStatus != "UP" {
+		if prevStatus != models.StatusUp {
 			s.StatusChangedAt = time.Now()
 		}
 	})
@@ -354,13 +364,13 @@ func (e *Engine) RecordHeartbeat(token string) bool {
 	}
 	switch prevStatus {
-	case "PENDING":
+	case models.StatusPending:
 		e.AddLog(fmt.Sprintf("Push Monitor '%s' received first heartbeat", name))
-	case "LATE":
+	case models.StatusLate:
 		e.AddLog(fmt.Sprintf("Push Monitor '%s' heartbeat arrived (was late)", name))
-	case "STALE":
+	case models.StatusStale:
 		e.AddLog(fmt.Sprintf("Push Monitor '%s' heartbeat arrived (was stale)", name))
-	case "DOWN":
+	case models.StatusDown:
 		downDur := ""
 		if !downSince.IsZero() {
 			downDur = fmt.Sprintf(" (was down %s)", fmtDurationShort(time.Since(downSince)))
@@ -369,8 +379,10 @@ func (e *Engine) RecordHeartbeat(token string) bool {
 		go e.triggerAlert(alertID, "✅ RECOVERY", fmt.Sprintf("Push Monitor '%s' is receiving heartbeats.%s", name, downDur))
 	}
-	if prevStatus != "UP" && prevStatus != "PENDING" {
+	e.recordCheck(targetID, 0, true)
-		e.enqueueWrite(writeStateChange{siteID: targetID, fromStatus: prevStatus, toStatus: "UP"})
+
 	if prevStatus != models.StatusUp && prevStatus != models.StatusPending {
 		e.enqueueWrite(writeStateChange{siteID: targetID, fromStatus: string(prevStatus), toStatus: string(models.StatusUp)})
 	}
 	return true
@@ -400,7 +412,9 @@ func (e *Engine) Start(ctx context.Context) {
 	e.writerWG.Add(1)
 	go e.dbWriter(ctx)
 	e.checkerWG.Add(1)
 	go func() {
 		defer e.checkerWG.Done()
 		for {
 			select {
 			case <-ctx.Done():
@@ -408,7 +422,9 @@ func (e *Engine) Start(ctx context.Context) {
 			default:
 			}
-			sites, err := e.db.GetSites()
+			e.refreshMaintenanceCache(ctx)
 			configs, err := e.db.GetSites(ctx)
 			if err != nil {
 				e.AddLog(fmt.Sprintf("Failed to load sites: %v", err))
 				select {
@@ -418,30 +434,51 @@ func (e *Engine) Start(ctx context.Context) {
 				}
 				continue
 			}
-			for _, s := range sites {
+			dbIDs := make(map[int]bool, len(configs))
 			for _, cfg := range configs {
 				dbIDs[cfg.ID] = true
 				e.mu.RLock()
-				_, exists := e.liveState[s.ID]
+				existing, exists := e.liveState[cfg.ID]
 				e.mu.RUnlock()
 				if !exists {
 					e.mu.Lock()
-					s.Status = "PENDING"
+					site := models.Site{SiteConfig: cfg, SiteState: models.SiteState{Status: models.StatusPending}}
-					if h, ok := e.GetHistory(s.ID); ok && len(h.Statuses) > 0 {
+					if h, ok := e.GetHistory(cfg.ID); ok && len(h.Statuses) > 0 {
 						if h.Statuses[len(h.Statuses)-1] {
-							s.Status = "UP"
+							site.Status = models.StatusUp
 						} else {
-							s.Status = "DOWN"
+							site.Status = models.StatusDown
 						}
 						if len(h.Latencies) > 0 {
-							s.Latency = h.Latencies[len(h.Latencies)-1]
+							site.Latency = h.Latencies[len(h.Latencies)-1]
 						}
 					}
-					e.liveState[s.ID] = s
+					e.liveState[cfg.ID] = site
-					e.addToTokenIndex(s)
+					e.addToTokenIndex(site)
 					e.mu.Unlock()
-					go e.monitorRoutine(ctx, s.ID)
+					e.checkerWG.Add(1)
 					go func(id int) {
 						defer e.checkerWG.Done()
 						e.monitorRoutine(ctx, id)
 					}(cfg.ID)
 				} else if existing.SiteConfig != cfg {
 					e.UpdateSiteConfig(cfg)
 				}
 			}
 			e.mu.RLock()
 			var vanished []int
 			for id := range e.liveState {
 				if !dbIDs[id] {
 					vanished = append(vanished, id)
 				}
 			}
 			e.mu.RUnlock()
 			for _, id := range vanished {
 				e.RemoveSite(id)
 				e.AddLog(fmt.Sprintf("Monitor removed (no longer in DB): ID %d", id))
 			}
 			select {
 			case <-time.After(pollInterval):
 			case <-ctx.Done():
@@ -450,27 +487,31 @@ func (e *Engine) Start(ctx context.Context) {
 		}
 	}()
-	go e.maintenancePruner(ctx)
+	e.checkerWG.Add(1)
 	go func() {
 		defer e.checkerWG.Done()
 		e.maintenancePruner(ctx)
 	}()
 }
 func (e *Engine) maintenancePruner(ctx context.Context) {
 	ticker := time.NewTicker(maintPruneInterval)
 	defer ticker.Stop()
-	e.pruneMaintenanceWindows()
+	e.pruneMaintenanceWindows(ctx)
 	for {
 		select {
 		case <-ticker.C:
-			e.pruneMaintenanceWindows()
+			e.pruneMaintenanceWindows(ctx)
 		case <-ctx.Done():
 			return
 		}
 	}
 }
-func (e *Engine) pruneMaintenanceWindows() {
+func (e *Engine) pruneMaintenanceWindows(ctx context.Context) {
-	pruned, err := e.db.PruneExpiredMaintenanceWindows(e.maintRetention)
+	pruned, err := e.db.PruneExpiredMaintenanceWindows(ctx, e.maintRetention)
 	if err != nil {
 		e.AddLog(fmt.Sprintf("Maintenance prune error: %v", err))
 		return
@@ -480,27 +521,17 @@ func (e *Engine) pruneMaintenanceWindows() {
 	}
 }
-func (e *Engine) UpdateSiteConfig(site models.Site) {
+func (e *Engine) UpdateSiteConfig(cfg models.SiteConfig) {
 	e.mu.Lock()
-	if existing, ok := e.liveState[site.ID]; ok {
+	if existing, ok := e.liveState[cfg.ID]; ok {
-		e.removeFromTokenIndex(site.ID)
+		e.removeFromTokenIndex(cfg.ID)
-		site.Status = existing.Status
+		existing.SiteConfig = cfg
-		site.StatusCode = existing.StatusCode
+		e.liveState[cfg.ID] = existing
-		site.Latency = existing.Latency
+		e.addToTokenIndex(existing)
 		site.CertExpiry = existing.CertExpiry
 		site.HasSSL = existing.HasSSL
 		site.LastCheck = existing.LastCheck
 		site.SentSSLWarning = existing.SentSSLWarning
 		site.FailureCount = existing.FailureCount
 		site.LastError = existing.LastError
 		site.StatusChangedAt = existing.StatusChangedAt
 		site.LastSuccessAt = existing.LastSuccessAt
 		e.liveState[site.ID] = site
 		e.addToTokenIndex(site)
 	}
 	e.mu.Unlock()
-	e.signalRecheck(site.ID)
+	e.signalRecheck(cfg.ID)
 }
 func (e *Engine) getRecheckChan(id int) chan struct{} {
@@ -529,6 +560,10 @@ func (e *Engine) RemoveSite(id int) {
 	e.mu.Unlock()
 	e.removeHistory(id)
 	e.probeResultsMu.Lock()
 	delete(e.probeResults, id)
 	e.probeResultsMu.Unlock()
 	e.recheckMu.Lock()
 	delete(e.recheck, id)
 	e.recheckMu.Unlock()
@@ -566,7 +601,7 @@ func (e *Engine) monitorRoutine(ctx context.Context, id int) {
 		return
 	}
-	e.checkByID(id)
+	e.checkByID(ctx, id)
 	for {
 		select {
 		case <-ctx.Done():
@@ -612,7 +647,7 @@ func (e *Engine) monitorRoutine(ctx context.Context, id int) {
 			return
 		case <-recheckCh:
 		}
-		e.checkByID(id)
+		e.checkByID(ctx, id)
 	}
 }
@@ -635,7 +670,7 @@ func (e *Engine) applyState(id int, mutate func(s *models.Site)) (models.Site, b
 	return cur, true
 }
-func (e *Engine) checkByID(id int) {
+func (e *Engine) checkByID(ctx context.Context, id int) {
 	if !e.IsActive() {
 		return
 	}
@@ -649,11 +684,11 @@ func (e *Engine) checkByID(id int) {
 	switch site.Type {
 	case "push":
-		e.checkPush(site)
+		e.checkPush(ctx, site)
 	case "group":
-		e.checkGroup(site)
+		e.checkGroup(ctx, site)
 	default:
-		result := RunCheck(site, e.strictClient, e.insecureClient, e.insecureSkipVerify, e.allowPrivateTargets)
+		result := RunCheck(ctx, site.SiteConfig, e.strictClient, e.insecureClient, e.insecureSkipVerify, e.allowPrivateTargets)
 		updatedSite := site
 		updatedSite.HasSSL = result.HasSSL
 		updatedSite.CertExpiry = result.CertExpiry
@@ -663,8 +698,8 @@ func (e *Engine) checkByID(id int) {
 	}
 }
-func (e *Engine) checkPush(site models.Site) {
+func (e *Engine) checkPush(_ context.Context, site models.Site) {
-	if site.Status == "PENDING" {
+	if site.Status == models.StatusPending {
 		return
 	}
@@ -680,16 +715,16 @@ func (e *Engine) checkPush(site models.Site) {
 	now := time.Now()
 	if now.After(graceEnd) {
-		if site.Status != "DOWN" {
+		if site.Status != models.StatusDown {
-			e.handleStatusChange(site, "DOWN", 0, 0, "heartbeat missed")
+			e.handleStatusChange(site, string(models.StatusDown), 0, 0, "heartbeat missed")
 		}
 	} else if now.After(staleMark) {
-		if site.Status != "STALE" {
+		if site.Status != models.StatusStale {
-			e.handleStatusChange(site, "STALE", 0, 0, "heartbeat stale")
+			e.handleStatusChange(site, string(models.StatusStale), 0, 0, "heartbeat stale")
 		}
 	} else if now.After(overdue) {
-		if site.Status != "LATE" {
+		if site.Status != models.StatusLate {
-			e.handleStatusChange(site, "LATE", 0, 0, "heartbeat overdue")
+			e.handleStatusChange(site, string(models.StatusLate), 0, 0, "heartbeat overdue")
 		}
 	}
 }
@@ -705,9 +740,10 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 	}
 	inMaint := e.isInMaintenance(snap.ID)
 	status := models.Status(rawStatus)
 	var (
-		prev, next            string
+		prev, next            models.Status
 		name, typ             string
 		alertID               int
 		failCount, maxRetries int
@@ -723,7 +759,7 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 	_, exists := e.applyState(snap.ID, func(s *models.Site) {
 		// A non-UP result computed from a stale snapshot must not override a
 		// heartbeat (or newer check) that landed while we were evaluating.
-		if rawStatus != "UP" && s.LastCheck.After(snap.LastCheck) {
+		if status != models.StatusUp && s.LastCheck.After(snap.LastCheck) {
 			skipped = true
 			return
 		}
@@ -742,41 +778,41 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 		s.HasSSL = snap.HasSSL
 		s.CertExpiry = snap.CertExpiry
 		s.LastError = errorReason
-		if rawStatus == "UP" {
+		if status == models.StatusUp {
 			s.LastSuccessAt = time.Now()
 			s.LastError = ""
 		}
 		// Status + failure-count transition, based on the CURRENT live status.
-		switch {
+		if status == models.StatusUp {
-		case prev == "UP" && rawStatus != "UP":
+			s.FailureCount = 0
-			s.FailureCount++
+			s.Status = models.StatusUp
 		} else {
 			if s.FailureCount <= s.MaxRetries {
 				s.FailureCount++
 			}
 			if s.FailureCount > s.MaxRetries {
-				s.Status = rawStatus
+				if s.Status != status {
 					confirmedDown = true
 				}
 				s.Status = status
 				s.FailureCount = s.MaxRetries + 1
 				confirmedDown = true
 			} else {
 				failedCheck = true
 			}
 		case rawStatus == "UP":
 			s.FailureCount = 0
 			s.Status = "UP"
 		default:
 			s.Status = rawStatus
 			s.FailureCount = s.MaxRetries + 1
 		}
 		failCount = s.FailureCount
-		if s.Status != prev && prev != "PENDING" {
+		if s.Status != prev && prev != models.StatusPending {
 			s.StatusChangedAt = time.Now()
-		} else if s.StatusChangedAt.IsZero() && s.Status != "PENDING" {
+		} else if s.StatusChangedAt.IsZero() && s.Status != models.StatusPending {
 			s.StatusChangedAt = time.Now()
 		}
 		// SSL expiry warning (fresh HasSSL/CertExpiry + config threshold).
 		if typ == "http" && s.CheckSSL && s.HasSSL {
 			days := int(time.Until(s.CertExpiry).Hours() / 24)
-			if days <= s.ExpiryThreshold && !s.SentSSLWarning && rawStatus != "SSL EXP" {
+			if days <= s.ExpiryThreshold && !s.SentSSLWarning && status != models.StatusSSLExp {
 				sslWarnFire = true
 				sslDays = days
 				s.SentSSLWarning = true
@@ -793,7 +829,7 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 		return
 	}
-	e.recordCheck(snap.ID, latency, rawStatus == "UP")
+	e.recordCheck(snap.ID, latency, status == models.StatusUp)
 	if confirmedDown {
 		if errorReason != "" {
@@ -805,8 +841,8 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 		e.AddLog(fmt.Sprintf("Monitor '%s' failed check %d/%d", name, failCount, maxRetries))
 	}
-	if changed && prev != "PENDING" {
+	if changed && prev != models.StatusPending {
-		e.enqueueWrite(writeStateChange{siteID: snap.ID, fromStatus: prev, toStatus: next, reason: errorReason})
+		e.enqueueWrite(writeStateChange{siteID: snap.ID, fromStatus: string(prev), toStatus: string(next), reason: errorReason})
 	}
 	if sslWarnFire {
@@ -817,13 +853,11 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 		}
 	}
-	isBroken := func(s string) bool { return s == "DOWN" || s == "SSL EXP" }
+	if prev == models.StatusUp && next == models.StatusLate {
 	if prev == "UP" && next == "LATE" {
 		e.AddLog(fmt.Sprintf("Monitor '%s' heartbeat overdue", name))
 	}
-	if !isBroken(prev) && isBroken(next) && next != "PENDING" {
+	if !prev.IsBroken() && next.IsBroken() && next != models.StatusPending {
 		if inMaint {
 			e.AddLog(fmt.Sprintf("Monitor '%s' is DOWN (alerts suppressed — maintenance)", name))
 		} else {
@@ -837,7 +871,7 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 			e.triggerAlert(alertID, "🚨 ALERT", msg)
 		}
 	}
-	if isBroken(prev) && next == "UP" {
+	if prev.IsBroken() && next == models.StatusUp {
 		downDur := ""
 		if !downSince.IsZero() {
 			downDur = fmt.Sprintf(" (was down %s)", fmtDurationShort(time.Since(downSince)))
@@ -847,13 +881,16 @@ func (e *Engine) handleStatusChange(snap models.Site, rawStatus string, code int
 			e.triggerAlert(alertID, "✅ RECOVERY", fmt.Sprintf("Monitor '%s' is UP%s", name, downDur))
 		}
 	}
-	if prev == "LATE" && next == "UP" && !isBroken(prev) {
+	if prev == models.StatusLate && next == models.StatusUp && !prev.IsBroken() {
 		e.AddLog(fmt.Sprintf("Monitor '%s' heartbeat arrived (was late)", name))
 	}
 }
 func (e *Engine) triggerAlert(alertID int, title, message string) {
-	cfg, err := e.db.GetAlert(alertID)
+	if alertID <= 0 {
 		return
 	}
 	cfg, err := e.db.GetAlert(context.Background(), alertID)
 	if err != nil {
 		e.AddLog(fmt.Sprintf("Failed to load alert config %d: %v", alertID, err))
 		return
@@ -906,7 +943,7 @@ func (e *Engine) GetAlertHealth(alertID int) AlertHealth {
 }
 func (e *Engine) TestAlert(alertID int) error {
-	cfg, err := e.db.GetAlert(alertID)
+	cfg, err := e.db.GetAlert(context.Background(), alertID)
 	if err != nil {
 		return fmt.Errorf("failed to load alert: %w", err)
 	}
@@ -927,11 +964,39 @@ func (e *Engine) TestAlert(alertID int) error {
 }
 func (e *Engine) isInMaintenance(monitorID int) bool {
-	inMaint, err := e.db.IsMonitorInMaintenance(monitorID)
+	e.maintCacheMu.RLock()
 	defer e.maintCacheMu.RUnlock()
 	return e.maintCache[monitorID]
 }
 func (e *Engine) refreshMaintenanceCache(ctx context.Context) {
 	windows, err := e.db.GetActiveMaintenanceWindows(ctx)
 	if err != nil {
-		return false
+		return
 	}
-	return inMaint
+
 	directMaint := make(map[int]bool)
 	var globalMaint bool
 	for _, w := range windows {
 		if w.MonitorID == 0 {
 			globalMaint = true
 		} else {
 			directMaint[w.MonitorID] = true
 		}
 	}
 	resolved := make(map[int]bool)
 	e.mu.RLock()
 	for id, site := range e.liveState {
 		if globalMaint || directMaint[id] || (site.ParentID > 0 && directMaint[site.ParentID]) {
 			resolved[id] = true
 		}
 	}
 	e.mu.RUnlock()
 	e.maintCacheMu.Lock()
 	e.maintCache = resolved
 	e.maintCacheMu.Unlock()
 }
 func (e *Engine) GetDisplayStatus(site models.Site) string {
@@ -941,54 +1006,67 @@ func (e *Engine) GetDisplayStatus(site models.Site) string {
 	if e.isInMaintenance(site.ID) {
 		return "MAINT"
 	}
-	return site.Status
+	return string(site.Status)
 }
-func (e *Engine) checkGroup(site models.Site) {
+func (e *Engine) checkGroup(_ context.Context, site models.Site) {
 	e.mu.RLock()
-	status := "UP"
+	status := models.StatusUp
 	hasChildren := false
 	allPaused := true
 	for _, child := range e.liveState {
 		if child.ParentID != site.ID || child.Type == "group" {
 			continue
 		}
 		hasChildren = true
 		if !child.Paused {
 			allPaused = false
 		}
 		if child.Paused || e.isInMaintenance(child.ID) {
 			continue
 		}
-		if child.Status == "DOWN" || child.Status == "SSL EXP" {
+		if child.Status == models.StatusDown || child.Status == models.StatusSSLExp {
-			status = "DOWN"
+			status = models.StatusDown
-		} else if child.Status == "STALE" && status != "DOWN" {
+		} else if child.Status == models.StatusStale && status != models.StatusDown {
-			status = "STALE"
+			status = models.StatusStale
-		} else if child.Status == "LATE" && status != "DOWN" && status != "STALE" {
+		} else if child.Status == models.StatusLate && status != models.StatusDown && status != models.StatusStale {
-			status = "LATE"
+			status = models.StatusLate
-		} else if child.Status == "PENDING" && status != "DOWN" && status != "STALE" && status != "LATE" {
+		} else if child.Status == models.StatusPending && status != models.StatusDown && status != models.StatusStale && status != models.StatusLate {
-			status = "PENDING"
+			status = models.StatusPending
 		}
 	}
 	e.mu.RUnlock()
 	if !hasChildren {
-		status = "PENDING"
+		status = models.StatusPending
 	}
 	e.applyState(site.ID, func(s *models.Site) {
 		s.Status = status
 		if hasChildren && allPaused {
 			s.Paused = true
 		}
 	})
 	e.recordCheck(site.ID, 0, !status.IsBroken())
 }
 func (e *Engine) EnqueueProbeCheck(siteID int, nodeID string, latencyNs int64, isUp bool) {
 	e.enqueueWrite(writeProbeCheck{siteID: siteID, nodeID: nodeID, latencyNs: latencyNs, isUp: isUp})
 }
 // SetAggStrategy must be called before Start: the field is read by the probe
 // aggregation path without synchronization.
 func (e *Engine) SetAggStrategy(strategy AggregationStrategy) {
 	e.aggStrategy = strategy
 }
 func (e *Engine) IngestProbeResult(nodeID string, siteID int, latencyNs int64, isUp bool, errorReason string) {
 	e.mu.RLock()
 	site, exists := e.liveState[siteID]
 	e.mu.RUnlock()
 	if !exists {
 		return
 	}
 	staleAfter := time.Duration(site.Interval) * time.Second * 3
 	if staleAfter < time.Minute {
 		staleAfter = time.Minute
 	}
 	now := time.Now()
 	e.probeResultsMu.Lock()
 	if e.probeResults[siteID] == nil {
 		e.probeResults[siteID] = make(map[string]NodeResult)
@@ -997,33 +1075,30 @@ func (e *Engine) IngestProbeResult(nodeID string, siteID int, latencyNs int64, i
 		NodeID:      nodeID,
 		IsUp:        isUp,
 		LatencyNs:   latencyNs,
-		CheckedAt:   time.Now(),
+		CheckedAt:   now,
 		ErrorReason: errorReason,
 	}
 	results := make([]NodeResult, 0, len(e.probeResults[siteID]))
-	for _, r := range e.probeResults[siteID] {
+	for id, r := range e.probeResults[siteID] {
 		if now.Sub(r.CheckedAt) > staleAfter {
 			delete(e.probeResults[siteID], id)
 			continue
 		}
 		results = append(results, r)
 	}
 	e.probeResultsMu.Unlock()
 	aggUp, avgLatency := AggregateStatus(results, e.aggStrategy)
-	e.mu.RLock()
+	probeStatus := models.StatusUp
 	site, exists := e.liveState[siteID]
 	e.mu.RUnlock()
 	if !exists {
 		return
 	}
 	rawStatus := "UP"
 	if !aggUp {
-		rawStatus = "DOWN"
+		probeStatus = models.StatusDown
 	}
 	updatedSite := site
 	updatedSite.Latency = time.Duration(avgLatency)
 	updatedSite.LastCheck = time.Now()
-	e.handleStatusChange(updatedSite, rawStatus, 0, time.Duration(avgLatency), errorReason)
+	e.handleStatusChange(updatedSite, string(probeStatus), 0, time.Duration(avgLatency), errorReason)
 }
 func (e *Engine) GetProbeResults(siteID int) map[string]NodeResult {
@@ -1038,7 +1113,7 @@ func (e *Engine) GetProbeResults(siteID int) map[string]NodeResult {
 }
 func (e *Engine) GetStateChanges(siteID int, limit int) []models.StateChange {
-	changes, err := e.db.GetStateChanges(siteID, limit)
+	changes, err := e.db.GetStateChanges(context.Background(), siteID, limit)
 	if err != nil {
 		return nil
 	}
@@ -1046,7 +1121,7 @@ func (e *Engine) GetStateChanges(siteID int, limit int) []models.StateChange {
 }
 func (e *Engine) GetStateChangesSince(siteID int, since time.Time) []models.StateChange {
-	changes, err := e.db.GetStateChangesSince(siteID, since)
+	changes, err := e.db.GetStateChangesSince(context.Background(), siteID, since)
 	if err != nil {
 		return nil
 	}
@@ -8,6 +8,7 @@ import (
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 )
 // --- Mock Store ---
@@ -19,8 +20,9 @@ type savedCheck struct {
 }
 type mockStore struct {
 	storetest.BaseMock
 	mu            sync.Mutex
-	sites         []models.Site
+	sites         []models.SiteConfig
 	alerts        map[int]models.AlertConfig
 	maintenance   map[int]bool
 	logs          []string
@@ -38,56 +40,19 @@ func newMockStore() *mockStore {
 	}
 }
-func (m *mockStore) Init() error                                              { return nil }
+func (m *mockStore) GetSites(context.Context) ([]models.SiteConfig, error) { return m.sites, nil }
 func (m *mockStore) GetSites() ([]models.Site, error)                         { return m.sites, nil }
 func (m *mockStore) AddSite(models.Site) error                                { return nil }
 func (m *mockStore) UpdateSite(models.Site) error                             { return nil }
 func (m *mockStore) UpdateSitePaused(int, bool) error                         { return nil }
 func (m *mockStore) DeleteSite(int) error                                     { return nil }
 func (m *mockStore) AddAlert(string, string, map[string]string) error         { return nil }
 func (m *mockStore) UpdateAlert(int, string, string, map[string]string) error { return nil }
 func (m *mockStore) DeleteAlert(int) error                                    { return nil }
 func (m *mockStore) GetAllUsers() ([]models.User, error)                      { return nil, nil }
 func (m *mockStore) AddUser(string, string, string) error                     { return nil }
 func (m *mockStore) UpdateUser(int, string, string, string) error             { return nil }
 func (m *mockStore) DeleteUser(int) error                                     { return nil }
 func (m *mockStore) ExportData() (models.Backup, error)                       { return models.Backup{}, nil }
 func (m *mockStore) ImportData(models.Backup) error                           { return nil }
 func (m *mockStore) GetSiteByName(string) (models.Site, error)                { return models.Site{}, nil }
 func (m *mockStore) AddSiteReturningID(models.Site) (int, error)              { return 0, nil }
 func (m *mockStore) AddAlertReturningID(string, string, map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *mockStore) SaveCheckFromNode(int, string, int64, bool) error { return nil }
 func (m *mockStore) RegisterNode(models.ProbeNode) error              { return nil }
 func (m *mockStore) GetNode(string) (models.ProbeNode, error)         { return models.ProbeNode{}, nil }
 func (m *mockStore) GetAllNodes() ([]models.ProbeNode, error)         { return nil, nil }
 func (m *mockStore) UpdateNodeLastSeen(string) error                  { return nil }
 func (m *mockStore) DeleteNode(string) error                          { return nil }
 func (m *mockStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) SaveAlertHealth(models.AlertHealthRecord) error { return nil }
 func (m *mockStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) GetAllMaintenanceWindows(int) ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) AddMaintenanceWindow(models.MaintenanceWindow) error         { return nil }
 func (m *mockStore) EndMaintenanceWindow(int) error                              { return nil }
 func (m *mockStore) DeleteMaintenanceWindow(int) error                           { return nil }
 func (m *mockStore) PruneExpiredMaintenanceWindows(time.Duration) (int64, error) { return 0, nil }
 func (m *mockStore) GetPreference(string) (string, error)                        { return "", nil }
 func (m *mockStore) SetPreference(string, string) error                          { return nil }
 func (m *mockStore) SaveStateChange(int, string, string, string) error           { return nil }
 func (m *mockStore) GetStateChanges(int, int) ([]models.StateChange, error)      { return nil, nil }
 func (m *mockStore) GetStateChangesSince(int, time.Time) ([]models.StateChange, error) {
 	return nil, nil
 }
 func (m *mockStore) Close() error { return nil }
-func (m *mockStore) GetAllAlerts() ([]models.AlertConfig, error) {
+func (m *mockStore) GetActiveMaintenanceWindows(context.Context) ([]models.MaintenanceWindow, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	var windows []models.MaintenanceWindow
 	for id := range m.maintenance {
 		windows = append(windows, models.MaintenanceWindow{MonitorID: id})
 	}
 	return windows, nil
 }
 func (m *mockStore) GetAllAlerts(context.Context) ([]models.AlertConfig, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	var result []models.AlertConfig
@@ -97,7 +62,7 @@ func (m *mockStore) GetAllAlerts() ([]models.AlertConfig, error) {
 	return result, nil
 }
-func (m *mockStore) GetAlert(id int) (models.AlertConfig, error) {
+func (m *mockStore) GetAlert(_ context.Context, id int) (models.AlertConfig, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.getAlertCalls = append(m.getAlertCalls, id)
@@ -107,7 +72,7 @@ func (m *mockStore) GetAlert(id int) (models.AlertConfig, error) {
 	return models.AlertConfig{}, fmt.Errorf("alert %d not found", id)
 }
-func (m *mockStore) GetAlertByName(name string) (models.AlertConfig, error) {
+func (m *mockStore) GetAlertByName(_ context.Context, name string) (models.AlertConfig, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	for _, a := range m.alerts {
@@ -118,38 +83,34 @@ func (m *mockStore) GetAlertByName(name string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, fmt.Errorf("alert %q not found", name)
 }
-func (m *mockStore) IsMonitorInMaintenance(id int) (bool, error) {
+func (m *mockStore) IsMonitorInMaintenance(_ context.Context, id int) (bool, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	return m.maintenance[id], nil
 }
-func (m *mockStore) SaveCheck(siteID int, latencyNs int64, isUp bool) error {
+func (m *mockStore) SaveCheck(_ context.Context, siteID int, latencyNs int64, isUp bool) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.savedChecks = append(m.savedChecks, savedCheck{siteID, latencyNs, isUp})
 	return nil
 }
-func (m *mockStore) SaveLog(msg string) error {
+func (m *mockStore) SaveLog(_ context.Context, msg string) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.savedLogs = append(m.savedLogs, msg)
 	return nil
 }
-func (m *mockStore) LoadLogs(limit int) ([]string, error) {
+func (m *mockStore) LoadLogs(_ context.Context, _ int) ([]string, error) {
 	return m.logs, nil
 }
-func (m *mockStore) LoadAllHistory(limit int) (map[int][]models.CheckRecord, error) {
+func (m *mockStore) LoadAllHistory(_ context.Context, _ int) (map[int][]models.CheckRecord, error) {
 	return m.history, nil
 }
 func (m *mockStore) PruneLogs() error         { return nil }
 func (m *mockStore) PruneCheckHistory() error { return nil }
 func (m *mockStore) PruneStateChanges() error { return nil }
 // --- Helpers ---
 func newTestEngine(ms *mockStore) *Engine {
@@ -187,7 +148,10 @@ func (m *mockStore) getAlertCallsSnapshot() []int {
 func TestHandleStatusChange_PendingToUp(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "PENDING", MaxRetries: 3, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 3, AlertID: 1},
 		SiteState:  models.SiteState{Status: "PENDING"},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "UP", 200, 10*time.Millisecond, "")
@@ -208,7 +172,10 @@ func TestHandleStatusChange_PendingToUp(t *testing.T) {
 func TestHandleStatusChange_UpIncrementFailure(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 3, FailureCount: 0}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 3},
 		SiteState:  models.SiteState{Status: "UP", FailureCount: 0},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 500, 0, "test error")
@@ -226,7 +193,10 @@ func TestHandleStatusChange_UpToDown_ExceedsRetries(t *testing.T) {
 	ms := newMockStore()
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "discord", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 2, FailureCount: 2, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 2, AlertID: 1},
 		SiteState:  models.SiteState{Status: "UP", FailureCount: 2},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 500, 0, "test error")
@@ -249,7 +219,10 @@ func TestHandleStatusChange_UpToDown_ZeroRetries(t *testing.T) {
 	ms := newMockStore()
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0, FailureCount: 0, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0, AlertID: 1},
 		SiteState:  models.SiteState{Status: "UP", FailureCount: 0},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 0, 0, "test error")
@@ -268,7 +241,10 @@ func TestHandleStatusChange_DownToUp_Recovery(t *testing.T) {
 	ms := newMockStore()
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "DOWN", FailureCount: 4, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", AlertID: 1},
 		SiteState:  models.SiteState{Status: "DOWN", FailureCount: 4},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "UP", 200, 5*time.Millisecond, "")
@@ -289,7 +265,10 @@ func TestHandleStatusChange_DownToUp_Recovery(t *testing.T) {
 func TestHandleStatusChange_DownStaysDown(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "DOWN", MaxRetries: 2, FailureCount: 3}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 2},
 		SiteState:  models.SiteState{Status: "DOWN", FailureCount: 3},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 0, 0, "test error")
@@ -308,7 +287,10 @@ func TestHandleStatusChange_SSLExpired(t *testing.T) {
 	ms := newMockStore()
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0, AlertID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "SSL EXP", 0, 0, "SSL certificate expired")
@@ -328,8 +310,12 @@ func TestHandleStatusChange_AlertSuppressedMaintenance(t *testing.T) {
 	ms.maintenance[1] = true
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0, AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0, AlertID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.refreshMaintenanceCache(context.Background())
 	e.handleStatusChange(site, "DOWN", 0, 0, "test error")
@@ -359,8 +345,12 @@ func TestHandleStatusChange_RecoverySuppressedMaintenance(t *testing.T) {
 	ms.maintenance[1] = true
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "DOWN", AlertID: 1}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", AlertID: 1},
 		SiteState:  models.SiteState{Status: "DOWN"},
 	}
 	injectSite(e, site)
 	e.refreshMaintenanceCache(context.Background())
 	e.handleStatusChange(site, "UP", 200, 0, "")
@@ -379,10 +369,8 @@ func TestHandleStatusChange_SSLWarning(t *testing.T) {
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "test", Status: "UP", Type: "http",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http", CheckSSL: true, ExpiryThreshold: 30, AlertID: 1},
-		CheckSSL: true, HasSSL: true, ExpiryThreshold: 30,
+		SiteState:  models.SiteState{Status: "UP", HasSSL: true, SentSSLWarning: false, CertExpiry: time.Now().Add(15 * 24 * time.Hour)},
 		SentSSLWarning: false, AlertID: 1,
 		CertExpiry: time.Now().Add(15 * 24 * time.Hour),
 	}
 	injectSite(e, site)
@@ -402,10 +390,8 @@ func TestHandleStatusChange_SSLWarningNotRepeated(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "test", Status: "UP", Type: "http",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http", CheckSSL: true, ExpiryThreshold: 30, AlertID: 1},
-		CheckSSL: true, HasSSL: true, ExpiryThreshold: 30,
+		SiteState:  models.SiteState{Status: "UP", HasSSL: true, SentSSLWarning: true, CertExpiry: time.Now().Add(15 * 24 * time.Hour)},
 		SentSSLWarning: true, AlertID: 1,
 		CertExpiry: time.Now().Add(15 * 24 * time.Hour),
 	}
 	injectSite(e, site)
@@ -421,10 +407,8 @@ func TestHandleStatusChange_SSLWarningReset(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "test", Status: "UP", Type: "http",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http", CheckSSL: true, ExpiryThreshold: 30},
-		CheckSSL: true, HasSSL: true, ExpiryThreshold: 30,
+		SiteState:  models.SiteState{Status: "UP", HasSSL: true, SentSSLWarning: true, CertExpiry: time.Now().Add(60 * 24 * time.Hour)},
 		SentSSLWarning: true,
 		CertExpiry:     time.Now().Add(60 * 24 * time.Hour),
 	}
 	injectSite(e, site)
@@ -442,12 +426,11 @@ func TestHandleStatusChange_SSLWarningSuppressedMaint(t *testing.T) {
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "test", Status: "UP", Type: "http",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http", CheckSSL: true, ExpiryThreshold: 30, AlertID: 1},
-		CheckSSL: true, HasSSL: true, ExpiryThreshold: 30,
+		SiteState:  models.SiteState{Status: "UP", HasSSL: true, SentSSLWarning: false, CertExpiry: time.Now().Add(15 * 24 * time.Hour)},
 		SentSSLWarning: false, AlertID: 1,
 		CertExpiry: time.Now().Add(15 * 24 * time.Hour),
 	}
 	injectSite(e, site)
 	e.refreshMaintenanceCache(context.Background())
 	e.handleStatusChange(site, "UP", 200, 0, "")
@@ -464,7 +447,10 @@ func TestHandleStatusChange_SSLWarningSuppressedMaint(t *testing.T) {
 func TestHandleStatusChange_InactiveEngine(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.SetActive(false)
@@ -481,7 +467,10 @@ func TestHandleStatusChange_InactiveEngine(t *testing.T) {
 func TestRecordHeartbeat_ValidToken(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "push-test", Type: "push", Token: "abc123", Status: "UP"}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "push-test", Type: "push", Token: "abc123"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	if !e.RecordHeartbeat("abc123") {
@@ -501,7 +490,10 @@ func TestRecordHeartbeat_RecoveryFromDown(t *testing.T) {
 	ms := newMockStore()
 	ms.alerts[1] = models.AlertConfig{ID: 1, Name: "test", Type: "webhook", Settings: map[string]string{"url": "http://example.com"}}
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "push-test", Type: "push", Token: "abc123", Status: "DOWN", AlertID: 1, FailureCount: 3}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "push-test", Type: "push", Token: "abc123", AlertID: 1},
 		SiteState:  models.SiteState{Status: "DOWN", FailureCount: 3},
 	}
 	injectSite(e, site)
 	if !e.RecordHeartbeat("abc123") {
@@ -533,7 +525,10 @@ func TestRecordHeartbeat_UnknownToken(t *testing.T) {
 func TestRecordHeartbeat_InactiveEngine(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Type: "push", Token: "abc123", Status: "UP"}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Type: "push", Token: "abc123"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.SetActive(false)
@@ -548,13 +543,12 @@ func TestCheckPush_DeadlineMissed(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "push", Type: "push", Status: "UP",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Interval: 10, MaxRetries: 0},
-		Interval: 10, MaxRetries: 0,
+		SiteState:  models.SiteState{Status: "UP", LastCheck: time.Now().Add(-120 * time.Second)},
 		LastCheck: time.Now().Add(-120 * time.Second),
 	}
 	injectSite(e, site)
-	e.checkPush(site)
+	e.checkPush(context.Background(), site)
 	s, _ := getSite(e, 1)
 	if s.Status != "DOWN" {
@@ -566,13 +560,12 @@ func TestCheckPush_OverdueBecomesLate(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "push", Type: "push", Status: "UP",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Interval: 300},
-		Interval:  300,
+		SiteState:  models.SiteState{Status: "UP", LastCheck: time.Now().Add(-310 * time.Second)},
 		LastCheck: time.Now().Add(-310 * time.Second),
 	}
 	injectSite(e, site)
-	e.checkPush(site)
+	e.checkPush(context.Background(), site)
 	s, _ := getSite(e, 1)
 	if s.Status != "LATE" {
@@ -586,13 +579,12 @@ func TestCheckPush_OverdueBecomesStale(t *testing.T) {
 	// interval=300, grace=150 (300/2), staleMark=overdue+75
 	// at 380s: past staleMark(375) but before graceEnd(450)
 	site := models.Site{
-		ID: 1, Name: "push", Type: "push", Status: "UP",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Interval: 300},
-		Interval:  300,
+		SiteState:  models.SiteState{Status: "UP", LastCheck: time.Now().Add(-380 * time.Second)},
 		LastCheck: time.Now().Add(-380 * time.Second),
 	}
 	injectSite(e, site)
-	e.checkPush(site)
+	e.checkPush(context.Background(), site)
 	s, _ := getSite(e, 1)
 	if s.Status != "STALE" {
@@ -604,12 +596,12 @@ func TestCheckPush_WithinDeadline(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "push", Type: "push", Status: "UP",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Interval: 60},
-		Interval: 60, LastCheck: time.Now(),
+		SiteState:  models.SiteState{Status: "UP", LastCheck: time.Now()},
 	}
 	injectSite(e, site)
-	e.checkPush(site)
+	e.checkPush(context.Background(), site)
 	s, _ := getSite(e, 1)
 	if s.Status != "UP" {
@@ -621,12 +613,12 @@ func TestCheckPush_PendingStaysPending(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
-		ID: 1, Name: "push", Type: "push", Status: "PENDING",
+		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Interval: 60},
-		Interval: 60,
+		SiteState:  models.SiteState{Status: "PENDING"},
 	}
 	injectSite(e, site)
-	e.checkPush(site)
+	e.checkPush(context.Background(), site)
 	s, _ := getSite(e, 1)
 	if s.Status != "PENDING" {
@@ -639,14 +631,23 @@ func TestCheckPush_PendingStaysPending(t *testing.T) {
 func TestCheckGroup_AllChildrenUp(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	group := models.Site{ID: 1, Name: "group", Type: "group", Status: "PENDING"}
+	group := models.Site{
-	child1 := models.Site{ID: 2, Name: "child1", Type: "http", ParentID: 1, Status: "UP"}
+		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
-	child2 := models.Site{ID: 3, Name: "child2", Type: "http", ParentID: 1, Status: "UP"}
+		SiteState:  models.SiteState{Status: "PENDING"},
 	}
 	child1 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "child1", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child2 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 3, Name: "child2", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, group)
 	injectSite(e, child1)
 	injectSite(e, child2)
-	e.checkGroup(group)
+	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Status != "UP" {
@@ -657,14 +658,23 @@ func TestCheckGroup_AllChildrenUp(t *testing.T) {
 func TestCheckGroup_OneChildDown(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	group := models.Site{ID: 1, Name: "group", Type: "group", Status: "UP"}
+	group := models.Site{
-	child1 := models.Site{ID: 2, Name: "child1", Type: "http", ParentID: 1, Status: "UP"}
+		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
-	child2 := models.Site{ID: 3, Name: "child2", Type: "http", ParentID: 1, Status: "DOWN"}
+		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child1 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "child1", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child2 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 3, Name: "child2", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "DOWN"},
 	}
 	injectSite(e, group)
 	injectSite(e, child1)
 	injectSite(e, child2)
-	e.checkGroup(group)
+	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Status != "DOWN" {
@@ -675,14 +685,22 @@ func TestCheckGroup_OneChildDown(t *testing.T) {
 func TestCheckGroup_PausedChildIgnored(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	group := models.Site{ID: 1, Name: "group", Type: "group"}
+	group := models.Site{
-	child1 := models.Site{ID: 2, Name: "child1", Type: "http", ParentID: 1, Status: "UP"}
+		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
-	child2 := models.Site{ID: 3, Name: "child2", Type: "http", ParentID: 1, Status: "DOWN", Paused: true}
+	}
 	child1 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "child1", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child2 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 3, Name: "child2", Type: "http", ParentID: 1, Paused: true},
 		SiteState:  models.SiteState{Status: "DOWN"},
 	}
 	injectSite(e, group)
 	injectSite(e, child1)
 	injectSite(e, child2)
-	e.checkGroup(group)
+	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Status != "UP" {
@@ -694,14 +712,23 @@ func TestCheckGroup_MaintenanceChildIgnored(t *testing.T) {
 	ms := newMockStore()
 	ms.maintenance[3] = true
 	e := newTestEngine(ms)
-	group := models.Site{ID: 1, Name: "group", Type: "group"}
+	group := models.Site{
-	child1 := models.Site{ID: 2, Name: "child1", Type: "http", ParentID: 1, Status: "UP"}
+		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
-	child2 := models.Site{ID: 3, Name: "child2", Type: "http", ParentID: 1, Status: "DOWN"}
+	}
 	child1 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "child1", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child2 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 3, Name: "child2", Type: "http", ParentID: 1},
 		SiteState:  models.SiteState{Status: "DOWN"},
 	}
 	injectSite(e, group)
 	injectSite(e, child1)
 	injectSite(e, child2)
 	e.refreshMaintenanceCache(context.Background())
-	e.checkGroup(group)
+	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Status != "UP" {
@@ -712,10 +739,13 @@ func TestCheckGroup_MaintenanceChildIgnored(t *testing.T) {
 func TestCheckGroup_NoChildren(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	group := models.Site{ID: 1, Name: "group", Type: "group", Status: "UP"}
+	group := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, group)
-	e.checkGroup(group)
+	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Status != "PENDING" {
@@ -807,10 +837,13 @@ func TestInitHistory_LoadsFromDB(t *testing.T) {
 func TestUpdateSiteConfig_PreservesRuntime(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", URL: "http://old.com", Status: "DOWN", FailureCount: 3, Latency: 100 * time.Millisecond}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", URL: "http://old.com"},
 		SiteState:  models.SiteState{Status: "DOWN", FailureCount: 3, Latency: 100 * time.Millisecond},
 	}
 	injectSite(e, site)
-	updated := models.Site{ID: 1, Name: "test", URL: "http://new.com", Interval: 60}
+	updated := models.SiteConfig{ID: 1, Name: "test", URL: "http://new.com", Interval: 60}
 	e.UpdateSiteConfig(updated)
 	s, _ := getSite(e, 1)
@@ -831,7 +864,10 @@ func TestUpdateSiteConfig_PreservesRuntime(t *testing.T) {
 func TestRemoveSite_CleansUp(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Type: "push", Token: "tok1", Status: "UP"}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "push", Token: "tok1"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.recordCheck(1, 5*time.Millisecond, true)
@@ -851,7 +887,10 @@ func TestRemoveSite_CleansUp(t *testing.T) {
 func TestToggleSitePause(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP"}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	paused := e.ToggleSitePause(1)
@@ -880,8 +919,14 @@ func TestToggleSitePause_NonexistentSite(t *testing.T) {
 func TestGetAllSites_ReturnsCopy(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	injectSite(e, models.Site{ID: 1, Name: "s1", Status: "UP"})
+	injectSite(e, models.Site{
-	injectSite(e, models.Site{ID: 2, Name: "s2", Status: "DOWN"})
+		SiteConfig: models.SiteConfig{ID: 1, Name: "s1"},
 		SiteState:  models.SiteState{Status: "UP"},
 	})
 	injectSite(e, models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "s2"},
 		SiteState:  models.SiteState{Status: "DOWN"},
 	})
 	sites := e.GetAllSites()
 	if len(sites) != 2 {
@@ -900,10 +945,13 @@ func TestGetAllSites_ReturnsCopy(t *testing.T) {
 func TestGetLiveState_ReturnsCopy(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	injectSite(e, models.Site{ID: 1, Name: "s1", Status: "UP"})
+	injectSite(e, models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "s1"},
 		SiteState:  models.SiteState{Status: "UP"},
 	})
 	state := e.GetLiveState()
-	state[1] = models.Site{Name: "mutated"}
+	state[1] = models.Site{SiteConfig: models.SiteConfig{Name: "mutated"}}
 	fresh := e.GetLiveState()
 	if fresh[1].Name == "mutated" {
@@ -1019,7 +1067,8 @@ func TestConcurrent_RecordHeartbeat(t *testing.T) {
 	e := newTestEngine(ms)
 	for i := 0; i < 10; i++ {
 		injectSite(e, models.Site{
-			ID: i + 1, Type: "push", Token: fmt.Sprintf("tok-%d", i+1), Status: "UP",
+			SiteConfig: models.SiteConfig{ID: i + 1, Type: "push", Token: fmt.Sprintf("tok-%d", i+1)},
 			SiteState:  models.SiteState{Status: "UP"},
 		})
 	}
@@ -1037,7 +1086,10 @@ func TestConcurrent_RecordHeartbeat(t *testing.T) {
 func TestConcurrent_HandleStatusChangeAndGetState(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 100}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 100},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	var wg sync.WaitGroup
@@ -1090,7 +1142,10 @@ func TestConcurrent_RecordCheckAndGetHistory(t *testing.T) {
 func TestHandleStatusChange_PauseDuringCheckSurvives(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	// `site` is the stale snapshot the check ran against (Paused=false).
@@ -1114,11 +1169,14 @@ func TestHandleStatusChange_PauseDuringCheckSurvives(t *testing.T) {
 func TestHandleStatusChange_ConfigEditDuringCheckSurvives(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", URL: "http://old.com", Type: "http", Status: "UP", MaxRetries: 0, Interval: 30}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", URL: "http://old.com", Type: "http", MaxRetries: 0, Interval: 30},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	// Config changes mid-check.
-	e.UpdateSiteConfig(models.Site{ID: 1, Name: "test", URL: "http://new.com", Type: "http", Interval: 60})
+	e.UpdateSiteConfig(models.SiteConfig{ID: 1, Name: "test", URL: "http://new.com", Type: "http", Interval: 60})
 	// Stale check (ran against http://old.com) folds its result in.
 	e.handleStatusChange(site, "UP", 200, 5*time.Millisecond, "")
@@ -1140,7 +1198,10 @@ func TestHandleStatusChange_HeartbeatNotOverwrittenByStaleDown(t *testing.T) {
 	e := newTestEngine(ms)
 	// Snapshot the engine would have taken before evaluating staleness:
 	// LastCheck is old, so checkPush decided "DOWN".
-	snap := models.Site{ID: 1, Name: "push", Type: "push", Token: "tok", Status: "UP", Interval: 10, LastCheck: time.Now().Add(-120 * time.Second)}
+	snap := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "push", Type: "push", Token: "tok", Interval: 10},
 		SiteState:  models.SiteState{Status: "UP", LastCheck: time.Now().Add(-120 * time.Second)},
 	}
 	injectSite(e, snap)
 	// A heartbeat lands first, advancing LastCheck and confirming UP.
@@ -1161,7 +1222,10 @@ func TestHandleStatusChange_HeartbeatNotOverwrittenByStaleDown(t *testing.T) {
 func TestHandleStatusChange_RemovedSiteDropped(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
-	site := models.Site{ID: 1, Name: "test", Status: "UP", MaxRetries: 0}
+	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", MaxRetries: 0},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.RemoveSite(1)
@@ -1217,6 +1281,197 @@ func TestEngineStop_Idempotent(t *testing.T) {
 	e.Stop() // must not panic or block
 }
 // --- Group 12: Phase 3 engine correctness ---
 // Groups must not auto-pause when all children are paused — that creates a
 // one-way trap because monitorRoutine skips paused sites.
 func TestCheckGroup_AllPausedNoAutoFreeze(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	group := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "group", Type: "group"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child1 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 2, Name: "child1", Type: "http", ParentID: 1, Paused: true},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child2 := models.Site{
 		SiteConfig: models.SiteConfig{ID: 3, Name: "child2", Type: "http", ParentID: 1, Paused: true},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, group)
 	injectSite(e, child1)
 	injectSite(e, child2)
 	e.checkGroup(context.Background(), group)
 	s, _ := getSite(e, 1)
 	if s.Paused {
 		t.Error("group must not auto-pause when all children are paused")
 	}
 }
 // PENDING→DOWN must honor MaxRetries instead of alerting on first failure.
 func TestHandleStatusChange_PendingRetriesBeforeDown(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "new-monitor", MaxRetries: 2},
 		SiteState:  models.SiteState{Status: "PENDING"},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 0, 0, "timeout")
 	s, _ := getSite(e, 1)
 	if s.Status != "PENDING" {
 		t.Errorf("expected PENDING during retry, got %s", s.Status)
 	}
 	if s.FailureCount != 1 {
 		t.Errorf("expected FailureCount 1, got %d", s.FailureCount)
 	}
 	e.handleStatusChange(s, "DOWN", 0, 0, "timeout")
 	s, _ = getSite(e, 1)
 	if s.Status != "PENDING" {
 		t.Errorf("expected PENDING during retry 2, got %s", s.Status)
 	}
 	e.handleStatusChange(s, "DOWN", 0, 0, "timeout")
 	s, _ = getSite(e, 1)
 	if s.Status != "DOWN" {
 		t.Errorf("expected DOWN after retries exhausted, got %s", s.Status)
 	}
 }
 // LATE→DOWN must also honor MaxRetries.
 func TestHandleStatusChange_LateRetriesBeforeDown(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "push-mon", MaxRetries: 1},
 		SiteState:  models.SiteState{Status: "LATE"},
 	}
 	injectSite(e, site)
 	e.handleStatusChange(site, "DOWN", 0, 0, "missed heartbeat")
 	s, _ := getSite(e, 1)
 	if s.Status != "LATE" {
 		t.Errorf("expected LATE during retry, got %s", s.Status)
 	}
 	e.handleStatusChange(s, "DOWN", 0, 0, "missed heartbeat")
 	s, _ = getSite(e, 1)
 	if s.Status != "DOWN" {
 		t.Errorf("expected DOWN after retries exhausted, got %s", s.Status)
 	}
 }
 // Dead probe results must be expired so they don't poison aggregation.
 func TestIngestProbeResult_ExpiresStaleProbes(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http", Interval: 30},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.probeResultsMu.Lock()
 	e.probeResults[1] = map[string]NodeResult{
 		"dead-probe": {
 			NodeID:    "dead-probe",
 			IsUp:      false,
 			CheckedAt: time.Now().Add(-10 * time.Minute),
 		},
 	}
 	e.probeResultsMu.Unlock()
 	e.IngestProbeResult("live-probe", 1, 5000, true, "")
 	e.probeResultsMu.RLock()
 	_, deadExists := e.probeResults[1]["dead-probe"]
 	_, liveExists := e.probeResults[1]["live-probe"]
 	e.probeResultsMu.RUnlock()
 	if deadExists {
 		t.Error("stale probe result should have been expired")
 	}
 	if !liveExists {
 		t.Error("live probe result should still exist")
 	}
 }
 // RemoveSite must clean up probeResults.
 func TestRemoveSite_CleansProbeResults(t *testing.T) {
 	ms := newMockStore()
 	e := newTestEngine(ms)
 	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.probeResultsMu.Lock()
 	e.probeResults[1] = map[string]NodeResult{
 		"node-a": {NodeID: "node-a", IsUp: true, CheckedAt: time.Now()},
 	}
 	e.probeResultsMu.Unlock()
 	e.RemoveSite(1)
 	e.probeResultsMu.RLock()
 	defer e.probeResultsMu.RUnlock()
 	if _, exists := e.probeResults[1]; exists {
 		t.Error("probe results should be cleaned up after RemoveSite")
 	}
 }
 // Maintenance cache resolves parent relationships correctly.
 func TestIsInMaintenance_UsesCache(t *testing.T) {
 	ms := newMockStore()
 	ms.maintenance[10] = true // direct maintenance on group
 	e := newTestEngine(ms)
 	group := models.Site{
 		SiteConfig: models.SiteConfig{ID: 10, Name: "group", Type: "group"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	child := models.Site{
 		SiteConfig: models.SiteConfig{ID: 20, Name: "child", Type: "http", ParentID: 10},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, group)
 	injectSite(e, child)
 	e.refreshMaintenanceCache(context.Background())
 	if !e.isInMaintenance(10) {
 		t.Error("group should be in maintenance (direct)")
 	}
 	if !e.isInMaintenance(20) {
 		t.Error("child should be in maintenance (parent)")
 	}
 	if e.isInMaintenance(99) {
 		t.Error("unknown monitor should not be in maintenance")
 	}
 }
 // Global maintenance (monitor_id=0) applies to all monitors.
 func TestIsInMaintenance_GlobalMaintenance(t *testing.T) {
 	ms := newMockStore()
 	ms.maintenance[0] = true
 	e := newTestEngine(ms)
 	site := models.Site{
 		SiteConfig: models.SiteConfig{ID: 1, Name: "test", Type: "http"},
 		SiteState:  models.SiteState{Status: "UP"},
 	}
 	injectSite(e, site)
 	e.refreshMaintenanceCache(context.Background())
 	if !e.isInMaintenance(1) {
 		t.Error("all monitors should be in maintenance during global window")
 	}
 }
 // --- Utilities ---
 func containsStr(s, substr string) bool {
@@ -11,9 +11,11 @@ var privateRanges []*net.IPNet
 func init() {
 	cidrs := []string{
 		"0.0.0.0/8",
 		"127.0.0.0/8",
 		"::1/128",
 		"10.0.0.0/8",
 		"100.64.0.0/10",
 		"172.16.0.0/12",
 		"192.168.0.0/16",
 		"169.254.0.0/16",
@@ -27,6 +29,9 @@ func init() {
 }
 func isPrivateIP(ip net.IP) bool {
 	if ip.IsUnspecified() || ip.IsMulticast() || ip.IsLoopback() {
 		return true
 	}
 	for _, network := range privateRanges {
 		if network.Contains(ip) {
 			return true
@@ -16,14 +16,14 @@ type SLAReport struct {
 	MTBF        time.Duration
 }
-func ComputeSLA(changes []models.StateChange, currentStatus string, window time.Duration) SLAReport {
+func ComputeSLA(changes []models.StateChange, currentStatus models.Status, window time.Duration) SLAReport {
 	now := time.Now()
 	windowStart := now.Add(-window)
 	report := SLAReport{Window: window}
 	if len(changes) == 0 {
-		if isDown(currentStatus) {
+		if models.Status(currentStatus).IsBroken() {
 			report.UptimePct = 0
 			report.Downtime = window
 		} else {
@@ -40,7 +40,7 @@ func ComputeSLA(changes []models.StateChange, currentStatus string, window time.
 	}
 	// Determine status at window start: last transition before or at windowStart.
-	statusAtStart := "UP"
+	statusAtStart := string(models.StatusUp)
 	for i := len(sorted) - 1; i >= 0; i-- {
 		if !sorted[i].ChangedAt.After(windowStart) {
 			statusAtStart = sorted[i].ToStatus
@@ -51,7 +51,7 @@ func ComputeSLA(changes []models.StateChange, currentStatus string, window time.
 	var upTime, downTime time.Duration
 	var outages []time.Duration
 	cursor := windowStart
-	wasDown := isDown(statusAtStart)
+	wasDown := models.Status(statusAtStart).IsBroken()
 	if wasDown {
 		report.OutageCount = 1
@@ -77,7 +77,7 @@ func ComputeSLA(changes []models.StateChange, currentStatus string, window time.
 			upTime += seg
 		}
-		newDown := isDown(sc.ToStatus)
+		newDown := models.Status(sc.ToStatus).IsBroken()
 		if !wasDown && newDown {
 			report.OutageCount++
 			outageStart = sc.ChangedAt
@@ -127,18 +127,15 @@ func ComputeSLA(changes []models.StateChange, currentStatus string, window time.
 	return report
 }
-func ComputeDailyBreakdown(changes []models.StateChange, currentStatus string, days int, now time.Time) []DayReport {
+func ComputeDailyBreakdown(changes []models.StateChange, currentStatus models.Status, days int, now time.Time) []DayReport {
 	reports := make([]DayReport, days)
 	for i := 0; i < days; i++ {
-		dayEnd := time.Date(now.Year(), now.Month(), now.Day(), 0, 0, 0, 0, now.Location()).Add(-time.Duration(i) * 24 * time.Hour)
+		dayStart := time.Date(now.Year(), now.Month(), now.Day()-i, 0, 0, 0, 0, now.Location())
 		dayEnd := time.Date(now.Year(), now.Month(), now.Day()-i+1, 0, 0, 0, 0, now.Location())
 		if i == 0 {
 			dayEnd = now
 		}
 		dayStart := time.Date(now.Year(), now.Month(), now.Day(), 0, 0, 0, 0, now.Location()).Add(-time.Duration(i) * 24 * time.Hour)
 		if i > 0 {
 			dayEnd = dayStart.Add(24 * time.Hour)
 		}
 		windowChanges := filterChangesForWindow(changes, dayStart, dayEnd)
@@ -159,10 +156,6 @@ type DayReport struct {
 	UptimePct float64
 }
 func isDown(status string) bool {
 	return status == "DOWN" || status == "SSL EXP"
 }
 func filterChangesForWindow(changes []models.StateChange, start, end time.Time) []models.StateChange {
 	var filtered []models.StateChange
 	for _, sc := range changes {
@@ -180,7 +173,7 @@ func inferStatusAt(changes []models.StateChange, at time.Time) string {
 			return sc.ToStatus
 		}
 	}
-	return "UP"
+	return string(models.StatusUp)
 }
 func computeSLAForWindow(changes []models.StateChange, statusAtStart string, start, end time.Time) float64 {
@@ -193,7 +186,7 @@ func computeSLAForWindow(changes []models.StateChange, statusAtStart string, sta
 	var upTime, downTime time.Duration
 	cursor := start
-	wasDown := isDown(statusAtStart)
+	wasDown := models.Status(statusAtStart).IsBroken()
 	for _, sc := range sorted {
 		if sc.ChangedAt.Before(start) || !sc.ChangedAt.Before(end) {
@@ -205,7 +198,7 @@ func computeSLAForWindow(changes []models.StateChange, statusAtStart string, sta
 		} else {
 			upTime += seg
 		}
-		wasDown = isDown(sc.ToStatus)
+		wasDown = models.Status(sc.ToStatus).IsBroken()
 		cursor = sc.ChangedAt
 	}
@@ -137,24 +137,24 @@ func TestComputeDailyBreakdown(t *testing.T) {
 	}
 }
-func TestIsDown(t *testing.T) {
+func TestIsBroken(t *testing.T) {
-	if !isDown("DOWN") {
+	if !models.StatusDown.IsBroken() {
-		t.Error("DOWN should be down")
+		t.Error("DOWN should be broken")
 	}
-	if !isDown("SSL EXP") {
+	if !models.StatusSSLExp.IsBroken() {
-		t.Error("SSL EXP should be down")
+		t.Error("SSL EXP should be broken")
 	}
-	if isDown("UP") {
+	if models.StatusUp.IsBroken() {
-		t.Error("UP should not be down")
+		t.Error("UP should not be broken")
 	}
-	if isDown("LATE") {
+	if models.StatusLate.IsBroken() {
-		t.Error("LATE should not be down")
+		t.Error("LATE should not be broken")
 	}
-	if isDown("STALE") {
+	if models.StatusStale.IsBroken() {
-		t.Error("STALE should not be down")
+		t.Error("STALE should not be broken")
 	}
-	if isDown("PENDING") {
+	if models.StatusPending.IsBroken() {
-		t.Error("PENDING should not be down")
+		t.Error("PENDING should not be broken")
 	}
 }
@@ -25,6 +25,7 @@ type RateLimiter struct {
 	rate     float64
 	burst    float64
 	trusted  []*net.IPNet
 	stop     chan struct{}
 }
 func NewRateLimiter(requestsPerMinute int, trusted []*net.IPNet) *RateLimiter {
@@ -33,11 +34,16 @@ func NewRateLimiter(requestsPerMinute int, trusted []*net.IPNet) *RateLimiter {
 		rate:     float64(requestsPerMinute) / 60.0,
 		burst:    float64(requestsPerMinute),
 		trusted:  trusted,
 		stop:     make(chan struct{}),
 	}
 	go rl.cleanup()
 	return rl
 }
 func (rl *RateLimiter) Stop() {
 	close(rl.stop)
 }
 func (rl *RateLimiter) Allow(ip string) bool {
 	rl.mu.Lock()
 	defer rl.mu.Unlock()
@@ -84,16 +90,22 @@ func (rl *RateLimiter) evictOldest() {
 }
 func (rl *RateLimiter) cleanup() {
 	ticker := time.NewTicker(5 * time.Minute)
 	defer ticker.Stop()
 	for {
-		time.Sleep(5 * time.Minute)
+		select {
-		rl.mu.Lock()
+		case <-ticker.C:
-		cutoff := time.Now().Add(-10 * time.Minute)
+			rl.mu.Lock()
-		for ip, v := range rl.visitors {
+			cutoff := time.Now().Add(-10 * time.Minute)
-			if v.lastSeen.Before(cutoff) {
+			for ip, v := range rl.visitors {
-				delete(rl.visitors, ip)
+				if v.lastSeen.Before(cutoff) {
 					delete(rl.visitors, ip)
 				}
 			}
 			rl.mu.Unlock()
 		case <-rl.stop:
 			return
 		}
 		rl.mu.Unlock()
 	}
 }
@@ -5,7 +5,7 @@ import (
 	"encoding/json"
 	"fmt"
 	"html/template"
-	"log"
+	"log/slog"
 	"net"
 	"net/http"
 	"sort"
@@ -21,6 +21,395 @@ import (
 const maxRequestBody = 1 << 20
 type ServerConfig struct {
 	Port           int
 	EnableStatus   bool
 	Title          string
 	ClusterKey     string
 	TLSCert        string
 	TLSKey         string
 	ClusterMode    string
 	MetricsPublic  bool
 	CORSOrigin     string
 	TrustedProxies []*net.IPNet
 	QuietHTTPLog   bool
 }
 type Server struct {
 	cfg      ServerConfig
 	store    store.Store
 	eng      *monitor.Engine
 	pushRL   *RateLimiter
 	probeRL  *RateLimiter
 	backupRL *RateLimiter
 	statusRL *RateLimiter
 }
 func NewServer(cfg ServerConfig, s store.Store, eng *monitor.Engine) *Server {
 	return &Server{
 		cfg:      cfg,
 		store:    s,
 		eng:      eng,
 		pushRL:   NewRateLimiter(60, cfg.TrustedProxies),
 		probeRL:  NewRateLimiter(30, cfg.TrustedProxies),
 		backupRL: NewRateLimiter(10, cfg.TrustedProxies),
 		statusRL: NewRateLimiter(120, cfg.TrustedProxies),
 	}
 }
 func Start(cfg ServerConfig, s store.Store, eng *monitor.Engine) *http.Server {
 	srv := NewServer(cfg, s, eng)
 	return srv.Start()
 }
 func (s *Server) Start() *http.Server {
 	if s.cfg.ClusterKey == "" {
 		slog.Warn("no UPTOP_CLUSTER_SECRET set, cluster API endpoints will reject all requests")
 	}
 	if s.cfg.ClusterMode != "" && s.cfg.ClusterMode != "leader" && s.cfg.TLSCert == "" {
 		slog.Warn("cluster mode active without TLS, secrets transmitted in cleartext")
 	}
 	handler := s.routes()
 	addr := fmt.Sprintf(":%d", s.cfg.Port)
 	httpSrv := &http.Server{
 		Addr:              addr,
 		Handler:           handler,
 		ReadHeaderTimeout: 10 * time.Second,
 		ReadTimeout:       30 * time.Second,
 		WriteTimeout:      60 * time.Second,
 		IdleTimeout:       120 * time.Second,
 	}
 	go func() {
 		if s.cfg.TLSCert != "" && s.cfg.TLSKey != "" {
 			slog.Info("HTTPS server listening", "addr", addr)
 			if err := httpSrv.ListenAndServeTLS(s.cfg.TLSCert, s.cfg.TLSKey); err != nil && err != http.ErrServerClosed {
 				slog.Error("HTTPS server failed", "err", err)
 			}
 		} else {
 			slog.Info("HTTP server listening", "addr", addr)
 			if err := httpSrv.ListenAndServe(); err != nil && err != http.ErrServerClosed {
 				slog.Error("HTTP server failed", "err", err)
 			}
 		}
 	}()
 	return httpSrv
 }
 func (s *Server) routes() http.Handler {
 	mux := http.NewServeMux()
 	mux.HandleFunc("/api/push", RateLimit(s.pushRL, s.handlePush))
 	mux.HandleFunc("/api/health", s.handleHealth)
 	mux.HandleFunc("/api/backup/export", RateLimit(s.backupRL, s.handleExport))
 	mux.HandleFunc("/api/backup/import", RateLimit(s.backupRL, s.handleImport))
 	mux.HandleFunc("/api/import/kuma", RateLimit(s.backupRL, s.handleKumaImport))
 	mux.HandleFunc("/api/probe/register", RateLimit(s.probeRL, s.handleProbeRegister))
 	mux.HandleFunc("/api/probe/assignments", RateLimit(s.probeRL, s.handleProbeAssignments))
 	mux.HandleFunc("/api/probe/results", RateLimit(s.probeRL, s.handleProbeResults))
 	mux.HandleFunc("/metrics", s.handleMetrics)
 	if s.cfg.EnableStatus {
 		mux.HandleFunc("/status", RateLimit(s.statusRL, s.handleStatus))
 		mux.HandleFunc("/status/json", RateLimit(s.statusRL, s.handleStatusJSON))
 	}
 	handler := securityHeadersMiddleware(mux)
 	if !s.cfg.QuietHTTPLog {
 		handler = loggingMiddleware(s.cfg.TrustedProxies, handler)
 	}
 	if s.cfg.TLSCert != "" {
 		handler = hstsMiddleware(handler)
 	}
 	return handler
 }
 func (s *Server) requireAuth(r *http.Request) bool {
 	return s.cfg.ClusterKey != "" && checkSecret(r.Header.Get("X-Uptop-Secret"), s.cfg.ClusterKey)
 }
 func (s *Server) handlePush(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet && r.Method != http.MethodPost {
 		http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 		return
 	}
 	token := extractBearerToken(r)
 	if token == "" {
 		if qt := r.URL.Query().Get("token"); qt != "" {
 			token = qt
 			slog.Warn("push token in query string is deprecated, use Authorization: Bearer header")
 		}
 	}
 	if token == "" {
 		http.Error(w, "Missing token", http.StatusBadRequest)
 		return
 	}
 	if s.eng.RecordHeartbeat(token) {
 		w.WriteHeader(http.StatusOK)
 		_, _ = w.Write([]byte("OK"))
 	} else {
 		http.Error(w, "Invalid Token", http.StatusNotFound)
 	}
 }
 func (s *Server) handleHealth(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 		return
 	}
 	if s.cfg.ClusterKey != "" && !checkSecret(r.Header.Get("X-Uptop-Secret"), s.cfg.ClusterKey) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	w.WriteHeader(http.StatusOK)
 	_, _ = w.Write([]byte("OK"))
 }
 func (s *Server) handleExport(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized: UPTOP_CLUSTER_SECRET required", http.StatusUnauthorized)
 		return
 	}
 	data, err := s.store.ExportData(r.Context())
 	if err != nil {
 		slog.Error("export failed", "err", err)
 		http.Error(w, "Export failed", http.StatusInternalServerError)
 		return
 	}
 	if r.URL.Query().Get("redact_secrets") != "false" {
 		for i := range data.Alerts {
 			data.Alerts[i].Settings = models.RedactAlertSettings(data.Alerts[i].Type, data.Alerts[i].Settings)
 		}
 	}
 	_ = json.NewEncoder(w).Encode(data) //nolint:errcheck
 }
 func (s *Server) handleImport(w http.ResponseWriter, r *http.Request) {
 	if r.Method != "POST" {
 		http.Error(w, "POST required", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 	var data models.Backup
 	if err := json.NewDecoder(r.Body).Decode(&data); err != nil {
 		http.Error(w, "Invalid JSON", http.StatusBadRequest)
 		return
 	}
 	// API import never modifies users — cluster-secret holder shouldn't be
 	// able to replace admin accounts. CLI restore still does full import.
 	data.Users = nil
 	if err := s.store.ImportData(r.Context(), data); err != nil {
 		slog.Error("import failed", "err", err)
 		http.Error(w, "Import failed", http.StatusInternalServerError)
 		return
 	}
 	_, _ = w.Write([]byte("Import Successful (users excluded — manage via CLI or UPTOP_KEYS)"))
 }
 func (s *Server) handleKumaImport(w http.ResponseWriter, r *http.Request) {
 	if r.Method != "POST" {
 		http.Error(w, "POST required", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 	var kb importer.KumaBackup
 	if err := json.NewDecoder(r.Body).Decode(&kb); err != nil {
 		slog.Error("invalid Kuma JSON", "err", err)
 		http.Error(w, "Invalid Kuma JSON", http.StatusBadRequest)
 		return
 	}
 	backup := importer.ConvertKuma(&kb)
 	if err := s.store.ImportData(r.Context(), backup); err != nil {
 		slog.Error("Kuma import failed", "err", err)
 		http.Error(w, "Import failed", http.StatusInternalServerError)
 		return
 	}
 	fmt.Fprintf(w, "Imported %d monitors, %d alerts from Kuma v%s", len(backup.Sites), len(backup.Alerts), kb.Version)
 }
 func (s *Server) handleProbeRegister(w http.ResponseWriter, r *http.Request) {
 	if r.Method != "POST" {
 		http.Error(w, "POST required", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 	var req struct {
 		ID      string `json:"id"`
 		Name    string `json:"name"`
 		Region  string `json:"region"`
 		Version string `json:"version"`
 	}
 	if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
 		http.Error(w, "Invalid JSON", http.StatusBadRequest)
 		return
 	}
 	if req.ID == "" {
 		http.Error(w, "id is required", http.StatusBadRequest)
 		return
 	}
 	if err := s.store.RegisterNode(r.Context(), models.ProbeNode{
 		ID: req.ID, Name: req.Name, Region: req.Region, Version: req.Version,
 	}); err != nil {
 		slog.Error("probe registration failed", "err", err)
 		http.Error(w, "Registration failed", http.StatusInternalServerError)
 		return
 	}
 	_ = json.NewEncoder(w).Encode(map[string]bool{"ok": true}) //nolint:errcheck
 }
 func (s *Server) handleProbeAssignments(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	nodeID := r.URL.Query().Get("node_id")
 	var nodeRegion string
 	if nodeID != "" {
 		if node, err := s.store.GetNode(r.Context(), nodeID); err == nil {
 			nodeRegion = node.Region
 		}
 	}
 	sites := s.eng.GetAllSites()
 	var assigned []models.Site
 	for _, site := range sites {
 		if site.Paused || site.Type == "push" || site.Type == "group" {
 			continue
 		}
 		if site.Regions != "" && nodeRegion != "" {
 			matched := false
 			for _, reg := range strings.Split(site.Regions, ",") {
 				if strings.TrimSpace(reg) == nodeRegion {
 					matched = true
 					break
 				}
 			}
 			if !matched {
 				continue
 			}
 		}
 		assigned = append(assigned, site)
 	}
 	w.Header().Set("Content-Type", "application/json")
 	_ = json.NewEncoder(w).Encode(map[string][]models.Site{"sites": assigned}) //nolint:errcheck
 }
 func (s *Server) handleProbeResults(w http.ResponseWriter, r *http.Request) {
 	if r.Method != "POST" {
 		http.Error(w, "POST required", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.requireAuth(r) {
 		http.Error(w, "Unauthorized", http.StatusUnauthorized)
 		return
 	}
 	r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 	var req struct {
 		NodeID  string `json:"node_id"`
 		Results []struct {
 			SiteID      int    `json:"site_id"`
 			LatencyNs   int64  `json:"latency_ns"`
 			IsUp        bool   `json:"is_up"`
 			ErrorReason string `json:"error_reason"`
 		} `json:"results"`
 	}
 	if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
 		http.Error(w, "Invalid JSON", http.StatusBadRequest)
 		return
 	}
 	if req.NodeID == "" {
 		http.Error(w, "node_id is required", http.StatusBadRequest)
 		return
 	}
 	for _, result := range req.Results {
 		s.eng.EnqueueProbeCheck(result.SiteID, req.NodeID, result.LatencyNs, result.IsUp)
 		s.eng.IngestProbeResult(req.NodeID, result.SiteID, result.LatencyNs, result.IsUp, result.ErrorReason)
 	}
 	if err := s.store.UpdateNodeLastSeen(r.Context(), req.NodeID); err != nil {
 		slog.Error("node last-seen update failed", "err", err)
 	}
 	_ = json.NewEncoder(w).Encode(map[string]bool{"ok": true}) //nolint:errcheck
 }
 func (s *Server) handleMetrics(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 		return
 	}
 	if !s.cfg.MetricsPublic {
 		if !s.requireAuth(r) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 	}
 	metrics.Handler(s.eng)(w, r)
 }
 func (s *Server) handleStatus(w http.ResponseWriter, _ *http.Request) {
 	renderStatusPage(w, s.cfg.Title, s.eng)
 }
 func (s *Server) handleStatusJSON(w http.ResponseWriter, r *http.Request) {
 	state := s.eng.GetLiveState()
 	activeWindows, _ := s.store.GetActiveMaintenanceWindows(r.Context())
 	maintSet := make(map[int]bool)
 	allInMaint := false
 	for _, mw := range activeWindows {
 		if mw.Type != "maintenance" {
 			continue
 		}
 		if mw.MonitorID == 0 {
 			allInMaint = true
 		} else {
 			maintSet[mw.MonitorID] = true
 		}
 	}
 	public := make(map[int]statusSite, len(state))
 	for id, site := range state {
 		displayStatus := string(site.Status)
 		if allInMaint || maintSet[site.ID] || (site.ParentID > 0 && maintSet[site.ParentID]) {
 			displayStatus = "MAINT"
 		}
 		public[id] = statusSite{
 			Name:      site.Name,
 			Type:      site.Type,
 			URL:       site.URL,
 			Status:    displayStatus,
 			Paused:    site.Paused,
 			LastCheck: site.LastCheck,
 			Latency:   site.Latency,
 		}
 	}
 	if s.cfg.CORSOrigin != "" {
 		w.Header().Set("Access-Control-Allow-Origin", s.cfg.CORSOrigin)
 	}
 	w.Header().Set("Content-Type", "application/json")
 	_ = json.NewEncoder(w).Encode(public) //nolint:errcheck
 }
 // --- Helpers ---
 func checkSecret(got, want string) bool {
 	return subtle.ConstantTimeCompare([]byte(got), []byte(want)) == 1
 }
@@ -33,39 +422,78 @@ func extractBearerToken(r *http.Request) string {
 	return ""
 }
-// safeSettingKeys lists, per provider type, the settings that are NOT secret
+// statusSite is the public DTO for /status/json.
-// and may be exported in the clear. Everything else is redacted. Providers
+type statusSite struct {
-// absent from this map (discord, slack, webhook, pushover) carry their secret
+	Name      string
-// in a field a denylist would miss — the webhook URL, the pushover token/user —
+	Type      string
-// so all of their settings are redacted.
+	URL       string
-var safeSettingKeys = map[string]map[string]bool{
+	Status    string
-	"email":     {"host": true, "port": true, "to": true, "from": true},
+	Paused    bool
-	"ntfy":      {"topic": true, "priority": true},
+	LastCheck time.Time
-	"telegram":  {"chat_id": true},
+	Latency   time.Duration
 	"pagerduty": {"severity": true},
 	"gotify":    {"priority": true},
 	"opsgenie":  {"priority": true, "eu": true},
 }
-// redactByProvider keeps only the known-safe keys for the alert type and
+// --- Middleware ---
-// redacts everything else. An allowlist fails safe: an unknown or newly added
+
-// setting is redacted by default instead of leaking. This closes the denylist
+type statusWriter struct {
-// gap where url (discord/slack/webhook/ntfy/gotify) and api_key (opsgenie) —
+	http.ResponseWriter
-// the actual credentials — were exported in the clear.
+	code int
-func redactByProvider(alertType string, settings map[string]string) map[string]string {
+}
-	safe := safeSettingKeys[alertType]
+
-	redacted := make(map[string]string, len(settings))
+func (w *statusWriter) WriteHeader(code int) {
-	for k, v := range settings {
+	w.code = code
-		switch {
+	w.ResponseWriter.WriteHeader(code)
-		case v == "":
+}
-			redacted[k] = ""
+
-		case safe[k]:
+func loggingMiddleware(trusted []*net.IPNet, next http.Handler) http.Handler {
-			redacted[k] = v
+	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		default:
+		start := time.Now()
-			redacted[k] = "***REDACTED***"
+		sw := &statusWriter{ResponseWriter: w, code: 200}
 		next.ServeHTTP(sw, r)
 		path := strings.ReplaceAll(strings.ReplaceAll(r.URL.Path, "\n", ""), "\r", "")
 		slog.Info("http request", "method", r.Method, "path", path, "status", sw.code, "duration", time.Since(start).Round(time.Millisecond), "ip", clientIP(r, trusted)) //nolint:gosec // structured slog, not format string
 	})
 }
 func securityHeadersMiddleware(next http.Handler) http.Handler {
 	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		w.Header().Set("X-Content-Type-Options", "nosniff")
 		w.Header().Set("X-Frame-Options", "DENY")
 		w.Header().Set("Referrer-Policy", "no-referrer")
 		w.Header().Set("Content-Security-Policy", "default-src 'self'; script-src 'unsafe-inline'; style-src 'unsafe-inline'")
 		next.ServeHTTP(w, r)
 	})
 }
 func hstsMiddleware(next http.Handler) http.Handler {
 	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		w.Header().Set("Strict-Transport-Security", "max-age=63072000; includeSubDomains")
 		next.ServeHTTP(w, r)
 	})
 }
 func renderStatusPage(w http.ResponseWriter, title string, eng *monitor.Engine) {
 	sites := eng.GetAllSites()
 	sort.Slice(sites, func(i, j int) bool {
 		if sites[i].Status != sites[j].Status {
 			if sites[i].Status == models.StatusDown {
 				return true
 			}
 			if sites[j].Status == models.StatusDown {
 				return false
 			}
 		}
 		return sites[i].Name < sites[j].Name
 	})
 	data := struct {
 		Title string
 		Sites []models.Site
 	}{Title: title, Sites: sites}
 	if err := statusTpl.Execute(w, data); err != nil {
 		slog.Error("status page render failed", "err", err)
 	}
 	return redacted
 }
 var statusTpl = template.Must(template.New("status").Parse(`
@@ -199,396 +627,3 @@ var statusTpl = template.Must(template.New("status").Parse(`
 	</script>
 </body>
 </html>`))
 type ServerConfig struct {
 	Port           int
 	EnableStatus   bool
 	Title          string
 	ClusterKey     string
 	TLSCert        string
 	TLSKey         string
 	ClusterMode    string
 	MetricsPublic  bool
 	CORSOrigin     string
 	TrustedProxies []*net.IPNet
 }
 func Start(cfg ServerConfig, s store.Store, eng *monitor.Engine) *http.Server {
 	if cfg.ClusterKey == "" {
 		fmt.Println("WARNING: No UPTOP_CLUSTER_SECRET set. Cluster API endpoints are unauthenticated.")
 	}
 	pushRL := NewRateLimiter(60, cfg.TrustedProxies)
 	probeRL := NewRateLimiter(30, cfg.TrustedProxies)
 	backupRL := NewRateLimiter(10, cfg.TrustedProxies)
 	statusRL := NewRateLimiter(120, cfg.TrustedProxies)
 	mux := http.NewServeMux()
 	// 1. Push Heartbeat
 	mux.HandleFunc("/api/push", RateLimit(pushRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != http.MethodGet && r.Method != http.MethodPost {
 			http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 			return
 		}
 		token := extractBearerToken(r)
 		if token == "" {
 			if qt := r.URL.Query().Get("token"); qt != "" {
 				token = qt
 				log.Printf("DEPRECATED: push token in query string — use Authorization: Bearer header instead")
 			}
 		}
 		if token == "" {
 			http.Error(w, "Missing token", http.StatusBadRequest)
 			return
 		}
 		if eng.RecordHeartbeat(token) {
 			w.WriteHeader(http.StatusOK)
 			_, _ = w.Write([]byte("OK"))
 		} else {
 			http.Error(w, "Invalid Token", http.StatusNotFound)
 		}
 	}))
 	// 2. Health Check (For Cluster Follower)
 	mux.HandleFunc("/api/health", func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != http.MethodGet {
 			http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey != "" && !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		w.WriteHeader(http.StatusOK)
 		_, _ = w.Write([]byte("OK"))
 	})
 	// 3. Config Export
 	mux.HandleFunc("/api/backup/export", RateLimit(backupRL, func(w http.ResponseWriter, r *http.Request) {
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized: UPTOP_CLUSTER_SECRET required", http.StatusUnauthorized)
 			return
 		}
 		data, err := s.ExportData()
 		if err != nil {
 			log.Printf("Export failed: %v", err)
 			http.Error(w, "Export failed", http.StatusInternalServerError)
 			return
 		}
 		if r.URL.Query().Get("redact_secrets") != "false" {
 			for i := range data.Alerts {
 				data.Alerts[i].Settings = redactByProvider(data.Alerts[i].Type, data.Alerts[i].Settings)
 			}
 		}
 		_ = json.NewEncoder(w).Encode(data) //nolint:errcheck
 	}))
 	// 4. Config Import
 	mux.HandleFunc("/api/backup/import", RateLimit(backupRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != "POST" {
 			http.Error(w, "POST required", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 		var data models.Backup
 		if err := json.NewDecoder(r.Body).Decode(&data); err != nil {
 			http.Error(w, "Invalid JSON", http.StatusBadRequest)
 			return
 		}
 		if err := s.ImportData(data); err != nil {
 			log.Printf("Import failed: %v", err)
 			http.Error(w, "Import failed", http.StatusInternalServerError)
 			return
 		}
 		_, _ = w.Write([]byte("Import Successful"))
 	}))
 	// 5. Kuma Import
 	mux.HandleFunc("/api/import/kuma", RateLimit(backupRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != "POST" {
 			http.Error(w, "POST required", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 		var kb importer.KumaBackup
 		if err := json.NewDecoder(r.Body).Decode(&kb); err != nil {
 			log.Printf("Invalid Kuma JSON: %v", err)
 			http.Error(w, "Invalid Kuma JSON", http.StatusBadRequest)
 			return
 		}
 		backup := importer.ConvertKuma(&kb)
 		if err := s.ImportData(backup); err != nil {
 			log.Printf("Kuma import failed: %v", err)
 			http.Error(w, "Import failed", http.StatusInternalServerError)
 			return
 		}
 		fmt.Fprintf(w, "Imported %d monitors, %d alerts from Kuma v%s", len(backup.Sites), len(backup.Alerts), kb.Version)
 	}))
 	// 6. Probe Registration
 	mux.HandleFunc("/api/probe/register", RateLimit(probeRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != "POST" {
 			http.Error(w, "POST required", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 		var req struct {
 			ID      string `json:"id"`
 			Name    string `json:"name"`
 			Region  string `json:"region"`
 			Version string `json:"version"`
 		}
 		if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
 			http.Error(w, "Invalid JSON", http.StatusBadRequest)
 			return
 		}
 		if req.ID == "" {
 			http.Error(w, "id is required", http.StatusBadRequest)
 			return
 		}
 		if err := s.RegisterNode(models.ProbeNode{
 			ID: req.ID, Name: req.Name, Region: req.Region, Version: req.Version,
 		}); err != nil {
 			log.Printf("Probe register failed: %v", err)
 			http.Error(w, "Registration failed", http.StatusInternalServerError)
 			return
 		}
 		_ = json.NewEncoder(w).Encode(map[string]bool{"ok": true}) //nolint:errcheck
 	}))
 	// 7. Probe Assignment Fetch
 	mux.HandleFunc("/api/probe/assignments", RateLimit(probeRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != http.MethodGet {
 			http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		nodeID := r.URL.Query().Get("node_id")
 		var nodeRegion string
 		if nodeID != "" {
 			if node, err := s.GetNode(nodeID); err == nil {
 				nodeRegion = node.Region
 			}
 		}
 		sites := eng.GetAllSites()
 		var assigned []models.Site
 		for _, site := range sites {
 			if site.Paused || site.Type == "push" || site.Type == "group" {
 				continue
 			}
 			if site.Regions != "" && nodeRegion != "" {
 				matched := false
 				for _, r := range strings.Split(site.Regions, ",") {
 					if strings.TrimSpace(r) == nodeRegion {
 						matched = true
 						break
 					}
 				}
 				if !matched {
 					continue
 				}
 			}
 			assigned = append(assigned, site)
 		}
 		w.Header().Set("Content-Type", "application/json")
 		_ = json.NewEncoder(w).Encode(map[string][]models.Site{"sites": assigned}) //nolint:errcheck
 	}))
 	// 8. Probe Result Submission
 	mux.HandleFunc("/api/probe/results", RateLimit(probeRL, func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != "POST" {
 			http.Error(w, "POST required", http.StatusMethodNotAllowed)
 			return
 		}
 		if cfg.ClusterKey == "" || !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 			http.Error(w, "Unauthorized", http.StatusUnauthorized)
 			return
 		}
 		r.Body = http.MaxBytesReader(w, r.Body, maxRequestBody)
 		var req struct {
 			NodeID  string `json:"node_id"`
 			Results []struct {
 				SiteID      int    `json:"site_id"`
 				LatencyNs   int64  `json:"latency_ns"`
 				IsUp        bool   `json:"is_up"`
 				ErrorReason string `json:"error_reason"`
 			} `json:"results"`
 		}
 		if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
 			http.Error(w, "Invalid JSON", http.StatusBadRequest)
 			return
 		}
 		if req.NodeID == "" {
 			http.Error(w, "node_id is required", http.StatusBadRequest)
 			return
 		}
 		for _, result := range req.Results {
 			if err := s.SaveCheckFromNode(result.SiteID, req.NodeID, result.LatencyNs, result.IsUp); err != nil {
 				log.Printf("Failed to save probe result: %v", err)
 			}
 			eng.IngestProbeResult(req.NodeID, result.SiteID, result.LatencyNs, result.IsUp, result.ErrorReason)
 		}
 		if err := s.UpdateNodeLastSeen(req.NodeID); err != nil {
 			log.Printf("Failed to update node last seen: %v", err)
 		}
 		_ = json.NewEncoder(w).Encode(map[string]bool{"ok": true}) //nolint:errcheck
 	}))
 	// 9. Prometheus Metrics
 	mux.HandleFunc("/metrics", func(w http.ResponseWriter, r *http.Request) {
 		if r.Method != http.MethodGet {
 			http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
 			return
 		}
 		if !cfg.MetricsPublic && cfg.ClusterKey != "" {
 			if !checkSecret(r.Header.Get("X-Upkeep-Secret"), cfg.ClusterKey) {
 				http.Error(w, "Unauthorized", http.StatusUnauthorized)
 				return
 			}
 		}
 		metrics.Handler(eng)(w, r)
 	})
 	// 10. Status Page
 	if cfg.EnableStatus {
 		mux.HandleFunc("/status", RateLimit(statusRL, func(w http.ResponseWriter, r *http.Request) { renderStatusPage(w, cfg.Title, eng) }))
 		mux.HandleFunc("/status/json", RateLimit(statusRL, func(w http.ResponseWriter, r *http.Request) {
 			state := eng.GetLiveState()
 			activeWindows, _ := s.GetActiveMaintenanceWindows()
 			maintSet := make(map[int]bool)
 			allInMaint := false
 			for _, mw := range activeWindows {
 				if mw.Type != "maintenance" {
 					continue
 				}
 				if mw.MonitorID == 0 {
 					allInMaint = true
 				} else {
 					maintSet[mw.MonitorID] = true
 				}
 			}
 			for id, site := range state {
 				site.Token = ""
 				if allInMaint || maintSet[site.ID] || (site.ParentID > 0 && maintSet[site.ParentID]) {
 					site.Status = "MAINT"
 				}
 				state[id] = site
 			}
 			if cfg.CORSOrigin != "" {
 				w.Header().Set("Access-Control-Allow-Origin", cfg.CORSOrigin)
 			}
 			w.Header().Set("Content-Type", "application/json")
 			_ = json.NewEncoder(w).Encode(state) //nolint:errcheck
 		}))
 	}
 	if cfg.ClusterMode != "" && cfg.ClusterMode != "leader" && cfg.TLSCert == "" {
 		fmt.Println("WARNING: Cluster mode active without TLS. Secrets transmitted in cleartext.")
 	}
 	handler := loggingMiddleware(cfg.TrustedProxies, securityHeadersMiddleware(mux))
 	if cfg.TLSCert != "" {
 		handler = hstsMiddleware(handler)
 	}
 	addr := fmt.Sprintf(":%d", cfg.Port)
 	srv := &http.Server{
 		Addr:              addr,
 		Handler:           handler,
 		ReadHeaderTimeout: 10 * time.Second,
 		ReadTimeout:       30 * time.Second,
 		WriteTimeout:      60 * time.Second,
 		IdleTimeout:       120 * time.Second,
 	}
 	go func() {
 		if cfg.TLSCert != "" && cfg.TLSKey != "" {
 			fmt.Printf("HTTPS Server listening on %s\n", addr)
 			if err := srv.ListenAndServeTLS(cfg.TLSCert, cfg.TLSKey); err != nil && err != http.ErrServerClosed {
 				log.Printf("HTTPS server error: %v", err)
 			}
 		} else {
 			fmt.Printf("HTTP Server listening on %s\n", addr)
 			if err := srv.ListenAndServe(); err != nil && err != http.ErrServerClosed {
 				log.Printf("HTTP server error: %v", err)
 			}
 		}
 	}()
 	return srv
 }
 type statusWriter struct {
 	http.ResponseWriter
 	code int
 }
 func (w *statusWriter) WriteHeader(code int) {
 	w.code = code
 	w.ResponseWriter.WriteHeader(code)
 }
 func loggingMiddleware(trusted []*net.IPNet, next http.Handler) http.Handler {
 	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		start := time.Now()
 		sw := &statusWriter{ResponseWriter: w, code: 200}
 		next.ServeHTTP(sw, r)
 		path := strings.ReplaceAll(strings.ReplaceAll(r.URL.Path, "\n", ""), "\r", "")
 		log.Printf("%s %s %d %s %s", r.Method, path, sw.code, time.Since(start).Round(time.Millisecond), clientIP(r, trusted)) //nolint:gosec // path sanitized above
 	})
 }
 func securityHeadersMiddleware(next http.Handler) http.Handler {
 	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		w.Header().Set("X-Content-Type-Options", "nosniff")
 		w.Header().Set("X-Frame-Options", "DENY")
 		w.Header().Set("Referrer-Policy", "no-referrer")
 		w.Header().Set("Content-Security-Policy", "default-src 'self'; script-src 'unsafe-inline'; style-src 'unsafe-inline'")
 		next.ServeHTTP(w, r)
 	})
 }
 func hstsMiddleware(next http.Handler) http.Handler {
 	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		w.Header().Set("Strict-Transport-Security", "max-age=63072000; includeSubDomains")
 		next.ServeHTTP(w, r)
 	})
 }
 func renderStatusPage(w http.ResponseWriter, title string, eng *monitor.Engine) {
 	sites := eng.GetAllSites()
 	sort.Slice(sites, func(i, j int) bool {
 		if sites[i].Status != sites[j].Status {
 			if sites[i].Status == "DOWN" {
 				return true
 			}
 			if sites[j].Status == "DOWN" {
 				return false
 			}
 		}
 		return sites[i].Name < sites[j].Name
 	})
 	data := struct {
 		Title string
 		Sites []models.Site
 	}{Title: title, Sites: sites}
 	if err := statusTpl.Execute(w, data); err != nil {
 		log.Printf("Failed to render status page: %v", err)
 	}
 }
@@ -2,6 +2,7 @@ package server
 import (
 	"bytes"
 	"context"
 	"encoding/json"
 	"fmt"
 	"net"
@@ -12,13 +13,15 @@ import (
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 )
 // --- Mock Store ---
 type mockStore struct {
 	storetest.BaseMock
 	mu              sync.Mutex
-	sites           []models.Site
+	sites           []models.SiteConfig
 	alerts          []models.AlertConfig
 	nodes           map[string]models.ProbeNode
 	importedData    *models.Backup
@@ -32,80 +35,26 @@ func newMockStore() *mockStore {
 	}
 }
-func (m *mockStore) Init() error                                              { return nil }
+func (m *mockStore) GetSites(_ context.Context) ([]models.SiteConfig, error) { return m.sites, nil }
-func (m *mockStore) GetSites() ([]models.Site, error)                         { return m.sites, nil }
+func (m *mockStore) GetAllAlerts(_ context.Context) ([]models.AlertConfig, error) {
-func (m *mockStore) AddSite(models.Site) error                                { return nil }
+	return m.alerts, nil
 func (m *mockStore) UpdateSite(models.Site) error                             { return nil }
 func (m *mockStore) UpdateSitePaused(int, bool) error                         { return nil }
 func (m *mockStore) DeleteSite(int) error                                     { return nil }
 func (m *mockStore) GetAllAlerts() ([]models.AlertConfig, error)              { return m.alerts, nil }
 func (m *mockStore) GetAlert(int) (models.AlertConfig, error)                 { return models.AlertConfig{}, nil }
 func (m *mockStore) AddAlert(string, string, map[string]string) error         { return nil }
 func (m *mockStore) UpdateAlert(int, string, string, map[string]string) error { return nil }
 func (m *mockStore) DeleteAlert(int) error                                    { return nil }
 func (m *mockStore) GetAllUsers() ([]models.User, error)                      { return nil, nil }
 func (m *mockStore) AddUser(string, string, string) error                     { return nil }
 func (m *mockStore) UpdateUser(int, string, string, string) error             { return nil }
 func (m *mockStore) DeleteUser(int) error                                     { return nil }
 func (m *mockStore) SaveCheck(int, int64, bool) error                         { return nil }
 func (m *mockStore) SaveCheckFromNode(siteID int, nodeID string, latencyNs int64, isUp bool) error {
 	return nil
 }
 func (m *mockStore) LoadAllHistory(int) (map[int][]models.CheckRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) GetSiteByName(string) (models.Site, error) { return models.Site{}, nil }
 func (m *mockStore) GetAlertByName(string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, nil
 }
 func (m *mockStore) AddSiteReturningID(models.Site) (int, error) { return 0, nil }
 func (m *mockStore) AddAlertReturningID(string, string, map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *mockStore) GetAllNodes() ([]models.ProbeNode, error) { return nil, nil }
 func (m *mockStore) UpdateNodeLastSeen(string) error          { return nil }
 func (m *mockStore) DeleteNode(string) error                  { return nil }
 func (m *mockStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return nil, nil
 }
 func (m *mockStore) SaveAlertHealth(models.AlertHealthRecord) error { return nil }
 func (m *mockStore) SaveLog(string) error                           { return nil }
 func (m *mockStore) PruneLogs() error                               { return nil }
 func (m *mockStore) PruneCheckHistory() error                       { return nil }
 func (m *mockStore) PruneStateChanges() error                       { return nil }
 func (m *mockStore) LoadLogs(int) ([]string, error)                 { return nil, nil }
 func (m *mockStore) GetAllMaintenanceWindows(int) ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *mockStore) AddMaintenanceWindow(models.MaintenanceWindow) error         { return nil }
 func (m *mockStore) EndMaintenanceWindow(int) error                              { return nil }
 func (m *mockStore) DeleteMaintenanceWindow(int) error                           { return nil }
 func (m *mockStore) PruneExpiredMaintenanceWindows(time.Duration) (int64, error) { return 0, nil }
 func (m *mockStore) IsMonitorInMaintenance(int) (bool, error)                    { return false, nil }
 func (m *mockStore) GetPreference(string) (string, error)                        { return "", nil }
 func (m *mockStore) SetPreference(string, string) error                          { return nil }
 func (m *mockStore) SaveStateChange(int, string, string, string) error           { return nil }
 func (m *mockStore) GetStateChanges(int, int) ([]models.StateChange, error)      { return nil, nil }
 func (m *mockStore) GetStateChangesSince(int, time.Time) ([]models.StateChange, error) {
 	return nil, nil
 }
 func (m *mockStore) Close() error { return nil }
-func (m *mockStore) ExportData() (models.Backup, error) {
+func (m *mockStore) ExportData(_ context.Context) (models.Backup, error) {
 	return models.Backup{
 		Sites:  m.sites,
 		Alerts: m.alerts,
 	}, nil
 }
-func (m *mockStore) ImportData(data models.Backup) error {
+func (m *mockStore) ImportData(_ context.Context, data models.Backup) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.importedData = &data
 	return nil
 }
-func (m *mockStore) RegisterNode(node models.ProbeNode) error {
+func (m *mockStore) RegisterNode(_ context.Context, node models.ProbeNode) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.registeredNodes = append(m.registeredNodes, node)
@@ -113,7 +62,7 @@ func (m *mockStore) RegisterNode(node models.ProbeNode) error {
 	return nil
 }
-func (m *mockStore) GetNode(id string) (models.ProbeNode, error) {
+func (m *mockStore) GetNode(_ context.Context, id string) (models.ProbeNode, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	if n, ok := m.nodes[id]; ok {
@@ -122,7 +71,7 @@ func (m *mockStore) GetNode(id string) (models.ProbeNode, error) {
 	return models.ProbeNode{}, fmt.Errorf("not found")
 }
-func (m *mockStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
+func (m *mockStore) GetActiveMaintenanceWindows(_ context.Context) ([]models.MaintenanceWindow, error) {
 	return m.maintWindows, nil
 }
@@ -192,7 +141,7 @@ func authReq(method, url, secret string, body []byte) (*http.Response, error) {
 		return nil, err
 	}
 	if secret != "" {
-		req.Header.Set("X-Upkeep-Secret", secret)
+		req.Header.Set("X-Uptop-Secret", secret)
 	}
 	return http.DefaultClient.Do(req)
 }
@@ -303,7 +252,7 @@ func TestExport_Unauthorized_WrongKey(t *testing.T) {
 func TestExport_Success(t *testing.T) {
 	ts := newTestServer(t, "secret", false)
-	ts.store.sites = []models.Site{{ID: 1, Name: "example", URL: "http://example.com"}}
+	ts.store.sites = []models.SiteConfig{{ID: 1, Name: "example", URL: "http://example.com"}}
 	resp, err := authReq("GET", ts.baseURL+"/api/backup/export", "secret", nil)
 	if err != nil {
@@ -350,7 +299,7 @@ func TestImport_Unauthorized(t *testing.T) {
 func TestImport_Success(t *testing.T) {
 	ts := newTestServer(t, "secret", false)
 	backup := models.Backup{
-		Sites: []models.Site{{Name: "imported", URL: "http://example.com"}},
+		Sites: []models.SiteConfig{{Name: "imported", URL: "http://example.com"}},
 	}
 	body, _ := json.Marshal(backup)
 	resp, err := authReq("POST", ts.baseURL+"/api/backup/import", "secret", body)
@@ -480,15 +429,32 @@ func TestStatusPage_Enabled(t *testing.T) {
 	}
 }
-func TestStatusJSON_TokensStripped(t *testing.T) {
+func TestStatusJSON_PublicDTOOnly(t *testing.T) {
 	ts := newTestServer(t, "secret", true)
-	// Inject a site with a token into engine state
+	// Seed a push monitor (no network IO) through the store and start the
-	ts.engine.UpdateSiteConfig(models.Site{ID: 1, Name: "test", Type: "push", Token: "secret-token", Status: "UP"})
+	// engine so its poll loop loads it into live state — the path real sites
-	// Need to inject directly since UpdateSiteConfig only updates existing
+	// take. The old version of this test injected via UpdateSiteConfig, which
-	func() {
+	// no-ops for unknown IDs, so it asserted over zero sites and passed
-		ts.engine.RecordHeartbeat("unused") // just to exercise, won't match
+	// against a server that leaked tokens.
-	}()
+	ts.store.sites = []models.SiteConfig{{
 		ID: 1, Name: "test", Type: "push", Token: "secret-token",
 		Hostname: "internal-host", AlertID: 3,
 	}}
 	ctx, cancel := context.WithCancel(context.Background())
 	ts.engine.Start(ctx)
 	t.Cleanup(func() {
 		cancel()
 		ts.engine.Stop()
 	})
 	deadline := time.Now().Add(2 * time.Second)
 	for time.Now().Before(deadline) && len(ts.engine.GetLiveState()) == 0 {
 		time.Sleep(10 * time.Millisecond)
 	}
 	if len(ts.engine.GetLiveState()) == 0 {
 		t.Fatal("engine never loaded the seeded site")
 	}
 	resp, err := http.Get(ts.baseURL + "/status/json")
 	if err != nil {
@@ -498,11 +464,23 @@ func TestStatusJSON_TokensStripped(t *testing.T) {
 	if resp.StatusCode != 200 {
 		t.Errorf("expected 200, got %d", resp.StatusCode)
 	}
-	var state map[string]models.Site
+
-	json.NewDecoder(resp.Body).Decode(&state)
+	// Decode raw so absent struct fields can't mask leaked JSON keys.
 	var state map[string]map[string]any
 	if err := json.NewDecoder(resp.Body).Decode(&state); err != nil {
 		t.Fatal(err)
 	}
 	if len(state) != 1 {
 		t.Fatalf("expected 1 site in status JSON, got %d", len(state))
 	}
 	for _, site := range state {
-		if site.Token != "" {
+		if site["Name"] != "test" {
-			t.Error("expected token stripped from status JSON response")
+			t.Errorf("expected Name to be public, got %v", site["Name"])
 		}
 		for _, leaked := range []string{"Token", "LastError", "Hostname", "Port", "DNSServer", "AlertID", "AcceptedCodes", "Interval"} {
 			if _, ok := site[leaked]; ok {
 				t.Errorf("status JSON leaks internal field %q", leaked)
 			}
 		}
 	}
 }
@@ -656,7 +634,7 @@ func TestRedactByProvider(t *testing.T) {
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
-			out := redactByProvider(tt.typ, tt.in)
+			out := models.RedactAlertSettings(tt.typ, tt.in)
 			for _, k := range tt.redacted {
 				if out[k] != "***REDACTED***" {
 					t.Errorf("key %q: expected redacted, got %q", k, out[k])
@@ -5,13 +5,20 @@ import (
 	"strconv"
 )
 type Migration struct {
 	Version int
 	SQL     string
 }
 type Dialect interface {
 	DriverName() string
 	CreateTablesSQL() []string
-	MigrationsSQL() []string
+	Migrations() []Migration
 	BaselineVersion() int
 	BoolFalse() string
 	ResetSequenceOnEmpty(db *sql.DB, table string)
 	ImportWipe(tx *sql.Tx)
 	ImportWipeUsers(tx *sql.Tx)
 	ImportResetSequences(tx *sql.Tx)
 	UpsertNodeSQL() string
 	UpsertAlertHealthSQL() string
@@ -2,7 +2,7 @@ package store
 import (
 	"database/sql"
-	"log"
+	"log/slog"
 	_ "github.com/lib/pq"
 )
@@ -13,8 +13,9 @@ func NewPostgresStore(connStr string) (*SQLStore, error) {
 	return NewSQLStore("postgres", connStr, &PostgresDialect{})
 }
-func (d *PostgresDialect) DriverName() string { return "postgres" }
+func (d *PostgresDialect) DriverName() string   { return "postgres" }
-func (d *PostgresDialect) BoolFalse() string  { return "FALSE" }
+func (d *PostgresDialect) BoolFalse() string    { return "FALSE" }
 func (d *PostgresDialect) BaselineVersion() int { return 21 }
 func (d *PostgresDialect) CreateTablesSQL() []string {
 	return []string{
@@ -32,7 +33,8 @@ func (d *PostgresDialect) CreateTablesSQL() []string {
 			method TEXT DEFAULT 'GET', description TEXT DEFAULT '',
 			parent_id INTEGER DEFAULT 0, accepted_codes TEXT DEFAULT '200-299',
 			dns_resolve_type TEXT DEFAULT '', dns_server TEXT DEFAULT '',
-			ignore_tls BOOLEAN DEFAULT FALSE, paused BOOLEAN DEFAULT FALSE
+			ignore_tls BOOLEAN DEFAULT FALSE, paused BOOLEAN DEFAULT FALSE,
 			regions TEXT DEFAULT ''
 		)`,
 		`CREATE TABLE IF NOT EXISTS users (
 			id SERIAL PRIMARY KEY,
@@ -42,20 +44,21 @@ func (d *PostgresDialect) CreateTablesSQL() []string {
 		`CREATE TABLE IF NOT EXISTS check_history (
 			id SERIAL PRIMARY KEY,
 			site_id INTEGER NOT NULL, latency_ns BIGINT,
-			is_up BOOLEAN, checked_at TIMESTAMP DEFAULT NOW()
+			is_up BOOLEAN, checked_at TIMESTAMPTZ DEFAULT NOW(),
 			node_id TEXT DEFAULT ''
 		)`,
 		`CREATE INDEX IF NOT EXISTS idx_check_history_site ON check_history(site_id, checked_at DESC)`,
 		`CREATE TABLE IF NOT EXISTS nodes (
 			id TEXT PRIMARY KEY,
 			name TEXT NOT NULL,
 			region TEXT DEFAULT '',
-			last_seen TIMESTAMP DEFAULT NOW(),
+			last_seen TIMESTAMPTZ DEFAULT NOW(),
 			version TEXT DEFAULT ''
 		)`,
 		`CREATE TABLE IF NOT EXISTS logs (
 			id SERIAL PRIMARY KEY,
 			message TEXT NOT NULL,
-			created_at TIMESTAMP DEFAULT NOW()
+			created_at TIMESTAMPTZ DEFAULT NOW()
 		)`,
 		`CREATE TABLE IF NOT EXISTS maintenance_windows (
 			id SERIAL PRIMARY KEY,
@@ -63,10 +66,10 @@ func (d *PostgresDialect) CreateTablesSQL() []string {
 			title TEXT NOT NULL,
 			description TEXT DEFAULT '',
 			type TEXT DEFAULT 'maintenance',
-			start_time TIMESTAMP NOT NULL,
+			start_time TIMESTAMPTZ NOT NULL,
-			end_time TIMESTAMP,
+			end_time TIMESTAMPTZ,
 			created_by TEXT DEFAULT '',
-			created_at TIMESTAMP DEFAULT NOW()
+			created_at TIMESTAMPTZ DEFAULT NOW()
 		)`,
 		`CREATE TABLE IF NOT EXISTS preferences (
 			key TEXT PRIMARY KEY,
@@ -78,12 +81,12 @@ func (d *PostgresDialect) CreateTablesSQL() []string {
 			from_status TEXT NOT NULL,
 			to_status TEXT NOT NULL,
 			error_reason TEXT DEFAULT '',
-			changed_at TIMESTAMP DEFAULT NOW()
+			changed_at TIMESTAMPTZ DEFAULT NOW()
 		)`,
 		`CREATE INDEX IF NOT EXISTS idx_state_changes_site ON state_changes(site_id, changed_at DESC)`,
 		`CREATE TABLE IF NOT EXISTS alert_health (
 			alert_id INTEGER PRIMARY KEY,
-			last_send_at TIMESTAMP,
+			last_send_at TIMESTAMPTZ,
 			last_send_ok BOOLEAN DEFAULT FALSE,
 			last_error TEXT DEFAULT '',
 			send_count INTEGER DEFAULT 0,
@@ -92,21 +95,29 @@ func (d *PostgresDialect) CreateTablesSQL() []string {
 	}
 }
-func (d *PostgresDialect) MigrationsSQL() []string {
+func (d *PostgresDialect) Migrations() []Migration {
-	return []string{
+	return []Migration{
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS hostname TEXT DEFAULT ''",
+		{1, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS hostname TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS port INTEGER DEFAULT 0",
+		{2, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS port INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS timeout INTEGER DEFAULT 0",
+		{3, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS timeout INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS method TEXT DEFAULT 'GET'",
+		{4, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS method TEXT DEFAULT 'GET'"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS description TEXT DEFAULT ''",
+		{5, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS description TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS parent_id INTEGER DEFAULT 0",
+		{6, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS parent_id INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS accepted_codes TEXT DEFAULT '200-299'",
+		{7, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS accepted_codes TEXT DEFAULT '200-299'"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS dns_resolve_type TEXT DEFAULT ''",
+		{8, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS dns_resolve_type TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS dns_server TEXT DEFAULT ''",
+		{9, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS dns_server TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS ignore_tls BOOLEAN DEFAULT FALSE",
+		{10, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS ignore_tls BOOLEAN DEFAULT FALSE"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS paused BOOLEAN DEFAULT FALSE",
+		{11, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS paused BOOLEAN DEFAULT FALSE"},
-		"ALTER TABLE check_history ADD COLUMN IF NOT EXISTS node_id TEXT DEFAULT ''",
+		{12, "ALTER TABLE check_history ADD COLUMN IF NOT EXISTS node_id TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN IF NOT EXISTS regions TEXT DEFAULT ''",
+		{13, "ALTER TABLE sites ADD COLUMN IF NOT EXISTS regions TEXT DEFAULT ''"},
 		{14, "ALTER TABLE check_history ALTER COLUMN checked_at TYPE TIMESTAMPTZ USING checked_at AT TIME ZONE 'UTC'"},
 		{15, "ALTER TABLE nodes ALTER COLUMN last_seen TYPE TIMESTAMPTZ USING last_seen AT TIME ZONE 'UTC'"},
 		{16, "ALTER TABLE logs ALTER COLUMN created_at TYPE TIMESTAMPTZ USING created_at AT TIME ZONE 'UTC'"},
 		{17, "ALTER TABLE maintenance_windows ALTER COLUMN start_time TYPE TIMESTAMPTZ USING start_time AT TIME ZONE 'UTC'"},
 		{18, "ALTER TABLE maintenance_windows ALTER COLUMN end_time TYPE TIMESTAMPTZ USING end_time AT TIME ZONE 'UTC'"},
 		{19, "ALTER TABLE maintenance_windows ALTER COLUMN created_at TYPE TIMESTAMPTZ USING created_at AT TIME ZONE 'UTC'"},
 		{20, "ALTER TABLE state_changes ALTER COLUMN changed_at TYPE TIMESTAMPTZ USING changed_at AT TIME ZONE 'UTC'"},
 		{21, "ALTER TABLE alert_health ALTER COLUMN last_send_at TYPE TIMESTAMPTZ USING last_send_at AT TIME ZONE 'UTC'"},
 	}
 }
@@ -122,30 +133,42 @@ func (d *PostgresDialect) ResetSequenceOnEmpty(db *sql.DB, table string) {}
 func (d *PostgresDialect) ImportWipe(tx *sql.Tx) {
 	if _, err := tx.Exec("TRUNCATE TABLE sites RESTART IDENTITY CASCADE"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "sites", "err", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE alerts RESTART IDENTITY CASCADE"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "alerts", "err", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE users RESTART IDENTITY CASCADE"); err != nil {
 		log.Printf("import wipe error: %v", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE maintenance_windows RESTART IDENTITY CASCADE"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "maintenance_windows", "err", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE check_history RESTART IDENTITY CASCADE"); err != nil {
 		slog.Debug("import wipe failed", "table", "check_history", "err", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE state_changes RESTART IDENTITY CASCADE"); err != nil {
 		slog.Debug("import wipe failed", "table", "state_changes", "err", err)
 	}
 	if _, err := tx.Exec("TRUNCATE TABLE alert_health RESTART IDENTITY CASCADE"); err != nil {
 		slog.Debug("import wipe failed", "table", "alert_health", "err", err)
 	}
 }
 func (d *PostgresDialect) ImportWipeUsers(tx *sql.Tx) {
 	if _, err := tx.Exec("TRUNCATE TABLE users RESTART IDENTITY CASCADE"); err != nil {
 		slog.Debug("import wipe failed", "table", "users", "err", err)
 	}
 }
 func (d *PostgresDialect) ImportResetSequences(tx *sql.Tx) {
 	if _, err := tx.Exec("SELECT setval('sites_id_seq', (SELECT COALESCE(MAX(id), 1) FROM sites))"); err != nil {
-		log.Printf("sequence reset error: %v", err)
+		slog.Debug("sequence reset failed", "table", "sites", "err", err)
 	}
 	if _, err := tx.Exec("SELECT setval('alerts_id_seq', (SELECT COALESCE(MAX(id), 1) FROM alerts))"); err != nil {
-		log.Printf("sequence reset error: %v", err)
+		slog.Debug("sequence reset failed", "table", "alerts", "err", err)
 	}
 	if _, err := tx.Exec("SELECT setval('users_id_seq', (SELECT COALESCE(MAX(id), 1) FROM users))"); err != nil {
-		log.Printf("sequence reset error: %v", err)
+		slog.Debug("sequence reset failed", "table", "users", "err", err)
 	}
 	if _, err := tx.Exec("SELECT setval('maintenance_windows_id_seq', (SELECT COALESCE(MAX(id), 1) FROM maintenance_windows))"); err != nil {
-		log.Printf("sequence reset error: %v", err)
+		slog.Debug("sequence reset failed", "table", "maintenance_windows", "err", err)
 	}
 }
@@ -3,9 +3,10 @@ package store
 import (
 	"database/sql"
 	"fmt"
-	"log"
+	"log/slog"
 	"os"
-	_ "github.com/mattn/go-sqlite3"
+	_ "modernc.org/sqlite"
 )
 type SQLiteDialect struct{}
@@ -19,17 +20,25 @@ func NewSQLiteStore(path string) (*SQLStore, error) {
 	// these pragmas are no-ops or harmful for the in-memory test DB.)
 	dsn := path
 	if path != ":memory:" {
-		dsn = fmt.Sprintf("file:%s?_journal_mode=WAL&_busy_timeout=5000&_synchronous=NORMAL", path)
+		dsn = fmt.Sprintf("file:%s?_pragma=journal_mode(wal)&_pragma=busy_timeout(5000)&_pragma=synchronous(normal)", path)
 	}
-	s, err := NewSQLStore("sqlite3", dsn, &SQLiteDialect{})
+	s, err := NewSQLStore("sqlite", dsn, &SQLiteDialect{})
 	if err != nil {
 		return nil, err
 	}
 	if path != ":memory:" {
 		for _, suffix := range []string{"", "-wal", "-shm"} {
 			if err := os.Chmod(path+suffix, 0600); err != nil && !os.IsNotExist(err) {
 				slog.Warn("failed to chmod database file", "path", path+suffix, "err", err)
 			}
 		}
 	}
 	return s, nil
 }
-func (d *SQLiteDialect) DriverName() string { return "sqlite3" }
+func (d *SQLiteDialect) DriverName() string   { return "sqlite" }
-func (d *SQLiteDialect) BoolFalse() string  { return "0" }
+func (d *SQLiteDialect) BoolFalse() string    { return "0" }
 func (d *SQLiteDialect) BaselineVersion() int { return 13 }
 func (d *SQLiteDialect) CreateTablesSQL() []string {
 	return []string{
@@ -47,7 +56,8 @@ func (d *SQLiteDialect) CreateTablesSQL() []string {
 			method TEXT DEFAULT 'GET', description TEXT DEFAULT '',
 			parent_id INTEGER DEFAULT 0, accepted_codes TEXT DEFAULT '200-299',
 			dns_resolve_type TEXT DEFAULT '', dns_server TEXT DEFAULT '',
-			ignore_tls BOOLEAN DEFAULT 0, paused BOOLEAN DEFAULT 0
+			ignore_tls BOOLEAN DEFAULT 0, paused BOOLEAN DEFAULT 0,
 			regions TEXT DEFAULT ''
 		)`,
 		`CREATE TABLE IF NOT EXISTS users (
 			id INTEGER PRIMARY KEY AUTOINCREMENT,
@@ -57,7 +67,8 @@ func (d *SQLiteDialect) CreateTablesSQL() []string {
 		`CREATE TABLE IF NOT EXISTS check_history (
 			id INTEGER PRIMARY KEY AUTOINCREMENT,
 			site_id INTEGER NOT NULL, latency_ns INTEGER,
-			is_up BOOLEAN, checked_at DATETIME DEFAULT CURRENT_TIMESTAMP
+			is_up BOOLEAN, checked_at DATETIME DEFAULT CURRENT_TIMESTAMP,
 			node_id TEXT DEFAULT ''
 		)`,
 		`CREATE INDEX IF NOT EXISTS idx_check_history_site ON check_history(site_id, checked_at DESC)`,
 		`CREATE TABLE IF NOT EXISTS nodes (
@@ -107,21 +118,21 @@ func (d *SQLiteDialect) CreateTablesSQL() []string {
 	}
 }
-func (d *SQLiteDialect) MigrationsSQL() []string {
+func (d *SQLiteDialect) Migrations() []Migration {
-	return []string{
+	return []Migration{
-		"ALTER TABLE sites ADD COLUMN hostname TEXT DEFAULT ''",
+		{1, "ALTER TABLE sites ADD COLUMN hostname TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN port INTEGER DEFAULT 0",
+		{2, "ALTER TABLE sites ADD COLUMN port INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN timeout INTEGER DEFAULT 0",
+		{3, "ALTER TABLE sites ADD COLUMN timeout INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN method TEXT DEFAULT 'GET'",
+		{4, "ALTER TABLE sites ADD COLUMN method TEXT DEFAULT 'GET'"},
-		"ALTER TABLE sites ADD COLUMN description TEXT DEFAULT ''",
+		{5, "ALTER TABLE sites ADD COLUMN description TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN parent_id INTEGER DEFAULT 0",
+		{6, "ALTER TABLE sites ADD COLUMN parent_id INTEGER DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN accepted_codes TEXT DEFAULT '200-299'",
+		{7, "ALTER TABLE sites ADD COLUMN accepted_codes TEXT DEFAULT '200-299'"},
-		"ALTER TABLE sites ADD COLUMN dns_resolve_type TEXT DEFAULT ''",
+		{8, "ALTER TABLE sites ADD COLUMN dns_resolve_type TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN dns_server TEXT DEFAULT ''",
+		{9, "ALTER TABLE sites ADD COLUMN dns_server TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN ignore_tls BOOLEAN DEFAULT 0",
+		{10, "ALTER TABLE sites ADD COLUMN ignore_tls BOOLEAN DEFAULT 0"},
-		"ALTER TABLE sites ADD COLUMN paused BOOLEAN DEFAULT 0",
+		{11, "ALTER TABLE sites ADD COLUMN paused BOOLEAN DEFAULT 0"},
-		"ALTER TABLE check_history ADD COLUMN node_id TEXT DEFAULT ''",
+		{12, "ALTER TABLE check_history ADD COLUMN node_id TEXT DEFAULT ''"},
-		"ALTER TABLE sites ADD COLUMN regions TEXT DEFAULT ''",
+		{13, "ALTER TABLE sites ADD COLUMN regions TEXT DEFAULT ''"},
 	}
 }
@@ -138,35 +149,47 @@ func (d *SQLiteDialect) ResetSequenceOnEmpty(db *sql.DB, table string) {
 	_ = db.QueryRow("SELECT COUNT(*) FROM " + table).Scan(&count) //nolint:errcheck
 	if count == 0 {
 		if _, err := db.Exec("DELETE FROM sqlite_sequence WHERE name=?", table); err != nil {
-			log.Printf("sequence cleanup error: %v", err)
+			slog.Debug("sequence cleanup failed", "table", table, "err", err)
 		}
 	}
 }
 func (d *SQLiteDialect) ImportWipe(tx *sql.Tx) {
 	if _, err := tx.Exec("DELETE FROM sites"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "sites", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM sqlite_sequence WHERE name='sites'"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "sqlite_sequence(sites)", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM alerts"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "alerts", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM sqlite_sequence WHERE name='alerts'"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "sqlite_sequence(alerts)", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM users"); err != nil {
 		log.Printf("import wipe error: %v", err)
 	}
 	if _, err := tx.Exec("DELETE FROM sqlite_sequence WHERE name='users'"); err != nil {
 		log.Printf("import wipe error: %v", err)
 	}
 	if _, err := tx.Exec("DELETE FROM maintenance_windows"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "maintenance_windows", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM sqlite_sequence WHERE name='maintenance_windows'"); err != nil {
-		log.Printf("import wipe error: %v", err)
+		slog.Debug("import wipe failed", "table", "sqlite_sequence(maintenance_windows)", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM check_history"); err != nil {
 		slog.Debug("import wipe failed", "table", "check_history", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM state_changes"); err != nil {
 		slog.Debug("import wipe failed", "table", "state_changes", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM alert_health"); err != nil {
 		slog.Debug("import wipe failed", "table", "alert_health", "err", err)
 	}
 }
 func (d *SQLiteDialect) ImportWipeUsers(tx *sql.Tx) {
 	if _, err := tx.Exec("DELETE FROM users"); err != nil {
 		slog.Debug("import wipe failed", "table", "users", "err", err)
 	}
 	if _, err := tx.Exec("DELETE FROM sqlite_sequence WHERE name='users'"); err != nil {
 		slog.Debug("import wipe failed", "table", "sqlite_sequence(users)", "err", err)
 	}
 }
@@ -1,12 +1,12 @@
 package store
 import (
 	"context"
 	"crypto/rand"
 	"database/sql"
 	"encoding/hex"
 	"encoding/json"
 	"fmt"
 	"strings"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
@@ -17,7 +17,6 @@ const (
 	maxLogRows             = 200
 	maxStateChangesPerSite = 5000
 	maxMaintenanceExport   = 1000
 	maxRequestBody         = 1 << 20
 )
 type SQLStore struct {
@@ -73,38 +72,59 @@ func (s *SQLStore) Close() error {
 	return s.db.Close()
 }
-func (s *SQLStore) Init() error {
+func (s *SQLStore) Init(ctx context.Context) error {
 	for _, stmt := range s.dialect.CreateTablesSQL() {
-		if _, err := s.db.Exec(stmt); err != nil {
+		if _, err := s.db.ExecContext(ctx, stmt); err != nil {
 			return err
 		}
 	}
-	for _, m := range s.dialect.MigrationsSQL() {
+
-		if _, err := s.db.Exec(m); err != nil {
+	if _, err := s.db.ExecContext(ctx, `CREATE TABLE IF NOT EXISTS schema_version (
-			errMsg := err.Error()
+		version INTEGER PRIMARY KEY,
-			if strings.Contains(errMsg, "already exists") || strings.Contains(errMsg, "duplicate column") {
+		applied_at DATETIME DEFAULT CURRENT_TIMESTAMP
-				continue
+	)`); err != nil {
-			}
+		return fmt.Errorf("create schema_version: %w", err)
-			return fmt.Errorf("migration failed: %w", err)
+	}
 	var current int
 	_ = s.db.QueryRowContext(ctx, "SELECT COALESCE(MAX(version), 0) FROM schema_version").Scan(&current) //nolint:errcheck
 	if current == 0 {
 		baseline := s.dialect.BaselineVersion()
 		if _, err := s.db.ExecContext(ctx, s.q("INSERT INTO schema_version (version) VALUES (?)"), baseline); err != nil {
 			return fmt.Errorf("seed baseline version: %w", err)
 		}
 		current = baseline
 	}
 	for _, m := range s.dialect.Migrations() {
 		if m.Version <= current {
 			continue
 		}
 		if _, err := s.db.ExecContext(ctx, m.SQL); err != nil {
 			return fmt.Errorf("migration %d failed: %w", m.Version, err)
 		}
 		if _, err := s.db.ExecContext(ctx, s.q("INSERT INTO schema_version (version) VALUES (?)"), m.Version); err != nil {
 			return fmt.Errorf("record migration %d: %w", m.Version, err)
 		}
 	}
 	return nil
 }
-func (s *SQLStore) GetSites() ([]models.Site, error) {
+func (s *SQLStore) GetSites(ctx context.Context) ([]models.SiteConfig, error) {
 	bf := s.dialect.BoolFalse()
 	query := fmt.Sprintf( //nolint:gosec // bf is a dialect boolean literal, not user input
 		"SELECT id, COALESCE(name, url), url, COALESCE(type, 'http'), COALESCE(token, ''), interval, alert_id, check_ssl, threshold, max_retries, COALESCE(hostname, ''), COALESCE(port, 0), COALESCE(timeout, 0), COALESCE(method, 'GET'), COALESCE(description, ''), COALESCE(parent_id, 0), COALESCE(accepted_codes, '200-299'), COALESCE(dns_resolve_type, ''), COALESCE(dns_server, ''), COALESCE(ignore_tls, %s), COALESCE(paused, %s), COALESCE(regions, '') FROM sites",
 		bf, bf,
 	)
-	rows, err := s.db.Query(query)
+	rows, err := s.db.QueryContext(ctx, query)
 	if err != nil {
 		return nil, err
 	}
 	defer rows.Close()
-	var sites []models.Site
+	var sites []models.SiteConfig
 	for rows.Next() {
-		var st models.Site
+		var st models.SiteConfig
 		if err := rows.Scan(&st.ID, &st.Name, &st.URL, &st.Type, &st.Token, &st.Interval, &st.AlertID,
 			&st.CheckSSL, &st.ExpiryThreshold, &st.MaxRetries, &st.Hostname, &st.Port, &st.Timeout,
 			&st.Method, &st.Description, &st.ParentID, &st.AcceptedCodes, &st.DNSResolveType,
@@ -116,7 +136,7 @@ func (s *SQLStore) GetSites() ([]models.Site, error) {
 	return sites, rows.Err()
 }
-func (s *SQLStore) AddSite(site models.Site) error {
+func (s *SQLStore) AddSite(ctx context.Context, site models.SiteConfig) error {
 	token := ""
 	if site.Type == "push" {
 		var err error
@@ -125,15 +145,17 @@ func (s *SQLStore) AddSite(site models.Site) error {
 			return fmt.Errorf("generate push token: %w", err)
 		}
 	}
-	_, err := s.db.Exec(s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
 		site.Name, site.URL, site.Type, token, site.Interval, site.AlertID, site.CheckSSL, site.ExpiryThreshold, site.MaxRetries,
 		site.Hostname, site.Port, site.Timeout, site.Method, site.Description, site.ParentID, site.AcceptedCodes, site.DNSResolveType, site.DNSServer, site.IgnoreTLS, site.Paused, site.Regions)
 	return err
 }
-func (s *SQLStore) UpdateSite(site models.Site) error {
+func (s *SQLStore) UpdateSite(ctx context.Context, site models.SiteConfig) error {
 	var existingToken string
-	_ = s.db.QueryRow(s.q("SELECT token FROM sites WHERE id=?"), site.ID).Scan(&existingToken) //nolint:errcheck
+	if err := s.db.QueryRowContext(ctx, s.q("SELECT token FROM sites WHERE id=?"), site.ID).Scan(&existingToken); err != nil && err != sql.ErrNoRows {
 		return fmt.Errorf("read existing token: %w", err)
 	}
 	if site.Type == "push" && existingToken == "" {
 		var err error
 		existingToken, err = generateToken()
@@ -141,19 +163,19 @@ func (s *SQLStore) UpdateSite(site models.Site) error {
 			return fmt.Errorf("generate push token: %w", err)
 		}
 	}
-	_, err := s.db.Exec(s.q("UPDATE sites SET name=?, url=?, type=?, token=?, interval=?, alert_id=?, check_ssl=?, threshold=?, max_retries=?, hostname=?, port=?, timeout=?, method=?, description=?, parent_id=?, accepted_codes=?, dns_resolve_type=?, dns_server=?, ignore_tls=?, paused=?, regions=? WHERE id=?"),
+	_, err := s.db.ExecContext(ctx, s.q("UPDATE sites SET name=?, url=?, type=?, token=?, interval=?, alert_id=?, check_ssl=?, threshold=?, max_retries=?, hostname=?, port=?, timeout=?, method=?, description=?, parent_id=?, accepted_codes=?, dns_resolve_type=?, dns_server=?, ignore_tls=?, paused=?, regions=? WHERE id=?"),
 		site.Name, site.URL, site.Type, existingToken, site.Interval, site.AlertID, site.CheckSSL, site.ExpiryThreshold, site.MaxRetries,
 		site.Hostname, site.Port, site.Timeout, site.Method, site.Description, site.ParentID, site.AcceptedCodes, site.DNSResolveType, site.DNSServer, site.IgnoreTLS, site.Paused, site.Regions, site.ID)
 	return err
 }
-func (s *SQLStore) UpdateSitePaused(id int, paused bool) error {
+func (s *SQLStore) UpdateSitePaused(ctx context.Context, id int, paused bool) error {
-	_, err := s.db.Exec(s.q("UPDATE sites SET paused=? WHERE id=?"), paused, id)
+	_, err := s.db.ExecContext(ctx, s.q("UPDATE sites SET paused=? WHERE id=?"), paused, id)
 	return err
 }
-func (s *SQLStore) DeleteSite(id int) error {
+func (s *SQLStore) DeleteSite(ctx context.Context, id int) error {
-	tx, err := s.db.Begin()
+	tx, err := s.db.BeginTx(ctx, nil)
 	if err != nil {
 		return err
 	}
@@ -165,7 +187,7 @@ func (s *SQLStore) DeleteSite(id int) error {
 		"DELETE FROM state_changes WHERE site_id = ?",
 		"DELETE FROM sites WHERE id = ?",
 	} {
-		if _, err := tx.Exec(s.q(q), id); err != nil {
+		if _, err := tx.ExecContext(ctx, s.q(q), id); err != nil {
 			return err
 		}
 	}
@@ -177,14 +199,14 @@ func (s *SQLStore) DeleteSite(id int) error {
 	return nil
 }
-func (s *SQLStore) GetSiteByName(name string) (models.Site, error) {
+func (s *SQLStore) GetSiteByName(ctx context.Context, name string) (models.SiteConfig, error) {
 	bf := s.dialect.BoolFalse()
 	query := fmt.Sprintf( //nolint:gosec // bf is a dialect boolean literal, not user input
 		"SELECT id, COALESCE(name, url), url, COALESCE(type, 'http'), COALESCE(token, ''), interval, alert_id, check_ssl, threshold, max_retries, COALESCE(hostname, ''), COALESCE(port, 0), COALESCE(timeout, 0), COALESCE(method, 'GET'), COALESCE(description, ''), COALESCE(parent_id, 0), COALESCE(accepted_codes, '200-299'), COALESCE(dns_resolve_type, ''), COALESCE(dns_server, ''), COALESCE(ignore_tls, %s), COALESCE(paused, %s), COALESCE(regions, '') FROM sites WHERE name = %s",
 		bf, bf, s.q("?"),
 	)
-	var st models.Site
+	var st models.SiteConfig
-	err := s.db.QueryRow(query, name).Scan(&st.ID, &st.Name, &st.URL, &st.Type, &st.Token, &st.Interval, &st.AlertID,
+	err := s.db.QueryRowContext(ctx, query, name).Scan(&st.ID, &st.Name, &st.URL, &st.Type, &st.Token, &st.Interval, &st.AlertID,
 		&st.CheckSSL, &st.ExpiryThreshold, &st.MaxRetries, &st.Hostname, &st.Port, &st.Timeout,
 		&st.Method, &st.Description, &st.ParentID, &st.AcceptedCodes, &st.DNSResolveType,
 		&st.DNSServer, &st.IgnoreTLS, &st.Paused, &st.Regions)
@@ -211,10 +233,10 @@ func (s *SQLStore) marshalSettings(settings map[string]string) (string, error) {
 	return s.encryptSettings(string(jsonBytes))
 }
-func (s *SQLStore) GetAlertByName(name string) (models.AlertConfig, error) {
+func (s *SQLStore) GetAlertByName(ctx context.Context, name string) (models.AlertConfig, error) {
 	var a models.AlertConfig
 	var settingsRaw string
-	err := s.db.QueryRow(s.q("SELECT id, name, type, settings FROM alerts WHERE name = ?"), name).Scan(&a.ID, &a.Name, &a.Type, &settingsRaw)
+	err := s.db.QueryRowContext(ctx, s.q("SELECT id, name, type, settings FROM alerts WHERE name = ?"), name).Scan(&a.ID, &a.Name, &a.Type, &settingsRaw)
 	if err != nil {
 		return a, err
 	}
@@ -225,7 +247,7 @@ func (s *SQLStore) GetAlertByName(name string) (models.AlertConfig, error) {
 	return a, nil
 }
-func (s *SQLStore) AddSiteReturningID(site models.Site) (int, error) {
+func (s *SQLStore) AddSiteReturningID(ctx context.Context, site models.SiteConfig) (int, error) {
 	token := ""
 	if site.Type == "push" {
 		var err error
@@ -236,12 +258,12 @@ func (s *SQLStore) AddSiteReturningID(site models.Site) (int, error) {
 	}
 	if s.dollar {
 		var id int
-		err := s.db.QueryRow(s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?) RETURNING id"),
+		err := s.db.QueryRowContext(ctx, s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?) RETURNING id"),
 			site.Name, site.URL, site.Type, token, site.Interval, site.AlertID, site.CheckSSL, site.ExpiryThreshold, site.MaxRetries,
 			site.Hostname, site.Port, site.Timeout, site.Method, site.Description, site.ParentID, site.AcceptedCodes, site.DNSResolveType, site.DNSServer, site.IgnoreTLS, site.Paused, site.Regions).Scan(&id)
 		return id, err
 	}
-	result, err := s.db.Exec(s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
+	result, err := s.db.ExecContext(ctx, s.q("INSERT INTO sites (name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
 		site.Name, site.URL, site.Type, token, site.Interval, site.AlertID, site.CheckSSL, site.ExpiryThreshold, site.MaxRetries,
 		site.Hostname, site.Port, site.Timeout, site.Method, site.Description, site.ParentID, site.AcceptedCodes, site.DNSResolveType, site.DNSServer, site.IgnoreTLS, site.Paused, site.Regions)
 	if err != nil {
@@ -251,17 +273,17 @@ func (s *SQLStore) AddSiteReturningID(site models.Site) (int, error) {
 	return int(id), err
 }
-func (s *SQLStore) AddAlertReturningID(name, aType string, settings map[string]string) (int, error) {
+func (s *SQLStore) AddAlertReturningID(ctx context.Context, name, aType string, settings map[string]string) (int, error) {
 	stored, err := s.marshalSettings(settings)
 	if err != nil {
 		return 0, err
 	}
 	if s.dollar {
 		var id int
-		err := s.db.QueryRow(s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?) RETURNING id"), name, aType, stored).Scan(&id)
+		err := s.db.QueryRowContext(ctx, s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?) RETURNING id"), name, aType, stored).Scan(&id)
 		return id, err
 	}
-	result, err := s.db.Exec(s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?)"), name, aType, stored)
+	result, err := s.db.ExecContext(ctx, s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?)"), name, aType, stored)
 	if err != nil {
 		return 0, err
 	}
@@ -269,8 +291,8 @@ func (s *SQLStore) AddAlertReturningID(name, aType string, settings map[string]s
 	return int(id), err
 }
-func (s *SQLStore) GetAllAlerts() ([]models.AlertConfig, error) {
+func (s *SQLStore) GetAllAlerts(ctx context.Context) ([]models.AlertConfig, error) {
-	rows, err := s.db.Query("SELECT id, name, type, settings FROM alerts")
+	rows, err := s.db.QueryContext(ctx, "SELECT id, name, type, settings FROM alerts")
 	if err != nil {
 		return nil, err
 	}
@@ -291,10 +313,10 @@ func (s *SQLStore) GetAllAlerts() ([]models.AlertConfig, error) {
 	return alerts, rows.Err()
 }
-func (s *SQLStore) GetAlert(id int) (models.AlertConfig, error) {
+func (s *SQLStore) GetAlert(ctx context.Context, id int) (models.AlertConfig, error) {
 	var a models.AlertConfig
 	var settingsRaw string
-	err := s.db.QueryRow(s.q("SELECT id, name, type, settings FROM alerts WHERE id = ?"), id).Scan(&a.ID, &a.Name, &a.Type, &settingsRaw)
+	err := s.db.QueryRowContext(ctx, s.q("SELECT id, name, type, settings FROM alerts WHERE id = ?"), id).Scan(&a.ID, &a.Name, &a.Type, &settingsRaw)
 	if err != nil {
 		return a, err
 	}
@@ -305,35 +327,37 @@ func (s *SQLStore) GetAlert(id int) (models.AlertConfig, error) {
 	return a, nil
 }
-func (s *SQLStore) AddAlert(name, aType string, settings map[string]string) error {
+func (s *SQLStore) AddAlert(ctx context.Context, name, aType string, settings map[string]string) error {
 	stored, err := s.marshalSettings(settings)
 	if err != nil {
 		return err
 	}
-	_, err = s.db.Exec(s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?)"), name, aType, stored)
+	_, err = s.db.ExecContext(ctx, s.q("INSERT INTO alerts (name, type, settings) VALUES (?, ?, ?)"), name, aType, stored)
 	return err
 }
-func (s *SQLStore) UpdateAlert(id int, name, aType string, settings map[string]string) error {
+func (s *SQLStore) UpdateAlert(ctx context.Context, id int, name, aType string, settings map[string]string) error {
 	stored, err := s.marshalSettings(settings)
 	if err != nil {
 		return err
 	}
-	_, err = s.db.Exec(s.q("UPDATE alerts SET name=?, type=?, settings=? WHERE id=?"), name, aType, stored, id)
+	_, err = s.db.ExecContext(ctx, s.q("UPDATE alerts SET name=?, type=?, settings=? WHERE id=?"), name, aType, stored, id)
 	return err
 }
-func (s *SQLStore) DeleteAlert(id int) error {
+func (s *SQLStore) DeleteAlert(ctx context.Context, id int) error {
-	_, err := s.db.Exec(s.q("DELETE FROM alerts WHERE id=?"), id)
+	if _, err := s.db.ExecContext(ctx, s.q("UPDATE sites SET alert_id = 0 WHERE alert_id = ?"), id); err != nil {
-	if err != nil {
+		return err
 	}
 	if _, err := s.db.ExecContext(ctx, s.q("DELETE FROM alerts WHERE id=?"), id); err != nil {
 		return err
 	}
 	s.dialect.ResetSequenceOnEmpty(s.db, "alerts")
 	return nil
 }
-func (s *SQLStore) GetAllUsers() ([]models.User, error) {
+func (s *SQLStore) GetAllUsers(ctx context.Context) ([]models.User, error) {
-	rows, err := s.db.Query("SELECT id, username, public_key, role FROM users")
+	rows, err := s.db.QueryContext(ctx, "SELECT id, username, public_key, role FROM users")
 	if err != nil {
 		return nil, err
 	}
@@ -349,29 +373,29 @@ func (s *SQLStore) GetAllUsers() ([]models.User, error) {
 	return users, rows.Err()
 }
-func (s *SQLStore) AddUser(username, publicKey, role string) error {
+func (s *SQLStore) AddUser(ctx context.Context, username, publicKey, role string) error {
-	_, err := s.db.Exec(s.q("INSERT INTO users (username, public_key, role) VALUES (?, ?, ?)"), username, publicKey, role)
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO users (username, public_key, role) VALUES (?, ?, ?)"), username, publicKey, role)
 	return err
 }
-func (s *SQLStore) UpdateUser(id int, username, publicKey, role string) error {
+func (s *SQLStore) UpdateUser(ctx context.Context, id int, username, publicKey, role string) error {
-	_, err := s.db.Exec(s.q("UPDATE users SET username=?, public_key=?, role=? WHERE id=?"), username, publicKey, role, id)
+	_, err := s.db.ExecContext(ctx, s.q("UPDATE users SET username=?, public_key=?, role=? WHERE id=?"), username, publicKey, role, id)
 	return err
 }
-func (s *SQLStore) DeleteUser(id int) error {
+func (s *SQLStore) DeleteUser(ctx context.Context, id int) error {
-	_, err := s.db.Exec(s.q("DELETE FROM users WHERE id=?"), id)
+	_, err := s.db.ExecContext(ctx, s.q("DELETE FROM users WHERE id=?"), id)
 	return err
 }
-func (s *SQLStore) SaveStateChange(siteID int, fromStatus, toStatus, errorReason string) error {
+func (s *SQLStore) SaveStateChange(ctx context.Context, siteID int, fromStatus, toStatus, errorReason string) error {
-	_, err := s.db.Exec(s.q("INSERT INTO state_changes (site_id, from_status, to_status, error_reason) VALUES (?, ?, ?, ?)"),
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO state_changes (site_id, from_status, to_status, error_reason) VALUES (?, ?, ?, ?)"),
 		siteID, fromStatus, toStatus, errorReason)
 	return err
 }
-func (s *SQLStore) GetStateChanges(siteID int, limit int) ([]models.StateChange, error) {
+func (s *SQLStore) GetStateChanges(ctx context.Context, siteID int, limit int) ([]models.StateChange, error) {
-	rows, err := s.db.Query(s.q("SELECT id, site_id, from_status, to_status, error_reason, changed_at FROM state_changes WHERE site_id = ? ORDER BY changed_at DESC LIMIT ?"), siteID, limit)
+	rows, err := s.db.QueryContext(ctx, s.q("SELECT id, site_id, from_status, to_status, error_reason, changed_at FROM state_changes WHERE site_id = ? ORDER BY changed_at DESC LIMIT ?"), siteID, limit)
 	if err != nil {
 		return nil, err
 	}
@@ -387,8 +411,8 @@ func (s *SQLStore) GetStateChanges(siteID int, limit int) ([]models.StateChange,
 	return changes, rows.Err()
 }
-func (s *SQLStore) GetStateChangesSince(siteID int, since time.Time) ([]models.StateChange, error) {
+func (s *SQLStore) GetStateChangesSince(ctx context.Context, siteID int, since time.Time) ([]models.StateChange, error) {
-	rows, err := s.db.Query(s.q("SELECT id, site_id, from_status, to_status, error_reason, changed_at FROM state_changes WHERE site_id = ? AND changed_at >= ? ORDER BY changed_at DESC"), siteID, since)
+	rows, err := s.db.QueryContext(ctx, s.q("SELECT id, site_id, from_status, to_status, error_reason, changed_at FROM state_changes WHERE site_id = ? AND changed_at >= ? ORDER BY changed_at DESC"), siteID, since)
 	if err != nil {
 		return nil, err
 	}
@@ -404,59 +428,59 @@ func (s *SQLStore) GetStateChangesSince(siteID int, since time.Time) ([]models.S
 	return changes, rows.Err()
 }
-func (s *SQLStore) SaveCheck(siteID int, latencyNs int64, isUp bool) error {
+func (s *SQLStore) SaveCheck(ctx context.Context, siteID int, latencyNs int64, isUp bool) error {
-	return s.SaveCheckFromNode(siteID, "", latencyNs, isUp)
+	return s.SaveCheckFromNode(ctx, siteID, "", latencyNs, isUp)
 }
 // SaveCheckFromNode inserts a single check row. Retention is handled out of
 // band by PruneCheckHistory on a timer, not per-insert, to keep the write hot
 // path a plain INSERT.
-func (s *SQLStore) SaveCheckFromNode(siteID int, nodeID string, latencyNs int64, isUp bool) error {
+func (s *SQLStore) SaveCheckFromNode(ctx context.Context, siteID int, nodeID string, latencyNs int64, isUp bool) error {
-	_, err := s.db.Exec(s.q("INSERT INTO check_history (site_id, node_id, latency_ns, is_up) VALUES (?, ?, ?, ?)"), siteID, nodeID, latencyNs, isUp)
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO check_history (site_id, node_id, latency_ns, is_up) VALUES (?, ?, ?, ?)"), siteID, nodeID, latencyNs, isUp)
 	return err
 }
 // PruneCheckHistory trims check_history to the newest maxCheckHistory rows per
 // site, across all sites, in one pass. Intended to run periodically.
-func (s *SQLStore) PruneCheckHistory() error {
+func (s *SQLStore) PruneCheckHistory(ctx context.Context) error {
 	q := fmt.Sprintf(`DELETE FROM check_history WHERE id IN (
 		SELECT id FROM (
 			SELECT id, ROW_NUMBER() OVER (PARTITION BY site_id ORDER BY checked_at DESC, id DESC) AS rn
 			FROM check_history
 		) ranked WHERE rn > %d
 	)`, maxCheckHistory)
-	_, err := s.db.Exec(s.q(q))
+	_, err := s.db.ExecContext(ctx, s.q(q))
 	return err
 }
 // PruneStateChanges trims state_changes to the newest maxStateChangesPerSite
 // rows per site. Generous so realistic SLA windows are unaffected; bounds the
 // otherwise unbounded growth of a flapping monitor's history.
-func (s *SQLStore) PruneStateChanges() error {
+func (s *SQLStore) PruneStateChanges(ctx context.Context) error {
 	q := fmt.Sprintf(`DELETE FROM state_changes WHERE id IN (
 		SELECT id FROM (
 			SELECT id, ROW_NUMBER() OVER (PARTITION BY site_id ORDER BY changed_at DESC, id DESC) AS rn
 			FROM state_changes
 		) ranked WHERE rn > %d
 	)`, maxStateChangesPerSite)
-	_, err := s.db.Exec(s.q(q))
+	_, err := s.db.ExecContext(ctx, s.q(q))
 	return err
 }
-func (s *SQLStore) RegisterNode(node models.ProbeNode) error {
+func (s *SQLStore) RegisterNode(ctx context.Context, node models.ProbeNode) error {
-	_, err := s.db.Exec(s.dialect.UpsertNodeSQL(), node.ID, node.Name, node.Region, node.Version)
+	_, err := s.db.ExecContext(ctx, s.dialect.UpsertNodeSQL(), node.ID, node.Name, node.Region, node.Version)
 	return err
 }
-func (s *SQLStore) GetNode(id string) (models.ProbeNode, error) {
+func (s *SQLStore) GetNode(ctx context.Context, id string) (models.ProbeNode, error) {
 	var n models.ProbeNode
-	err := s.db.QueryRow(s.q("SELECT id, name, region, last_seen, version FROM nodes WHERE id = ?"), id).
+	err := s.db.QueryRowContext(ctx, s.q("SELECT id, name, region, last_seen, version FROM nodes WHERE id = ?"), id).
 		Scan(&n.ID, &n.Name, &n.Region, &n.LastSeen, &n.Version)
 	return n, err
 }
-func (s *SQLStore) GetAllNodes() ([]models.ProbeNode, error) {
+func (s *SQLStore) GetAllNodes(ctx context.Context) ([]models.ProbeNode, error) {
-	rows, err := s.db.Query("SELECT id, name, region, last_seen, version FROM nodes ORDER BY region, name")
+	rows, err := s.db.QueryContext(ctx, "SELECT id, name, region, last_seen, version FROM nodes ORDER BY region, name")
 	if err != nil {
 		return nil, err
 	}
@@ -472,18 +496,18 @@ func (s *SQLStore) GetAllNodes() ([]models.ProbeNode, error) {
 	return nodes, rows.Err()
 }
-func (s *SQLStore) UpdateNodeLastSeen(id string) error {
+func (s *SQLStore) UpdateNodeLastSeen(ctx context.Context, id string) error {
-	_, err := s.db.Exec(s.q("UPDATE nodes SET last_seen = CURRENT_TIMESTAMP WHERE id = ?"), id)
+	_, err := s.db.ExecContext(ctx, s.q("UPDATE nodes SET last_seen = CURRENT_TIMESTAMP WHERE id = ?"), id)
 	return err
 }
-func (s *SQLStore) DeleteNode(id string) error {
+func (s *SQLStore) DeleteNode(ctx context.Context, id string) error {
-	_, err := s.db.Exec(s.q("DELETE FROM nodes WHERE id = ?"), id)
+	_, err := s.db.ExecContext(ctx, s.q("DELETE FROM nodes WHERE id = ?"), id)
 	return err
 }
-func (s *SQLStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
+func (s *SQLStore) LoadAlertHealth(ctx context.Context) (map[int]models.AlertHealthRecord, error) {
-	rows, err := s.db.Query("SELECT alert_id, last_send_at, last_send_ok, last_error, send_count, fail_count FROM alert_health")
+	rows, err := s.db.QueryContext(ctx, "SELECT alert_id, last_send_at, last_send_ok, last_error, send_count, fail_count FROM alert_health")
 	if err != nil {
 		return nil, err
 	}
@@ -503,35 +527,35 @@ func (s *SQLStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return out, rows.Err()
 }
-func (s *SQLStore) SaveAlertHealth(h models.AlertHealthRecord) error {
+func (s *SQLStore) SaveAlertHealth(ctx context.Context, h models.AlertHealthRecord) error {
 	var lastSend interface{}
 	if !h.LastSendAt.IsZero() {
 		lastSend = h.LastSendAt
 	}
-	_, err := s.db.Exec(s.dialect.UpsertAlertHealthSQL(),
+	_, err := s.db.ExecContext(ctx, s.dialect.UpsertAlertHealthSQL(),
 		h.AlertID, lastSend, h.LastSendOK, h.LastError, h.SendCount, h.FailCount)
 	return err
 }
 // SaveLog inserts a single log row. Retention is handled by PruneLogs on a
 // timer, not per-insert.
-func (s *SQLStore) SaveLog(message string) error {
+func (s *SQLStore) SaveLog(ctx context.Context, message string) error {
-	_, err := s.db.Exec(s.q("INSERT INTO logs (message) VALUES (?)"), message)
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO logs (message) VALUES (?)"), message)
 	return err
 }
 // PruneLogs trims the logs table to the newest maxLogRows rows. The id DESC
 // tiebreak keeps ordering deterministic when rows share a created_at second.
-func (s *SQLStore) PruneLogs() error {
+func (s *SQLStore) PruneLogs(ctx context.Context) error {
 	q := fmt.Sprintf(`DELETE FROM logs WHERE id NOT IN (
 		SELECT id FROM logs ORDER BY created_at DESC, id DESC LIMIT %d
 	)`, maxLogRows)
-	_, err := s.db.Exec(s.q(q))
+	_, err := s.db.ExecContext(ctx, s.q(q))
 	return err
 }
-func (s *SQLStore) LoadLogs(limit int) ([]string, error) {
+func (s *SQLStore) LoadLogs(ctx context.Context, limit int) ([]string, error) {
-	rows, err := s.db.Query(s.q("SELECT message FROM logs ORDER BY created_at DESC LIMIT ?"), limit)
+	rows, err := s.db.QueryContext(ctx, s.q("SELECT message FROM logs ORDER BY created_at DESC LIMIT ?"), limit)
 	if err != nil {
 		return nil, err
 	}
@@ -547,9 +571,9 @@ func (s *SQLStore) LoadLogs(limit int) ([]string, error) {
 	return logs, rows.Err()
 }
-func (s *SQLStore) LoadAllHistory(limit int) (map[int][]models.CheckRecord, error) {
+func (s *SQLStore) LoadAllHistory(ctx context.Context, limit int) (map[int][]models.CheckRecord, error) {
 	result := make(map[int][]models.CheckRecord)
-	rows, err := s.db.Query(s.q(`
+	rows, err := s.db.QueryContext(ctx, s.q(`
 		SELECT site_id, latency_ns, is_up FROM (
 			SELECT site_id, latency_ns, is_up,
 				ROW_NUMBER() OVER (PARTITION BY site_id ORDER BY checked_at DESC) AS rn
@@ -587,8 +611,8 @@ func (s *SQLStore) scanMaintenanceWindow(rows *sql.Rows) (models.MaintenanceWind
 	return mw, nil
 }
-func (s *SQLStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
+func (s *SQLStore) GetActiveMaintenanceWindows(ctx context.Context) ([]models.MaintenanceWindow, error) {
-	rows, err := s.db.Query(s.q("SELECT id, monitor_id, title, description, type, start_time, end_time, created_by, created_at FROM maintenance_windows WHERE start_time <= CURRENT_TIMESTAMP AND (end_time IS NULL OR end_time > CURRENT_TIMESTAMP) ORDER BY start_time DESC"))
+	rows, err := s.db.QueryContext(ctx, s.q("SELECT id, monitor_id, title, description, type, start_time, end_time, created_by, created_at FROM maintenance_windows WHERE start_time <= CURRENT_TIMESTAMP AND (end_time IS NULL OR end_time > CURRENT_TIMESTAMP) ORDER BY start_time DESC"))
 	if err != nil {
 		return nil, err
 	}
@@ -604,8 +628,8 @@ func (s *SQLStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, er
 	return windows, rows.Err()
 }
-func (s *SQLStore) GetAllMaintenanceWindows(limit int) ([]models.MaintenanceWindow, error) {
+func (s *SQLStore) GetAllMaintenanceWindows(ctx context.Context, limit int) ([]models.MaintenanceWindow, error) {
-	rows, err := s.db.Query(s.q("SELECT id, monitor_id, title, description, type, start_time, end_time, created_by, created_at FROM maintenance_windows ORDER BY created_at DESC LIMIT ?"), limit)
+	rows, err := s.db.QueryContext(ctx, s.q("SELECT id, monitor_id, title, description, type, start_time, end_time, created_by, created_at FROM maintenance_windows ORDER BY created_at DESC LIMIT ?"), limit)
 	if err != nil {
 		return nil, err
 	}
@@ -621,22 +645,22 @@ func (s *SQLStore) GetAllMaintenanceWindows(limit int) ([]models.MaintenanceWind
 	return windows, rows.Err()
 }
-func (s *SQLStore) AddMaintenanceWindow(mw models.MaintenanceWindow) error {
+func (s *SQLStore) AddMaintenanceWindow(ctx context.Context, mw models.MaintenanceWindow) error {
 	if mw.StartTime.IsZero() {
 		mw.StartTime = time.Now()
 	}
-	_, err := s.db.Exec(s.q("INSERT INTO maintenance_windows (monitor_id, title, description, type, start_time, end_time, created_by) VALUES (?, ?, ?, ?, ?, ?, ?)"),
+	_, err := s.db.ExecContext(ctx, s.q("INSERT INTO maintenance_windows (monitor_id, title, description, type, start_time, end_time, created_by) VALUES (?, ?, ?, ?, ?, ?, ?)"),
 		mw.MonitorID, mw.Title, mw.Description, mw.Type, mw.StartTime, sql.NullTime{Time: mw.EndTime, Valid: !mw.EndTime.IsZero()}, mw.CreatedBy)
 	return err
 }
-func (s *SQLStore) EndMaintenanceWindow(id int) error {
+func (s *SQLStore) EndMaintenanceWindow(ctx context.Context, id int) error {
-	_, err := s.db.Exec(s.q("UPDATE maintenance_windows SET end_time = CURRENT_TIMESTAMP WHERE id = ?"), id)
+	_, err := s.db.ExecContext(ctx, s.q("UPDATE maintenance_windows SET end_time = CURRENT_TIMESTAMP WHERE id = ?"), id)
 	return err
 }
-func (s *SQLStore) DeleteMaintenanceWindow(id int) error {
+func (s *SQLStore) DeleteMaintenanceWindow(ctx context.Context, id int) error {
-	_, err := s.db.Exec(s.q("DELETE FROM maintenance_windows WHERE id = ?"), id)
+	_, err := s.db.ExecContext(ctx, s.q("DELETE FROM maintenance_windows WHERE id = ?"), id)
 	if err != nil {
 		return err
 	}
@@ -644,9 +668,9 @@ func (s *SQLStore) DeleteMaintenanceWindow(id int) error {
 	return nil
 }
-func (s *SQLStore) PruneExpiredMaintenanceWindows(retention time.Duration) (int64, error) {
+func (s *SQLStore) PruneExpiredMaintenanceWindows(ctx context.Context, retention time.Duration) (int64, error) {
 	cutoff := time.Now().Add(-retention)
-	result, err := s.db.Exec(
+	result, err := s.db.ExecContext(ctx,
 		s.q("DELETE FROM maintenance_windows WHERE end_time IS NOT NULL AND end_time < ?"),
 		cutoff,
 	)
@@ -656,9 +680,9 @@ func (s *SQLStore) PruneExpiredMaintenanceWindows(retention time.Duration) (int6
 	return result.RowsAffected()
 }
-func (s *SQLStore) IsMonitorInMaintenance(monitorID int) (bool, error) {
+func (s *SQLStore) IsMonitorInMaintenance(ctx context.Context, monitorID int) (bool, error) {
 	var count int
-	err := s.db.QueryRow(s.q(`SELECT COUNT(*) FROM maintenance_windows
+	err := s.db.QueryRowContext(ctx, s.q(`SELECT COUNT(*) FROM maintenance_windows
 		WHERE type = 'maintenance'
 		AND start_time <= CURRENT_TIMESTAMP
 		AND (end_time IS NULL OR end_time > CURRENT_TIMESTAMP)
@@ -671,46 +695,46 @@ func (s *SQLStore) IsMonitorInMaintenance(monitorID int) (bool, error) {
 	return count > 0, nil
 }
-func (s *SQLStore) GetPreference(key string) (string, error) {
+func (s *SQLStore) GetPreference(ctx context.Context, key string) (string, error) {
 	var value string
-	err := s.db.QueryRow(s.q("SELECT value FROM preferences WHERE key = ?"), key).Scan(&value)
+	err := s.db.QueryRowContext(ctx, s.q("SELECT value FROM preferences WHERE key = ?"), key).Scan(&value)
 	if err != nil {
 		return "", err
 	}
 	return value, nil
 }
-func (s *SQLStore) SetPreference(key, value string) error {
+func (s *SQLStore) SetPreference(ctx context.Context, key, value string) error {
 	if s.dollar {
-		_, err := s.db.Exec(s.q("INSERT INTO preferences (key, value) VALUES (?, ?) ON CONFLICT (key) DO UPDATE SET value = ?"), key, value, value)
+		_, err := s.db.ExecContext(ctx, s.q("INSERT INTO preferences (key, value) VALUES (?, ?) ON CONFLICT (key) DO UPDATE SET value = ?"), key, value, value)
 		return err
 	}
-	_, err := s.db.Exec("INSERT OR REPLACE INTO preferences (key, value) VALUES (?, ?)", key, value)
+	_, err := s.db.ExecContext(ctx, "INSERT OR REPLACE INTO preferences (key, value) VALUES (?, ?)", key, value)
 	return err
 }
-func (s *SQLStore) ExportData() (models.Backup, error) {
+func (s *SQLStore) ExportData(ctx context.Context) (models.Backup, error) {
-	sites, err := s.GetSites()
+	sites, err := s.GetSites(ctx)
 	if err != nil {
 		return models.Backup{}, err
 	}
-	alerts, err := s.GetAllAlerts()
+	alerts, err := s.GetAllAlerts(ctx)
 	if err != nil {
 		return models.Backup{}, err
 	}
-	users, err := s.GetAllUsers()
+	users, err := s.GetAllUsers(ctx)
 	if err != nil {
 		return models.Backup{}, err
 	}
-	windows, err := s.GetAllMaintenanceWindows(maxMaintenanceExport)
+	windows, err := s.GetAllMaintenanceWindows(ctx, maxMaintenanceExport)
 	if err != nil {
 		return models.Backup{}, err
 	}
 	return models.Backup{Sites: sites, Alerts: alerts, Users: users, MaintenanceWindows: windows}, nil
 }
-func (s *SQLStore) ImportData(data models.Backup) error {
+func (s *SQLStore) ImportData(ctx context.Context, data models.Backup) error {
-	tx, err := s.db.Begin()
+	tx, err := s.db.BeginTx(ctx, nil)
 	if err != nil {
 		return err
 	}
@@ -718,9 +742,14 @@ func (s *SQLStore) ImportData(data models.Backup) error {
 	s.dialect.ImportWipe(tx)
-	for _, u := range data.Users {
+	// Only wipe+replace users when callers explicitly provide them (CLI
-		if _, err := tx.Exec(s.q("INSERT INTO users (username, public_key, role) VALUES (?, ?, ?)"), u.Username, u.PublicKey, u.Role); err != nil {
+	// full restore). API/Kuma imports pass nil — existing users preserved.
-			return err
+	if data.Users != nil {
 		s.dialect.ImportWipeUsers(tx)
 		for _, u := range data.Users {
 			if _, err := tx.ExecContext(ctx, s.q("INSERT INTO users (username, public_key, role) VALUES (?, ?, ?)"), u.Username, u.PublicKey, u.Role); err != nil {
 				return err
 			}
 		}
 	}
 	for _, a := range data.Alerts {
@@ -730,12 +759,12 @@ func (s *SQLStore) ImportData(data models.Backup) error {
 		if err != nil {
 			return err
 		}
-		if _, err := tx.Exec(s.q("INSERT INTO alerts (id, name, type, settings) VALUES (?, ?, ?, ?)"), a.ID, a.Name, a.Type, settingsStr); err != nil {
+		if _, err := tx.ExecContext(ctx, s.q("INSERT INTO alerts (id, name, type, settings) VALUES (?, ?, ?, ?)"), a.ID, a.Name, a.Type, settingsStr); err != nil {
 			return err
 		}
 	}
 	for _, st := range data.Sites {
-		if _, err := tx.Exec(s.q("INSERT INTO sites (id, name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
+		if _, err := tx.ExecContext(ctx, s.q("INSERT INTO sites (id, name, url, type, token, interval, alert_id, check_ssl, threshold, max_retries, hostname, port, timeout, method, description, parent_id, accepted_codes, dns_resolve_type, dns_server, ignore_tls, paused, regions) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"),
 			st.ID, st.Name, st.URL, st.Type, st.Token, st.Interval, st.AlertID, st.CheckSSL, st.ExpiryThreshold, st.MaxRetries,
 			st.Hostname, st.Port, st.Timeout, st.Method, st.Description, st.ParentID, st.AcceptedCodes, st.DNSResolveType, st.DNSServer, st.IgnoreTLS, st.Paused, st.Regions); err != nil {
 			return err
@@ -743,7 +772,7 @@ func (s *SQLStore) ImportData(data models.Backup) error {
 	}
 	for _, mw := range data.MaintenanceWindows {
-		if _, err := tx.Exec(s.q("INSERT INTO maintenance_windows (id, monitor_id, title, description, type, start_time, end_time, created_by) VALUES (?, ?, ?, ?, ?, ?, ?, ?)"),
+		if _, err := tx.ExecContext(ctx, s.q("INSERT INTO maintenance_windows (id, monitor_id, title, description, type, start_time, end_time, created_by) VALUES (?, ?, ?, ?, ?, ?, ?, ?)"),
 			mw.ID, mw.MonitorID, mw.Title, mw.Description, mw.Type, mw.StartTime, sql.NullTime{Time: mw.EndTime, Valid: !mw.EndTime.IsZero()}, mw.CreatedBy); err != nil {
 			return err
 		}
@@ -1,6 +1,7 @@
 package store
 import (
 	"context"
 	"fmt"
 	"strings"
 	"testing"
@@ -15,7 +16,7 @@ func newTestStore(t *testing.T) *SQLStore {
 	if err != nil {
 		t.Fatalf("NewSQLiteStore: %v", err)
 	}
-	if err := s.Init(); err != nil {
+	if err := s.Init(context.Background()); err != nil {
 		t.Fatalf("Init: %v", err)
 	}
 	return s
@@ -24,7 +25,7 @@ func newTestStore(t *testing.T) *SQLStore {
 func TestSiteCRUD(t *testing.T) {
 	s := newTestStore(t)
-	sites, err := s.GetSites()
+	sites, err := s.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
@@ -32,11 +33,11 @@ func TestSiteCRUD(t *testing.T) {
 		t.Fatalf("expected 0 sites, got %d", len(sites))
 	}
-	if err := s.AddSite(models.Site{Name: "Test", URL: "https://example.com", Type: "http", Interval: 30}); err != nil {
+	if err := s.AddSite(context.Background(), models.SiteConfig{Name: "Test", URL: "https://example.com", Type: "http", Interval: 30}); err != nil {
 		t.Fatalf("AddSite: %v", err)
 	}
-	sites, err = s.GetSites()
+	sites, err = s.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
@@ -48,11 +49,11 @@ func TestSiteCRUD(t *testing.T) {
 	}
 	sites[0].Name = "Updated"
-	if err := s.UpdateSite(sites[0]); err != nil {
+	if err := s.UpdateSite(context.Background(), sites[0]); err != nil {
 		t.Fatalf("UpdateSite: %v", err)
 	}
-	sites, err = s.GetSites()
+	sites, err = s.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
@@ -60,11 +61,11 @@ func TestSiteCRUD(t *testing.T) {
 		t.Errorf("expected name 'Updated', got '%s'", sites[0].Name)
 	}
-	if err := s.DeleteSite(sites[0].ID); err != nil {
+	if err := s.DeleteSite(context.Background(), sites[0].ID); err != nil {
 		t.Fatalf("DeleteSite: %v", err)
 	}
-	sites, err = s.GetSites()
+	sites, err = s.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
@@ -76,11 +77,11 @@ func TestSiteCRUD(t *testing.T) {
 func TestAlertCRUD(t *testing.T) {
 	s := newTestStore(t)
-	if err := s.AddAlert("Discord", "discord", map[string]string{"url": "https://example.com/hook"}); err != nil {
+	if err := s.AddAlert(context.Background(), "Discord", "discord", map[string]string{"url": "https://example.com/hook"}); err != nil {
 		t.Fatalf("AddAlert: %v", err)
 	}
-	alerts, err := s.GetAllAlerts()
+	alerts, err := s.GetAllAlerts(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllAlerts: %v", err)
 	}
@@ -94,7 +95,7 @@ func TestAlertCRUD(t *testing.T) {
 		t.Errorf("settings url mismatch")
 	}
-	a, err := s.GetAlert(alerts[0].ID)
+	a, err := s.GetAlert(context.Background(), alerts[0].ID)
 	if err != nil {
 		t.Fatalf("GetAlert: %v", err)
 	}
@@ -102,11 +103,11 @@ func TestAlertCRUD(t *testing.T) {
 		t.Errorf("expected name 'Discord', got '%s'", a.Name)
 	}
-	if err := s.UpdateAlert(a.ID, "Slack", "slack", map[string]string{"url": "https://slack.com/hook"}); err != nil {
+	if err := s.UpdateAlert(context.Background(), a.ID, "Slack", "slack", map[string]string{"url": "https://slack.com/hook"}); err != nil {
 		t.Fatalf("UpdateAlert: %v", err)
 	}
-	a, err = s.GetAlert(a.ID)
+	a, err = s.GetAlert(context.Background(), a.ID)
 	if err != nil {
 		t.Fatalf("GetAlert: %v", err)
 	}
@@ -114,11 +115,11 @@ func TestAlertCRUD(t *testing.T) {
 		t.Errorf("expected type 'slack', got '%s'", a.Type)
 	}
-	if err := s.DeleteAlert(a.ID); err != nil {
+	if err := s.DeleteAlert(context.Background(), a.ID); err != nil {
 		t.Fatalf("DeleteAlert: %v", err)
 	}
-	alerts, err = s.GetAllAlerts()
+	alerts, err = s.GetAllAlerts(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllAlerts: %v", err)
 	}
@@ -130,11 +131,11 @@ func TestAlertCRUD(t *testing.T) {
 func TestUserCRUD(t *testing.T) {
 	s := newTestStore(t)
-	if err := s.AddUser("admin", "ssh-ed25519 AAAA...", "admin"); err != nil {
+	if err := s.AddUser(context.Background(), "admin", "ssh-ed25519 AAAA...", "admin"); err != nil {
 		t.Fatalf("AddUser: %v", err)
 	}
-	users, err := s.GetAllUsers()
+	users, err := s.GetAllUsers(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllUsers: %v", err)
 	}
@@ -145,11 +146,11 @@ func TestUserCRUD(t *testing.T) {
 		t.Errorf("expected username 'admin', got '%s'", users[0].Username)
 	}
-	if err := s.UpdateUser(users[0].ID, "root", "ssh-ed25519 BBBB...", "admin"); err != nil {
+	if err := s.UpdateUser(context.Background(), users[0].ID, "root", "ssh-ed25519 BBBB...", "admin"); err != nil {
 		t.Fatalf("UpdateUser: %v", err)
 	}
-	users, err = s.GetAllUsers()
+	users, err = s.GetAllUsers(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllUsers: %v", err)
 	}
@@ -157,11 +158,11 @@ func TestUserCRUD(t *testing.T) {
 		t.Errorf("expected username 'root', got '%s'", users[0].Username)
 	}
-	if err := s.DeleteUser(users[0].ID); err != nil {
+	if err := s.DeleteUser(context.Background(), users[0].ID); err != nil {
 		t.Fatalf("DeleteUser: %v", err)
 	}
-	users, err = s.GetAllUsers()
+	users, err = s.GetAllUsers(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllUsers: %v", err)
 	}
@@ -173,11 +174,11 @@ func TestUserCRUD(t *testing.T) {
 func TestPushTokenGeneration(t *testing.T) {
 	s := newTestStore(t)
-	if err := s.AddSite(models.Site{Name: "Push Monitor", Type: "push", Interval: 60}); err != nil {
+	if err := s.AddSite(context.Background(), models.SiteConfig{Name: "Push Monitor", Type: "push", Interval: 60}); err != nil {
 		t.Fatalf("AddSite: %v", err)
 	}
-	sites, err := s.GetSites()
+	sites, err := s.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
@@ -195,17 +196,17 @@ func TestPushTokenGeneration(t *testing.T) {
 func TestImportExport(t *testing.T) {
 	s := newTestStore(t)
-	if err := s.AddAlert("Test Alert", "webhook", map[string]string{"url": "https://example.com"}); err != nil {
+	if err := s.AddAlert(context.Background(), "Test Alert", "webhook", map[string]string{"url": "https://example.com"}); err != nil {
 		t.Fatalf("AddAlert: %v", err)
 	}
-	if err := s.AddSite(models.Site{Name: "Site1", URL: "https://example.com", Type: "http", Interval: 30}); err != nil {
+	if err := s.AddSite(context.Background(), models.SiteConfig{Name: "Site1", URL: "https://example.com", Type: "http", Interval: 30}); err != nil {
 		t.Fatalf("AddSite: %v", err)
 	}
-	if err := s.AddUser("user1", "ssh-ed25519 KEY", "user"); err != nil {
+	if err := s.AddUser(context.Background(), "user1", "ssh-ed25519 KEY", "user"); err != nil {
 		t.Fatalf("AddUser: %v", err)
 	}
-	backup, err := s.ExportData()
+	backup, err := s.ExportData(context.Background())
 	if err != nil {
 		t.Fatalf("ExportData: %v", err)
 	}
@@ -214,19 +215,19 @@ func TestImportExport(t *testing.T) {
 	}
 	s2 := newTestStore(t)
-	if err := s2.ImportData(backup); err != nil {
+	if err := s2.ImportData(context.Background(), backup); err != nil {
 		t.Fatalf("ImportData: %v", err)
 	}
-	sites, err := s2.GetSites()
+	sites, err := s2.GetSites(context.Background())
 	if err != nil {
 		t.Fatalf("GetSites: %v", err)
 	}
-	alerts, err := s2.GetAllAlerts()
+	alerts, err := s2.GetAllAlerts(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllAlerts: %v", err)
 	}
-	users, err := s2.GetAllUsers()
+	users, err := s2.GetAllUsers(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllUsers: %v", err)
 	}
@@ -235,20 +236,85 @@ func TestImportExport(t *testing.T) {
 	}
 }
 func TestImportData_WipesHistory(t *testing.T) {
 	s := newTestStore(t)
 	if err := s.AddSite(context.Background(), models.SiteConfig{Name: "OldSite", URL: "https://old.com", Type: "http", Interval: 30}); err != nil {
 		t.Fatalf("AddSite: %v", err)
 	}
 	if err := s.SaveCheck(context.Background(), 1, 5000, true); err != nil {
 		t.Fatalf("SaveCheck: %v", err)
 	}
 	if err := s.SaveStateChange(context.Background(), 1, "UP", "DOWN", "timeout"); err != nil {
 		t.Fatalf("SaveStateChange: %v", err)
 	}
 	if err := s.SaveAlertHealth(context.Background(), models.AlertHealthRecord{AlertID: 1, LastSendOK: true, SendCount: 1}); err != nil {
 		t.Fatalf("SaveAlertHealth: %v", err)
 	}
 	backup := models.Backup{
 		Sites: []models.SiteConfig{{ID: 1, Name: "NewSite", URL: "https://new.com", Type: "http", Interval: 60}},
 	}
 	if err := s.ImportData(context.Background(), backup); err != nil {
 		t.Fatalf("ImportData: %v", err)
 	}
 	history, err := s.LoadAllHistory(context.Background(), 100)
 	if err != nil {
 		t.Fatalf("LoadAllHistory: %v", err)
 	}
 	if len(history) != 0 {
 		t.Errorf("expected empty check_history after import, got %d sites with history", len(history))
 	}
 	changes, err := s.GetStateChanges(context.Background(), 1, 100)
 	if err != nil {
 		t.Fatalf("GetStateChanges: %v", err)
 	}
 	if len(changes) != 0 {
 		t.Errorf("expected empty state_changes after import, got %d", len(changes))
 	}
 }
 func TestImportData_NilUsersPreservesExisting(t *testing.T) {
 	s := newTestStore(t)
 	if err := s.AddUser(context.Background(), "admin", "ssh-ed25519 ADMINKEY", "admin"); err != nil {
 		t.Fatalf("AddUser: %v", err)
 	}
 	backup := models.Backup{
 		Sites:  []models.SiteConfig{{ID: 1, Name: "New", URL: "https://new.com", Type: "http", Interval: 30}},
 		Alerts: []models.AlertConfig{{ID: 1, Name: "a", Type: "webhook", Settings: map[string]string{"url": "https://h.com"}}},
 		Users:  nil,
 	}
 	if err := s.ImportData(context.Background(), backup); err != nil {
 		t.Fatalf("ImportData: %v", err)
 	}
 	users, err := s.GetAllUsers(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllUsers: %v", err)
 	}
 	if len(users) != 1 || users[0].Username != "admin" {
 		t.Errorf("expected existing admin user preserved, got %d users", len(users))
 	}
 }
 func TestCheckHistory(t *testing.T) {
 	s := newTestStore(t)
-	if err := s.SaveCheck(1, 5000000, true); err != nil {
+	if err := s.SaveCheck(context.Background(), 1, 5000000, true); err != nil {
 		t.Fatalf("SaveCheck: %v", err)
 	}
-	if err := s.SaveCheck(1, 10000000, false); err != nil {
+	if err := s.SaveCheck(context.Background(), 1, 10000000, false); err != nil {
 		t.Fatalf("SaveCheck: %v", err)
 	}
-	if err := s.SaveCheck(2, 3000000, true); err != nil {
+	if err := s.SaveCheck(context.Background(), 2, 3000000, true); err != nil {
 		t.Fatalf("SaveCheck site 2: %v", err)
 	}
-	history, err := s.LoadAllHistory(10)
+	history, err := s.LoadAllHistory(context.Background(), 10)
 	if err != nil {
 		t.Fatalf("LoadAllHistory: %v", err)
 	}
@@ -273,17 +339,17 @@ func TestCheckHistory(t *testing.T) {
 func TestDeleteSiteCascade(t *testing.T) {
 	s := newTestStore(t)
-	site := models.Site{Name: "Cascade Test", URL: "https://example.com", Interval: 30}
+	site := models.SiteConfig{Name: "Cascade Test", URL: "https://example.com", Interval: 30}
-	if err := s.AddSite(site); err != nil {
+	if err := s.AddSite(context.Background(), site); err != nil {
 		t.Fatalf("AddSite: %v", err)
 	}
-	sites, _ := s.GetSites()
+	sites, _ := s.GetSites(context.Background())
 	siteID := sites[0].ID
-	if err := s.SaveCheck(siteID, 1000, true); err != nil {
+	if err := s.SaveCheck(context.Background(), siteID, 1000, true); err != nil {
 		t.Fatalf("SaveCheck: %v", err)
 	}
-	if err := s.SaveStateChange(siteID, "UP", "DOWN", "timeout"); err != nil {
+	if err := s.SaveStateChange(context.Background(), siteID, "UP", "DOWN", "timeout"); err != nil {
 		t.Fatalf("SaveStateChange: %v", err)
 	}
 	mw := models.MaintenanceWindow{
@@ -292,25 +358,25 @@ func TestDeleteSiteCascade(t *testing.T) {
 		Type:      "maintenance",
 		StartTime: time.Now(),
 	}
-	if err := s.AddMaintenanceWindow(mw); err != nil {
+	if err := s.AddMaintenanceWindow(context.Background(), mw); err != nil {
 		t.Fatalf("AddMaintenanceWindow: %v", err)
 	}
-	if err := s.DeleteSite(siteID); err != nil {
+	if err := s.DeleteSite(context.Background(), siteID); err != nil {
 		t.Fatalf("DeleteSite: %v", err)
 	}
-	history, _ := s.LoadAllHistory(100)
+	history, _ := s.LoadAllHistory(context.Background(), 100)
 	if len(history[siteID]) != 0 {
 		t.Errorf("expected 0 check_history rows, got %d", len(history[siteID]))
 	}
-	changes, _ := s.GetStateChanges(siteID, 100)
+	changes, _ := s.GetStateChanges(context.Background(), siteID, 100)
 	if len(changes) != 0 {
 		t.Errorf("expected 0 state_changes rows, got %d", len(changes))
 	}
-	windows, _ := s.GetActiveMaintenanceWindows()
+	windows, _ := s.GetActiveMaintenanceWindows(context.Background())
 	for _, w := range windows {
 		if w.MonitorID == siteID {
 			t.Errorf("orphaned maintenance window found: id=%d", w.ID)
@@ -322,15 +388,15 @@ func TestPruneLogs(t *testing.T) {
 	s := newTestStore(t)
 	for i := 0; i < maxLogRows+50; i++ {
-		if err := s.SaveLog(fmt.Sprintf("log %d", i)); err != nil {
+		if err := s.SaveLog(context.Background(), fmt.Sprintf("log %d", i)); err != nil {
 			t.Fatalf("SaveLog: %v", err)
 		}
 	}
-	if err := s.PruneLogs(); err != nil {
+	if err := s.PruneLogs(context.Background()); err != nil {
 		t.Fatalf("PruneLogs: %v", err)
 	}
-	logs, err := s.LoadLogs(maxLogRows * 2)
+	logs, err := s.LoadLogs(context.Background(), maxLogRows*2)
 	if err != nil {
 		t.Fatalf("LoadLogs: %v", err)
 	}
@@ -355,21 +421,21 @@ func TestPruneCheckHistory(t *testing.T) {
 	s := newTestStore(t)
 	for i := 0; i < maxCheckHistory+5; i++ {
-		if err := s.SaveCheck(1, int64(i), true); err != nil {
+		if err := s.SaveCheck(context.Background(), 1, int64(i), true); err != nil {
 			t.Fatalf("SaveCheck site 1: %v", err)
 		}
 	}
 	for i := 0; i < 3; i++ {
-		if err := s.SaveCheck(2, int64(i), true); err != nil {
+		if err := s.SaveCheck(context.Background(), 2, int64(i), true); err != nil {
 			t.Fatalf("SaveCheck site 2: %v", err)
 		}
 	}
-	if err := s.PruneCheckHistory(); err != nil {
+	if err := s.PruneCheckHistory(context.Background()); err != nil {
 		t.Fatalf("PruneCheckHistory: %v", err)
 	}
-	history, err := s.LoadAllHistory(maxCheckHistory * 2)
+	history, err := s.LoadAllHistory(context.Background(), maxCheckHistory*2)
 	if err != nil {
 		t.Fatalf("LoadAllHistory: %v", err)
 	}
@@ -394,7 +460,7 @@ func TestPruneExpiredMaintenanceWindows(t *testing.T) {
 		StartTime: now.Add(-11 * 24 * time.Hour),
 		EndTime:   now.Add(-10 * 24 * time.Hour),
 	}
-	if err := s.AddMaintenanceWindow(old); err != nil {
+	if err := s.AddMaintenanceWindow(context.Background(), old); err != nil {
 		t.Fatalf("AddMaintenanceWindow (old): %v", err)
 	}
@@ -406,7 +472,7 @@ func TestPruneExpiredMaintenanceWindows(t *testing.T) {
 		StartTime: now.Add(-2 * 24 * time.Hour),
 		EndTime:   now.Add(-1 * 24 * time.Hour),
 	}
-	if err := s.AddMaintenanceWindow(recent); err != nil {
+	if err := s.AddMaintenanceWindow(context.Background(), recent); err != nil {
 		t.Fatalf("AddMaintenanceWindow (recent): %v", err)
 	}
@@ -417,11 +483,11 @@ func TestPruneExpiredMaintenanceWindows(t *testing.T) {
 		Type:      "maintenance",
 		StartTime: now.Add(-1 * time.Hour),
 	}
-	if err := s.AddMaintenanceWindow(ongoing); err != nil {
+	if err := s.AddMaintenanceWindow(context.Background(), ongoing); err != nil {
 		t.Fatalf("AddMaintenanceWindow (ongoing): %v", err)
 	}
-	pruned, err := s.PruneExpiredMaintenanceWindows(7 * 24 * time.Hour)
+	pruned, err := s.PruneExpiredMaintenanceWindows(context.Background(), 7*24*time.Hour)
 	if err != nil {
 		t.Fatalf("PruneExpiredMaintenanceWindows: %v", err)
 	}
@@ -429,7 +495,7 @@ func TestPruneExpiredMaintenanceWindows(t *testing.T) {
 		t.Errorf("expected 1 pruned, got %d", pruned)
 	}
-	all, err := s.GetAllMaintenanceWindows(100)
+	all, err := s.GetAllMaintenanceWindows(context.Background(), 100)
 	if err != nil {
 		t.Fatalf("GetAllMaintenanceWindows: %v", err)
 	}
@@ -458,7 +524,7 @@ func TestImportData_EncryptsAlertSettings(t *testing.T) {
 			{ID: 1, Name: "tg", Type: "telegram", Settings: map[string]string{"token": "123:SECRET", "chat_id": "42"}},
 		},
 	}
-	if err := s.ImportData(backup); err != nil {
+	if err := s.ImportData(context.Background(), backup); err != nil {
 		t.Fatalf("ImportData: %v", err)
 	}
@@ -473,7 +539,7 @@ func TestImportData_EncryptsAlertSettings(t *testing.T) {
 		t.Errorf("plaintext secret found in stored column: %q", raw)
 	}
-	alerts, err := s.GetAllAlerts()
+	alerts, err := s.GetAllAlerts(context.Background())
 	if err != nil {
 		t.Fatalf("GetAllAlerts: %v", err)
 	}
@@ -1,84 +1,85 @@
 package store
 import (
 	"context"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
 type Store interface {
-	Init() error
+	Init(ctx context.Context) error
 	// Sites
-	GetSites() ([]models.Site, error)
+	GetSites(ctx context.Context) ([]models.SiteConfig, error)
-	AddSite(site models.Site) error
+	AddSite(ctx context.Context, site models.SiteConfig) error
-	UpdateSite(site models.Site) error
+	UpdateSite(ctx context.Context, site models.SiteConfig) error
-	UpdateSitePaused(id int, paused bool) error
+	UpdateSitePaused(ctx context.Context, id int, paused bool) error
-	DeleteSite(id int) error
+	DeleteSite(ctx context.Context, id int) error
 	// Alerts
-	GetAllAlerts() ([]models.AlertConfig, error)
+	GetAllAlerts(ctx context.Context) ([]models.AlertConfig, error)
-	GetAlert(id int) (models.AlertConfig, error)
+	GetAlert(ctx context.Context, id int) (models.AlertConfig, error)
-	AddAlert(name, aType string, settings map[string]string) error
+	AddAlert(ctx context.Context, name, aType string, settings map[string]string) error
-	UpdateAlert(id int, name, aType string, settings map[string]string) error
+	UpdateAlert(ctx context.Context, id int, name, aType string, settings map[string]string) error
-	DeleteAlert(id int) error
+	DeleteAlert(ctx context.Context, id int) error
 	// Declarative config support
-	GetSiteByName(name string) (models.Site, error)
+	GetSiteByName(ctx context.Context, name string) (models.SiteConfig, error)
-	GetAlertByName(name string) (models.AlertConfig, error)
+	GetAlertByName(ctx context.Context, name string) (models.AlertConfig, error)
-	AddSiteReturningID(site models.Site) (int, error)
+	AddSiteReturningID(ctx context.Context, site models.SiteConfig) (int, error)
-	AddAlertReturningID(name, aType string, settings map[string]string) (int, error)
+	AddAlertReturningID(ctx context.Context, name, aType string, settings map[string]string) (int, error)
 	// Users
-	GetAllUsers() ([]models.User, error)
+	GetAllUsers(ctx context.Context) ([]models.User, error)
-	AddUser(username, publicKey, role string) error
+	AddUser(ctx context.Context, username, publicKey, role string) error
-	UpdateUser(id int, username, publicKey, role string) error
+	UpdateUser(ctx context.Context, id int, username, publicKey, role string) error
-	DeleteUser(id int) error
+	DeleteUser(ctx context.Context, id int) error
 	// History
-	SaveCheck(siteID int, latencyNs int64, isUp bool) error
+	SaveCheck(ctx context.Context, siteID int, latencyNs int64, isUp bool) error
-	SaveCheckFromNode(siteID int, nodeID string, latencyNs int64, isUp bool) error
+	SaveCheckFromNode(ctx context.Context, siteID int, nodeID string, latencyNs int64, isUp bool) error
-	LoadAllHistory(limit int) (map[int][]models.CheckRecord, error)
+	LoadAllHistory(ctx context.Context, limit int) (map[int][]models.CheckRecord, error)
-	PruneCheckHistory() error
+	PruneCheckHistory(ctx context.Context) error
 	// State Changes
-	SaveStateChange(siteID int, fromStatus, toStatus, errorReason string) error
+	SaveStateChange(ctx context.Context, siteID int, fromStatus, toStatus, errorReason string) error
-	GetStateChanges(siteID int, limit int) ([]models.StateChange, error)
+	GetStateChanges(ctx context.Context, siteID int, limit int) ([]models.StateChange, error)
-	GetStateChangesSince(siteID int, since time.Time) ([]models.StateChange, error)
+	GetStateChangesSince(ctx context.Context, siteID int, since time.Time) ([]models.StateChange, error)
-	PruneStateChanges() error
+	PruneStateChanges(ctx context.Context) error
 	// Nodes
-	RegisterNode(node models.ProbeNode) error
+	RegisterNode(ctx context.Context, node models.ProbeNode) error
-	GetNode(id string) (models.ProbeNode, error)
+	GetNode(ctx context.Context, id string) (models.ProbeNode, error)
-	GetAllNodes() ([]models.ProbeNode, error)
+	GetAllNodes(ctx context.Context) ([]models.ProbeNode, error)
-	UpdateNodeLastSeen(id string) error
+	UpdateNodeLastSeen(ctx context.Context, id string) error
-	DeleteNode(id string) error
+	DeleteNode(ctx context.Context, id string) error
 	// Alert Health
-	LoadAlertHealth() (map[int]models.AlertHealthRecord, error)
+	LoadAlertHealth(ctx context.Context) (map[int]models.AlertHealthRecord, error)
-	SaveAlertHealth(h models.AlertHealthRecord) error
+	SaveAlertHealth(ctx context.Context, h models.AlertHealthRecord) error
 	// Logs
-	SaveLog(message string) error
+	SaveLog(ctx context.Context, message string) error
-	LoadLogs(limit int) ([]string, error)
+	LoadLogs(ctx context.Context, limit int) ([]string, error)
-	PruneLogs() error
+	PruneLogs(ctx context.Context) error
 	// Maintenance Windows
-	GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error)
+	GetActiveMaintenanceWindows(ctx context.Context) ([]models.MaintenanceWindow, error)
-	GetAllMaintenanceWindows(limit int) ([]models.MaintenanceWindow, error)
+	GetAllMaintenanceWindows(ctx context.Context, limit int) ([]models.MaintenanceWindow, error)
-	AddMaintenanceWindow(mw models.MaintenanceWindow) error
+	AddMaintenanceWindow(ctx context.Context, mw models.MaintenanceWindow) error
-	EndMaintenanceWindow(id int) error
+	EndMaintenanceWindow(ctx context.Context, id int) error
-	DeleteMaintenanceWindow(id int) error
+	DeleteMaintenanceWindow(ctx context.Context, id int) error
-	PruneExpiredMaintenanceWindows(retention time.Duration) (int64, error)
+	PruneExpiredMaintenanceWindows(ctx context.Context, retention time.Duration) (int64, error)
-	IsMonitorInMaintenance(monitorID int) (bool, error)
+	IsMonitorInMaintenance(ctx context.Context, monitorID int) (bool, error)
 	// Preferences
-	GetPreference(key string) (string, error)
+	GetPreference(ctx context.Context, key string) (string, error)
-	SetPreference(key, value string) error
+	SetPreference(ctx context.Context, key, value string) error
 	// Backup & Restore
-	ExportData() (models.Backup, error)
+	ExportData(ctx context.Context) (models.Backup, error)
-	ImportData(data models.Backup) error
+	ImportData(ctx context.Context, data models.Backup) error
 	// Lifecycle
 	Close() error
@@ -0,0 +1,276 @@
 package storetest
 import (
 	"context"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
 // BaseMock implements store.Store with no-op defaults. Embed it in test-specific
 // mocks and override only the methods you need via the exported Func fields or
 // by shadowing the method on the embedding struct.
 type BaseMock struct {
 	GetSitesFunc                    func(ctx context.Context) ([]models.SiteConfig, error)
 	AddSiteFunc                     func(ctx context.Context, site models.SiteConfig) error
 	UpdateSiteFunc                  func(ctx context.Context, site models.SiteConfig) error
 	GetAllAlertsFunc                func(ctx context.Context) ([]models.AlertConfig, error)
 	GetAlertFunc                    func(ctx context.Context, id int) (models.AlertConfig, error)
 	GetAllUsersFunc                 func(ctx context.Context) ([]models.User, error)
 	GetAllNodesFunc                 func(ctx context.Context) ([]models.ProbeNode, error)
 	GetActiveMaintenanceWindowsFunc func(ctx context.Context) ([]models.MaintenanceWindow, error)
 	GetAllMaintenanceWindowsFunc    func(ctx context.Context, limit int) ([]models.MaintenanceWindow, error)
 	IsMonitorInMaintenanceFunc      func(ctx context.Context, id int) (bool, error)
 	LoadAlertHealthFunc             func(ctx context.Context) (map[int]models.AlertHealthRecord, error)
 	LoadAllHistoryFunc              func(ctx context.Context, limit int) (map[int][]models.CheckRecord, error)
 	SaveCheckFunc                   func(ctx context.Context, siteID int, latencyNs int64, isUp bool) error
 	SaveCheckFromNodeFunc           func(ctx context.Context, siteID int, nodeID string, latencyNs int64, isUp bool) error
 	SaveLogFunc                     func(ctx context.Context, message string) error
 	SaveStateChangeFunc             func(ctx context.Context, siteID int, from, to, reason string) error
 	SaveAlertHealthFunc             func(ctx context.Context, h models.AlertHealthRecord) error
 	GetStateChangesFunc             func(ctx context.Context, siteID, limit int) ([]models.StateChange, error)
 	GetStateChangesSinceFunc        func(ctx context.Context, siteID int, since time.Time) ([]models.StateChange, error)
 	ExportDataFunc                  func(ctx context.Context) (models.Backup, error)
 	ImportDataFunc                  func(ctx context.Context, data models.Backup) error
 	RegisterNodeFunc                func(ctx context.Context, node models.ProbeNode) error
 	GetNodeFunc                     func(ctx context.Context, id string) (models.ProbeNode, error)
 	GetPreferenceFunc               func(ctx context.Context, key string) (string, error)
 	SetPreferenceFunc               func(ctx context.Context, key, value string) error
 }
 func (m *BaseMock) Init(_ context.Context) error { return nil }
 func (m *BaseMock) Close() error                 { return nil }
 func (m *BaseMock) GetSites(ctx context.Context) ([]models.SiteConfig, error) {
 	if m.GetSitesFunc != nil {
 		return m.GetSitesFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) AddSite(ctx context.Context, site models.SiteConfig) error {
 	if m.AddSiteFunc != nil {
 		return m.AddSiteFunc(ctx, site)
 	}
 	return nil
 }
 func (m *BaseMock) UpdateSite(ctx context.Context, site models.SiteConfig) error {
 	if m.UpdateSiteFunc != nil {
 		return m.UpdateSiteFunc(ctx, site)
 	}
 	return nil
 }
 func (m *BaseMock) UpdateSitePaused(_ context.Context, _ int, _ bool) error { return nil }
 func (m *BaseMock) DeleteSite(_ context.Context, _ int) error { return nil }
 func (m *BaseMock) GetAllAlerts(ctx context.Context) ([]models.AlertConfig, error) {
 	if m.GetAllAlertsFunc != nil {
 		return m.GetAllAlertsFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) GetAlert(ctx context.Context, id int) (models.AlertConfig, error) {
 	if m.GetAlertFunc != nil {
 		return m.GetAlertFunc(ctx, id)
 	}
 	return models.AlertConfig{}, nil
 }
 func (m *BaseMock) AddAlert(_ context.Context, _ string, _ string, _ map[string]string) error {
 	return nil
 }
 func (m *BaseMock) UpdateAlert(_ context.Context, _ int, _ string, _ string, _ map[string]string) error {
 	return nil
 }
 func (m *BaseMock) DeleteAlert(_ context.Context, _ int) error { return nil }
 func (m *BaseMock) GetSiteByName(_ context.Context, _ string) (models.SiteConfig, error) {
 	return models.SiteConfig{}, nil
 }
 func (m *BaseMock) GetAlertByName(_ context.Context, _ string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, nil
 }
 func (m *BaseMock) AddSiteReturningID(_ context.Context, _ models.SiteConfig) (int, error) {
 	return 0, nil
 }
 func (m *BaseMock) AddAlertReturningID(_ context.Context, _ string, _ string, _ map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *BaseMock) GetAllUsers(ctx context.Context) ([]models.User, error) {
 	if m.GetAllUsersFunc != nil {
 		return m.GetAllUsersFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) AddUser(_ context.Context, _ string, _ string, _ string) error { return nil }
 func (m *BaseMock) UpdateUser(_ context.Context, _ int, _ string, _ string, _ string) error {
 	return nil
 }
 func (m *BaseMock) DeleteUser(_ context.Context, _ int) error { return nil }
 func (m *BaseMock) SaveCheck(ctx context.Context, siteID int, latencyNs int64, isUp bool) error {
 	if m.SaveCheckFunc != nil {
 		return m.SaveCheckFunc(ctx, siteID, latencyNs, isUp)
 	}
 	return nil
 }
 func (m *BaseMock) SaveCheckFromNode(ctx context.Context, siteID int, nodeID string, latencyNs int64, isUp bool) error {
 	if m.SaveCheckFromNodeFunc != nil {
 		return m.SaveCheckFromNodeFunc(ctx, siteID, nodeID, latencyNs, isUp)
 	}
 	return nil
 }
 func (m *BaseMock) LoadAllHistory(ctx context.Context, limit int) (map[int][]models.CheckRecord, error) {
 	if m.LoadAllHistoryFunc != nil {
 		return m.LoadAllHistoryFunc(ctx, limit)
 	}
 	return nil, nil
 }
 func (m *BaseMock) PruneCheckHistory(_ context.Context) error { return nil }
 func (m *BaseMock) SaveStateChange(ctx context.Context, siteID int, from, to, reason string) error {
 	if m.SaveStateChangeFunc != nil {
 		return m.SaveStateChangeFunc(ctx, siteID, from, to, reason)
 	}
 	return nil
 }
 func (m *BaseMock) GetStateChanges(ctx context.Context, siteID, limit int) ([]models.StateChange, error) {
 	if m.GetStateChangesFunc != nil {
 		return m.GetStateChangesFunc(ctx, siteID, limit)
 	}
 	return nil, nil
 }
 func (m *BaseMock) GetStateChangesSince(ctx context.Context, siteID int, since time.Time) ([]models.StateChange, error) {
 	if m.GetStateChangesSinceFunc != nil {
 		return m.GetStateChangesSinceFunc(ctx, siteID, since)
 	}
 	return nil, nil
 }
 func (m *BaseMock) PruneStateChanges(_ context.Context) error { return nil }
 func (m *BaseMock) RegisterNode(ctx context.Context, node models.ProbeNode) error {
 	if m.RegisterNodeFunc != nil {
 		return m.RegisterNodeFunc(ctx, node)
 	}
 	return nil
 }
 func (m *BaseMock) GetNode(ctx context.Context, id string) (models.ProbeNode, error) {
 	if m.GetNodeFunc != nil {
 		return m.GetNodeFunc(ctx, id)
 	}
 	return models.ProbeNode{}, nil
 }
 func (m *BaseMock) GetAllNodes(ctx context.Context) ([]models.ProbeNode, error) {
 	if m.GetAllNodesFunc != nil {
 		return m.GetAllNodesFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) UpdateNodeLastSeen(_ context.Context, _ string) error { return nil }
 func (m *BaseMock) DeleteNode(_ context.Context, _ string) error         { return nil }
 func (m *BaseMock) LoadAlertHealth(ctx context.Context) (map[int]models.AlertHealthRecord, error) {
 	if m.LoadAlertHealthFunc != nil {
 		return m.LoadAlertHealthFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) SaveAlertHealth(ctx context.Context, h models.AlertHealthRecord) error {
 	if m.SaveAlertHealthFunc != nil {
 		return m.SaveAlertHealthFunc(ctx, h)
 	}
 	return nil
 }
 func (m *BaseMock) SaveLog(ctx context.Context, message string) error {
 	if m.SaveLogFunc != nil {
 		return m.SaveLogFunc(ctx, message)
 	}
 	return nil
 }
 func (m *BaseMock) LoadLogs(_ context.Context, _ int) ([]string, error) { return nil, nil }
 func (m *BaseMock) PruneLogs(_ context.Context) error                   { return nil }
 func (m *BaseMock) GetActiveMaintenanceWindows(ctx context.Context) ([]models.MaintenanceWindow, error) {
 	if m.GetActiveMaintenanceWindowsFunc != nil {
 		return m.GetActiveMaintenanceWindowsFunc(ctx)
 	}
 	return nil, nil
 }
 func (m *BaseMock) GetAllMaintenanceWindows(ctx context.Context, limit int) ([]models.MaintenanceWindow, error) {
 	if m.GetAllMaintenanceWindowsFunc != nil {
 		return m.GetAllMaintenanceWindowsFunc(ctx, limit)
 	}
 	return nil, nil
 }
 func (m *BaseMock) AddMaintenanceWindow(_ context.Context, _ models.MaintenanceWindow) error {
 	return nil
 }
 func (m *BaseMock) EndMaintenanceWindow(_ context.Context, _ int) error    { return nil }
 func (m *BaseMock) DeleteMaintenanceWindow(_ context.Context, _ int) error { return nil }
 func (m *BaseMock) PruneExpiredMaintenanceWindows(_ context.Context, _ time.Duration) (int64, error) {
 	return 0, nil
 }
 func (m *BaseMock) IsMonitorInMaintenance(ctx context.Context, id int) (bool, error) {
 	if m.IsMonitorInMaintenanceFunc != nil {
 		return m.IsMonitorInMaintenanceFunc(ctx, id)
 	}
 	return false, nil
 }
 func (m *BaseMock) GetPreference(ctx context.Context, key string) (string, error) {
 	if m.GetPreferenceFunc != nil {
 		return m.GetPreferenceFunc(ctx, key)
 	}
 	return "", nil
 }
 func (m *BaseMock) SetPreference(ctx context.Context, key, value string) error {
 	if m.SetPreferenceFunc != nil {
 		return m.SetPreferenceFunc(ctx, key, value)
 	}
 	return nil
 }
 func (m *BaseMock) ExportData(ctx context.Context) (models.Backup, error) {
 	if m.ExportDataFunc != nil {
 		return m.ExportDataFunc(ctx)
 	}
 	return models.Backup{}, nil
 }
 func (m *BaseMock) ImportData(ctx context.Context, data models.Backup) error {
 	if m.ImportDataFunc != nil {
 		return m.ImportDataFunc(ctx, data)
 	}
 	return nil
 }
@@ -1,103 +0,0 @@
 package tui
 // braillePlane is a subpixel canvas where each terminal cell maps to a 2×4
 // dot grid, rendered via Unicode braille (U+2800..U+28FF).
 type braillePlane struct {
 	wCells, hCells int
 	wDots, hDots   int
 	dots           []bool
 }
 func newBraillePlane(wCells, hCells int) *braillePlane {
 	wd, hd := wCells*2, hCells*4
 	return &braillePlane{
 		wCells: wCells, hCells: hCells,
 		wDots: wd, hDots: hd,
 		dots: make([]bool, wd*hd),
 	}
 }
 func (p *braillePlane) set(dx, dy int) {
 	if dx < 0 || dy < 0 || dx >= p.wDots || dy >= p.hDots {
 		return
 	}
 	p.dots[dy*p.wDots+dx] = true
 }
 // line draws a Bresenham line between two dot coordinates.
 func (p *braillePlane) line(x0, y0, x1, y1 int) {
 	dx := intAbs(x1 - x0)
 	sx := 1
 	if x0 >= x1 {
 		sx = -1
 	}
 	dy := -intAbs(y1 - y0)
 	sy := 1
 	if y0 >= y1 {
 		sy = -1
 	}
 	err := dx + dy
 	for {
 		p.set(x0, y0)
 		if x0 == x1 && y0 == y1 {
 			return
 		}
 		e2 := 2 * err
 		if e2 >= dy {
 			err += dy
 			x0 += sx
 		}
 		if e2 <= dx {
 			err += dx
 			y0 += sy
 		}
 	}
 }
 // fillBelow fills all dots below the topmost lit dot in each column,
 // producing an area-chart effect.
 func (p *braillePlane) fillBelow() {
 	for x := 0; x < p.wDots; x++ {
 		topY := -1
 		for y := 0; y < p.hDots; y++ {
 			if p.dots[y*p.wDots+x] {
 				topY = y
 				break
 			}
 		}
 		if topY >= 0 {
 			for y := topY + 1; y < p.hDots; y++ {
 				p.dots[y*p.wDots+x] = true
 			}
 		}
 	}
 }
 // cellMask builds the U+2800-relative bitmask for one terminal cell.
 func (p *braillePlane) cellMask(cx, cy int) byte {
 	type bit struct {
 		dx, dy int
 		m      byte
 	}
 	bits := [...]bit{
 		{0, 0, 0x01}, {0, 1, 0x02}, {0, 2, 0x04},
 		{1, 0, 0x08}, {1, 1, 0x10}, {1, 2, 0x20},
 		{0, 3, 0x40}, {1, 3, 0x80},
 	}
 	var mask byte
 	for _, b := range bits {
 		dx := cx*2 + b.dx
 		dy := cy*4 + b.dy
 		if dx >= 0 && dx < p.wDots && dy >= 0 && dy < p.hDots && p.dots[dy*p.wDots+dx] {
 			mask |= b.m
 		}
 	}
 	return mask
 }
 func intAbs(n int) int {
 	if n < 0 {
 		return -n
 	}
 	return n
 }
@@ -1,64 +0,0 @@
 package tui
 import "testing"
 func TestBraillePlane_Set(t *testing.T) {
 	p := newBraillePlane(2, 1)
 	if p.wDots != 4 || p.hDots != 4 {
 		t.Fatalf("expected 4x4 dots, got %dx%d", p.wDots, p.hDots)
 	}
 	p.set(0, 0)
 	if !p.dots[0] {
 		t.Error("dot at (0,0) should be set")
 	}
 	p.set(-1, 0) // out of bounds, should not panic
 	p.set(0, 99) // out of bounds, should not panic
 }
 func TestBraillePlane_CellMask(t *testing.T) {
 	p := newBraillePlane(1, 1)
 	// Set bottom-left dot
 	p.set(0, 3)
 	mask := p.cellMask(0, 0)
 	if mask != 0x40 {
 		t.Errorf("bottom-left dot should be 0x40, got 0x%02x", mask)
 	}
 	// Set all dots
 	for y := 0; y < 4; y++ {
 		for x := 0; x < 2; x++ {
 			p.set(x, y)
 		}
 	}
 	mask = p.cellMask(0, 0)
 	if mask != 0xFF {
 		t.Errorf("all dots should be 0xFF, got 0x%02x", mask)
 	}
 }
 func TestBraillePlane_Line(t *testing.T) {
 	p := newBraillePlane(3, 1)
 	p.line(0, 2, 5, 2) // horizontal line
 	for x := 0; x <= 5; x++ {
 		if !p.dots[2*p.wDots+x] {
 			t.Errorf("dot at (%d, 2) should be set", x)
 		}
 	}
 }
 func TestBraillePlane_FillBelow(t *testing.T) {
 	p := newBraillePlane(1, 1)
 	p.set(0, 1) // set dot at row 1
 	p.fillBelow()
 	if !p.dots[1*p.wDots+0] {
 		t.Error("original dot should still be set")
 	}
 	if !p.dots[2*p.wDots+0] {
 		t.Error("row 2 should be filled")
 	}
 	if !p.dots[3*p.wDots+0] {
 		t.Error("row 3 should be filled")
 	}
 	if p.dots[0*p.wDots+0] {
 		t.Error("row 0 above the dot should not be filled")
 	}
 }
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"encoding/json"
 	"sort"
 	"strings"
@@ -13,7 +14,7 @@ import (
 func loadCollapsed(s store.Store) map[int]bool {
 	m := make(map[int]bool)
-	raw, err := s.GetPreference("collapsed_groups")
+	raw, err := s.GetPreference(context.Background(), "collapsed_groups")
 	if err != nil || raw == "" {
 		return m
 	}
@@ -103,10 +104,25 @@ func (m *Model) refreshLive() {
 		ordered = filterSites(ordered, m.filterText)
 	}
 	m.sites = ordered
-	m.logViewport.SetContent(strings.Join(m.engine.GetLogs(), "\n"))
+	m.refreshLogContent()
 	if m.currentTab == 0 && m.selectedID != 0 {
 		for i, s := range m.sites {
 			if s.ID == m.selectedID {
 				m.cursor = i
 				break
 			}
 		}
 	}
 	m.clampCursor()
 }
 func (m *Model) syncSelectedID() {
 	if m.currentTab == 0 && m.cursor < len(m.sites) {
 		m.selectedID = m.sites[m.cursor].ID
 	}
 }
 // clampCursor keeps the cursor and scroll offset within the current tab's list.
 func (m *Model) clampCursor() {
 	listLen := m.currentListLen()
@@ -130,21 +146,22 @@ func (m *Model) loadTabDataCmd() tea.Cmd {
 	st := m.store
 	isAdmin := m.isAdmin
 	return func() tea.Msg {
-		alerts, err := st.GetAllAlerts()
+		ctx := context.Background()
 		alerts, err := st.GetAllAlerts(ctx)
 		if err != nil {
 			return tabDataMsg{seq: seq, err: err}
 		}
 		var users []models.User
 		if isAdmin {
-			if users, err = st.GetAllUsers(); err != nil {
+			if users, err = st.GetAllUsers(ctx); err != nil {
 				return tabDataMsg{seq: seq, err: err}
 			}
 		}
-		nodes, err := st.GetAllNodes()
+		nodes, err := st.GetAllNodes(ctx)
 		if err != nil {
 			return tabDataMsg{seq: seq, err: err}
 		}
-		maint, err := st.GetAllMaintenanceWindows(100)
+		maint, err := st.GetAllMaintenanceWindows(ctx, 100)
 		if err != nil {
 			return tabDataMsg{seq: seq, err: err}
 		}
@@ -8,9 +8,9 @@ import (
 func TestSortSitesForDisplay_GroupsFirst(t *testing.T) {
 	sites := []models.Site{
-		{ID: 3, Name: "ungrouped", Type: "http", Status: "UP"},
+		{SiteConfig: models.SiteConfig{ID: 3, Name: "ungrouped", Type: "http"}, SiteState: models.SiteState{Status: "UP"}},
-		{ID: 1, Name: "group-a", Type: "group", Status: "UP"},
+		{SiteConfig: models.SiteConfig{ID: 1, Name: "group-a", Type: "group"}, SiteState: models.SiteState{Status: "UP"}},
-		{ID: 2, Name: "child", Type: "http", Status: "UP", ParentID: 1},
+		{SiteConfig: models.SiteConfig{ID: 2, Name: "child", Type: "http", ParentID: 1}, SiteState: models.SiteState{Status: "UP"}},
 	}
 	result := sortSitesForDisplay(sites, nil)
 	if len(result) != 3 {
@@ -29,9 +29,9 @@ func TestSortSitesForDisplay_GroupsFirst(t *testing.T) {
 func TestSortSitesForDisplay_CollapsedHidesChildren(t *testing.T) {
 	sites := []models.Site{
-		{ID: 1, Name: "group-a", Type: "group", Status: "UP"},
+		{SiteConfig: models.SiteConfig{ID: 1, Name: "group-a", Type: "group"}, SiteState: models.SiteState{Status: "UP"}},
-		{ID: 2, Name: "child-1", Type: "http", Status: "UP", ParentID: 1},
+		{SiteConfig: models.SiteConfig{ID: 2, Name: "child-1", Type: "http", ParentID: 1}, SiteState: models.SiteState{Status: "UP"}},
-		{ID: 3, Name: "child-2", Type: "http", Status: "UP", ParentID: 1},
+		{SiteConfig: models.SiteConfig{ID: 3, Name: "child-2", Type: "http", ParentID: 1}, SiteState: models.SiteState{Status: "UP"}},
 	}
 	collapsed := map[int]bool{1: true}
 	result := sortSitesForDisplay(sites, collapsed)
@@ -45,9 +45,9 @@ func TestSortSitesForDisplay_CollapsedHidesChildren(t *testing.T) {
 func TestSortSitesForDisplay_StatusOrdering(t *testing.T) {
 	sites := []models.Site{
-		{ID: 1, Name: "up-site", Type: "http", Status: "UP"},
+		{SiteConfig: models.SiteConfig{ID: 1, Name: "up-site", Type: "http"}, SiteState: models.SiteState{Status: "UP"}},
-		{ID: 2, Name: "down-site", Type: "http", Status: "DOWN"},
+		{SiteConfig: models.SiteConfig{ID: 2, Name: "down-site", Type: "http"}, SiteState: models.SiteState{Status: "DOWN"}},
-		{ID: 3, Name: "late-site", Type: "http", Status: "LATE"},
+		{SiteConfig: models.SiteConfig{ID: 3, Name: "late-site", Type: "http"}, SiteState: models.SiteState{Status: "LATE"}},
 	}
 	result := sortSitesForDisplay(sites, nil)
 	if result[0].Status != "DOWN" {
@@ -63,9 +63,9 @@ func TestSortSitesForDisplay_StatusOrdering(t *testing.T) {
 func TestFilterSites(t *testing.T) {
 	sites := []models.Site{
-		{Name: "Production API"},
+		{SiteConfig: models.SiteConfig{Name: "Production API"}},
-		{Name: "Staging API"},
+		{SiteConfig: models.SiteConfig{Name: "Staging API"}},
-		{Name: "Database"},
+		{SiteConfig: models.SiteConfig{Name: "Database"}},
 	}
 	tests := []struct {
@@ -87,7 +87,7 @@ func TestFilterSites(t *testing.T) {
 }
 func TestFilterSites_EmptyNeedle(t *testing.T) {
-	sites := []models.Site{{Name: "a"}, {Name: "b"}}
+	sites := []models.Site{{SiteConfig: models.SiteConfig{Name: "a"}}, {SiteConfig: models.SiteConfig{Name: "b"}}}
 	got := filterSites(sites, "")
 	if len(got) != 2 {
 		t.Errorf("empty needle should return all, got %d", len(got))
@@ -34,6 +34,9 @@ func (m Model) emptyState(message, hint string) string {
 }
 func limitStr(text string, max int) string {
 	if max < 3 {
 		return text
 	}
 	runes := []rune(text)
 	if len(runes) > max {
 		return string(runes[:max-3]) + "..."
@@ -143,16 +146,16 @@ func (m Model) fmtRetries(site models.Site) string {
 		dispCount = site.MaxRetries
 	}
 	s := fmt.Sprintf("%d/%d", dispCount, site.MaxRetries)
-	if site.Status == "DOWN" {
+	if site.Status == models.StatusDown {
 		return m.st.dangerStyle.Render(s)
 	}
-	if site.Status == "UP" && site.FailureCount > 0 {
+	if site.Status == models.StatusUp && site.FailureCount > 0 {
 		return m.st.warnStyle.Render(s)
 	}
 	return s
 }
-func (m Model) fmtStatus(status string, paused bool, inMaint bool) string {
+func (m Model) fmtStatus(status models.Status, paused bool, inMaint bool) string {
 	if paused {
 		return m.st.warnStyle.Render("◇ PAUSED")
 	}
@@ -160,18 +163,18 @@ func (m Model) fmtStatus(status string, paused bool, inMaint bool) string {
 		return m.st.maintStyle.Render("◼ MAINT")
 	}
 	switch status {
-	case "DOWN":
+	case models.StatusDown:
 		return m.st.dangerStyle.Render("▼ DOWN")
-	case "SSL EXP":
+	case models.StatusSSLExp:
 		return m.st.dangerStyle.Render("▼ SSL EXP")
-	case "LATE":
+	case models.StatusLate:
 		return m.st.warnStyle.Render("◆ LATE")
-	case "STALE":
+	case models.StatusStale:
 		return m.st.staleStyle.Render("◆ STALE")
-	case "PENDING":
+	case models.StatusPending:
 		return m.st.subtleStyle.Render("○ PENDING")
 	default:
-		return m.st.specialStyle.Render("▲ " + status)
+		return m.st.specialStyle.Render("▲ " + string(status))
 	}
 }
@@ -38,13 +38,13 @@ func TestSiteOrder(t *testing.T) {
 		site models.Site
 		want int
 	}{
-		{"down", models.Site{Status: "DOWN"}, 0},
+		{"down", models.Site{SiteState: models.SiteState{Status: "DOWN"}}, 0},
-		{"ssl exp", models.Site{Status: "SSL EXP"}, 0},
+		{"ssl exp", models.Site{SiteState: models.SiteState{Status: "SSL EXP"}}, 0},
-		{"late", models.Site{Status: "LATE"}, 1},
+		{"late", models.Site{SiteState: models.SiteState{Status: "LATE"}}, 1},
-		{"up", models.Site{Status: "UP"}, 2},
+		{"up", models.Site{SiteState: models.SiteState{Status: "UP"}}, 2},
-		{"pending", models.Site{Status: "PENDING"}, 3},
+		{"pending", models.Site{SiteState: models.SiteState{Status: "PENDING"}}, 3},
-		{"paused up", models.Site{Status: "UP", Paused: true}, 3},
+		{"paused up", models.Site{SiteConfig: models.SiteConfig{Paused: true}, SiteState: models.SiteState{Status: "UP"}}, 3},
-		{"paused down", models.Site{Status: "DOWN", Paused: true}, 3},
+		{"paused down", models.Site{SiteConfig: models.SiteConfig{Paused: true}, SiteState: models.SiteState{Status: "DOWN"}}, 3},
 	}
 	for _, tt := range tests {
 		got := siteOrder(tt.site)
@@ -56,19 +56,19 @@ func TestSiteOrder(t *testing.T) {
 func TestFmtStatus(t *testing.T) {
 	tests := []struct {
-		status  string
+		status  models.Status
 		paused  bool
 		inMaint bool
 		wantSub string
 	}{
-		{"DOWN", false, false, "▼ DOWN"},
+		{models.StatusDown, false, false, "▼ DOWN"},
-		{"UP", false, false, "▲ UP"},
+		{models.StatusUp, false, false, "▲ UP"},
-		{"SSL EXP", false, false, "▼ SSL EXP"},
+		{models.StatusSSLExp, false, false, "▼ SSL EXP"},
-		{"LATE", false, false, "◆ LATE"},
+		{models.StatusLate, false, false, "◆ LATE"},
-		{"STALE", false, false, "◆ STALE"},
+		{models.StatusStale, false, false, "◆ STALE"},
-		{"PENDING", false, false, "○ PENDING"},
+		{models.StatusPending, false, false, "○ PENDING"},
-		{"DOWN", true, false, "◇ PAUSED"},
+		{models.StatusDown, true, false, "◇ PAUSED"},
-		{"DOWN", false, true, "◼ MAINT"},
+		{models.StatusDown, false, true, "◼ MAINT"},
 	}
 	for _, tt := range tests {
 		got := styledModel.fmtStatus(tt.status, tt.paused, tt.inMaint)
@@ -17,6 +17,17 @@ func parseHex(hex string) (r, g, b uint8) {
 	return
 }
 func trueColorHex(c lipgloss.TerminalColor) string {
 	switch v := c.(type) {
 	case lipgloss.CompleteColor:
 		return v.TrueColor
 	case lipgloss.Color:
 		return string(v)
 	default:
 		return ""
 	}
 }
 func dimColor(hex string, brightness float64) lipgloss.Color {
 	r, g, b := parseHex(hex)
 	f := 0.3 + brightness*0.7
@@ -27,35 +38,36 @@ func dimColor(hex string, brightness float64) lipgloss.Color {
 	))
 }
-func withBg(s lipgloss.Style, bg lipgloss.Color) lipgloss.Style {
+func withBg(s lipgloss.Style, bg lipgloss.TerminalColor) lipgloss.Style {
-	if bg != "" {
+	if bg != nil {
 		return s.Background(bg)
 	}
 	return s
 }
-func (m Model) latencyStyle(ms int64, bg lipgloss.Color) lipgloss.Style {
+func (m Model) latencyStyle(ms int64, bg lipgloss.TerminalColor) lipgloss.Style {
-	var hex string
+	var base lipgloss.TerminalColor
 	var t float64
 	switch {
 	case ms < 200:
-		hex = m.st.sparkSuccess
+		base = m.st.sparkSuccess
 		t = float64(ms) / 200
 	case ms < 500:
-		hex = m.st.sparkWarning
+		base = m.st.sparkWarning
 		t = float64(ms-200) / 300
 	default:
-		hex = m.st.sparkDanger
+		base = m.st.sparkDanger
 		t = float64(ms-500) / 1500
 		if t > 1 {
 			t = 1
 		}
 	}
 	hex := trueColorHex(base)
 	s := lipgloss.NewStyle().Foreground(dimColor(hex, t))
 	return withBg(s, bg)
 }
-func (m Model) latencySparkline(latencies []time.Duration, statuses []bool, width int, bg lipgloss.Color) string {
+func (m Model) latencySparkline(latencies []time.Duration, statuses []bool, width int, bg lipgloss.TerminalColor) string {
 	if len(latencies) == 0 {
 		return withBg(m.st.subtleStyle, bg).Render(strings.Repeat("·", width))
 	}
@@ -103,7 +115,7 @@ func (m Model) latencySparkline(latencies []time.Duration, statuses []bool, widt
 	return sb.String()
 }
-func (m Model) heartbeatSparkline(statuses []bool, width int, bg lipgloss.Color) string {
+func (m Model) heartbeatSparkline(statuses []bool, width int, bg lipgloss.TerminalColor) string {
 	if len(statuses) == 0 {
 		return withBg(m.st.subtleStyle, bg).Render(strings.Repeat("·", width))
 	}
@@ -143,7 +155,7 @@ func resolveSparklineIndex(x, sparkWidth, dataLen int) int {
 	return offset + (x - padding)
 }
-func (m Model) groupSparkline(groupID int, width int, bg lipgloss.Color) string {
+func (m Model) groupSparkline(groupID int, width int, bg lipgloss.TerminalColor) string {
 	allSites := m.engine.GetAllSites()
 	var childStatuses [][]bool
 	for _, s := range allSites {
@@ -5,10 +5,12 @@ import (
 	"testing"
 	"time"
 	"unicode/utf8"
 	"github.com/charmbracelet/lipgloss"
 )
 func TestLatencySparkline_Empty(t *testing.T) {
-	got := styledModel.latencySparkline(nil, nil, 10, "")
+	got := styledModel.latencySparkline(nil, nil, 10, nil)
 	if !strings.Contains(got, "··········") {
 		t.Errorf("empty sparkline should be dots, got %q", got)
 	}
@@ -17,7 +19,7 @@ func TestLatencySparkline_Empty(t *testing.T) {
 func TestLatencySparkline_SingleValue(t *testing.T) {
 	latencies := []time.Duration{100 * time.Millisecond}
 	statuses := []bool{true}
-	got := styledModel.latencySparkline(latencies, statuses, 5, "")
+	got := styledModel.latencySparkline(latencies, statuses, 5, nil)
 	if len(got) == 0 {
 		t.Error("sparkline should not be empty")
 	}
@@ -33,7 +35,7 @@ func TestLatencySparkline_WidthTruncation(t *testing.T) {
 		latencies[i] = time.Duration(i*50) * time.Millisecond
 		statuses[i] = true
 	}
-	got := styledModel.latencySparkline(latencies, statuses, 5, "")
+	got := styledModel.latencySparkline(latencies, statuses, 5, nil)
 	if len(got) == 0 {
 		t.Error("sparkline should not be empty")
 	}
@@ -45,7 +47,7 @@ func TestLatencySparkline_WidthTruncation(t *testing.T) {
 func TestLatencySparkline_RelativeHeight(t *testing.T) {
 	latencies := []time.Duration{10 * time.Millisecond, 50 * time.Millisecond, 10 * time.Millisecond}
 	statuses := []bool{true, true, true}
-	out := stripANSI(styledModel.latencySparkline(latencies, statuses, 3, ""))
+	out := stripANSI(styledModel.latencySparkline(latencies, statuses, 3, nil))
 	runes := []rune(out)
 	if len(runes) < 3 {
 		t.Fatalf("expected 3 runes, got %d", len(runes))
@@ -57,14 +59,14 @@ func TestLatencySparkline_RelativeHeight(t *testing.T) {
 func TestLatencyStyle_BandsProduceDifferentColors(t *testing.T) {
 	st := newStyles(themeFlexokiDark)
-	st.sparkSuccess = "#00ff00"
+	st.sparkSuccess = lipgloss.Color("#00ff00")
-	st.sparkWarning = "#ffff00"
+	st.sparkWarning = lipgloss.Color("#ffff00")
-	st.sparkDanger = "#ff0000"
+	st.sparkDanger = lipgloss.Color("#ff0000")
 	m := Model{st: st}
-	green := m.latencyStyle(50, "")
+	green := m.latencyStyle(50, nil)
-	yellow := m.latencyStyle(300, "")
+	yellow := m.latencyStyle(300, nil)
-	red := m.latencyStyle(800, "")
+	red := m.latencyStyle(800, nil)
 	gfg := green.GetForeground()
 	yfg := yellow.GetForeground()
@@ -77,11 +79,11 @@ func TestLatencyStyle_BandsProduceDifferentColors(t *testing.T) {
 func TestLatencyStyle_BrightnessVariesWithinBand(t *testing.T) {
 	st := newStyles(themeFlexokiDark)
-	st.sparkSuccess = "#00ff00"
+	st.sparkSuccess = lipgloss.Color("#00ff00")
 	m := Model{st: st}
-	dim := m.latencyStyle(10, "")
+	dim := m.latencyStyle(10, nil)
-	bright := m.latencyStyle(190, "")
+	bright := m.latencyStyle(190, nil)
 	if dim.GetForeground() == bright.GetForeground() {
 		t.Error("10ms and 190ms should have different brightness within green band")
@@ -91,7 +93,7 @@ func TestLatencyStyle_BrightnessVariesWithinBand(t *testing.T) {
 func TestLatencySparkline_OutputWidth(t *testing.T) {
 	latencies := []time.Duration{100 * time.Millisecond, 200 * time.Millisecond, 300 * time.Millisecond}
 	statuses := []bool{true, true, true}
-	got := styledModel.latencySparkline(latencies, statuses, 5, "")
+	got := styledModel.latencySparkline(latencies, statuses, 5, nil)
 	count := utf8.RuneCountInString(stripANSI(got))
 	if count != 5 {
 		t.Errorf("expected 5 rune-width output, got %d from %q", count, got)
@@ -116,7 +118,7 @@ func stripANSI(s string) string {
 }
 func TestHeartbeatSparkline_Empty(t *testing.T) {
-	got := styledModel.heartbeatSparkline(nil, 10, "")
+	got := styledModel.heartbeatSparkline(nil, 10, nil)
 	if !strings.Contains(got, "··········") {
 		t.Errorf("empty heartbeat should be dots, got %q", got)
 	}
@@ -124,7 +126,7 @@ func TestHeartbeatSparkline_Empty(t *testing.T) {
 func TestHeartbeatSparkline_Mixed(t *testing.T) {
 	statuses := []bool{true, false, true, true, false}
-	got := styledModel.heartbeatSparkline(statuses, 5, "")
+	got := styledModel.heartbeatSparkline(statuses, 5, nil)
 	if len(got) == 0 {
 		t.Error("heartbeat sparkline should not be empty")
 	}
@@ -132,7 +134,7 @@ func TestHeartbeatSparkline_Mixed(t *testing.T) {
 func TestHeartbeatSparkline_PaddedWidth(t *testing.T) {
 	statuses := []bool{true, true}
-	got := styledModel.heartbeatSparkline(statuses, 5, "")
+	got := styledModel.heartbeatSparkline(statuses, 5, nil)
 	if !strings.Contains(got, "···") {
 		t.Errorf("should have dot padding for width > data, got %q", got)
 	}
@@ -1,9 +1,13 @@
 package tui
 import (
 	"context"
 	"fmt"
 	neturl "net/url"
 	"sort"
 	"strings"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	tea "github.com/charmbracelet/bubbletea"
 	"github.com/charmbracelet/huh"
@@ -71,10 +75,7 @@ func fmtAlertType(t string) string {
 	}
 }
-func (m Model) fmtAlertConfig(alert struct {
+func (m Model) fmtAlertConfig(alert models.AlertConfig) string {
 	Type     string
 	Settings map[string]string
 }) string {
 	switch alert.Type {
 	case "email":
 		host := alert.Settings["host"]
@@ -100,15 +101,17 @@ func (m Model) fmtAlertConfig(alert struct {
 		return m.st.subtleStyle.Render("—")
 	case "pagerduty":
 		if key := alert.Settings["routing_key"]; key != "" {
-			return limitStr(key, 34)
+			return limitStr(maskSecret(key), 34)
 		}
 		return m.st.subtleStyle.Render("—")
 	case "pushover":
 		if user := alert.Settings["user"]; user != "" {
-			return limitStr(fmt.Sprintf("user:%s", user), 34)
+			return limitStr(fmt.Sprintf("user:%s", maskSecret(user)), 34)
 		}
 		return m.st.subtleStyle.Render("—")
 	case "gotify":
 		// The gotify server URL identifies the target; the token is the
 		// secret and is never shown here.
 		if url := alert.Settings["url"]; url != "" {
 			return limitStr(url, 34)
 		}
@@ -116,10 +119,7 @@ func (m Model) fmtAlertConfig(alert struct {
 	case "opsgenie":
 		key := alert.Settings["api_key"]
 		if key != "" {
-			masked := key
+			masked := maskSecret(key)
 			if len(masked) > 8 {
 				masked = masked[:4] + "…" + masked[len(masked)-4:]
 			}
 			if alert.Settings["eu"] == "true" {
 				return limitStr(fmt.Sprintf("EU %s", masked), 34)
 			}
@@ -127,13 +127,33 @@ func (m Model) fmtAlertConfig(alert struct {
 		}
 		return m.st.subtleStyle.Render("—")
 	default:
-		if val, ok := alert.Settings["url"]; ok {
+		// discord/slack/webhook: the URL path IS the credential — show only
-			return limitStr(val, 34)
+		// enough to identify the target.
 		if val, ok := alert.Settings["url"]; ok && val != "" {
 			return limitStr(maskWebhookURL(val), 34)
 		}
 		return m.st.subtleStyle.Render("—")
 	}
 }
 // maskSecret keeps just enough of a credential to identify it.
 func maskSecret(s string) string {
 	if len(s) > 8 {
 		return s[:4] + "…" + s[len(s)-4:]
 	}
 	return "●●●●●●●●"
 }
 // maskWebhookURL shows scheme and host only. For discord, slack, and generic
 // webhooks the URL path carries the token, so the path is never rendered.
 func maskWebhookURL(raw string) string {
 	u, err := neturl.Parse(raw)
 	if err != nil || u.Host == "" {
 		return "●●●●●●●●"
 	}
 	return u.Scheme + "://" + u.Host + "/…"
 }
 func (m Model) fmtAlertHealth(h monitor.AlertHealth) string {
 	if h.LastSendAt.IsZero() {
 		return m.st.subtleStyle.Render("●")
@@ -178,10 +198,7 @@ func (m Model) viewAlertsTab() string {
 					m.fmtAlertHealth(h),
 					m.zones.Mark(fmt.Sprintf("alert-%d", i), limitStr(a.Name, nameW-2)),
 					fmtAlertType(a.Type),
-					limitStr(m.fmtAlertConfig(struct {
+					limitStr(m.fmtAlertConfig(a), cfgW-2),
 						Type     string
 						Settings map[string]string
 					}{a.Type, a.Settings}), cfgW-2),
 					m.fmtAlertLastSent(h),
 				})
 			}
@@ -229,12 +246,26 @@ func (m Model) viewAlertDetailPanel() string {
 	b.WriteString(m.divider() + "\n")
 	b.WriteString(m.st.subtleStyle.Render("  CONFIGURATION") + "\n")
-	for k, v := range a.Settings {
+	// Render through the same allowlist the backup export uses — this panel
 	// ends up in screen shares and asciinema recordings. Keys are sorted so
 	// rows don't reshuffle every render.
 	redacted := models.RedactAlertSettings(a.Type, a.Settings)
 	keys := make([]string, 0, len(redacted))
 	for k := range redacted {
 		keys = append(keys, k)
 	}
 	sort.Strings(keys)
 	for _, k := range keys {
 		v := redacted[k]
 		if v == "***REDACTED***" {
 			row(k, m.st.subtleStyle.Render("●●●●●●●●"))
 			continue
 		}
 		row(k, v)
 	}
 	b.WriteString(m.divider() + "\n")
-	b.WriteString(m.st.subtleStyle.Render("  [i/Esc] Back  [e] Edit  [t] Test  [q] Quit"))
+	b.WriteString(m.st.subtleStyle.Render("  [q/Esc] Back  [e] Edit  [t] Test"))
 	return lipgloss.NewStyle().Padding(1, 2).Render(b.String())
 }
@@ -492,10 +523,10 @@ func (m *Model) submitAlertForm() tea.Cmd {
 	m.state = stateDashboard
 	if id > 0 {
 		return writeCmd("Update alert", func() error {
-			return st.UpdateAlert(id, name, aType, settings)
+			return st.UpdateAlert(context.Background(), id, name, aType, settings)
 		})
 	}
 	return writeCmd("Add alert", func() error {
-		return st.AddAlert(name, aType, settings)
+		return st.AddAlert(context.Background(), name, aType, settings)
 	})
 }
@@ -0,0 +1,62 @@
 package tui
 import (
 	"strings"
 	"testing"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 )
 func TestAlertDetailPanel_MasksSecretsStableOrder(t *testing.T) {
 	m := newTestModel(&tuiMockStore{})
 	m.termWidth, m.termHeight = 120, 40
 	m.alerts = []models.AlertConfig{{
 		ID: 1, Name: "ops", Type: "email",
 		Settings: map[string]string{
 			"host": "smtp.example.com",
 			"port": "587",
 			"user": "oncall@example.com",
 			"pass": "hunter2-secret",
 			"to":   "team@example.com",
 		},
 	}}
 	m.cursor = 0
 	out := m.viewAlertDetailPanel()
 	if strings.Contains(out, "hunter2-secret") {
 		t.Error("SMTP password rendered in alert detail panel")
 	}
 	if strings.Contains(out, "oncall@example.com") {
 		t.Error("SMTP user (not on the allowlist) rendered in alert detail panel")
 	}
 	if !strings.Contains(out, "smtp.example.com") {
 		t.Error("allowlisted setting (host) missing from panel")
 	}
 	// Map iteration must not reshuffle rows between renders.
 	for i := 0; i < 5; i++ {
 		if m.viewAlertDetailPanel() != out {
 			t.Fatal("panel output unstable across renders — settings keys not sorted")
 		}
 	}
 }
 func TestFmtAlertConfig_MasksSecrets(t *testing.T) {
 	m := newTestModel(&tuiMockStore{})
 	webhook := m.fmtAlertConfig(models.AlertConfig{Type: "discord", Settings: map[string]string{"url": "https://discord.com/api/webhooks/123456/SeCrEtToKeN"}})
 	if strings.Contains(webhook, "SeCrEtToKeN") || strings.Contains(webhook, "123456") {
 		t.Errorf("webhook URL path (the credential) rendered in table: %q", webhook)
 	}
 	if !strings.Contains(webhook, "discord.com") {
 		t.Errorf("webhook host missing from table config: %q", webhook)
 	}
 	pd := m.fmtAlertConfig(models.AlertConfig{Type: "pagerduty", Settings: map[string]string{"routing_key": "R0123456789ABCDEFGHIJ"}})
 	if strings.Contains(pd, "R0123456789ABCDEFGHIJ") {
 		t.Errorf("pagerduty routing key rendered raw in table: %q", pd)
 	}
 	if !strings.Contains(pd, "R012") || !strings.Contains(pd, "GHIJ") {
 		t.Errorf("masked routing key should keep identifying ends: %q", pd)
 	}
 }
@@ -82,18 +82,15 @@ func (m Model) renderLogLine(line string) string {
 	return fmt.Sprintf("  %s  %s", tag, msg)
 }
-func (m Model) viewLogsTab() string {
+// refreshLogContent rebuilds the log viewport from the full engine log list,
-	content := m.logViewport.View()
+// filtering before windowing so the entry count and "(n hidden)" reflect all
-	if strings.TrimSpace(content) == "" || content == "Waiting for logs..." {
+// logs, not just the visible viewport slice.
-		return m.emptyState("No log entries yet.", "Logs appear as monitors run checks")
+func (m *Model) refreshLogContent() {
 	}
 	lines := strings.Split(content, "\n")
 	var rendered []string
 	total := 0
 	shown := 0
-	for _, line := range lines {
+	for _, line := range m.engine.GetLogs() {
 		if strings.TrimSpace(line) == "" {
 			continue
 		}
@@ -106,18 +103,27 @@ func (m Model) viewLogsTab() string {
 		rendered = append(rendered, m.renderLogLine(line))
 	}
 	m.logTotal = total
 	m.logShown = shown
 	m.logViewport.SetContent(strings.Join(rendered, "\n"))
 }
 func (m Model) viewLogsTab() string {
 	if m.logTotal == 0 {
 		return m.emptyState("No log entries yet.", "Logs appear as monitors run checks")
 	}
 	filterLabel := "All"
 	if m.logFilterImportant {
 		filterLabel = "Important"
 	}
 	header := m.st.subtleStyle.Render(fmt.Sprintf(
-		"  %d entries  Filter: %s", shown, filterLabel))
+		"  %d entries  Filter: %s", m.logShown, filterLabel))
-	if m.logFilterImportant && shown < total {
+	if m.logFilterImportant && m.logShown < m.logTotal {
-		header += m.st.subtleStyle.Render(fmt.Sprintf("  (%d hidden)", total-shown))
+		header += m.st.subtleStyle.Render(fmt.Sprintf("  (%d hidden)", m.logTotal-m.logShown))
 	}
 	m.logViewport.SetContent(strings.Join(rendered, "\n"))
 	return "\n" + header + "\n\n" + m.logViewport.View()
 }
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"fmt"
 	"strconv"
 	"time"
@@ -240,6 +241,6 @@ func (m *Model) submitMaintForm() tea.Cmd {
 	st := m.store
 	m.state = stateDashboard
 	return writeCmd("Add maintenance window", func() error {
-		return st.AddMaintenanceWindow(mw)
+		return st.AddMaintenanceWindow(context.Background(), mw)
 	})
 }
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"fmt"
 	"net/url"
 	"strconv"
@@ -203,7 +204,7 @@ func (m Model) viewSitesTab() string {
 			for i := start; i < end; i++ {
 				site := m.sites[i]
 				rowIdx := i - start
-				var rowBg lipgloss.Color
+				var rowBg lipgloss.TerminalColor
 				if i == m.cursor {
 					rowBg = m.theme.SelectedBg
 				} else if rowIdx%2 == 1 {
@@ -239,7 +240,7 @@ func (m Model) viewSitesTab() string {
 					name = limitStr(name, nameW-2)
 				}
-				if (site.Status == "DOWN" || site.Status == "SSL EXP" || site.Status == "LATE" || site.Status == "STALE") && site.LastError != "" {
+				if (site.Status == models.StatusDown || site.Status == models.StatusSSLExp || site.Status == models.StatusLate || site.Status == models.StatusStale) && site.LastError != "" {
 					nameLen := len([]rune(name))
 					errSpace := nameW - nameLen - 3
 					if errSpace > 10 {
@@ -325,101 +326,104 @@ func (m *Model) initSiteHuhForm() tea.Cmd {
 		}
 	}
-	// m.alerts is the tab-data cache (≤5s stale) — no store IO in Update.
+	return m.rebuildSiteForm()
-	alertOpts := []huh.Option[string]{huh.NewOption("None", "0")}
+}
 func (m *Model) rebuildSiteForm() tea.Cmd {
 	groups := m.buildSiteFormGroups()
 	m.huhForm = huh.NewForm(groups...).WithTheme(m.theme.HuhTheme())
 	if m.termWidth > 0 {
 		m.huhForm.WithWidth(m.termWidth)
 	}
 	formHeight := m.termHeight - 7
 	if formHeight < 5 {
 		formHeight = 5
 	}
 	m.huhForm.WithHeight(formHeight)
 	m.lastSiteType = m.siteFormData.SiteType
 	return m.huhForm.Init()
 }
 func (m *Model) siteFormOptions() (alertOpts, groupOpts []huh.Option[string]) {
 	alertOpts = []huh.Option[string]{huh.NewOption("None", "0")}
 	for _, a := range m.alerts {
 		alertOpts = append(alertOpts, huh.NewOption(
 			fmt.Sprintf("%s (%s)", a.Name, a.Type),
 			strconv.Itoa(a.ID),
 		))
 	}
-
+	groupOpts = []huh.Option[string]{huh.NewOption("None", "0")}
 	groupOpts := []huh.Option[string]{huh.NewOption("None", "0")}
 	for _, s := range m.sites {
 		if s.Type == "group" && s.ID != m.editID {
 			groupOpts = append(groupOpts, huh.NewOption(s.Name, strconv.Itoa(s.ID)))
 		}
 	}
 	return
 }
-	m.huhForm = huh.NewForm(
+func (m *Model) buildSiteFormGroups() []*huh.Group {
-		huh.NewGroup(
+	d := m.siteFormData
-			huh.NewInput().Title("Monitor Name").
+	alertOpts, groupOpts := m.siteFormOptions()
-				Placeholder("My Service").
+
-				Value(&m.siteFormData.Name).
+	// Page 1 — Monitor Setup: core fields + type-specific target
-				Validate(func(s string) error {
+	setup := []huh.Field{
-					if s == "" {
+		huh.NewInput().Title("Monitor Name").
-						return fmt.Errorf("name is required")
+			Placeholder("My Service").
-					}
+			Value(&d.Name).
-					return nil
+			Validate(func(s string) error {
-				}),
+				if s == "" {
-			huh.NewSelect[string]().Title("Monitor Type").
+					return fmt.Errorf("name is required")
-				Options(
+				}
-					huh.NewOption("HTTP/HTTPS", "http"),
+				return nil
-					huh.NewOption("Push / Heartbeat", "push"),
+			}),
-					huh.NewOption("Ping (ICMP)", "ping"),
+		huh.NewSelect[string]().Title("Monitor Type").
-					huh.NewOption("TCP Port", "port"),
+			Options(
-					huh.NewOption("DNS", "dns"),
+				huh.NewOption("HTTP/HTTPS", "http"),
-					huh.NewOption("Group", "group"),
+				huh.NewOption("Push / Heartbeat", "push"),
-				).Value(&m.siteFormData.SiteType),
+				huh.NewOption("Ping (ICMP)", "ping"),
-			huh.NewSelect[string]().Title("Alert Channel").
+				huh.NewOption("TCP Port", "port"),
-				Options(alertOpts...).
+				huh.NewOption("DNS", "dns"),
-				Value(&m.siteFormData.AlertID),
+				huh.NewOption("Group", "group"),
-		).Title("Monitor Settings"),
+			).Value(&d.SiteType),
-		huh.NewGroup(
+		huh.NewSelect[string]().Title("Alert Channel").
-			huh.NewInput().Title("URL").
+			Options(alertOpts...).
-				Placeholder("https://example.com").
+			Value(&d.AlertID),
-				Description("Required for HTTP monitors").
+	}
-				Value(&m.siteFormData.URL).
+
-				Validate(func(s string) error {
+	switch d.SiteType {
-					if m.siteFormData.SiteType != "http" {
+	case "http":
-						return nil
+		setup = append(setup, huh.NewInput().Title("URL").
-					}
+			Placeholder("https://example.com").
-					if s == "" {
+			Value(&d.URL).
-						return fmt.Errorf("URL is required for HTTP monitors")
+			Validate(func(s string) error {
-					}
+				if s == "" {
-					u, err := url.Parse(s)
+					return fmt.Errorf("URL is required")
-					if err != nil {
+				}
-						return fmt.Errorf("invalid URL")
+				u, err := url.Parse(s)
-					}
+				if err != nil {
-					if u.Scheme != "http" && u.Scheme != "https" {
+					return fmt.Errorf("invalid URL")
-						return fmt.Errorf("URL must start with http:// or https://")
+				}
-					}
+				if u.Scheme != "http" && u.Scheme != "https" {
-					if u.Host == "" {
+					return fmt.Errorf("URL must start with http:// or https://")
-						return fmt.Errorf("URL must include a host")
+				}
-					}
+				if u.Host == "" {
-					return nil
+					return fmt.Errorf("URL must include a host")
-				}),
+				}
-			huh.NewInput().Title("Check Interval (seconds)").
+				return nil
-				Placeholder("60").
+			}))
-				Value(&m.siteFormData.Interval).
+	case "ping", "dns":
-				Validate(func(s string) error {
+		setup = append(setup, huh.NewInput().Title("Hostname / IP").
-					if m.siteFormData.SiteType == "group" {
+			Placeholder("10.0.0.1").
-						return nil
+			Value(&d.Hostname))
-					}
+	case "port":
-					v, err := strconv.Atoi(s)
+		setup = append(setup,
 					if err != nil {
 						return fmt.Errorf("must be a number")
 					}
 					if v < 5 {
 						return fmt.Errorf("minimum interval is 5 seconds")
 					}
 					return nil
 				}),
 			huh.NewSelect[string]().Title("Parent Group").
 				Options(groupOpts...).
 				Value(&m.siteFormData.GroupID),
 			huh.NewInput().Title("Hostname / IP").
 				Placeholder("10.0.0.1").
-				Description("Target for ping/port/DNS monitors").
+				Value(&d.Hostname),
 				Value(&m.siteFormData.Hostname),
 			huh.NewInput().Title("Port").
-				Placeholder("0").
+				Placeholder("443").
-				Description("Target port for TCP port monitors").
+				Value(&d.Port).
 				Value(&m.siteFormData.Port).
 				Validate(func(s string) error {
 					if m.siteFormData.SiteType != "port" {
 						return nil
 					}
 					v, err := strconv.Atoi(s)
 					if err != nil {
 						return fmt.Errorf("must be a number")
@@ -428,34 +432,20 @@ func (m *Model) initSiteHuhForm() tea.Cmd {
 						return fmt.Errorf("port must be 1-65535")
 					}
 					return nil
-				}),
+				}))
-			huh.NewInput().Title("Timeout (seconds)").
+	}
-				Placeholder("5").
+
-				Value(&m.siteFormData.Timeout).
+	groups := []*huh.Group{huh.NewGroup(setup...).Title("Monitor Setup")}
-				Validate(func(s string) error {
+
-					if m.siteFormData.SiteType == "group" {
+	if d.SiteType == "group" {
-						return nil
+		return groups
-					}
+	}
-					v, err := strconv.Atoi(s)
+
-					if err != nil {
+	// Page 2 — Configuration: type-specific options + shared defaults
-						return fmt.Errorf("must be a number")
+	var config []huh.Field
-					}
+
-					if v < 1 || v > 300 {
+	if d.SiteType == "http" {
-						return fmt.Errorf("timeout must be 1-300 seconds")
+		config = append(config,
 					}
 					return nil
 				}),
 			huh.NewInput().Title("Description").
 				Placeholder("Optional description").
 				Value(&m.siteFormData.Description),
 			huh.NewInput().Title("Probe Regions").
 				Placeholder("us-east, eu-west (empty = all)").
 				Description("Comma-separated regions for distributed probing").
 				Value(&m.siteFormData.Regions),
 		).Title("Connection").WithHideFunc(func() bool {
 			return m.siteFormData.SiteType == "group"
 		}),
 		huh.NewGroup(
 			huh.NewSelect[string]().Title("HTTP Method").
 				Options(
 					huh.NewOption("GET", "GET"),
@@ -465,22 +455,75 @@ func (m *Model) initSiteHuhForm() tea.Cmd {
 					huh.NewOption("DELETE", "DELETE"),
 					huh.NewOption("HEAD", "HEAD"),
 					huh.NewOption("OPTIONS", "OPTIONS"),
-				).Value(&m.siteFormData.Method),
+				).Value(&d.Method),
 			huh.NewInput().Title("Accepted Status Codes").
 				Placeholder("200-299").
 				Description("Ranges (200-299) and singles (301) separated by commas").
-				Value(&m.siteFormData.AcceptedCodes),
+				Value(&d.AcceptedCodes),
-		).Title("HTTP Settings").WithHideFunc(func() bool {
+		)
-			return m.siteFormData.SiteType != "http"
+	}
-		}),
+
-		huh.NewGroup(
+	config = append(config,
 		huh.NewInput().Title("Check Interval (seconds)").
 			Placeholder("60").
 			Value(&d.Interval).
 			Validate(func(s string) error {
 				v, err := strconv.Atoi(s)
 				if err != nil {
 					return fmt.Errorf("must be a number")
 				}
 				if v < 5 {
 					return fmt.Errorf("minimum interval is 5 seconds")
 				}
 				return nil
 			}),
 		huh.NewInput().Title("Timeout (seconds)").
 			Placeholder("5").
 			Value(&d.Timeout).
 			Validate(func(s string) error {
 				v, err := strconv.Atoi(s)
 				if err != nil {
 					return fmt.Errorf("must be a number")
 				}
 				if v < 1 || v > 300 {
 					return fmt.Errorf("timeout must be 1-300 seconds")
 				}
 				return nil
 			}),
 		huh.NewInput().Title("Max Retries Before Alert").
 			Placeholder("0").
 			Value(&d.Retries).
 			Validate(func(s string) error {
 				v, err := strconv.Atoi(s)
 				if err != nil {
 					return fmt.Errorf("must be a number")
 				}
 				if v < 0 {
 					return fmt.Errorf("retries cannot be negative")
 				}
 				return nil
 			}),
 		huh.NewSelect[string]().Title("Parent Group").
 			Options(groupOpts...).
 			Value(&d.GroupID),
 		huh.NewInput().Title("Description").
 			Placeholder("Optional description").
 			Value(&d.Description),
 		huh.NewInput().Title("Probe Regions").
 			Placeholder("us-east, eu-west (empty = all)").
 			Description("Comma-separated regions for distributed probing").
 			Value(&d.Regions),
 	)
 	if d.SiteType == "http" {
 		config = append(config,
 			huh.NewConfirm().Title("Monitor SSL Certificate?").
-				Value(&m.siteFormData.CheckSSL),
+				Value(&d.CheckSSL),
 			huh.NewInput().Title("SSL Warning Threshold (days)").
 				Placeholder("7").
-				Value(&m.siteFormData.Threshold).
+				Value(&d.Threshold).
 				Validate(func(s string) error {
-					if !m.siteFormData.CheckSSL {
+					if !d.CheckSSL {
 						return nil
 					}
 					v, err := strconv.Atoi(s)
@@ -492,30 +535,13 @@ func (m *Model) initSiteHuhForm() tea.Cmd {
 					}
 					return nil
 				}),
 			huh.NewInput().Title("Max Retries Before Alert").
 				Placeholder("0").
 				Value(&m.siteFormData.Retries).
 				Validate(func(s string) error {
 					if m.siteFormData.SiteType == "group" {
 						return nil
 					}
 					v, err := strconv.Atoi(s)
 					if err != nil {
 						return fmt.Errorf("must be a number")
 					}
 					if v < 0 {
 						return fmt.Errorf("retries cannot be negative")
 					}
 					return nil
 				}),
 			huh.NewConfirm().Title("Ignore TLS Errors?").
-				Value(&m.siteFormData.IgnoreTLS),
+				Value(&d.IgnoreTLS),
-		).Title("Advanced").WithHideFunc(func() bool {
+		)
-			return m.siteFormData.SiteType == "group"
+	}
 		}),
 	).WithTheme(m.theme.HuhTheme())
-	return m.huhForm.Init()
+	groups = append(groups, huh.NewGroup(config...).Title("Configuration"))
 	return groups
 }
 func (m *Model) submitSiteForm() tea.Cmd {
@@ -534,7 +560,7 @@ func (m *Model) submitSiteForm() tea.Cmd {
 		threshold = 7
 	}
-	site := models.Site{
+	cfg := models.SiteConfig{
 		ID:              m.editID,
 		Name:            d.Name,
 		URL:             d.URL,
@@ -558,11 +584,8 @@ func (m *Model) submitSiteForm() tea.Cmd {
 	st := m.store
 	m.state = stateDashboard
 	if m.editID > 0 {
-		// The engine's in-memory config updates immediately; the DB write
+		m.engine.UpdateSiteConfig(cfg)
-		// follows in the Cmd. New sites enter the engine via its poll loop
+		return writeCmd("Update site", func() error { return st.UpdateSite(context.Background(), cfg) })
 		// once the insert lands.
 		m.engine.UpdateSiteConfig(site)
 		return writeCmd("Update site", func() error { return st.UpdateSite(site) })
 	}
-	return writeCmd("Add site", func() error { return st.AddSite(site) })
+	return writeCmd("Add site", func() error { return st.AddSite(context.Background(), cfg) })
 }
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"fmt"
 	tea "github.com/charmbracelet/bubbletea"
@@ -118,10 +119,10 @@ func (m *Model) submitUserForm() tea.Cmd {
 	m.state = stateUsers
 	if id > 0 {
 		return writeCmd("Update user", func() error {
-			return st.UpdateUser(id, username, key, role)
+			return st.UpdateUser(context.Background(), id, username, key, role)
 		})
 	}
 	return writeCmd("Add user", func() error {
-		return st.AddUser(username, key, role)
+		return st.AddUser(context.Background(), username, key, role)
 	})
 }
@@ -5,35 +5,43 @@ import (
 	"github.com/charmbracelet/lipgloss"
 )
 func cc(hex, ansi string) lipgloss.CompleteColor {
 	return lipgloss.CompleteColor{
 		TrueColor: hex,
 		ANSI256:   hex,
 		ANSI:      ansi,
 	}
 }
 type Theme struct {
 	Name string
 	// Base layers
-	Bg      lipgloss.Color
+	Bg      lipgloss.TerminalColor
-	Surface lipgloss.Color
+	Surface lipgloss.TerminalColor
-	Panel   lipgloss.Color
+	Panel   lipgloss.TerminalColor
-	Border  lipgloss.Color
+	Border  lipgloss.TerminalColor
 	// Text
-	Fg     lipgloss.Color
+	Fg     lipgloss.TerminalColor
-	Muted  lipgloss.Color
+	Muted  lipgloss.TerminalColor
-	Subtle lipgloss.Color
+	Subtle lipgloss.TerminalColor
 	// Semantic
-	Success lipgloss.Color
+	Success lipgloss.TerminalColor
-	Warning lipgloss.Color
+	Warning lipgloss.TerminalColor
-	Stale   lipgloss.Color
+	Stale   lipgloss.TerminalColor
-	Danger  lipgloss.Color
+	Danger  lipgloss.TerminalColor
-	Info    lipgloss.Color
+	Info    lipgloss.TerminalColor
-	Accent  lipgloss.Color
+	Accent  lipgloss.TerminalColor
-	Purple  lipgloss.Color
+	Purple  lipgloss.TerminalColor
 	// Table
-	ZebraBg lipgloss.Color
+	ZebraBg lipgloss.TerminalColor
 	// Selection
-	SelectedFg lipgloss.Color
+	SelectedFg lipgloss.TerminalColor
-	SelectedBg lipgloss.Color
+	SelectedBg lipgloss.TerminalColor
 }
 var themes = []Theme{
@@ -46,107 +54,107 @@ var themes = []Theme{
 var themeFlexokiDark = Theme{
 	Name:       "Flexoki Dark",
-	Bg:         "#1C1B1A",
+	Bg:         cc("#1C1B1A", ""),
-	Surface:    "#282726",
+	Surface:    cc("#282726", ""),
-	Panel:      "#343331",
+	Panel:      cc("#343331", ""),
-	Border:     "#575653",
+	Border:     cc("#575653", "8"),
-	Fg:         "#CECDC3",
+	Fg:         cc("#CECDC3", "15"),
-	Muted:      "#878580",
+	Muted:      cc("#878580", "7"),
-	Subtle:     "#6F6E69",
+	Subtle:     cc("#6F6E69", "7"),
-	Success:    "#879A39",
+	Success:    cc("#879A39", "10"),
-	Warning:    "#D0A215",
+	Warning:    cc("#D0A215", "11"),
-	Stale:      "#DA702C",
+	Stale:      cc("#DA702C", "3"),
-	Danger:     "#D14D41",
+	Danger:     cc("#D14D41", "9"),
-	Info:       "#4385BE",
+	Info:       cc("#4385BE", "12"),
-	Accent:     "#3AA99F",
+	Accent:     cc("#3AA99F", "14"),
-	Purple:     "#8B7EC8",
+	Purple:     cc("#8B7EC8", "13"),
-	ZebraBg:    "#222120",
+	ZebraBg:    cc("#222120", ""),
-	SelectedFg: "#FFFCF0",
+	SelectedFg: cc("#FFFCF0", "15"),
-	SelectedBg: "#403E3C",
+	SelectedBg: cc("#403E3C", "4"),
 }
 var themeTokyoNight = Theme{
 	Name:       "Tokyo Night",
-	Bg:         "#1a1b26",
+	Bg:         cc("#1a1b26", ""),
-	Surface:    "#24283b",
+	Surface:    cc("#24283b", ""),
-	Panel:      "#292e42",
+	Panel:      cc("#292e42", ""),
-	Border:     "#3b4261",
+	Border:     cc("#3b4261", "8"),
-	Fg:         "#c0caf5",
+	Fg:         cc("#c0caf5", "15"),
-	Muted:      "#a9b1d6",
+	Muted:      cc("#a9b1d6", "7"),
-	Subtle:     "#565f89",
+	Subtle:     cc("#565f89", "7"),
-	Success:    "#9ece6a",
+	Success:    cc("#9ece6a", "10"),
-	Warning:    "#e0af68",
+	Warning:    cc("#e0af68", "11"),
-	Stale:      "#ff9e64",
+	Stale:      cc("#ff9e64", "3"),
-	Danger:     "#f7768e",
+	Danger:     cc("#f7768e", "9"),
-	Info:       "#7aa2f7",
+	Info:       cc("#7aa2f7", "12"),
-	Accent:     "#7dcfff",
+	Accent:     cc("#7dcfff", "14"),
-	Purple:     "#bb9af7",
+	Purple:     cc("#bb9af7", "13"),
-	ZebraBg:    "#1c1d28",
+	ZebraBg:    cc("#1c1d28", ""),
-	SelectedFg: "#c0caf5",
+	SelectedFg: cc("#c0caf5", "15"),
-	SelectedBg: "#292e42",
+	SelectedBg: cc("#292e42", "4"),
 }
 var themeGruvbox = Theme{
 	Name:       "Gruvbox",
-	Bg:         "#282828",
+	Bg:         cc("#282828", ""),
-	Surface:    "#3c3836",
+	Surface:    cc("#3c3836", ""),
-	Panel:      "#504945",
+	Panel:      cc("#504945", ""),
-	Border:     "#665c54",
+	Border:     cc("#665c54", "8"),
-	Fg:         "#ebdbb2",
+	Fg:         cc("#ebdbb2", "15"),
-	Muted:      "#bdae93",
+	Muted:      cc("#bdae93", "7"),
-	Subtle:     "#7c6f64",
+	Subtle:     cc("#7c6f64", "7"),
-	Success:    "#b8bb26",
+	Success:    cc("#b8bb26", "10"),
-	Warning:    "#fabd2f",
+	Warning:    cc("#fabd2f", "11"),
-	Stale:      "#fe8019",
+	Stale:      cc("#fe8019", "3"),
-	Danger:     "#fb4934",
+	Danger:     cc("#fb4934", "9"),
-	Info:       "#83a598",
+	Info:       cc("#83a598", "12"),
-	Accent:     "#8ec07c",
+	Accent:     cc("#8ec07c", "14"),
-	Purple:     "#d3869b",
+	Purple:     cc("#d3869b", "13"),
-	ZebraBg:    "#2a2a2a",
+	ZebraBg:    cc("#2a2a2a", ""),
-	SelectedFg: "#fbf1c7",
+	SelectedFg: cc("#fbf1c7", "15"),
-	SelectedBg: "#504945",
+	SelectedBg: cc("#504945", "4"),
 }
 var themeCatppuccinMocha = Theme{
 	Name:       "Catppuccin Mocha",
-	Bg:         "#1e1e2e",
+	Bg:         cc("#1e1e2e", ""),
-	Surface:    "#313244",
+	Surface:    cc("#313244", ""),
-	Panel:      "#45475a",
+	Panel:      cc("#45475a", ""),
-	Border:     "#585b70",
+	Border:     cc("#585b70", "8"),
-	Fg:         "#cdd6f4",
+	Fg:         cc("#cdd6f4", "15"),
-	Muted:      "#a6adc8",
+	Muted:      cc("#a6adc8", "7"),
-	Subtle:     "#6c7086",
+	Subtle:     cc("#6c7086", "7"),
-	Success:    "#a6e3a1",
+	Success:    cc("#a6e3a1", "10"),
-	Warning:    "#f9e2af",
+	Warning:    cc("#f9e2af", "11"),
-	Stale:      "#fab387",
+	Stale:      cc("#fab387", "3"),
-	Danger:     "#f38ba8",
+	Danger:     cc("#f38ba8", "9"),
-	Info:       "#89b4fa",
+	Info:       cc("#89b4fa", "12"),
-	Accent:     "#94e2d5",
+	Accent:     cc("#94e2d5", "14"),
-	Purple:     "#cba6f7",
+	Purple:     cc("#cba6f7", "13"),
-	ZebraBg:    "#232334",
+	ZebraBg:    cc("#232334", ""),
-	SelectedFg: "#cdd6f4",
+	SelectedFg: cc("#cdd6f4", "15"),
-	SelectedBg: "#45475a",
+	SelectedBg: cc("#45475a", "4"),
 }
 var themeNord = Theme{
 	Name:       "Nord",
-	Bg:         "#2e3440",
+	Bg:         cc("#2e3440", ""),
-	Surface:    "#3b4252",
+	Surface:    cc("#3b4252", ""),
-	Panel:      "#434c5e",
+	Panel:      cc("#434c5e", ""),
-	Border:     "#4c566a",
+	Border:     cc("#4c566a", "8"),
-	Fg:         "#d8dee9",
+	Fg:         cc("#d8dee9", "15"),
-	Muted:      "#d8dee9",
+	Muted:      cc("#d8dee9", "7"),
-	Subtle:     "#4c566a",
+	Subtle:     cc("#4c566a", "7"),
-	Success:    "#a3be8c",
+	Success:    cc("#a3be8c", "10"),
-	Warning:    "#ebcb8b",
+	Warning:    cc("#ebcb8b", "11"),
-	Stale:      "#d08770",
+	Stale:      cc("#d08770", "3"),
-	Danger:     "#bf616a",
+	Danger:     cc("#bf616a", "9"),
-	Info:       "#81a1c1",
+	Info:       cc("#81a1c1", "12"),
-	Accent:     "#88c0d0",
+	Accent:     cc("#88c0d0", "14"),
-	Purple:     "#b48ead",
+	Purple:     cc("#b48ead", "13"),
-	ZebraBg:    "#323845",
+	ZebraBg:    cc("#323845", ""),
-	SelectedFg: "#eceff4",
+	SelectedFg: cc("#eceff4", "15"),
-	SelectedBg: "#434c5e",
+	SelectedBg: cc("#434c5e", "4"),
 }
 func (t Theme) HuhTheme() *huh.Theme {
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"os"
 	"time"
@@ -29,9 +30,9 @@ type styles struct {
 	activeTab    lipgloss.Style
 	inactiveTab  lipgloss.Style
-	sparkSuccess string
+	sparkSuccess lipgloss.TerminalColor
-	sparkWarning string
+	sparkWarning lipgloss.TerminalColor
-	sparkDanger  string
+	sparkDanger  lipgloss.TerminalColor
 	tableHeaderStyle   lipgloss.Style
 	tableCellStyle     lipgloss.Style
@@ -45,23 +46,23 @@ type styles struct {
 func newStyles(t Theme) *styles {
 	return &styles{
-		subtleStyle:  lipgloss.NewStyle().Foreground(t.Subtle),
+		subtleStyle:  lipgloss.NewStyle().Foreground(t.Subtle).Faint(true),
 		specialStyle: lipgloss.NewStyle().Foreground(t.Success),
-		warnStyle:    lipgloss.NewStyle().Foreground(t.Warning),
+		warnStyle:    lipgloss.NewStyle().Foreground(t.Warning).Bold(true),
-		staleStyle:   lipgloss.NewStyle().Foreground(t.Stale),
+		staleStyle:   lipgloss.NewStyle().Foreground(t.Stale).Faint(true),
-		dangerStyle:  lipgloss.NewStyle().Foreground(t.Danger),
+		dangerStyle:  lipgloss.NewStyle().Foreground(t.Danger).Bold(true),
 		titleStyle:   lipgloss.NewStyle().Foreground(t.Accent).Bold(true),
 		activeTab:    lipgloss.NewStyle().Background(t.Surface).Foreground(t.Accent).Bold(true).Padding(0, 1),
-		inactiveTab:  lipgloss.NewStyle().Padding(0, 1).Foreground(t.Muted),
+		inactiveTab:  lipgloss.NewStyle().Padding(0, 1).Foreground(t.Muted).Faint(true),
-		sparkSuccess: string(t.Success),
+		sparkSuccess: t.Success,
-		sparkWarning: string(t.Warning),
+		sparkWarning: t.Warning,
-		sparkDanger:  string(t.Danger),
+		sparkDanger:  t.Danger,
 		tableHeaderStyle:   lipgloss.NewStyle().Foreground(t.Accent).Bold(true).Padding(0, 1),
 		tableCellStyle:     lipgloss.NewStyle().Padding(0, 1),
 		tableSelectedStyle: lipgloss.NewStyle().Padding(0, 1).Bold(true).Foreground(t.SelectedFg).Background(t.SelectedBg),
-		tableBorderStyle:   lipgloss.NewStyle().Foreground(t.Border),
+		tableBorderStyle:   lipgloss.NewStyle().Foreground(t.Border).Faint(true),
 		tableZebraStyle:    lipgloss.NewStyle().Padding(0, 1).Background(t.ZebraBg),
 		siteGroupStyle: lipgloss.NewStyle().Padding(0, 1).Bold(true).Foreground(t.Accent),
@@ -79,6 +80,8 @@ const (
 	chromeFooter = 2 // footer: "\n" prefix + text line
 	chromeTable  = 3 // renderTable "\n" prefix + top border + header + bottom border (lipgloss collapses two into three rendered lines)
 	chromeBase   = chromePadV + chromeHeader + chromeGaps + chromeFooter + chromeTable
 	detailSparkWidth = 40
 )
 type sessionState int
@@ -102,6 +105,7 @@ type Model struct {
 	state        sessionState
 	currentTab   int
 	cursor       int
 	selectedID   int
 	tableOffset  int
 	maxTableRows int
 	termWidth    int
@@ -111,12 +115,15 @@ type Model struct {
 	huhForm       *huh.Form
 	siteFormData  *siteFormData
 	lastSiteType  string
 	alertFormData *alertFormData
 	userFormData  *userFormData
 	maintFormData *maintFormData
 	logViewport        viewport.Model
 	logFilterImportant bool
 	logTotal           int
 	logShown           int
 	historyViewport viewport.Model
 	historyChanges  []models.StateChange
@@ -180,7 +187,7 @@ func InitialModel(isAdmin bool, s store.Store, eng *monitor.Engine, version stri
 	spring := harmonica.NewSpring(harmonica.FPS(10), 6.0, 0.4)
 	collapsed := loadCollapsed(s)
-	themeName, _ := s.GetPreference("theme")
+	themeName, _ := s.GetPreference(context.Background(), "theme")
 	theme := themeByName(themeName)
 	themeIdx := 0
 	for i, t := range themes {
@@ -1,6 +1,7 @@
 package tui
 import (
 	"context"
 	"fmt"
 	"time"
@@ -78,17 +79,17 @@ func (m *Model) handleConfirmDelete(msg tea.Msg) (tea.Model, tea.Cmd) {
 		var cmd tea.Cmd
 		switch m.deleteTab {
 		case 0:
-			cmd = writeCmd("Delete site", func() error { return st.DeleteSite(id) })
+			cmd = writeCmd("Delete site", func() error { return st.DeleteSite(context.Background(), id) })
 			m.engine.RemoveSite(id)
 			m.adjustCursor(len(m.sites) - 1)
 		case 1:
-			cmd = writeCmd("Delete alert", func() error { return st.DeleteAlert(id) })
+			cmd = writeCmd("Delete alert", func() error { return st.DeleteAlert(context.Background(), id) })
 			m.adjustCursor(len(m.alerts) - 1)
 		case 4:
-			cmd = writeCmd("Delete maintenance window", func() error { return st.DeleteMaintenanceWindow(id) })
+			cmd = writeCmd("Delete maintenance window", func() error { return st.DeleteMaintenanceWindow(context.Background(), id) })
 			m.adjustCursor(len(m.maintenanceWindows) - 1)
 		case 5:
-			cmd = writeCmd("Delete user", func() error { return st.DeleteUser(id) })
+			cmd = writeCmd("Delete user", func() error { return st.DeleteUser(context.Background(), id) })
 			m.adjustCursor(len(m.users) - 1)
 		}
 		m.refreshLive()
@@ -109,10 +110,6 @@ func (m *Model) handleConfirmDelete(msg tea.Msg) (tea.Model, tea.Cmd) {
 }
 func (m *Model) handleFormMsg(msg tea.Msg) (tea.Model, tea.Cmd) {
 	if wsm, ok := msg.(tea.WindowSizeMsg); ok {
 		m.termWidth = wsm.Width
 		m.termHeight = wsm.Height
 	}
 	if keyMsg, ok := msg.(tea.KeyMsg); ok {
 		if keyMsg.String() == "ctrl+c" {
 			return m, tea.Quit
@@ -131,6 +128,13 @@ func (m *Model) handleFormMsg(msg tea.Msg) (tea.Model, tea.Cmd) {
 		if f, ok := form.(*huh.Form); ok {
 			m.huhForm = f
 		}
 		if m.state == stateFormSite && m.siteFormData != nil &&
 			m.siteFormData.SiteType != m.lastSiteType {
 			rebuildCmd := m.rebuildSiteForm()
 			// Advance to Type select — user just changed it.
 			skipName := m.huhForm.NextField()
 			return m, tea.Batch(rebuildCmd, skipName)
 		}
 		if m.huhForm.State == huh.StateCompleted {
 			// The store write runs in the returned Cmd; its writeDoneMsg
 			// triggers the tab-data reload once the row actually exists.
@@ -144,24 +148,35 @@ func (m *Model) handleFormMsg(msg tea.Msg) (tea.Model, tea.Cmd) {
 	return m, nil
 }
-func (m *Model) handleResize(msg tea.WindowSizeMsg) (tea.Model, tea.Cmd) {
+func (m *Model) recalcLayout() {
 	m.termWidth = msg.Width
 	m.termHeight = msg.Height
 	chrome := chromeBase
 	if m.filterMode || m.filterText != "" {
 		chrome++
 	}
-	m.maxTableRows = msg.Height - chrome
+	m.maxTableRows = m.termHeight - chrome
 	if m.maxTableRows < 1 {
 		m.maxTableRows = 1
 	}
 }
 func (m *Model) handleResize(msg tea.WindowSizeMsg) (tea.Model, tea.Cmd) {
 	m.termWidth = msg.Width
 	m.termHeight = msg.Height
 	m.recalcLayout()
 	m.logViewport.Width = msg.Width - chromePadH
 	m.logViewport.Height = msg.Height - (chromePadV + chromeHeader + chromeFooter + 2)
 	m.historyViewport.Width = msg.Width - chromePadH
 	m.historyViewport.Height = msg.Height - 10
 	m.slaViewport.Width = msg.Width - chromePadH
 	m.slaViewport.Height = msg.Height - 16
-	return m, tea.ClearScreen
+	if m.huhForm != nil {
 		formHeight := msg.Height - 7
 		if formHeight < 5 {
 			formHeight = 5
 		}
 		m.huhForm.WithHeight(formHeight)
 	}
 	return m, nil
 }
 func (m *Model) handleTick(t time.Time) (tea.Model, tea.Cmd) {
@@ -285,6 +300,7 @@ func (m *Model) handleMouse(msg tea.MouseMsg) (tea.Model, tea.Cmd) {
 			}
 		}
 	}
 	m.syncSelectedID()
 	return m, nil
 }
@@ -322,9 +338,11 @@ func (m *Model) handleFilterKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 		m.filterText = ""
 		m.cursor = 0
 		m.tableOffset = 0
 		m.recalcLayout()
 		m.refreshLive()
 	case "enter":
 		m.filterMode = false
 		m.recalcLayout()
 	case "backspace":
 		if len(m.filterText) > 0 {
 			m.filterText = m.filterText[:len(m.filterText)-1]
@@ -335,8 +353,8 @@ func (m *Model) handleFilterKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 	case "ctrl+c":
 		return m, tea.Quit
 	default:
-		if len(msg.String()) == 1 {
+		if len(msg.Runes) == 1 {
-			m.filterText += msg.String()
+			m.filterText += string(msg.Runes)
 			m.cursor = 0
 			m.tableOffset = 0
 			m.refreshLive()
@@ -378,7 +396,7 @@ func (m *Model) handleDetailKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 			return m, m.openSLAView(m.sites[m.cursor])
 		}
 	case "q":
-		return m, tea.Quit
+		m.state = stateDashboard
 	}
 	return m, nil
 }
@@ -390,16 +408,14 @@ func (m *Model) handleSparklineClick(msg tea.MouseMsg) (tea.Model, tea.Cmd) {
 	site := m.sites[m.cursor]
 	hist, _ := m.engine.GetHistory(site.ID)
 	const sparkWidth = 40
 	if zi := m.zones.Get("spark-latency"); zi != nil && !zi.IsZero() && zi.InBounds(msg) {
 		x, _ := zi.Pos(msg)
-		m.sparkTooltipIdx = resolveSparklineIndex(x, sparkWidth, len(hist.Latencies))
+		m.sparkTooltipIdx = resolveSparklineIndex(x, detailSparkWidth, len(hist.Latencies))
 		return m, nil
 	}
 	if zi := m.zones.Get("spark-heartbeat"); zi != nil && !zi.IsZero() && zi.InBounds(msg) {
 		x, _ := zi.Pos(msg)
-		m.sparkTooltipIdx = resolveSparklineIndex(x, sparkWidth, len(hist.Statuses))
+		m.sparkTooltipIdx = resolveSparklineIndex(x, detailSparkWidth, len(hist.Statuses))
 		return m, nil
 	}
@@ -454,7 +470,7 @@ func (m *Model) handleSLAData(msg slaDataMsg) (tea.Model, tea.Cmd) {
 	}
 	period := slaPeriods[msg.periodIdx]
-	var currentStatus string
+	var currentStatus models.Status
 	for _, s := range m.sites {
 		if s.ID == msg.siteID {
 			currentStatus = s.Status
@@ -498,10 +514,8 @@ func (m *Model) handleHistoryKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 func (m *Model) handleAlertDetailKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 	switch msg.String() {
-	case "i", "esc":
+	case "q", "i", "esc":
 		m.state = stateDashboard
 	case "q":
 		return m, tea.Quit
 	}
 	return m, nil
 }
@@ -514,11 +528,13 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 	case "/":
 		if m.currentTab == 0 {
 			m.filterMode = true
 			m.recalcLayout()
 			return m, nil
 		}
 	case "f":
 		if m.state == stateLogs {
 			m.logFilterImportant = !m.logFilterImportant
 			m.refreshLogContent()
 			return m, nil
 		}
 	case "tab":
@@ -536,6 +552,7 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 			if m.cursor < m.tableOffset {
 				m.tableOffset = m.cursor
 			}
 			m.syncSelectedID()
 		}
 	case "down", "j":
 		if m.state == stateLogs {
@@ -547,6 +564,7 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 				if m.cursor >= m.tableOffset+m.maxTableRows {
 					m.tableOffset++
 				}
 				m.syncSelectedID()
 			}
 		}
 	case "n":
@@ -566,7 +584,7 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 			st := m.store
 			m.refreshLive()
 			return m, writeCmd("Save collapsed groups", func() error {
-				return st.SetPreference("collapsed_groups", payload)
+				return st.SetPreference(context.Background(), "collapsed_groups", payload)
 			})
 		}
 	case "p":
@@ -576,7 +594,7 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 			st := m.store
 			m.refreshLive()
 			return m, writeCmd("Update pause state", func() error {
-				return st.UpdateSitePaused(id, paused)
+				return st.UpdateSitePaused(context.Background(), id, paused)
 			})
 		}
 	case "i":
@@ -596,7 +614,7 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 				id := mw.ID
 				m.refreshLive()
 				return m, writeCmd("End maintenance", func() error {
-					return st.EndMaintenanceWindow(id)
+					return st.EndMaintenanceWindow(context.Background(), id)
 				})
 			}
 		}
@@ -607,9 +625,9 @@ func (m *Model) handleDashboardKey(msg tea.KeyMsg) (tea.Model, tea.Cmd) {
 		st := m.store
 		name := m.theme.Name
 		return m, writeCmd("Save theme", func() error {
-			return st.SetPreference("theme", name)
+			return st.SetPreference(context.Background(), "theme", name)
 		})
-	case "d", "backspace":
+	case "d":
 		return m.handleDeleteItem()
 	}
 	return m, nil
@@ -716,6 +734,7 @@ func (m *Model) handleClick(msg tea.MouseMsg) (tea.Model, tea.Cmd) {
 	for i := m.tableOffset; i < end; i++ {
 		if m.zones.Get(fmt.Sprintf("%s-%d", prefix, i)).InBounds(msg) {
 			m.cursor = i
 			m.syncSelectedID()
 			return m, nil
 		}
 	}
@@ -744,16 +763,8 @@ func (m *Model) switchTab(idx int) {
 	}
 }
-func (m *Model) adjustCursor(newLen int) {
+func (m *Model) adjustCursor(_ int) {
-	if m.cursor >= newLen && m.cursor > 0 {
+	m.clampCursor()
 		m.cursor--
 	}
 	if m.cursor < m.tableOffset {
 		m.tableOffset = m.cursor
 		if m.tableOffset < 0 {
 			m.tableOffset = 0
 		}
 	}
 }
 func (m *Model) submitForm() tea.Cmd {
@@ -1,12 +1,14 @@
 package tui
 import (
 	"context"
 	"strings"
 	"testing"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/monitor"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/store/storetest"
 	tea "github.com/charmbracelet/bubbletea"
 	zone "github.com/lrstanley/bubblezone"
 )
@@ -14,89 +16,34 @@ import (
 // --- minimal Store mock for TUI data-flow tests ---
 type tuiMockStore struct {
 	storetest.BaseMock
 	alerts           []models.AlertConfig
 	users            []models.User
 	nodes            []models.ProbeNode
 	maint            []models.MaintenanceWindow
 	stateChanges     []models.StateChange
-	stateChangeCalls int // counts GetStateChanges hits (to prove View does no IO)
+	stateChangeCalls int
-	deleteSiteCalls  int // counts DeleteSite hits (to prove writes run in Cmds)
+	deleteSiteCalls  int
 }
-func (m *tuiMockStore) GetAllAlerts() ([]models.AlertConfig, error) { return m.alerts, nil }
+func (m *tuiMockStore) GetAllAlerts(_ context.Context) ([]models.AlertConfig, error) {
-func (m *tuiMockStore) GetAllUsers() ([]models.User, error)         { return m.users, nil }
+	return m.alerts, nil
-func (m *tuiMockStore) GetAllNodes() ([]models.ProbeNode, error)    { return m.nodes, nil }
+}
-func (m *tuiMockStore) GetStateChanges(int, int) ([]models.StateChange, error) {
+func (m *tuiMockStore) GetAllUsers(_ context.Context) ([]models.User, error) { return m.users, nil }
 func (m *tuiMockStore) GetAllNodes(_ context.Context) ([]models.ProbeNode, error) {
 	return m.nodes, nil
 }
 func (m *tuiMockStore) GetStateChanges(_ context.Context, _ int, _ int) ([]models.StateChange, error) {
 	m.stateChangeCalls++
 	return m.stateChanges, nil
 }
-func (m *tuiMockStore) GetAllMaintenanceWindows(int) ([]models.MaintenanceWindow, error) {
+func (m *tuiMockStore) GetAllMaintenanceWindows(_ context.Context, _ int) ([]models.MaintenanceWindow, error) {
 	return m.maint, nil
 }
-
+func (m *tuiMockStore) DeleteSite(_ context.Context, _ int) error {
 func (m *tuiMockStore) Init() error                      { return nil }
 func (m *tuiMockStore) GetSites() ([]models.Site, error) { return nil, nil }
 func (m *tuiMockStore) AddSite(models.Site) error        { return nil }
 func (m *tuiMockStore) UpdateSite(models.Site) error     { return nil }
 func (m *tuiMockStore) UpdateSitePaused(int, bool) error { return nil }
 func (m *tuiMockStore) DeleteSite(int) error {
 	m.deleteSiteCalls++
 	return nil
 }
 func (m *tuiMockStore) GetAlert(int) (models.AlertConfig, error)                 { return models.AlertConfig{}, nil }
 func (m *tuiMockStore) AddAlert(string, string, map[string]string) error         { return nil }
 func (m *tuiMockStore) UpdateAlert(int, string, string, map[string]string) error { return nil }
 func (m *tuiMockStore) DeleteAlert(int) error                                    { return nil }
 func (m *tuiMockStore) GetSiteByName(string) (models.Site, error)                { return models.Site{}, nil }
 func (m *tuiMockStore) GetAlertByName(string) (models.AlertConfig, error) {
 	return models.AlertConfig{}, nil
 }
 func (m *tuiMockStore) AddSiteReturningID(models.Site) (int, error) { return 0, nil }
 func (m *tuiMockStore) AddAlertReturningID(string, string, map[string]string) (int, error) {
 	return 0, nil
 }
 func (m *tuiMockStore) AddUser(string, string, string) error         { return nil }
 func (m *tuiMockStore) UpdateUser(int, string, string, string) error { return nil }
 func (m *tuiMockStore) DeleteUser(int) error                         { return nil }
 func (m *tuiMockStore) SaveCheck(int, int64, bool) error             { return nil }
 func (m *tuiMockStore) SaveCheckFromNode(int, string, int64, bool) error {
 	return nil
 }
 func (m *tuiMockStore) LoadAllHistory(int) (map[int][]models.CheckRecord, error) {
 	return nil, nil
 }
 func (m *tuiMockStore) PruneCheckHistory() error                          { return nil }
 func (m *tuiMockStore) SaveStateChange(int, string, string, string) error { return nil }
 func (m *tuiMockStore) GetStateChangesSince(int, time.Time) ([]models.StateChange, error) {
 	return nil, nil
 }
 func (m *tuiMockStore) PruneStateChanges() error                 { return nil }
 func (m *tuiMockStore) RegisterNode(models.ProbeNode) error      { return nil }
 func (m *tuiMockStore) GetNode(string) (models.ProbeNode, error) { return models.ProbeNode{}, nil }
 func (m *tuiMockStore) UpdateNodeLastSeen(string) error          { return nil }
 func (m *tuiMockStore) DeleteNode(string) error                  { return nil }
 func (m *tuiMockStore) LoadAlertHealth() (map[int]models.AlertHealthRecord, error) {
 	return nil, nil
 }
 func (m *tuiMockStore) SaveAlertHealth(models.AlertHealthRecord) error { return nil }
 func (m *tuiMockStore) SaveLog(string) error                           { return nil }
 func (m *tuiMockStore) LoadLogs(int) ([]string, error)                 { return nil, nil }
 func (m *tuiMockStore) PruneLogs() error                               { return nil }
 func (m *tuiMockStore) GetActiveMaintenanceWindows() ([]models.MaintenanceWindow, error) {
 	return nil, nil
 }
 func (m *tuiMockStore) AddMaintenanceWindow(models.MaintenanceWindow) error { return nil }
 func (m *tuiMockStore) EndMaintenanceWindow(int) error                      { return nil }
 func (m *tuiMockStore) DeleteMaintenanceWindow(int) error                   { return nil }
 func (m *tuiMockStore) PruneExpiredMaintenanceWindows(time.Duration) (int64, error) {
 	return 0, nil
 }
 func (m *tuiMockStore) IsMonitorInMaintenance(int) (bool, error) { return false, nil }
 func (m *tuiMockStore) GetPreference(string) (string, error)     { return "", nil }
 func (m *tuiMockStore) SetPreference(string, string) error       { return nil }
 func (m *tuiMockStore) ExportData() (models.Backup, error)       { return models.Backup{}, nil }
 func (m *tuiMockStore) ImportData(models.Backup) error           { return nil }
 func (m *tuiMockStore) Close() error                             { return nil }
 func newTestModel(ms *tuiMockStore) Model {
 	return Model{
@@ -169,7 +116,7 @@ func (*stubErr) Error() string { return "boom" }
 func TestDetailLoad_CachesAndViewDoesNoIO(t *testing.T) {
 	ms := &tuiMockStore{stateChanges: []models.StateChange{{FromStatus: "UP", ToStatus: "DOWN"}}}
 	m := newTestModel(ms)
-	m.sites = []models.Site{{ID: 1, Name: "site", Status: "DOWN"}}
+	m.sites = []models.Site{{SiteConfig: models.SiteConfig{ID: 1, Name: "site"}, SiteState: models.SiteState{Status: "DOWN"}}}
 	m.cursor = 0
 	m.state = stateDetail
 	m.termWidth = 120
@@ -254,7 +201,7 @@ func TestHandleTabData_DropsStaleSeq(t *testing.T) {
 func TestHistoryKey_LoadsOffUIGoroutine(t *testing.T) {
 	ms := &tuiMockStore{stateChanges: []models.StateChange{{FromStatus: "UP", ToStatus: "DOWN"}}}
 	m := newTestModel(ms)
-	m.sites = []models.Site{{ID: 7, Name: "site"}}
+	m.sites = []models.Site{{SiteConfig: models.SiteConfig{ID: 7, Name: "site"}}}
 	m.state = stateDetail
 	m.termWidth, m.termHeight = 120, 40
@@ -293,7 +240,7 @@ func TestHistoryKey_LoadsOffUIGoroutine(t *testing.T) {
 func TestSLAData_DropsStaleReply(t *testing.T) {
 	m := newTestModel(&tuiMockStore{})
 	m.termWidth, m.termHeight = 120, 40
-	m.sites = []models.Site{{ID: 3, Status: "UP"}}
+	m.sites = []models.Site{{SiteConfig: models.SiteConfig{ID: 3}, SiteState: models.SiteState{Status: "UP"}}}
 	if cmd := (&m).openSLAView(m.sites[0]); cmd == nil {
 		t.Fatal("openSLAView should return a load Cmd")
@@ -317,7 +264,7 @@ func TestSLAData_DropsStaleReply(t *testing.T) {
 func TestConfirmDelete_WritesOffUIGoroutine(t *testing.T) {
 	ms := &tuiMockStore{}
 	m := newTestModel(ms)
-	m.sites = []models.Site{{ID: 4, Name: "s"}}
+	m.sites = []models.Site{{SiteConfig: models.SiteConfig{ID: 4, Name: "s"}}}
 	m.state = stateConfirmDelete
 	m.deleteTab = 0
 	m.deleteID = 4
@@ -365,7 +312,7 @@ func TestWriteDoneMsg_LogsErrorAndReloads(t *testing.T) {
 func TestDetailRefreshCmd_OnlyWhileDetailOpen(t *testing.T) {
 	ms := &tuiMockStore{stateChanges: []models.StateChange{{FromStatus: "UP", ToStatus: "DOWN"}}}
 	m := newTestModel(ms)
-	m.sites = []models.Site{{ID: 5, Name: "site"}}
+	m.sites = []models.Site{{SiteConfig: models.SiteConfig{ID: 5, Name: "site"}}}
 	m.state = stateDashboard
 	if (&m).detailRefreshCmd() != nil {
@@ -6,6 +6,7 @@ import (
 	"strings"
 	"time"
 	"gitea.lerkolabs.com/lerkolabs/uptop/internal/models"
 	"github.com/charmbracelet/lipgloss"
 )
@@ -16,7 +17,7 @@ func sinApprox(x float64) float64 {
 func (m Model) pulseIndicator() string {
 	hasDown := false
 	for _, s := range m.sites {
-		if !s.Paused && !m.isMonitorInMaintenance(s.ID) && (s.Status == "DOWN" || s.Status == "SSL EXP") {
+		if !s.Paused && !m.isMonitorInMaintenance(s.ID) && (s.Status == models.StatusDown || s.Status == models.StatusSSLExp) {
 			hasDown = true
 			break
 		}
@@ -84,11 +85,6 @@ func (m Model) View() string {
 			case stateFormMaint:
 				title = "New Maintenance Window"
 			}
 			formHeight := m.termHeight - 7
 			if formHeight < 5 {
 				formHeight = 5
 			}
 			m.huhForm.WithHeight(formHeight)
 			header := m.st.titleStyle.Render(title)
 			footer := m.st.subtleStyle.Render("\n[Esc] Cancel")
 			return lipgloss.NewStyle().Padding(1, 2).Render(header + "\n\n" + m.huhForm.View() + "\n" + footer)
@@ -127,9 +123,9 @@ func (m Model) computeStats() dashboardStats {
 			continue
 		}
 		switch site.Status {
-		case "DOWN", "SSL EXP":
+		case models.StatusDown, models.StatusSSLExp:
 			s.downCount++
-		case "LATE":
+		case models.StatusLate:
 			s.lateCount++
 		}
 	}
@@ -269,7 +265,7 @@ func (m Model) renderFooter(stats dashboardStats) string {
 	var keys string
 	switch m.currentTab {
 	case 0:
-		keys = "[/]Filter [n]New [e]Edit [i]Info [d]Del [p]Pause [T]Theme [Tab]Switch [q]Quit"
+		keys = "[/]Filter [n]New [e]Edit [i]Info [d]Del [p]Pause [Space]Collapse [T]Theme [Tab]Switch [q]Quit"
 	case 1:
 		keys = "[n]New [e]Edit [i]Info [d]Del [t]Test [T]Theme [Tab]Switch [q]Quit"
 	case 2:
@@ -2,6 +2,7 @@ package tui
 import (
 	"fmt"
 	"sort"
 	"strconv"
 	"strings"
 	"time"
@@ -45,7 +46,7 @@ func (m Model) viewDetailPanel() string {
 	row("Status", m.fmtStatus(site.Status, site.Paused, m.isMonitorInMaintenance(site.ID)))
-	if (site.Status == "DOWN" || site.Status == "SSL EXP" || site.Status == "LATE" || site.Status == "STALE") && site.LastError != "" {
+	if (site.Status == models.StatusDown || site.Status == models.StatusSSLExp || site.Status == models.StatusLate || site.Status == models.StatusStale) && site.LastError != "" {
 		errWidth := m.termWidth - chromePadH - 19
 		if errWidth < 30 {
 			errWidth = 30
@@ -58,7 +59,7 @@ func (m Model) viewDetailPanel() string {
 		row("HTTP Code", strconv.Itoa(site.StatusCode))
 	}
-	if (site.Status == "DOWN" || site.Status == "SSL EXP") && site.LastError != "" {
+	if (site.Status == models.StatusDown || site.Status == models.StatusSSLExp) && site.LastError != "" {
 		chain := connectionChain(site.LastError, site.Type, site.StatusCode, strings.HasPrefix(site.URL, "https"))
 		if len(chain) > 0 {
 			b.WriteString("\n")
@@ -163,8 +164,14 @@ func (m Model) viewDetailPanel() string {
 	probeResults := m.engine.GetProbeResults(site.ID)
 	if len(probeResults) > 0 {
 		nodeIDs := make([]string, 0, len(probeResults))
 		for id := range probeResults {
 			nodeIDs = append(nodeIDs, id)
 		}
 		sort.Strings(nodeIDs)
 		b.WriteString("\n" + m.st.subtleStyle.Render("  PROBE RESULTS") + "\n")
-		for nodeID, result := range probeResults {
+		for _, nodeID := range nodeIDs {
 			result := probeResults[nodeID]
 			status := m.st.specialStyle.Render("UP")
 			if !result.IsUp {
 				status = m.st.dangerStyle.Render("DN")
@@ -189,7 +196,7 @@ func (m Model) viewDetailPanel() string {
 		for i, sc := range stateChanges {
 			ago := fmtDuration(time.Since(sc.ChangedAt))
 			arrow := m.st.subtleStyle.Render(sc.FromStatus) + " → "
-			if sc.ToStatus == "UP" {
+			if sc.ToStatus == string(models.StatusUp) {
 				arrow += m.st.specialStyle.Render(sc.ToStatus)
 			} else {
 				arrow += m.st.dangerStyle.Render(sc.ToStatus)
@@ -198,7 +205,7 @@ func (m Model) viewDetailPanel() string {
 			if dur := computeOutageDuration(stateChanges, i); dur > 0 {
 				line += "  " + m.st.warnStyle.Render("outage "+fmtDuration(dur))
 			}
-			if sc.ErrorReason != "" && sc.ToStatus != "UP" {
+			if sc.ErrorReason != "" && sc.ToStatus != string(models.StatusUp) {
 				line += "  " + m.st.dangerStyle.Render(sc.ErrorReason)
 			}
 			b.WriteString(line + "\n")
@@ -207,9 +214,8 @@ func (m Model) viewDetailPanel() string {
 	}
 	b.WriteString(m.divider() + "\n")
 	const sparkWidth = 40
 	if site.Type == "push" {
-		b.WriteString("  " + m.zones.Mark("spark-heartbeat", m.heartbeatSparkline(hist.Statuses, sparkWidth, "")))
+		b.WriteString("  " + m.zones.Mark("spark-heartbeat", m.heartbeatSparkline(hist.Statuses, detailSparkWidth, nil)))
 		if len(hist.Statuses) > 0 {
 			up := 0
 			for _, s := range hist.Statuses {
@@ -222,7 +228,7 @@ func (m Model) viewDetailPanel() string {
 				up, len(hist.Statuses))
 		}
 	} else {
-		b.WriteString("  " + m.zones.Mark("spark-latency", m.latencySparkline(hist.Latencies, hist.Statuses, sparkWidth, "")))
+		b.WriteString("  " + m.zones.Mark("spark-latency", m.latencySparkline(hist.Latencies, hist.Statuses, detailSparkWidth, nil)))
 		var minL, maxL, total time.Duration
 		count := 0
 		for i, l := range hist.Latencies {
@@ -249,12 +255,12 @@ func (m Model) viewDetailPanel() string {
 	}
 	if m.sparkTooltipIdx >= 0 {
-		b.WriteString("\n" + m.renderSparkTooltip(site, hist, sparkWidth))
+		b.WriteString("\n" + m.renderSparkTooltip(site, hist, detailSparkWidth))
 	}
 	b.WriteString("\n")
 	b.WriteString(m.divider() + "\n")
-	b.WriteString(m.st.subtleStyle.Render("  [i/Esc] Back  [e] Edit  [h] History  [s] SLA  [click] Inspect  [q] Quit"))
+	b.WriteString(m.st.subtleStyle.Render("  [q/Esc] Back  [e] Edit  [h] History  [s] SLA  [click] Inspect"))
 	return lipgloss.NewStyle().Padding(1, 2).Render(b.String())
 }
@@ -17,14 +17,14 @@ type historyStats struct {
 func computeOutageDuration(changes []models.StateChange, idx int) time.Duration {
 	sc := changes[idx]
-	if sc.ToStatus != "UP" {
+	if sc.ToStatus != string(models.StatusUp) {
 		return 0
 	}
 	if idx+1 >= len(changes) {
 		return 0
 	}
 	prev := changes[idx+1]
-	if prev.ToStatus == "UP" {
+	if prev.ToStatus == string(models.StatusUp) {
 		return 0
 	}
 	dur := sc.ChangedAt.Sub(prev.ChangedAt)
@@ -122,11 +122,11 @@ func (m Model) buildHistoryContent() string {
 		arrow := m.st.subtleStyle.Render(sc.FromStatus) + " → "
 		switch sc.ToStatus {
-		case "UP":
+		case string(models.StatusUp):
 			arrow += m.st.specialStyle.Render(sc.ToStatus)
-		case "LATE":
+		case string(models.StatusLate):
 			arrow += m.st.warnStyle.Render(sc.ToStatus)
-		case "STALE":
+		case string(models.StatusStale):
 			arrow += m.st.staleStyle.Render(sc.ToStatus)
 		default:
 			arrow += m.st.dangerStyle.Render(sc.ToStatus)
@@ -138,7 +138,7 @@ func (m Model) buildHistoryContent() string {
 		}
 		reason := ""
-		if sc.ErrorReason != "" && sc.ToStatus != "UP" {
+		if sc.ErrorReason != "" && sc.ToStatus != string(models.StatusUp) {
 			reason = m.st.dangerStyle.Render(limitStr(sc.ErrorReason, reasonWidth))
 		}