1 Commits

Author SHA1 Message Date
3f7a4c2255 test: image-pull validation (one good, one bad)
Some checks failed
CI / Terraform fmt + validate (pull_request) Successful in 21s
CI / Nomad job spec validate (pull_request) Successful in 22s
CI / Docker image pull validation (pull_request) Failing after 16s
2026-04-19 18:20:20 +10:00
15 changed files with 14 additions and 66 deletions

View File

@@ -58,10 +58,8 @@ job "pgadmin" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -7,10 +7,6 @@ job "postgres" {
connect { connect {
sidecar_service {} sidecar_service {}
} }
# Note: TCP checks are not valid for Connect-enabled services (runs through
# Envoy sidecar). Postgres is a single-writer DB that we never canary, so
# observable health via Consul is lower priority than other services.
} }
task "postgres" { task "postgres" {

View File

@@ -33,10 +33,8 @@ job "authelia" {
} }
check { check {
name = "alive"
type = "http" type = "http"
path = "/health" path = "/health"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -35,8 +35,7 @@ job "traefik" {
check { check {
name = "alive" name = "alive"
type = "http" type = "tcp"
path = "/ping"
port = "api" port = "api"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
@@ -86,9 +85,6 @@ api:
dashboard: true dashboard: true
insecure: true insecure: true
ping:
entryPoint: traefik
providers: providers:
file: file:
directory: "/etc/traefik/configs/" directory: "/etc/traefik/configs/"

View File

@@ -54,10 +54,8 @@ EOH
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }
@@ -80,10 +78,8 @@ EOH
} }
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -32,10 +32,8 @@ job "gitea" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/api/healthz" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -30,8 +30,7 @@ job "glance" {
check { check {
name = "alive" name = "alive"
type = "http" type = "tcp"
path = "/"
port = "http" port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"

View File

@@ -28,11 +28,10 @@ job "jellyfin" {
check { check {
name = "alive" name = "alive"
type = "http" type = "tcp"
path = "/health"
port = "http" port = "http"
interval = "10s" interval = "10s"
timeout = "5s" timeout = "2s"
} }
} }

View File

@@ -33,10 +33,8 @@ job "ntfy" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/healthz" path = "/healthz"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -31,10 +31,8 @@ job "openreader" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }
@@ -50,10 +48,8 @@ job "openreader" {
} }
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }
@@ -63,7 +59,7 @@ job "openreader" {
driver = "docker" driver = "docker"
config { config {
image = "ghcr.io/richardr1126/openreader:v2.1.2" image = "ghcr.io/richardr1126/openreader:v99.99.99"
ports = ["http"] ports = ["http"]
} }

View File

@@ -34,9 +34,8 @@ job "prowlarr" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/ping" path = "/"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }
@@ -52,9 +51,8 @@ job "prowlarr" {
} }
check { check {
name = "alive"
type = "http" type = "http"
path = "/ping" path = "/"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -37,9 +37,8 @@ job "sonarr" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/ping" path = "/"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }
@@ -55,9 +54,8 @@ job "sonarr" {
} }
check { check {
name = "alive"
type = "http" type = "http"
path = "/ping" path = "/"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -16,10 +16,8 @@ job "transfer" {
] ]
check { check {
name = "alive"
type = "http" type = "http"
path = "/" path = "/"
port = "http"
interval = "10s" interval = "10s"
timeout = "2s" timeout = "2s"
} }

View File

@@ -21,26 +21,6 @@ job "unifi-network" {
UNIFI_STDOUT = "true" UNIFI_STDOUT = "true"
} }
# Register in Consul so Traefik and health checks can find it.
# address_mode=driver uses the macvlan IP (192.168.1.50) rather than the host IP.
service {
name = "unifi-network"
port = 8443
address_mode = "driver"
# TCP/HTTP checks from the Consul agent can't reach the macvlan IP (host↔macvlan
# isolation). Use a script check instead — it runs inside the container via
# docker exec and connects to localhost:8443 directly.
check {
name = "alive"
type = "script"
command = "/usr/bin/curl"
args = ["-sk", "--max-time", "5", "-o", "/dev/null", "https://localhost:8443"]
interval = "30s"
timeout = "10s"
}
}
volume_mount { volume_mount {
volume = "unraid_appdata_unifi_network" volume = "unraid_appdata_unifi_network"
destination = "/unifi" # Expected root directory (contains data, log, cert subdirs) destination = "/unifi" # Expected root directory (contains data, log, cert subdirs)

View File

@@ -188,8 +188,8 @@ Most jobs already have Consul health checks — these can use `health_check = "c
| frigate | ✅ | ✅ `single-node-writer` | ⚠️ same — rolling | | frigate | ✅ | ✅ `single-node-writer` | ⚠️ same — rolling |
| glance | ✅ | no | ✅ yes | | glance | ✅ | no | ✅ yes |
| transfer | ✅ | ✅ `single-node-writer` | ⚠️ rolling | | transfer | ✅ | ✅ `single-node-writer` | ⚠️ rolling |
| openreader | `/` | ✅ `single-node-writer` | ⚠️ rolling | | openreader | | ✅ `single-node-writer` | ⚠️ add check first, then rolling |
| unifi | ✅ script | ✅ `single-node-writer` | ⚠️ rolling | | unifi | | ✅ `single-node-writer` | ⚠️ add check first, then rolling |
| traefik | (ingress) | ✅ | ⚠️ rolling — downtime risk, promote quickly | | traefik | (ingress) | ✅ | ⚠️ rolling — downtime risk, promote quickly |
| authelia | (ingress) | ✅ | ✅ stateless config, canary fine | | authelia | (ingress) | ✅ | ✅ stateless config, canary fine |
| renovate | batch job | n/a | n/a — no deployment model | | renovate | batch job | n/a | n/a — no deployment model |
@@ -298,8 +298,8 @@ exit 1
- [x] **Phase 1c**: Add Nomad validate step — add `NOMAD_ADDR` + read-only `NOMAD_TOKEN` to Gitea secrets - [x] **Phase 1c**: Add Nomad validate step — add `NOMAD_ADDR` + read-only `NOMAD_TOKEN` to Gitea secrets
- [x] **Phase 2**: Add image pull validation step to the workflow - [x] **Phase 2**: Add image pull validation step to the workflow
- [ ] **Phase 3a**: Add `update` stanzas to ntfy and glance (simplest, no volume conflict) - [ ] **Phase 3a**: Add `update` stanzas to ntfy and glance (simplest, no volume conflict)
- [ ] **Phase 3b**: Add rolling `update` stanzas to remaining service jobs (jellyfin, sonarr, prowlarr, deluge, gitea, immich, transfer, frigate, openreader, unifi, authelia, traefik) - [ ] **Phase 3b**: Add rolling `update` stanzas to remaining service jobs (jellyfin, sonarr, etc.)
- [x] **Phase 3c**: Add health checks to openreader and unifi before adding update stanzas - [ ] **Phase 3c**: Add health checks to openreader and unifi before adding update stanzas
- [ ] **Phase 4a**: Add on-push workflow that runs `terraform apply -auto-approve` using full credential set - [ ] **Phase 4a**: Add on-push workflow that runs `terraform apply -auto-approve` using full credential set
- [ ] **Phase 4b**: Add deployment promotion/revert polling script - [ ] **Phase 4b**: Add deployment promotion/revert polling script
- [ ] **Phase 4c**: Wire ntfy notifications for promote/revert outcomes - [ ] **Phase 4c**: Wire ntfy notifications for promote/revert outcomes