veza/infra/ansible/roles/pgbackrest/defaults/main.yml

# pgBackRest defaults — Postgres backup + WAL archive to MinIO/S3.
# https://pgbackrest.org
#
# v1.0.9 Day 8 — RPO target ≈ 5 min (WAL archive interval), RTO
# target < 30 min (the dr-drill timing budget). Backup cadence:
#   - full   : weekly (Sunday 02:00 UTC)
#   - diff   : daily Mon-Sat 02:00 UTC
#   - WAL    : continuous (archive_command after every WAL file)
---
postgres_version: 16

# Repository — MinIO is S3-compatible. The bucket is provisioned by
# the minio_distributed role (W3 day 12); until then operators
# create it manually with `mc mb minio/veza-pgbackrest`.
pgbackrest_repo_type: s3
pgbackrest_repo_s3_endpoint: minio.lxd:9000
pgbackrest_repo_s3_region: us-east-1                 # MinIO ignores region but pgbackrest requires the field
pgbackrest_repo_s3_bucket: veza-pgbackrest
pgbackrest_repo_s3_uri_style: path                   # MinIO speaks path-style by default
pgbackrest_repo_s3_verify_tls: false                 # lab MinIO uses self-signed certs; flip to true once Let's Encrypt is wired
pgbackrest_repo_path: /
pgbackrest_repo_cipher_type: aes-256-cbc

# Stanza — pgBackRest's name for one Postgres cluster's archive.
# Single stanza per environment for v1.0.9 (one formation = one
# stanza). Multi-cluster envs add suffixed stanzas.
pgbackrest_stanza: veza

# Retention — keep 4 full backups (≈ 1 month at weekly cadence).
# diff/incremental retention is implicit (kept until the parent
# full expires). WAL is kept as long as any in-window full needs
# it for PITR.
pgbackrest_repo_retention_full: 4
pgbackrest_repo_retention_diff: 7
pgbackrest_repo_retention_archive: 4

# Compression — zstd@3 trades CPU for ~50% smaller archive vs gz@6.
# The CPU budget is fine on the R720; bandwidth to MinIO is the
# scarcer resource.
pgbackrest_compress_type: zstd
pgbackrest_compress_level: 3

# Process count — parallel WAL push + parallel backup. 4 is right
# for the 12-core R720 with concurrent backend traffic; bump in
# `group_vars/<env>` for dedicated-host backups.
pgbackrest_process_max: 4

# Secrets — sourced from vault. The role refuses to apply when
# placeholders are still in place to prevent a "live" rollout
# pointing at the wrong S3 keys.
pgbackrest_repo_s3_key: "{{ vault_pgbackrest_s3_key | default('CHANGEME-PGBR-KEY') }}"
pgbackrest_repo_s3_key_secret: "{{ vault_pgbackrest_s3_key_secret | default('CHANGEME-PGBR-SECRET') }}"
pgbackrest_repo_cipher_pass: "{{ vault_pgbackrest_cipher_pass | default('CHANGEME-PGBR-CIPHER') }}"

# Schedule — systemd timers (preferred over cron for journald
# integration). Override per env in group_vars.
pgbackrest_schedule_full: "Sun *-*-* 02:00:00"
pgbackrest_schedule_diff: "Mon..Sat *-*-* 02:00:00"

# Drill schedule — weekly RTO check, runs from any host with
# `incus` access. `dr-drill.sh` writes a textfile metric the
# node_exporter scrapes; the Prometheus alert
# BackupRestoreDrillFailed fires when the timestamp gets stale
# (> 8 days = a week's drill missed entirely).
pgbackrest_drill_schedule: "Sun *-*-* 04:00:00"
pgbackrest_drill_metrics_file: /var/lib/node_exporter/textfile_collector/pgbackrest_drill.prom