fjelltopp
diff --git a/‎deploy/sync/Dockerfile.sync‎
Lines changed: 27 additions & 0 deletions b/‎deploy/sync/Dockerfile.sync‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎deploy/sync/cronjob.yaml‎
Lines changed: 77 additions & 0 deletions b/‎deploy/sync/cronjob.yaml‎
Lines changed: 77 additions & 0 deletions
diff --git a/‎deploy/sync/secrets.yaml.template‎
Lines changed: 50 additions & 0 deletions b/‎deploy/sync/secrets.yaml.template‎
Lines changed: 50 additions & 0 deletions
@@ -0,0 +1,27 @@
+# Image for the nightly prod -> staging sync CronJob.
+# Target: adracr.azurecr.io/adr-sync
+FROM ubuntu:24.04
+
+ENV DEBIAN_FRONTEND=noninteractive
+
+RUN apt-get update -qq && apt-get install -y -qq \
+        ca-certificates curl gnupg lsb-release tar python3 python3-pip python3-requests \
+    && install -d /usr/share/postgresql-common/pgdg \
+    && curl -fsSL https://www.postgresql.org/media/keys/ACCC4CF8.asc \
+        -o /usr/share/postgresql-common/pgdg/apt.postgresql.org.asc \
+    && echo "deb [signed-by=/usr/share/postgresql-common/pgdg/apt.postgresql.org.asc] https://apt.postgresql.org/pub/repos/apt $(lsb_release -cs)-pgdg main" \
+        > /etc/apt/sources.list.d/pgdg.list \
+    && apt-get update -qq \
+    && apt-get install -y -qq postgresql-client-16 \
+    && curl -fsSL https://aka.ms/downloadazcopy-v10-linux -o /tmp/azcopy.tgz \
+    && tar -xzf /tmp/azcopy.tgz -C /tmp \
+    && install /tmp/azcopy_linux_*/azcopy /usr/local/bin/azcopy \
+    && curl -fsSL -o /usr/local/bin/kubectl \
+        "https://dl.k8s.io/release/$(curl -fsSL https://dl.k8s.io/release/stable.txt)/bin/linux/amd64/kubectl" \
+    && chmod +x /usr/local/bin/kubectl \
+    && rm -rf /var/lib/apt/lists/* /tmp/azcopy*
+
+COPY sync.py /usr/local/bin/sync.py
+RUN chmod +x /usr/local/bin/sync.py
+
+ENTRYPOINT ["python3", "/usr/local/bin/sync.py"]
@@ -0,0 +1,77 @@
+# Nightly prod -> staging sync CronJob.
+# Apply with: kubectl apply -f deploy/sync/cronjob.yaml
+# Manual one-off run: kubectl create job --from=cronjob/adr-sync adr-sync-manual-$(date +%s) -n adr-s
+apiVersion: batch/v1
+kind: CronJob
+metadata:
+  name: adr-sync
+  namespace: adr-s
+spec:
+  schedule: "0 1 * * *"  # 01:00 UTC daily
+  timeZone: "Etc/UTC"
+  concurrencyPolicy: Forbid
+  successfulJobsHistoryLimit: 3
+  failedJobsHistoryLimit: 7
+  jobTemplate:
+    spec:
+      backoffLimit: 0  # don't retry — re-run manually after fixing
+      activeDeadlineSeconds: 14400  # 4 hours; datastore restore alone is ~90 min
+      template:
+        spec:
+          restartPolicy: Never
+          serviceAccountName: adr-sync  # needs `kubectl exec` on the ckan deployment
+          containers:
+            - name: sync
+              image: adracr.azurecr.io/adr-sync:latest
+              imagePullPolicy: Always
+              resources:
+                requests:
+                  cpu: "500m"
+                  memory: "1Gi"
+                limits:
+                  cpu: "2"
+                  memory: "4Gi"
+              envFrom:
+                - secretRef:
+                    name: adr-sync-secrets
+              env:
+                - name: CKAN_NAMESPACE
+                  value: "adr-s"
+                - name: CKAN_DEPLOYMENT
+                  value: "deploy/ckan"
+---
+apiVersion: v1
+kind: ServiceAccount
+metadata:
+  name: adr-sync
+  namespace: adr-s
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  name: adr-sync
+  namespace: adr-s
+rules:
+  - apiGroups: ["apps"]
+    resources: ["deployments"]
+    verbs: ["get", "patch"]
+  - apiGroups: ["apps"]
+    resources: ["deployments/scale"]
+    verbs: ["get", "patch", "update"]
+  - apiGroups: [""]
+    resources: ["pods", "pods/exec"]
+    verbs: ["get", "list", "create", "watch"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: RoleBinding
+metadata:
+  name: adr-sync
+  namespace: adr-s
+subjects:
+  - kind: ServiceAccount
+    name: adr-sync
+    namespace: adr-s
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: Role
+  name: adr-sync
@@ -0,0 +1,50 @@
+# Template for the k8s Secret consumed by the adr-sync CronJob.
+#
+# Do NOT commit a populated copy. Either:
+#   1. Use sealed-secrets / external-secrets and commit the encrypted form.
+#   2. Apply manually with `kubectl apply -f` from a local copy that lives
+#      only on the operator's machine.
+#
+# All values are strings. The SAS tokens should be issued with the minimum
+# necessary permissions:
+#   - PROD_LFS_SAS:        read+list on adr-p-datalake
+#   - SNAPSHOTS_SAS:       read+list+write+delete on adr-snapshots (full)
+#   - STAGING_LFS_SAS:     read+list+write+delete on adr-s-datalake
+#
+# Auth0 M2M scopes: read:users create:users (for users-exports job).
+# Use the canonical tenant domain (not the custom domain) for AUTH0_PROD_DOMAIN —
+# the Management API token endpoint validates against the canonical hostname.
+apiVersion: v1
+kind: Secret
+metadata:
+  name: adr-sync-secrets
+  namespace: adr-s
+type: Opaque
+stringData:
+  # Postgres connection URLs — use the ckan_admin (or equivalent) role with
+  # access to BOTH the ckan and datastore databases. The sync derives the
+  # datastore URL by swapping the path component. Do NOT use the limited
+  # `datastore` role here; it can't SELECT the UUID-named resource tables.
+  PROD_CKAN_PG_URL:    "postgresql://ckan_admin:PASS@adr-p-eun-db001.postgres.database.azure.com/ckan?sslmode=require"
+  STAGING_CKAN_PG_URL: "postgresql://ckan_admin:PASS@adr-s-eun-db001.postgres.database.azure.com/ckan?sslmode=require"
+
+  # Storage
+  SNAPSHOTS_ACCOUNT:        "adrsnapshotsta"
+  SNAPSHOTS_CONTAINER:      "snapshots"
+  SNAPSHOTS_SAS:            "sv=...&sig=..."   # full rwl(d) on the container
+  PROD_LFS_ACCOUNT:         "adrpeunsta"
+  PROD_LFS_CONTAINER:       "adr-p-datalake"
+  PROD_LFS_SAS:             "sv=...&sig=..."   # read+list only
+  STAGING_LFS_ACCOUNT:      "adrseunsta"
+  STAGING_LFS_CONTAINER:    "adr-s-datalake"
+  STAGING_LFS_SAS:          "sv=...&sig=..."   # rwl(d)
+
+  # Auth0 — single tenant, M2M creds for the users-exports backup job.
+  # Env var names are AUTH0_PROD_* for backward-compat with earlier secret revisions;
+  # there is no AUTH0_DEV_* anymore because prod and staging share one tenant.
+  AUTH0_PROD_DOMAIN:        "dev-udfgla0l.eu.auth0.com"   # canonical, not the vanity custom domain
+  AUTH0_PROD_CLIENT_ID:     "..."
+  AUTH0_PROD_CLIENT_SECRET: "..."
+
+  # Slack (optional — omit to disable notifications)
+  SLACK_WEBHOOK_URL:        "https://hooks.slack.com/services/..."