Compare commits
17 Commits
sprint44/c
...
runners/bl
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
ec78175526 | ||
|
|
2cc91b6df0 | ||
| 0d2090fe81 | |||
|
|
bc3548e715 | ||
| 74333cc26b | |||
|
|
7310fb88c2 | ||
| 148bc87b9a | |||
|
|
2a1e842100 | ||
| bc28430d24 | |||
|
|
cc92272217 | ||
| d6f4468a9c | |||
|
|
2f796a2ebd | ||
| 1f1f6823db | |||
|
|
b92f74b63a | ||
|
|
cb7f7dbc4d | ||
|
|
03126d5584 | ||
|
|
495e884c41 |
448
apps/authentik/authentik.yaml
Normal file
448
apps/authentik/authentik.yaml
Normal file
@@ -0,0 +1,448 @@
|
||||
# Authentik OIDC backend
|
||||
# ArgoCD-managed. BlueJay Lab.
|
||||
#
|
||||
# Stack:
|
||||
# - PostgreSQL 16 StatefulSet (single replica, Longhorn RWO 5Gi)
|
||||
# - Redis 7 Deployment (no persistence — session/cache only)
|
||||
# - Authentik server + worker Deployments (image ghcr.io/goauthentik/server:2024.12.3)
|
||||
# - Media PVC shared between server + worker (Longhorn RWO 2Gi)
|
||||
# - Certificate via step-ca-acme ClusterIssuer
|
||||
# - Traefik IngressRoute at id.iamworkin.lan
|
||||
#
|
||||
# Secrets come from 1Password item "authentik-credentials" (IAmWorkin vault, id y6i74ch22q5wvm7znquq4nhhcu)
|
||||
# via the OnePasswordItem CRD, materialized into k8s Secret authentik/authentik-credentials.
|
||||
#
|
||||
# Why the discovery URL is /application/o/pimanager/ : Authentik issues per-application OIDC providers.
|
||||
# The pimanager OIDC application/provider is created after the cluster pods are healthy (manual or
|
||||
# via API once the bootstrap token is available — see Notes substrate).
|
||||
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Namespace
|
||||
metadata:
|
||||
name: authentik
|
||||
labels:
|
||||
app.kubernetes.io/part-of: bluejay-infra
|
||||
|
||||
---
|
||||
# 1Password operator pulls the authentik-credentials item into a k8s Secret of the same name.
|
||||
# Field labels in 1P become Secret keys: AUTHENTIK_SECRET_KEY, POSTGRES_PASSWORD, REDIS_PASSWORD,
|
||||
# BOOTSTRAP_ADMIN_PASSWORD, BOOTSTRAP_ADMIN_TOKEN, BOOTSTRAP_ADMIN_EMAIL.
|
||||
apiVersion: onepassword.com/v1
|
||||
kind: OnePasswordItem
|
||||
metadata:
|
||||
name: authentik-credentials
|
||||
namespace: authentik
|
||||
spec:
|
||||
itemPath: "vaults/IAmWorkin/items/authentik-credentials"
|
||||
|
||||
---
|
||||
# Shared media volume for server + worker pods.
|
||||
apiVersion: v1
|
||||
kind: PersistentVolumeClaim
|
||||
metadata:
|
||||
name: authentik-media
|
||||
namespace: authentik
|
||||
spec:
|
||||
storageClassName: longhorn
|
||||
accessModes: [ReadWriteOnce]
|
||||
resources:
|
||||
requests:
|
||||
storage: 2Gi
|
||||
|
||||
---
|
||||
# PostgreSQL 16 StatefulSet — Authentik's primary store.
|
||||
apiVersion: apps/v1
|
||||
kind: StatefulSet
|
||||
metadata:
|
||||
name: authentik-postgres
|
||||
namespace: authentik
|
||||
labels:
|
||||
app: authentik-postgres
|
||||
argocd.argoproj.io/instance: infra-authentik
|
||||
spec:
|
||||
persistentVolumeClaimRetentionPolicy:
|
||||
whenDeleted: Retain
|
||||
whenScaled: Retain
|
||||
podManagementPolicy: OrderedReady
|
||||
serviceName: authentik-postgres
|
||||
replicas: 1
|
||||
revisionHistoryLimit: 10
|
||||
selector:
|
||||
matchLabels:
|
||||
app: authentik-postgres
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: authentik-postgres
|
||||
spec:
|
||||
containers:
|
||||
- name: postgres
|
||||
image: postgres:16-alpine
|
||||
ports:
|
||||
- containerPort: 5432
|
||||
name: postgres
|
||||
env:
|
||||
- name: POSTGRES_USER
|
||||
value: authentik
|
||||
- name: POSTGRES_PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: POSTGRES_PASSWORD
|
||||
- name: POSTGRES_DB
|
||||
value: authentik
|
||||
- name: POSTGRES_INITDB_ARGS
|
||||
value: "--encoding=UTF-8 --lc-collate=C --lc-ctype=C"
|
||||
- name: PGDATA
|
||||
value: /var/lib/postgresql/data/pgdata
|
||||
readinessProbe:
|
||||
exec:
|
||||
command: ["pg_isready", "-U", "authentik"]
|
||||
initialDelaySeconds: 5
|
||||
periodSeconds: 5
|
||||
livenessProbe:
|
||||
exec:
|
||||
command: ["pg_isready", "-U", "authentik"]
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 30
|
||||
resources:
|
||||
requests: { cpu: 100m, memory: 256Mi }
|
||||
limits: { cpu: 1000m, memory: 1Gi }
|
||||
volumeMounts:
|
||||
- name: pgdata
|
||||
mountPath: /var/lib/postgresql/data
|
||||
volumeClaimTemplates:
|
||||
- metadata:
|
||||
name: pgdata
|
||||
spec:
|
||||
storageClassName: longhorn
|
||||
accessModes: [ReadWriteOnce]
|
||||
volumeMode: Filesystem
|
||||
resources:
|
||||
requests:
|
||||
storage: 5Gi
|
||||
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Service
|
||||
metadata:
|
||||
name: authentik-postgres
|
||||
namespace: authentik
|
||||
spec:
|
||||
clusterIP: None
|
||||
selector:
|
||||
app: authentik-postgres
|
||||
ports:
|
||||
- name: postgres
|
||||
port: 5432
|
||||
targetPort: 5432
|
||||
|
||||
---
|
||||
# Redis 7 — session storage + Celery broker. No persistence needed (cache).
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
name: authentik-redis
|
||||
namespace: authentik
|
||||
labels:
|
||||
app: authentik-redis
|
||||
argocd.argoproj.io/instance: infra-authentik
|
||||
spec:
|
||||
replicas: 1
|
||||
strategy:
|
||||
type: Recreate
|
||||
selector:
|
||||
matchLabels:
|
||||
app: authentik-redis
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: authentik-redis
|
||||
spec:
|
||||
containers:
|
||||
- name: redis
|
||||
image: redis:7-alpine
|
||||
args:
|
||||
- "--save"
|
||||
- ""
|
||||
- "--appendonly"
|
||||
- "no"
|
||||
- "--requirepass"
|
||||
- "$(REDIS_PASSWORD)"
|
||||
env:
|
||||
- name: REDIS_PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: REDIS_PASSWORD
|
||||
ports:
|
||||
- containerPort: 6379
|
||||
name: redis
|
||||
readinessProbe:
|
||||
tcpSocket: { port: 6379 }
|
||||
initialDelaySeconds: 5
|
||||
periodSeconds: 5
|
||||
livenessProbe:
|
||||
tcpSocket: { port: 6379 }
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 30
|
||||
resources:
|
||||
requests: { cpu: 50m, memory: 64Mi }
|
||||
limits: { cpu: 500m, memory: 256Mi }
|
||||
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Service
|
||||
metadata:
|
||||
name: authentik-redis
|
||||
namespace: authentik
|
||||
spec:
|
||||
selector:
|
||||
app: authentik-redis
|
||||
ports:
|
||||
- name: redis
|
||||
port: 6379
|
||||
targetPort: 6379
|
||||
|
||||
---
|
||||
# Authentik server Deployment — HTTP frontend on :9000.
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
name: authentik-server
|
||||
namespace: authentik
|
||||
labels:
|
||||
app: authentik-server
|
||||
argocd.argoproj.io/instance: infra-authentik
|
||||
spec:
|
||||
replicas: 1
|
||||
strategy:
|
||||
type: Recreate # shares /media RWO PVC with worker
|
||||
selector:
|
||||
matchLabels:
|
||||
app: authentik-server
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: authentik-server
|
||||
spec:
|
||||
securityContext:
|
||||
# Authentik image runs as uid 1000 "authentik" but the Longhorn PVC mounts
|
||||
# root:root by default. fsGroup recursively chgrp + chmod g+rwx so the
|
||||
# non-root container can mkdir /media/public during the tenant_files migration.
|
||||
fsGroup: 1000
|
||||
containers:
|
||||
- name: server
|
||||
image: ghcr.io/goauthentik/server:2024.12.3
|
||||
args: ["server"]
|
||||
ports:
|
||||
- containerPort: 9000
|
||||
name: http
|
||||
- containerPort: 9443
|
||||
name: https
|
||||
env:
|
||||
- name: AUTHENTIK_SECRET_KEY
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: AUTHENTIK_SECRET_KEY
|
||||
- name: AUTHENTIK_REDIS__HOST
|
||||
value: authentik-redis
|
||||
- name: AUTHENTIK_REDIS__PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: REDIS_PASSWORD
|
||||
- name: AUTHENTIK_POSTGRESQL__HOST
|
||||
value: authentik-postgres
|
||||
- name: AUTHENTIK_POSTGRESQL__NAME
|
||||
value: authentik
|
||||
- name: AUTHENTIK_POSTGRESQL__USER
|
||||
value: authentik
|
||||
- name: AUTHENTIK_POSTGRESQL__PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: POSTGRES_PASSWORD
|
||||
- name: AUTHENTIK_BOOTSTRAP_PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: BOOTSTRAP_ADMIN_PASSWORD
|
||||
- name: AUTHENTIK_BOOTSTRAP_TOKEN
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: BOOTSTRAP_ADMIN_TOKEN
|
||||
- name: AUTHENTIK_BOOTSTRAP_EMAIL
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: BOOTSTRAP_ADMIN_EMAIL
|
||||
- name: AUTHENTIK_DISABLE_UPDATE_CHECK
|
||||
value: "true"
|
||||
- name: AUTHENTIK_ERROR_REPORTING__ENABLED
|
||||
value: "false"
|
||||
- name: AUTHENTIK_LOG_LEVEL
|
||||
value: info
|
||||
# First-boot Authentik can take 3+ min on the migration phase
|
||||
# (waiting on DB lock while worker also runs migrations). Initial
|
||||
# delays are generous so kubelet doesn't kill the pod mid-migration;
|
||||
# periodSeconds keeps post-startup probing responsive.
|
||||
readinessProbe:
|
||||
httpGet:
|
||||
path: /-/health/ready/
|
||||
port: 9000
|
||||
initialDelaySeconds: 60
|
||||
periodSeconds: 10
|
||||
timeoutSeconds: 5
|
||||
failureThreshold: 12
|
||||
livenessProbe:
|
||||
httpGet:
|
||||
path: /-/health/live/
|
||||
port: 9000
|
||||
initialDelaySeconds: 300
|
||||
periodSeconds: 30
|
||||
timeoutSeconds: 10
|
||||
failureThreshold: 3
|
||||
startupProbe:
|
||||
httpGet:
|
||||
path: /-/health/live/
|
||||
port: 9000
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 15
|
||||
timeoutSeconds: 10
|
||||
failureThreshold: 40 # 30s + 40*15s = 10.5 min budget
|
||||
resources:
|
||||
requests: { cpu: 150m, memory: 512Mi }
|
||||
limits: { cpu: 1500m, memory: 1Gi }
|
||||
volumeMounts:
|
||||
- name: media
|
||||
mountPath: /media
|
||||
volumes:
|
||||
- name: media
|
||||
persistentVolumeClaim:
|
||||
claimName: authentik-media
|
||||
|
||||
---
|
||||
# Authentik worker Deployment — runs Celery background tasks.
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
name: authentik-worker
|
||||
namespace: authentik
|
||||
labels:
|
||||
app: authentik-worker
|
||||
argocd.argoproj.io/instance: infra-authentik
|
||||
spec:
|
||||
replicas: 1
|
||||
strategy:
|
||||
type: Recreate # shares /media RWO PVC with server
|
||||
selector:
|
||||
matchLabels:
|
||||
app: authentik-worker
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: authentik-worker
|
||||
spec:
|
||||
securityContext:
|
||||
# Same as server pod — non-root uid 1000 needs PVC group write.
|
||||
fsGroup: 1000
|
||||
containers:
|
||||
- name: worker
|
||||
image: ghcr.io/goauthentik/server:2024.12.3
|
||||
args: ["worker"]
|
||||
env:
|
||||
- name: AUTHENTIK_SECRET_KEY
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: AUTHENTIK_SECRET_KEY
|
||||
- name: AUTHENTIK_REDIS__HOST
|
||||
value: authentik-redis
|
||||
- name: AUTHENTIK_REDIS__PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: REDIS_PASSWORD
|
||||
- name: AUTHENTIK_POSTGRESQL__HOST
|
||||
value: authentik-postgres
|
||||
- name: AUTHENTIK_POSTGRESQL__NAME
|
||||
value: authentik
|
||||
- name: AUTHENTIK_POSTGRESQL__USER
|
||||
value: authentik
|
||||
- name: AUTHENTIK_POSTGRESQL__PASSWORD
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: authentik-credentials
|
||||
key: POSTGRES_PASSWORD
|
||||
- name: AUTHENTIK_DISABLE_UPDATE_CHECK
|
||||
value: "true"
|
||||
- name: AUTHENTIK_ERROR_REPORTING__ENABLED
|
||||
value: "false"
|
||||
- name: AUTHENTIK_LOG_LEVEL
|
||||
value: info
|
||||
resources:
|
||||
requests: { cpu: 100m, memory: 256Mi }
|
||||
limits: { cpu: 1000m, memory: 768Mi }
|
||||
volumeMounts:
|
||||
- name: media
|
||||
mountPath: /media
|
||||
volumes:
|
||||
- name: media
|
||||
persistentVolumeClaim:
|
||||
claimName: authentik-media
|
||||
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Service
|
||||
metadata:
|
||||
name: authentik-server
|
||||
namespace: authentik
|
||||
spec:
|
||||
selector:
|
||||
app: authentik-server
|
||||
ports:
|
||||
- name: http
|
||||
port: 9000
|
||||
targetPort: 9000
|
||||
- name: https
|
||||
port: 9443
|
||||
targetPort: 9443
|
||||
|
||||
---
|
||||
# step-ca leaf certificate for id.iamworkin.lan.
|
||||
# step-ca container resolver uses pfSense Unbound, so the public A record for id.iamworkin.lan
|
||||
# MUST exist before this Certificate is applied (cert-manager HTTP-01 will silently 2h-backoff
|
||||
# otherwise). Added 2026-05-25 via scripts/pfsense-add-id-host.py.
|
||||
apiVersion: cert-manager.io/v1
|
||||
kind: Certificate
|
||||
metadata:
|
||||
name: authentik-tls
|
||||
namespace: authentik
|
||||
spec:
|
||||
secretName: authentik-tls
|
||||
dnsNames:
|
||||
- id.iamworkin.lan
|
||||
issuerRef:
|
||||
name: step-ca-acme
|
||||
kind: ClusterIssuer
|
||||
|
||||
---
|
||||
apiVersion: traefik.io/v1alpha1
|
||||
kind: IngressRoute
|
||||
metadata:
|
||||
name: authentik
|
||||
namespace: authentik
|
||||
spec:
|
||||
entryPoints: [websecure]
|
||||
routes:
|
||||
- match: Host(`id.iamworkin.lan`)
|
||||
kind: Rule
|
||||
services:
|
||||
- name: authentik-server
|
||||
port: 9000
|
||||
tls:
|
||||
secretName: authentik-tls
|
||||
@@ -1,33 +0,0 @@
|
||||
# FlowerCore Remote Desktop - session pod resource defaults
|
||||
#
|
||||
# Namespace-level LimitRange for Sprint 44 Phase 1. This defends the
|
||||
# fc-desktop namespace from unbounded container requests while the
|
||||
# per-tenant advisory FairShareEvaluator lands in FlowerCore.RemoteDesktop.
|
||||
apiVersion: v1
|
||||
kind: LimitRange
|
||||
metadata:
|
||||
name: fc-desktop-pod-defaults
|
||||
namespace: fc-desktop
|
||||
labels:
|
||||
app.kubernetes.io/name: fc-desktop
|
||||
app.kubernetes.io/part-of: remotedesktop
|
||||
app.kubernetes.io/component: capacity-guard
|
||||
app.kubernetes.io/managed-by: argocd
|
||||
flowercore.io/owner: infra
|
||||
annotations:
|
||||
flowercore.io/phase: sprint-44-cx-9-phase-a
|
||||
spec:
|
||||
limits:
|
||||
- type: Container
|
||||
default:
|
||||
cpu: "1.0"
|
||||
memory: "2Gi"
|
||||
defaultRequest:
|
||||
cpu: "500m"
|
||||
memory: "1Gi"
|
||||
max:
|
||||
cpu: "2.0"
|
||||
memory: "4Gi"
|
||||
min:
|
||||
cpu: "100m"
|
||||
memory: "128Mi"
|
||||
@@ -1,36 +0,0 @@
|
||||
# FlowerCore Remote Desktop - namespace ResourceQuota (GitOps-managed)
|
||||
#
|
||||
# Adopts the live fc-desktop-session-cap object created during the
|
||||
# 2026-05-19 prewarm-cascade triage. Sprint 44 Phase 1 keeps the pod,
|
||||
# CPU, and memory guard unchanged, then adds storage/PVC backstops from
|
||||
# the fc-desktop CPU expansion substrate.
|
||||
#
|
||||
# Two-phase deploy note:
|
||||
# Phase A: apply this ResourceQuota and limitrange.yaml with the current
|
||||
# FlowerCore.RemoteDesktop image.
|
||||
# Phase B: bump the service image only after the RemoteDesktop service
|
||||
# admission/fair-share code lands in that repo.
|
||||
apiVersion: v1
|
||||
kind: ResourceQuota
|
||||
metadata:
|
||||
name: fc-desktop-session-cap
|
||||
namespace: fc-desktop
|
||||
labels:
|
||||
app.kubernetes.io/name: fc-desktop
|
||||
app.kubernetes.io/part-of: remotedesktop
|
||||
app.kubernetes.io/component: capacity-guard
|
||||
app.kubernetes.io/managed-by: argocd
|
||||
flowercore.io/owner: infra
|
||||
annotations:
|
||||
flowercore.io/rationale: |
|
||||
Operator-requested limit 2026-05-19: cluster CPU exhausted by RD
|
||||
pool prewarm cascade. Preserve count/pods=15 plus requests.cpu=8
|
||||
and requests.memory=16Gi until capacity expansion lands.
|
||||
flowercore.io/phase: sprint-44-cx-9-phase-a
|
||||
spec:
|
||||
hard:
|
||||
count/pods: "15"
|
||||
requests.cpu: "8"
|
||||
requests.memory: "16Gi"
|
||||
requests.storage: "500Gi"
|
||||
persistentvolumeclaims: "30"
|
||||
@@ -12,6 +12,15 @@ ENV PATH="/home/runner/_tool/Ruby/${RUBY_MINOR}/x64/bin:/opt/runner-toolcache/Ru
|
||||
|
||||
USER root
|
||||
|
||||
# Bake the IAmWorkin step-ca root CA into the system trust store. Without
|
||||
# this, .NET HttpClient calls from CI tests against *.iamworkin.lan
|
||||
# (e.g. https://selenium.iamworkin.lan/session) fail with `PartialChain`
|
||||
# because the runner image's default Ubuntu trust bundle doesn't include
|
||||
# our internal Root CA. update-ca-certificates regenerates
|
||||
# /etc/ssl/certs/ca-certificates.crt, which OpenSSL + .NET on Linux read
|
||||
# automatically — no SSL_CERT_FILE env var needed.
|
||||
COPY step-ca-root.crt /usr/local/share/ca-certificates/iamworkin-step-ca-root.crt
|
||||
|
||||
RUN apt-get update \
|
||||
&& DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \
|
||||
autoconf \
|
||||
@@ -31,6 +40,7 @@ RUN apt-get update \
|
||||
pkg-config \
|
||||
uuid-dev \
|
||||
zlib1g-dev \
|
||||
&& update-ca-certificates \
|
||||
&& curl -fsSL "https://github.com/rbenv/ruby-build/archive/refs/tags/${RUBY_BUILD_VERSION}.tar.gz" -o /tmp/ruby-build.tar.gz \
|
||||
&& mkdir -p /tmp/ruby-build \
|
||||
&& tar -xzf /tmp/ruby-build.tar.gz --strip-components=1 -C /tmp/ruby-build \
|
||||
|
||||
@@ -7,7 +7,7 @@ Deployments with `kubectl`; update this manifest and let ArgoCD reconcile.
|
||||
|
||||
All repo-scoped Linux runners use:
|
||||
|
||||
- `localhost/fc-github-runner:v20260520-ruby3.3.11`, derived from
|
||||
- `localhost/fc-github-runner:v20260525-ruby3.3.11-stepca`, derived from
|
||||
`myoung34/github-runner:latest`
|
||||
- `ACCESS_TOKEN` from the `github-runner-token` Secret
|
||||
- `RUN_AS_ROOT=false`
|
||||
@@ -40,14 +40,26 @@ still mounts an `emptyDir` over `/home/runner`, so the `setup-runner-home` init
|
||||
container copies the baked toolcache from `/opt/runner-toolcache/Ruby` into
|
||||
`/home/runner/_tool/Ruby` before the runner container starts.
|
||||
|
||||
The IAmWorkin step-ca root CA is also baked into the system trust store
|
||||
(`/usr/local/share/ca-certificates/iamworkin-step-ca-root.crt`, registered by
|
||||
`update-ca-certificates`). Without it, .NET HttpClient calls from CI tests
|
||||
against `*.iamworkin.lan` (e.g. `https://selenium.iamworkin.lan/session`)
|
||||
fail with `PartialChain`. To refresh the bundled cert when the root rotates,
|
||||
re-extract from the cluster and overwrite `step-ca-root.crt`:
|
||||
|
||||
```bash
|
||||
kubectl get secret -n cert-manager step-ca-root \
|
||||
-o jsonpath='{.data.ca\.crt}' | base64 -d > step-ca-root.crt
|
||||
```
|
||||
|
||||
```bash
|
||||
cd apps/github-runner
|
||||
podman build -t localhost/fc-github-runner:v20260520-ruby3.3.11 .
|
||||
podman run --rm localhost/fc-github-runner:v20260520-ruby3.3.11 ruby -v
|
||||
podman run --rm localhost/fc-github-runner:v20260520-ruby3.3.11 \
|
||||
podman build -t localhost/fc-github-runner:v20260525-ruby3.3.11-stepca .
|
||||
podman run --rm localhost/fc-github-runner:v20260525-ruby3.3.11-stepca ruby -v
|
||||
podman run --rm localhost/fc-github-runner:v20260525-ruby3.3.11-stepca \
|
||||
test -f /opt/runner-toolcache/Ruby/3.3/x64.complete
|
||||
podman save localhost/fc-github-runner:v20260520-ruby3.3.11 \
|
||||
-o fc-github-runner-v20260520-ruby3.3.11.tar
|
||||
podman save localhost/fc-github-runner:v20260525-ruby3.3.11-stepca \
|
||||
-o fc-github-runner-v20260525-ruby3.3.11-stepca.tar
|
||||
```
|
||||
|
||||
Import the saved image on every schedulable RKE2 node before ArgoCD rolls the
|
||||
@@ -55,9 +67,9 @@ Deployments:
|
||||
|
||||
```bash
|
||||
for node in rke2-server rke2-agent1 rke2-agent2; do
|
||||
scp fc-github-runner-v20260520-ruby3.3.11.tar "$node:/tmp/"
|
||||
ssh "$node" 'sudo ctr -a /run/k3s/containerd/containerd.sock -n k8s.io images rm localhost/fc-github-runner:v20260520-ruby3.3.11 || true'
|
||||
ssh "$node" 'sudo ctr -a /run/k3s/containerd/containerd.sock -n k8s.io images import /tmp/fc-github-runner-v20260520-ruby3.3.11.tar'
|
||||
scp fc-github-runner-v20260525-ruby3.3.11-stepca.tar "$node:/tmp/"
|
||||
ssh "$node" 'sudo ctr -a /run/k3s/containerd/containerd.sock -n k8s.io images rm localhost/fc-github-runner:v20260525-ruby3.3.11-stepca || true'
|
||||
ssh "$node" 'sudo ctr -a /run/k3s/containerd/containerd.sock -n k8s.io images import /tmp/fc-github-runner-v20260525-ruby3.3.11-stepca.tar'
|
||||
done
|
||||
```
|
||||
|
||||
|
||||
@@ -22,7 +22,7 @@
|
||||
# NUGET_PACKAGES, XDG_CACHE_HOME, and RUNNER_TOOL_CACHE are all pointed at
|
||||
# writable mounted paths under /home/runner so actions/setup-dotnet does not
|
||||
# attempt to install into /usr/share/dotnet.
|
||||
# Ruby 3.3.11 is baked into localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
# Ruby 3.3.11 is baked into localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
# under /opt/runner-toolcache; setup-runner-home copies it into
|
||||
# /home/runner/_tool because the runner-home emptyDir masks image content
|
||||
# under /home/runner at runtime.
|
||||
@@ -157,7 +157,7 @@ spec:
|
||||
# honors the deeper mount.
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -178,7 +178,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
# GitHub org/repo targeting.
|
||||
@@ -334,7 +334,7 @@ spec:
|
||||
# rather than re-applied per repo as flipped lanes land.
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -355,7 +355,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -472,7 +472,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -493,7 +493,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -604,7 +604,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -625,7 +625,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -736,7 +736,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -757,7 +757,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -868,7 +868,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -889,7 +889,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -976,7 +976,10 @@ metadata:
|
||||
flowercore.io/runner-repo: print-web
|
||||
flowercore.io/github-repo: FlowerCore.Print.Web
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): bumped 2 → 3 because help-screenshots
|
||||
# AAT job holds a runner 30+ min, causing head-of-line blocking on parallel PRs.
|
||||
# 12 runs in trailing 5d.
|
||||
replicas: 3
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-print-web
|
||||
@@ -1000,7 +1003,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1021,7 +1024,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1132,7 +1135,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1153,7 +1156,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1264,7 +1267,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1285,7 +1288,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1396,7 +1399,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1417,7 +1420,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1530,7 +1533,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1551,7 +1554,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1664,7 +1667,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1685,7 +1688,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1723,13 +1726,17 @@ spec:
|
||||
key: credential
|
||||
- name: RUN_AS_ROOT
|
||||
value: "false"
|
||||
# Bumped 2026-05-25: previous 4Gi limit caused OOMKill (exit 137)
|
||||
# mid-`dotnet test` on TtsReader's 1000+ test suite. PR #21 CI flapped
|
||||
# twice with "runner lost communication" before the K8s side
|
||||
# symptoms surfaced. 8Gi gives ~30% headroom over peak observed.
|
||||
resources:
|
||||
requests:
|
||||
cpu: "500m"
|
||||
memory: "1Gi"
|
||||
memory: "2Gi"
|
||||
limits:
|
||||
cpu: "2000m"
|
||||
memory: "4Gi"
|
||||
memory: "8Gi"
|
||||
volumeMounts:
|
||||
- name: runner-home
|
||||
mountPath: /home/runner
|
||||
@@ -1774,7 +1781,8 @@ metadata:
|
||||
flowercore.io/runner-repo: knowledge
|
||||
flowercore.io/github-repo: FlowerCore.Knowledge
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — zero CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-knowledge
|
||||
@@ -1798,7 +1806,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1819,7 +1827,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -1907,7 +1915,8 @@ metadata:
|
||||
flowercore.io/runner-repo: llm-bridge
|
||||
flowercore.io/github-repo: FlowerCore.LlmBridge
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — zero CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-llm-bridge
|
||||
@@ -1931,7 +1940,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -1952,7 +1961,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2040,7 +2049,8 @@ metadata:
|
||||
flowercore.io/runner-repo: media
|
||||
flowercore.io/github-repo: FlowerCore.Media
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — zero CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-media
|
||||
@@ -2064,7 +2074,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2085,7 +2095,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2173,7 +2183,8 @@ metadata:
|
||||
flowercore.io/runner-repo: presentations
|
||||
flowercore.io/github-repo: FlowerCore.Presentations
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — only 6 CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-presentations
|
||||
@@ -2197,7 +2208,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2218,7 +2229,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2330,7 +2341,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2351,7 +2362,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2439,7 +2450,8 @@ metadata:
|
||||
flowercore.io/runner-repo: dns
|
||||
flowercore.io/github-repo: FlowerCore.DNS
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — zero CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-dns
|
||||
@@ -2463,7 +2475,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2484,7 +2496,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2596,7 +2608,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2617,7 +2629,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2729,7 +2741,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2750,7 +2762,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2862,7 +2874,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -2883,7 +2895,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -2995,7 +3007,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3016,7 +3028,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3128,7 +3140,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3149,7 +3161,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3237,7 +3249,8 @@ metadata:
|
||||
flowercore.io/runner-repo: intranet-web
|
||||
flowercore.io/github-repo: FlowerCore.Intranet.Web
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — zero CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-intranet-web
|
||||
@@ -3261,7 +3274,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3282,7 +3295,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3370,7 +3383,8 @@ metadata:
|
||||
flowercore.io/runner-repo: provisioning
|
||||
flowercore.io/github-repo: FlowerCore.Provisioning
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — only 3 CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-provisioning
|
||||
@@ -3394,7 +3408,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3415,7 +3429,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3503,7 +3517,8 @@ metadata:
|
||||
flowercore.io/runner-repo: redis
|
||||
flowercore.io/github-repo: FlowerCore.Redis
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — only 3 CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-redis
|
||||
@@ -3527,7 +3542,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3548,7 +3563,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3636,7 +3651,8 @@ metadata:
|
||||
flowercore.io/runner-repo: message-board
|
||||
flowercore.io/github-repo: FlowerCore.MessageBoard
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — only 3 CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-message-board
|
||||
@@ -3660,7 +3676,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3681,7 +3697,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3769,7 +3785,8 @@ metadata:
|
||||
flowercore.io/runner-repo: menu-board
|
||||
flowercore.io/github-repo: FlowerCore.MenuBoard
|
||||
spec:
|
||||
replicas: 2
|
||||
# Sprint 33 morning-routine (2026-05-25): dropped 2 → 1 — only 3 CI runs in trailing 14d.
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-menu-board
|
||||
@@ -3793,7 +3810,7 @@ spec:
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
@@ -3814,7 +3831,7 @@ spec:
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260520-ruby3.3.11
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
@@ -3884,9 +3901,277 @@ spec:
|
||||
- name: tmp
|
||||
emptyDir: {}
|
||||
restartPolicy: Always
|
||||
---
|
||||
# Runner for FlowerCore.PiManager. Two replicas use per-pod emptyDir caches, so
|
||||
# backlog can drain without sharing a ReadWriteOnce PVC. Added 2026-05-25 to
|
||||
# close the runner-fleet gap that left run 26417714843 queued for 5h.
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
name: github-runner-pimanager
|
||||
namespace: github-runner
|
||||
labels:
|
||||
app.kubernetes.io/name: github-runner-pimanager
|
||||
app.kubernetes.io/component: runner
|
||||
app.kubernetes.io/part-of: flowercore
|
||||
app.kubernetes.io/managed-by: argocd
|
||||
flowercore.io/created-by: argocd
|
||||
flowercore.io/runner-repo: pimanager
|
||||
flowercore.io/github-repo: FlowerCore.PiManager
|
||||
spec:
|
||||
replicas: 2
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-pimanager
|
||||
strategy:
|
||||
type: Recreate
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app.kubernetes.io/name: github-runner-pimanager
|
||||
app.kubernetes.io/component: runner
|
||||
app.kubernetes.io/part-of: flowercore
|
||||
flowercore.io/created-by: argocd
|
||||
flowercore.io/runner-repo: pimanager
|
||||
flowercore.io/github-repo: FlowerCore.PiManager
|
||||
spec:
|
||||
serviceAccountName: github-runner
|
||||
securityContext:
|
||||
runAsNonRoot: true
|
||||
runAsUser: 1001
|
||||
runAsGroup: 1001
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
- -c
|
||||
- |
|
||||
set -e
|
||||
mkdir -p /home/runner/.dotnet /home/runner/.nuget/packages /home/runner/.nuget/NuGet /home/runner/.cache /home/runner/_tool
|
||||
if [ -d /opt/runner-toolcache/Ruby ] && [ ! -d /home/runner/_tool/Ruby ]; then
|
||||
cp -a /opt/runner-toolcache/Ruby /home/runner/_tool/
|
||||
fi
|
||||
chown -R 1001:1001 /home/runner/.dotnet /home/runner/.nuget /home/runner/.cache /home/runner/_tool
|
||||
chmod -R 755 /home/runner/.dotnet /home/runner/.nuget /home/runner/.cache /home/runner/_tool
|
||||
securityContext:
|
||||
runAsUser: 0
|
||||
runAsNonRoot: false
|
||||
volumeMounts:
|
||||
- name: runner-home
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
value: "https://github.com/astoltz/FlowerCore.PiManager"
|
||||
- name: RUNNER_NAME_PREFIX
|
||||
value: "rke2-linux-pimanager"
|
||||
- name: RUNNER_WORKDIR
|
||||
value: "/tmp/runner/work"
|
||||
- name: EPHEMERAL
|
||||
value: "true"
|
||||
- name: LABELS
|
||||
value: "self-hosted,linux,fc-build-linux"
|
||||
- name: HOME
|
||||
value: "/home/runner"
|
||||
- name: DOTNET_INSTALL_DIR
|
||||
value: "/home/runner/.dotnet"
|
||||
- name: DOTNET_CLI_TELEMETRY_OPTOUT
|
||||
value: "1"
|
||||
- name: DOTNET_NOLOGO
|
||||
value: "1"
|
||||
- name: DOTNET_GENERATE_ASPNET_CERTIFICATE
|
||||
value: "false"
|
||||
- name: DOTNET_CLI_HOME
|
||||
value: "/home/runner"
|
||||
- name: NUGET_PACKAGES
|
||||
value: "/home/runner/.nuget/packages"
|
||||
- name: XDG_CACHE_HOME
|
||||
value: "/home/runner/.cache"
|
||||
- name: RUNNER_TOOL_CACHE
|
||||
value: "/home/runner/_tool"
|
||||
- name: ACCESS_TOKEN
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: github-runner-token
|
||||
key: credential
|
||||
- name: RUN_AS_ROOT
|
||||
value: "false"
|
||||
resources:
|
||||
requests:
|
||||
cpu: "500m"
|
||||
memory: "1Gi"
|
||||
limits:
|
||||
cpu: "2000m"
|
||||
memory: "4Gi"
|
||||
volumeMounts:
|
||||
- name: runner-home
|
||||
mountPath: /home/runner
|
||||
- name: nuget-cache
|
||||
mountPath: /home/runner/.nuget/packages
|
||||
- name: tmp
|
||||
mountPath: /tmp
|
||||
livenessProbe:
|
||||
exec:
|
||||
command:
|
||||
- /bin/sh
|
||||
- -c
|
||||
- "pgrep -f Runner.Listener > /dev/null"
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 30
|
||||
failureThreshold: 3
|
||||
volumes:
|
||||
- name: runner-home
|
||||
emptyDir: {}
|
||||
- name: nuget-cache
|
||||
emptyDir:
|
||||
sizeLimit: 2Gi
|
||||
- name: tmp
|
||||
emptyDir: {}
|
||||
restartPolicy: Always
|
||||
---
|
||||
# Runner for FlowerCore.Updater. Two replicas use per-pod emptyDir caches, so
|
||||
# backlog can drain without sharing a ReadWriteOnce PVC. Added 2026-05-26 to
|
||||
# close the runner-fleet gap that left the repo with only the offline
|
||||
# windows-sandbox runner and no Linux PR-CI capacity for future workflows.
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
name: github-runner-updater
|
||||
namespace: github-runner
|
||||
labels:
|
||||
app.kubernetes.io/name: github-runner-updater
|
||||
app.kubernetes.io/component: runner
|
||||
app.kubernetes.io/part-of: flowercore
|
||||
app.kubernetes.io/managed-by: argocd
|
||||
flowercore.io/created-by: argocd
|
||||
flowercore.io/runner-repo: updater
|
||||
flowercore.io/github-repo: FlowerCore.Updater
|
||||
spec:
|
||||
replicas: 2
|
||||
selector:
|
||||
matchLabels:
|
||||
app.kubernetes.io/name: github-runner-updater
|
||||
strategy:
|
||||
type: Recreate
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app.kubernetes.io/name: github-runner-updater
|
||||
app.kubernetes.io/component: runner
|
||||
app.kubernetes.io/part-of: flowercore
|
||||
flowercore.io/created-by: argocd
|
||||
flowercore.io/runner-repo: updater
|
||||
flowercore.io/github-repo: FlowerCore.Updater
|
||||
spec:
|
||||
serviceAccountName: github-runner
|
||||
securityContext:
|
||||
runAsNonRoot: true
|
||||
runAsUser: 1001
|
||||
runAsGroup: 1001
|
||||
fsGroup: 1001
|
||||
initContainers:
|
||||
- name: setup-runner-home
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
command:
|
||||
- sh
|
||||
- -c
|
||||
- |
|
||||
set -e
|
||||
mkdir -p /home/runner/.dotnet /home/runner/.nuget/packages /home/runner/.nuget/NuGet /home/runner/.cache /home/runner/_tool
|
||||
if [ -d /opt/runner-toolcache/Ruby ] && [ ! -d /home/runner/_tool/Ruby ]; then
|
||||
cp -a /opt/runner-toolcache/Ruby /home/runner/_tool/
|
||||
fi
|
||||
chown -R 1001:1001 /home/runner/.dotnet /home/runner/.nuget /home/runner/.cache /home/runner/_tool
|
||||
chmod -R 755 /home/runner/.dotnet /home/runner/.nuget /home/runner/.cache /home/runner/_tool
|
||||
securityContext:
|
||||
runAsUser: 0
|
||||
runAsNonRoot: false
|
||||
volumeMounts:
|
||||
- name: runner-home
|
||||
mountPath: /home/runner
|
||||
containers:
|
||||
- name: runner
|
||||
image: localhost/fc-github-runner:v20260525-ruby3.3.11-stepca
|
||||
imagePullPolicy: Never
|
||||
env:
|
||||
- name: REPO_URL
|
||||
value: "https://github.com/astoltz/FlowerCore.Updater"
|
||||
- name: RUNNER_NAME_PREFIX
|
||||
value: "rke2-linux-updater"
|
||||
- name: RUNNER_WORKDIR
|
||||
value: "/tmp/runner/work"
|
||||
- name: EPHEMERAL
|
||||
value: "true"
|
||||
- name: LABELS
|
||||
value: "self-hosted,linux,fc-build-linux"
|
||||
- name: HOME
|
||||
value: "/home/runner"
|
||||
- name: DOTNET_INSTALL_DIR
|
||||
value: "/home/runner/.dotnet"
|
||||
- name: DOTNET_CLI_TELEMETRY_OPTOUT
|
||||
value: "1"
|
||||
- name: DOTNET_NOLOGO
|
||||
value: "1"
|
||||
- name: DOTNET_GENERATE_ASPNET_CERTIFICATE
|
||||
value: "false"
|
||||
- name: DOTNET_CLI_HOME
|
||||
value: "/home/runner"
|
||||
- name: NUGET_PACKAGES
|
||||
value: "/home/runner/.nuget/packages"
|
||||
- name: XDG_CACHE_HOME
|
||||
value: "/home/runner/.cache"
|
||||
- name: RUNNER_TOOL_CACHE
|
||||
value: "/home/runner/_tool"
|
||||
- name: ACCESS_TOKEN
|
||||
valueFrom:
|
||||
secretKeyRef:
|
||||
name: github-runner-token
|
||||
key: credential
|
||||
- name: RUN_AS_ROOT
|
||||
value: "false"
|
||||
resources:
|
||||
requests:
|
||||
cpu: "500m"
|
||||
memory: "1Gi"
|
||||
limits:
|
||||
cpu: "2000m"
|
||||
memory: "4Gi"
|
||||
volumeMounts:
|
||||
- name: runner-home
|
||||
mountPath: /home/runner
|
||||
- name: nuget-cache
|
||||
mountPath: /home/runner/.nuget/packages
|
||||
- name: tmp
|
||||
mountPath: /tmp
|
||||
livenessProbe:
|
||||
exec:
|
||||
command:
|
||||
- /bin/sh
|
||||
- -c
|
||||
- "pgrep -f Runner.Listener > /dev/null"
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 30
|
||||
failureThreshold: 3
|
||||
volumes:
|
||||
- name: runner-home
|
||||
emptyDir: {}
|
||||
- name: nuget-cache
|
||||
emptyDir:
|
||||
sizeLimit: 2Gi
|
||||
- name: tmp
|
||||
emptyDir: {}
|
||||
restartPolicy: Always
|
||||
|
||||
# Long-tail runner pattern:
|
||||
#
|
||||
# Sprint 32 added the final 16 long-tail repo-scoped Deployments above. Keep
|
||||
# Common as the only PVC-backed runner at replicas: 1. Any future multi-replica
|
||||
# runner must use per-pod emptyDir caches, not a shared ReadWriteOnce PVC.
|
||||
# 2026-05-25: PiManager added (was missed in the Sprint 32 long-tail sweep).
|
||||
|
||||
12
apps/github-runner/step-ca-root.crt
Normal file
12
apps/github-runner/step-ca-root.crt
Normal file
@@ -0,0 +1,12 @@
|
||||
-----BEGIN CERTIFICATE-----
|
||||
MIIBxDCCAWqgAwIBAgIRAPY357G6ow6zMAL5+4bS2kkwCgYIKoZIzj0EAwIwQDEa
|
||||
MBgGA1UEChMRSUFtV29ya2luIEFDTUUgQ0ExIjAgBgNVBAMTGUlBbVdvcmtpbiBB
|
||||
Q01FIENBIFJvb3QgQ0EwHhcNMjYwMzA4MTgwNzExWhcNMzYwMzA1MTgwNzExWjBA
|
||||
MRowGAYDVQQKExFJQW1Xb3JraW4gQUNNRSBDQTEiMCAGA1UEAxMZSUFtV29ya2lu
|
||||
IEFDTUUgQ0EgUm9vdCBDQTBZMBMGByqGSM49AgEGCCqGSM49AwEHA0IABJ2n04X1
|
||||
JZo5Zdq/i1Idv8+fqwZyAzBh7whbqj0SWsJL8UWRabCMqYCs7+dXO0xRSzqkwFDL
|
||||
x+vooOai8RgRNhajRTBDMA4GA1UdDwEB/wQEAwIBBjASBgNVHRMBAf8ECDAGAQH/
|
||||
AgEBMB0GA1UdDgQWBBRnuPPQR6iM/H6vOluiU3Sygayz8jAKBggqhkjOPQQDAgNI
|
||||
ADBFAiEArQK9dYPGmAZsdYnjziuFVVE5NKZUcceYvGfGC+tLXUsCIAudF2zJrCRq
|
||||
3mK50ZZET/fwTkJwiEF4824mjP8p1CKM
|
||||
-----END CERTIFICATE-----
|
||||
@@ -24,7 +24,16 @@
|
||||
# (10.0.57.16:5200), public internet 80/443 (excluding RFC1918), and
|
||||
# fc-signage:5190 for the signage AAT lane.
|
||||
# - Ingress: Traefik (4444 + 8089 ACME-solver-style), intra-pod,
|
||||
# telephony / gitea / fc-system / fc-signage namespaces on 4444.
|
||||
# telephony / gitea / fc-system / fc-signage / github-runner namespaces
|
||||
# on 4444.
|
||||
#
|
||||
# 2026-05-25: added github-runner ingress on 4444 so CI jobs running in
|
||||
# self-hosted runner pods (e.g. FlowerCore.Print.Web `help-screenshots`)
|
||||
# can reach the grid. Without this allow, the session POST to
|
||||
# `selenium-hub.selenium.svc.cluster.local:4444` was DNAT'd to the hub
|
||||
# pod IP and then dropped at the Calico ingress hook — Selenium UI showed
|
||||
# 0/4 sessions while the .NET HTTP client timed out at 60s. Same family
|
||||
# as `feedback_netpol_dnat_backend_port`, wrong-source-namespace flavor.
|
||||
apiVersion: networking.k8s.io/v1
|
||||
kind: NetworkPolicy
|
||||
metadata:
|
||||
@@ -203,6 +212,13 @@ spec:
|
||||
ports:
|
||||
- port: 4444
|
||||
protocol: TCP
|
||||
- from:
|
||||
- namespaceSelector:
|
||||
matchLabels:
|
||||
kubernetes.io/metadata.name: github-runner
|
||||
ports:
|
||||
- port: 4444
|
||||
protocol: TCP
|
||||
podSelector: {}
|
||||
policyTypes:
|
||||
- Ingress
|
||||
|
||||
427
apps/selenium/selenium-grid.yaml
Normal file
427
apps/selenium/selenium-grid.yaml
Normal file
@@ -0,0 +1,427 @@
|
||||
# Selenium Grid 4 — RKE2 deployment
|
||||
#
|
||||
# Hub + chrome + firefox + edge browser nodes serving fleet-wide AAT runs from
|
||||
# the GitHub Actions self-hosted runners. ArgoCD owns this namespace from
|
||||
# 2026-05-25 (`infra-selenium` Application; previously these resources were
|
||||
# orphan kubectl-applied since 2026-03-15).
|
||||
#
|
||||
# Endpoints:
|
||||
# - Internal cluster: http://selenium-hub.selenium.svc.cluster.local:4444
|
||||
# - LAN LoadBalancer (MetalLB): http://10.0.56.208:4444
|
||||
# - Traefik public: https://selenium.iamworkin.lan
|
||||
#
|
||||
# Browser maxSessions:
|
||||
# - chrome 2 (bumped from 1 on 2026-05-25 morning-routine — AAT-heavy
|
||||
# Print.Web help-screenshots was the global bottleneck;
|
||||
# see commit history for ops/runner-replica-rightsize)
|
||||
# - firefox 1
|
||||
# - edge 1
|
||||
#
|
||||
# Screenshots + video recording write to NFS via the chrome video sidecar.
|
||||
# See: CLAUDE.md "Selenium Grid & Visual AAT Testing" + bluejay-infra ADR notes.
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Service
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-hub
|
||||
app.kubernetes.io/name: selenium-hub
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
name: selenium-hub
|
||||
namespace: selenium
|
||||
spec:
|
||||
ports:
|
||||
- name: web
|
||||
port: 4444
|
||||
targetPort: 4444
|
||||
- name: publish
|
||||
port: 4442
|
||||
targetPort: 4442
|
||||
- name: subscribe
|
||||
port: 4443
|
||||
targetPort: 4443
|
||||
selector:
|
||||
app: selenium-hub
|
||||
type: ClusterIP
|
||||
---
|
||||
apiVersion: v1
|
||||
kind: Service
|
||||
metadata:
|
||||
annotations:
|
||||
metallb.io/ip-allocated-from-pool: bluejay-pool
|
||||
metallb.universe.tf/loadBalancerIPs: 10.0.56.208
|
||||
labels:
|
||||
app: selenium-hub
|
||||
component: external-access
|
||||
name: selenium-hub-external
|
||||
namespace: selenium
|
||||
spec:
|
||||
clusterIP: 10.43.90.147
|
||||
clusterIPs:
|
||||
- 10.43.90.147
|
||||
externalTrafficPolicy: Local
|
||||
healthCheckNodePort: 32213
|
||||
ports:
|
||||
- name: web
|
||||
nodePort: 32411
|
||||
port: 4444
|
||||
targetPort: 4444
|
||||
- name: publish
|
||||
nodePort: 32068
|
||||
port: 4442
|
||||
targetPort: 4442
|
||||
- name: subscribe
|
||||
nodePort: 31000
|
||||
port: 4443
|
||||
targetPort: 4443
|
||||
selector:
|
||||
app: selenium-hub
|
||||
type: LoadBalancer
|
||||
---
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-hub
|
||||
app.kubernetes.io/name: selenium-hub
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
name: selenium-hub
|
||||
namespace: selenium
|
||||
spec:
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app: selenium-hub
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-hub
|
||||
app.kubernetes.io/name: selenium-hub
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
spec:
|
||||
containers:
|
||||
- env:
|
||||
- name: SE_NODE_SESSION_TIMEOUT
|
||||
value: '300'
|
||||
- name: SE_SESSION_REQUEST_TIMEOUT
|
||||
value: '300'
|
||||
- name: SE_SESSION_RETRY_INTERVAL
|
||||
value: '5'
|
||||
- name: JAVA_OPTS
|
||||
value: -Xmx512m
|
||||
image: selenium/hub:4.27.0
|
||||
livenessProbe:
|
||||
httpGet:
|
||||
path: /wd/hub/status
|
||||
port: 4444
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 15
|
||||
timeoutSeconds: 5
|
||||
name: selenium-hub
|
||||
ports:
|
||||
- containerPort: 4444
|
||||
name: web
|
||||
- containerPort: 4442
|
||||
name: publish
|
||||
- containerPort: 4443
|
||||
name: subscribe
|
||||
readinessProbe:
|
||||
httpGet:
|
||||
path: /wd/hub/status
|
||||
port: 4444
|
||||
initialDelaySeconds: 10
|
||||
periodSeconds: 5
|
||||
timeoutSeconds: 5
|
||||
# Hub baseline working set ~766Mi on 2026-05-25 (75% of prior 1Gi
|
||||
# limit). Bump to 1.5Gi / 1Gi to keep ~50% headroom; matches the
|
||||
# stampede-buffer pattern documented for multus
|
||||
# (feedback_k8s_cni_multus_sizing). CPU left alone — observed 54m
|
||||
# against a 500m limit, no contention.
|
||||
resources:
|
||||
limits:
|
||||
cpu: 500m
|
||||
memory: 1536Mi
|
||||
requests:
|
||||
cpu: 250m
|
||||
memory: 1Gi
|
||||
---
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-chrome
|
||||
app.kubernetes.io/name: selenium-node-chrome
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
name: selenium-node-chrome
|
||||
namespace: selenium
|
||||
spec:
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app: selenium-node-chrome
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-chrome
|
||||
app.kubernetes.io/name: selenium-node-chrome
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
spec:
|
||||
containers:
|
||||
- env:
|
||||
- name: SE_EVENT_BUS_HOST
|
||||
value: selenium-hub
|
||||
- name: SE_EVENT_BUS_PUBLISH_PORT
|
||||
value: '4442'
|
||||
- name: SE_EVENT_BUS_SUBSCRIBE_PORT
|
||||
value: '4443'
|
||||
- name: SE_NODE_MAX_SESSIONS
|
||||
value: '2'
|
||||
- name: SE_NODE_OVERRIDE_MAX_SESSIONS
|
||||
value: 'false'
|
||||
- name: SE_VNC_NO_PASSWORD
|
||||
value: '1'
|
||||
- name: SE_SCREEN_WIDTH
|
||||
value: '1920'
|
||||
- name: SE_SCREEN_HEIGHT
|
||||
value: '1080'
|
||||
- name: SE_NODE_SESSION_TIMEOUT
|
||||
value: '300'
|
||||
image: selenium/node-chrome:4.27.0
|
||||
livenessProbe:
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 15
|
||||
name: selenium-chrome
|
||||
ports:
|
||||
- containerPort: 5555
|
||||
name: node
|
||||
readinessProbe:
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 15
|
||||
periodSeconds: 5
|
||||
# Chromium-based browser node. Bumped from 1Gi -> 2Gi (req 512Mi
|
||||
# -> 1Gi) on 2026-05-25 — Edge had 51 OOMKills in 5d on the
|
||||
# original 1Gi cap (~1 OOM every 2.4h), and Chrome at maxSessions=2
|
||||
# was running 684Mi idle on the same cap. Matches the Firefox node's
|
||||
# tested-stable 2Gi limit. CPU unchanged.
|
||||
resources:
|
||||
limits:
|
||||
cpu: '1'
|
||||
memory: 2Gi
|
||||
requests:
|
||||
cpu: 500m
|
||||
memory: 1Gi
|
||||
volumeMounts:
|
||||
- mountPath: /dev/shm
|
||||
name: dshm
|
||||
- env:
|
||||
- name: DISPLAY_CONTAINER_NAME
|
||||
value: localhost
|
||||
- name: SE_SCREEN_WIDTH
|
||||
value: '1920'
|
||||
- name: SE_SCREEN_HEIGHT
|
||||
value: '1080'
|
||||
- name: SE_VIDEO_FILE_NAME
|
||||
value: auto
|
||||
- name: SE_VIDEO_UPLOAD_ENABLED
|
||||
value: 'false'
|
||||
image: selenium/video:ffmpeg-7.1-20250101
|
||||
name: video
|
||||
resources:
|
||||
limits:
|
||||
cpu: 500m
|
||||
memory: 768Mi
|
||||
requests:
|
||||
cpu: 250m
|
||||
memory: 384Mi
|
||||
volumeMounts:
|
||||
- mountPath: /videos
|
||||
name: selenium-videos
|
||||
volumes:
|
||||
- emptyDir:
|
||||
medium: Memory
|
||||
sizeLimit: 2Gi
|
||||
name: dshm
|
||||
- emptyDir:
|
||||
sizeLimit: 5Gi
|
||||
name: selenium-videos
|
||||
---
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-firefox
|
||||
app.kubernetes.io/name: selenium-node-firefox
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
name: selenium-node-firefox
|
||||
namespace: selenium
|
||||
spec:
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app: selenium-node-firefox
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-firefox
|
||||
app.kubernetes.io/name: selenium-node-firefox
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
spec:
|
||||
containers:
|
||||
- env:
|
||||
- name: SE_EVENT_BUS_HOST
|
||||
value: selenium-hub
|
||||
- name: SE_EVENT_BUS_PUBLISH_PORT
|
||||
value: '4442'
|
||||
- name: SE_EVENT_BUS_SUBSCRIBE_PORT
|
||||
value: '4443'
|
||||
- name: SE_NODE_MAX_SESSIONS
|
||||
value: '1'
|
||||
- name: SE_NODE_OVERRIDE_MAX_SESSIONS
|
||||
value: 'true'
|
||||
- name: SE_VNC_NO_PASSWORD
|
||||
value: '1'
|
||||
- name: SE_START_VNC
|
||||
value: 'false'
|
||||
- name: SE_SCREEN_WIDTH
|
||||
value: '1920'
|
||||
- name: SE_SCREEN_HEIGHT
|
||||
value: '1080'
|
||||
- name: SE_NODE_SESSION_TIMEOUT
|
||||
value: '300'
|
||||
image: selenium/node-firefox:4.27.0
|
||||
livenessProbe:
|
||||
failureThreshold: 5
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 15
|
||||
timeoutSeconds: 5
|
||||
name: selenium-firefox
|
||||
ports:
|
||||
- containerPort: 5555
|
||||
name: node
|
||||
readinessProbe:
|
||||
failureThreshold: 5
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 15
|
||||
periodSeconds: 5
|
||||
timeoutSeconds: 5
|
||||
resources:
|
||||
limits:
|
||||
cpu: '1'
|
||||
memory: 2Gi
|
||||
requests:
|
||||
cpu: 500m
|
||||
memory: 1Gi
|
||||
volumeMounts:
|
||||
- mountPath: /dev/shm
|
||||
name: dshm
|
||||
volumes:
|
||||
- emptyDir:
|
||||
medium: Memory
|
||||
sizeLimit: 2Gi
|
||||
name: dshm
|
||||
---
|
||||
apiVersion: apps/v1
|
||||
kind: Deployment
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-edge
|
||||
app.kubernetes.io/name: selenium-node-edge
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
name: selenium-node-edge
|
||||
namespace: selenium
|
||||
spec:
|
||||
replicas: 1
|
||||
selector:
|
||||
matchLabels:
|
||||
app: selenium-node-edge
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: selenium-node-edge
|
||||
app.kubernetes.io/name: selenium-node-edge
|
||||
app.kubernetes.io/part-of: selenium-grid
|
||||
spec:
|
||||
containers:
|
||||
- env:
|
||||
- name: SE_EVENT_BUS_HOST
|
||||
value: selenium-hub
|
||||
- name: SE_EVENT_BUS_PUBLISH_PORT
|
||||
value: '4442'
|
||||
- name: SE_EVENT_BUS_SUBSCRIBE_PORT
|
||||
value: '4443'
|
||||
- name: SE_NODE_MAX_SESSIONS
|
||||
value: '1'
|
||||
- name: SE_NODE_OVERRIDE_MAX_SESSIONS
|
||||
value: 'true'
|
||||
- name: SE_VNC_NO_PASSWORD
|
||||
value: '1'
|
||||
- name: SE_SCREEN_WIDTH
|
||||
value: '1920'
|
||||
- name: SE_SCREEN_HEIGHT
|
||||
value: '1080'
|
||||
- name: SE_NODE_SESSION_TIMEOUT
|
||||
value: '300'
|
||||
image: selenium/node-edge:4.27.0
|
||||
livenessProbe:
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 30
|
||||
periodSeconds: 15
|
||||
name: selenium-edge
|
||||
ports:
|
||||
- containerPort: 5555
|
||||
name: node
|
||||
readinessProbe:
|
||||
httpGet:
|
||||
path: /status
|
||||
port: 5555
|
||||
initialDelaySeconds: 15
|
||||
periodSeconds: 5
|
||||
# Chromium-based browser node. Bumped from 1Gi -> 2Gi (req 512Mi
|
||||
# -> 1Gi) on 2026-05-25 — Edge had 51 OOMKills in 5d on the
|
||||
# original 1Gi cap (~1 OOM every 2.4h), and Chrome at maxSessions=2
|
||||
# was running 684Mi idle on the same cap. Matches the Firefox node's
|
||||
# tested-stable 2Gi limit. CPU unchanged.
|
||||
resources:
|
||||
limits:
|
||||
cpu: '1'
|
||||
memory: 2Gi
|
||||
requests:
|
||||
cpu: 500m
|
||||
memory: 1Gi
|
||||
volumeMounts:
|
||||
- mountPath: /dev/shm
|
||||
name: dshm
|
||||
volumes:
|
||||
- emptyDir:
|
||||
medium: Memory
|
||||
sizeLimit: 2Gi
|
||||
name: dshm
|
||||
---
|
||||
apiVersion: traefik.io/v1alpha1
|
||||
kind: IngressRoute
|
||||
metadata:
|
||||
name: selenium-hub
|
||||
namespace: selenium
|
||||
spec:
|
||||
entryPoints:
|
||||
- websecure
|
||||
routes:
|
||||
- kind: Rule
|
||||
match: Host(`selenium.iamworkin.lan`)
|
||||
services:
|
||||
- name: selenium-hub
|
||||
port: 4444
|
||||
tls:
|
||||
secretName: selenium-tls
|
||||
@@ -1,285 +0,0 @@
|
||||
using FluentAssertions;
|
||||
using YamlDotNet.RepresentationModel;
|
||||
using Xunit;
|
||||
|
||||
namespace BluejayInfraLint.Tests;
|
||||
|
||||
[Trait("Category", "Unit")]
|
||||
public sealed class FcDesktopCapacityPolicyTests
|
||||
{
|
||||
private static readonly ManifestInventory Inventory = ManifestInventory.Load();
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_AppDirectoryMustExist()
|
||||
{
|
||||
Directory.Exists(Path.Combine(Inventory.BluejayRoot, "apps", "fc-desktop"))
|
||||
.Should()
|
||||
.BeTrue();
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_MustHaveExactlyOneResourceQuota()
|
||||
{
|
||||
FcDesktopDocuments()
|
||||
.Where(document => document.Kind == "ResourceQuota")
|
||||
.Should()
|
||||
.ContainSingle();
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_ResourceQuotaMustAdoptLiveSessionCapObject()
|
||||
{
|
||||
var quota = ResourceQuota();
|
||||
|
||||
quota.RelativePath.Should().Be("fc-desktop/resourcequota.yaml");
|
||||
quota.Name.Should().Be("fc-desktop-session-cap");
|
||||
quota.Namespace.Should().Be("fc-desktop");
|
||||
}
|
||||
|
||||
[Theory]
|
||||
[InlineData("count/pods", "15")]
|
||||
[InlineData("requests.cpu", "8")]
|
||||
[InlineData("requests.memory", "16Gi")]
|
||||
[InlineData("requests.storage", "500Gi")]
|
||||
[InlineData("persistentvolumeclaims", "30")]
|
||||
public void FcDesktop_ResourceQuotaMustDeclarePhaseOneHardLimits(string key, string value)
|
||||
{
|
||||
ResourceQuota().Scalar("spec", "hard", key).Should().Be(value);
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_ResourceQuotaMustCarryTraceableLabels()
|
||||
{
|
||||
ResourceQuotaLabels()
|
||||
.Should()
|
||||
.Contain(new Dictionary<string, string>
|
||||
{
|
||||
["app.kubernetes.io/name"] = "fc-desktop",
|
||||
["app.kubernetes.io/part-of"] = "remotedesktop",
|
||||
["app.kubernetes.io/component"] = "capacity-guard",
|
||||
["app.kubernetes.io/managed-by"] = "argocd",
|
||||
["flowercore.io/owner"] = "infra",
|
||||
});
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_ResourceQuotaMustUseRequestsKeysForComputeCap()
|
||||
{
|
||||
var hardKeys = HardLimitKeys(ResourceQuota());
|
||||
|
||||
hardKeys.Should().Contain(new[] { "requests.cpu", "requests.memory" });
|
||||
hardKeys.Should().NotContain(new[] { "cpu", "memory" });
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_ResourceQuotaMustAvoidDestructiveArgoAnnotations()
|
||||
{
|
||||
var quota = ResourceQuota();
|
||||
|
||||
quota.Scalar("metadata", "annotations", "argocd.argoproj.io/hook").Should().BeNull();
|
||||
quota.Scalar("metadata", "annotations", "argocd.argoproj.io/hook-delete-policy").Should().BeNull();
|
||||
|
||||
var syncOptions = quota.Scalar("metadata", "annotations", "argocd.argoproj.io/sync-options") ?? string.Empty;
|
||||
syncOptions.Should().NotContain("Force=true");
|
||||
syncOptions.Should().NotContain("Replace=true");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_ResourceQuotaMustRecordPhaseAInfraOnlyScope()
|
||||
{
|
||||
ResourceQuota().Scalar("metadata", "annotations", "flowercore.io/phase")
|
||||
.Should()
|
||||
.Be("sprint-44-cx-9-phase-a");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_MustHaveExactlyOneLimitRange()
|
||||
{
|
||||
FcDesktopDocuments()
|
||||
.Where(document => document.Kind == "LimitRange")
|
||||
.Should()
|
||||
.ContainSingle();
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_LimitRangeMustLiveBesideResourceQuota()
|
||||
{
|
||||
var limitRange = LimitRange();
|
||||
|
||||
limitRange.RelativePath.Should().Be("fc-desktop/limitrange.yaml");
|
||||
limitRange.Name.Should().Be("fc-desktop-pod-defaults");
|
||||
limitRange.Namespace.Should().Be("fc-desktop");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_LimitRangeMustHaveSingleContainerRule()
|
||||
{
|
||||
var limit = LimitRangeRule();
|
||||
|
||||
LimitRange().MappingSequence("spec", "limits").Should().ContainSingle();
|
||||
ManifestNodeExtensions.Scalar(limit, "type").Should().Be("Container");
|
||||
}
|
||||
|
||||
[Theory]
|
||||
[InlineData("default", "cpu", "1.0")]
|
||||
[InlineData("default", "memory", "2Gi")]
|
||||
[InlineData("defaultRequest", "cpu", "500m")]
|
||||
[InlineData("defaultRequest", "memory", "1Gi")]
|
||||
[InlineData("max", "cpu", "2.0")]
|
||||
[InlineData("max", "memory", "4Gi")]
|
||||
[InlineData("min", "cpu", "100m")]
|
||||
[InlineData("min", "memory", "128Mi")]
|
||||
public void FcDesktop_LimitRangeMustDeclarePerPodShape(string section, string key, string value)
|
||||
{
|
||||
ManifestNodeExtensions.Scalar(LimitRangeRule(), section, key).Should().Be(value);
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_LimitRangeMustCarryTraceableLabels()
|
||||
{
|
||||
LimitRangeLabels()
|
||||
.Should()
|
||||
.Contain(new Dictionary<string, string>
|
||||
{
|
||||
["app.kubernetes.io/name"] = "fc-desktop",
|
||||
["app.kubernetes.io/part-of"] = "remotedesktop",
|
||||
["app.kubernetes.io/component"] = "capacity-guard",
|
||||
["app.kubernetes.io/managed-by"] = "argocd",
|
||||
["flowercore.io/owner"] = "infra",
|
||||
});
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_LimitRangeMustAvoidDestructiveArgoAnnotations()
|
||||
{
|
||||
var limitRange = LimitRange();
|
||||
|
||||
limitRange.Scalar("metadata", "annotations", "argocd.argoproj.io/hook").Should().BeNull();
|
||||
limitRange.Scalar("metadata", "annotations", "argocd.argoproj.io/hook-delete-policy").Should().BeNull();
|
||||
|
||||
var syncOptions = limitRange.Scalar("metadata", "annotations", "argocd.argoproj.io/sync-options") ?? string.Empty;
|
||||
syncOptions.Should().NotContain("Force=true");
|
||||
syncOptions.Should().NotContain("Replace=true");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_LimitRangeMustRecordPhaseAInfraOnlyScope()
|
||||
{
|
||||
LimitRange().Scalar("metadata", "annotations", "flowercore.io/phase")
|
||||
.Should()
|
||||
.Be("sprint-44-cx-9-phase-a");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_BluejayInfraMustNotOwnDeploymentOrService()
|
||||
{
|
||||
FcDesktopDocuments()
|
||||
.Select(document => document.Kind)
|
||||
.Should()
|
||||
.NotContain(new[] { "Deployment", "Service" });
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_BluejayInfraMustOnlyOwnInfraResourceKinds()
|
||||
{
|
||||
var allowedKinds = new HashSet<string>(StringComparer.Ordinal)
|
||||
{
|
||||
"Certificate",
|
||||
"IngressRoute",
|
||||
"NetworkPolicy",
|
||||
"ResourceQuota",
|
||||
"LimitRange",
|
||||
};
|
||||
|
||||
FcDesktopDocuments()
|
||||
.Select(document => document.Kind)
|
||||
.Should()
|
||||
.OnlyContain(kind => allowedKinds.Contains(kind));
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_NetworkPolicySetMustRemainPresent()
|
||||
{
|
||||
FcDesktopDocuments()
|
||||
.Where(document => document.Kind == "NetworkPolicy")
|
||||
.Select(document => document.Name)
|
||||
.Should()
|
||||
.BeEquivalentTo(
|
||||
"desktop-isolation",
|
||||
"fc-desktop-default-deny",
|
||||
"remotedesktop-web-isolation",
|
||||
"cm-acme-http-solver-allow");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDesktop_TlsIngressMustRemainOwnedByInfra()
|
||||
{
|
||||
FcDesktopDocuments()
|
||||
.Should()
|
||||
.Contain(document => document.Kind == "Certificate" && document.Name == "remotedesktop-web-tls")
|
||||
.And
|
||||
.Contain(document => document.Kind == "IngressRoute" && document.Name == "remotedesktop-web");
|
||||
}
|
||||
|
||||
private static IReadOnlyList<ManifestDocument> FcDesktopDocuments()
|
||||
{
|
||||
return Inventory.Documents
|
||||
.Where(document => document.RelativePath.StartsWith("fc-desktop/", StringComparison.Ordinal))
|
||||
.ToList();
|
||||
}
|
||||
|
||||
private static ManifestDocument ResourceQuota()
|
||||
{
|
||||
return FcDesktopDocuments()
|
||||
.Single(document => document.Kind == "ResourceQuota");
|
||||
}
|
||||
|
||||
private static ManifestDocument LimitRange()
|
||||
{
|
||||
return FcDesktopDocuments()
|
||||
.Single(document => document.Kind == "LimitRange");
|
||||
}
|
||||
|
||||
private static YamlMappingNode LimitRangeRule()
|
||||
{
|
||||
return LimitRange()
|
||||
.MappingSequence("spec", "limits")
|
||||
.Single();
|
||||
}
|
||||
|
||||
private static IReadOnlySet<string> HardLimitKeys(ManifestDocument document)
|
||||
{
|
||||
var hard = ManifestNodeExtensions.Mapping(document.Root, "spec", "hard")
|
||||
?? throw new InvalidOperationException($"{document.Descriptor} is missing spec.hard.");
|
||||
|
||||
return hard.Children.Keys
|
||||
.OfType<YamlScalarNode>()
|
||||
.Select(key => key.Value)
|
||||
.Where(value => !string.IsNullOrWhiteSpace(value))
|
||||
.Cast<string>()
|
||||
.ToHashSet(StringComparer.Ordinal);
|
||||
}
|
||||
|
||||
private static IReadOnlyDictionary<string, string> ResourceQuotaLabels()
|
||||
{
|
||||
return Labels(ResourceQuota());
|
||||
}
|
||||
|
||||
private static IReadOnlyDictionary<string, string> LimitRangeLabels()
|
||||
{
|
||||
return Labels(LimitRange());
|
||||
}
|
||||
|
||||
private static IReadOnlyDictionary<string, string> Labels(ManifestDocument document)
|
||||
{
|
||||
var labels = ManifestNodeExtensions.Mapping(document.Root, "metadata", "labels")
|
||||
?? throw new InvalidOperationException($"{document.Descriptor} is missing metadata.labels.");
|
||||
|
||||
return labels.Children
|
||||
.Where(entry => entry.Key is YamlScalarNode && entry.Value is YamlScalarNode)
|
||||
.ToDictionary(
|
||||
entry => ((YamlScalarNode)entry.Key).Value ?? string.Empty,
|
||||
entry => ((YamlScalarNode)entry.Value).Value ?? string.Empty,
|
||||
StringComparer.Ordinal);
|
||||
}
|
||||
}
|
||||
@@ -67,6 +67,7 @@ public sealed class FleetManifestLintTests
|
||||
["github-runner-chat"] = "https://github.com/astoltz/FlowerCore.Chat",
|
||||
["github-runner-mysql"] = "https://github.com/astoltz/FlowerCore.MySQL",
|
||||
["github-runner-kiosk-linux"] = "https://github.com/astoltz/FlowerCore.Kiosk.Linux",
|
||||
["github-runner-updater"] = "https://github.com/astoltz/FlowerCore.Updater",
|
||||
};
|
||||
|
||||
private static readonly HashSet<string> ScaledLinuxRunnerDeployments = new(StringComparer.Ordinal)
|
||||
@@ -80,6 +81,7 @@ public sealed class FleetManifestLintTests
|
||||
"github-runner-chat",
|
||||
"github-runner-mysql",
|
||||
"github-runner-kiosk-linux",
|
||||
"github-runner-updater",
|
||||
};
|
||||
|
||||
private static readonly IReadOnlyDictionary<string, string> WritableRunnerEnv = new Dictionary<string, string>(StringComparer.Ordinal)
|
||||
@@ -234,7 +236,7 @@ public sealed class FleetManifestLintTests
|
||||
{
|
||||
deployments.Should().ContainKey(expectedRunner.Key);
|
||||
|
||||
var container = RunnerContainer(deployments[expectedRunner.Key]);
|
||||
var container = deployments[expectedRunner.Key].MainContainerMappings().Should().ContainSingle().Subject;
|
||||
EnvValue(container, "REPO_URL").Should().Be(expectedRunner.Value);
|
||||
EnvValue(container, "EPHEMERAL").Should().Be("true");
|
||||
EnvValue(container, "LABELS").Should().Be("self-hosted,linux,fc-build-linux");
|
||||
@@ -250,7 +252,7 @@ public sealed class FleetManifestLintTests
|
||||
{
|
||||
foreach (var deployment in GitHubRunnerDeployments().Values)
|
||||
{
|
||||
var container = RunnerContainer(deployment);
|
||||
var container = deployment.MainContainerMappings().Should().ContainSingle().Subject;
|
||||
|
||||
foreach (var expectedEnv in WritableRunnerEnv)
|
||||
{
|
||||
@@ -277,7 +279,10 @@ public sealed class FleetManifestLintTests
|
||||
foreach (var deploymentName in ScaledLinuxRunnerDeployments)
|
||||
{
|
||||
var deployment = deployments[deploymentName];
|
||||
ReplicaCount(deployment).Should().Be(2);
|
||||
// Scaled runners must have >= 2 replicas (avoid single-pod bottleneck).
|
||||
// Individual deployments may be tuned upward per CI activity — see
|
||||
// "runners: right-size replica counts per 14d CI activity (#24)".
|
||||
ReplicaCount(deployment).Should().BeGreaterOrEqualTo(2, $"{deploymentName} is in the scaled set and must run with at least 2 replicas");
|
||||
|
||||
var volumes = deployment.MappingSequence("spec", "template", "spec", "volumes");
|
||||
var claimNames = volumes
|
||||
@@ -303,6 +308,108 @@ public sealed class FleetManifestLintTests
|
||||
.Be("github-runner-nuget-cache");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void Runners_MustNotPinToOperatorWorkstationHosts()
|
||||
{
|
||||
// CRITICAL SAFETY (operator directive 2026-05-26): BLUEJAY-WS is the
|
||||
// operator's primary workstation — host of the 1Password Connect
|
||||
// bearer token, fcadmin SSH keys to noc1, signing CA private keys,
|
||||
// and source for every FC repo. A self-hosted GitHub Actions runner
|
||||
// there would execute arbitrary PR code with that local access.
|
||||
// Build-side analog of the Sprint 9 NEW safe-account exclusion gate
|
||||
// (Puppet GPO/AppLocker/WDAC/audit-forwarder modules refuse to apply
|
||||
// on BLUEJAY-WS). This lint asserts no GitHub-runner Deployment in
|
||||
// apps/github-runner/ pins to a forbidden operator-workstation host
|
||||
// via nodeName, nodeSelector, nodeAffinity, or tolerations.
|
||||
// Existing legacy `bluejay-ws-sandbox-1` GitHub-registered runner is
|
||||
// out of scope here (it's a runtime registration, not a K8s
|
||||
// Deployment) — see CLAUDE.md "Common Mistakes" entry and
|
||||
// feedback_bluejay_ws_never_public_runner.md.
|
||||
var forbiddenHostPatterns = new[]
|
||||
{
|
||||
"bluejay-ws",
|
||||
"BLUEJAY-WS",
|
||||
"bluejay-ws.iamworkin.lan",
|
||||
"iamworkin-ws",
|
||||
};
|
||||
|
||||
bool ContainsForbidden(string? value) =>
|
||||
!string.IsNullOrWhiteSpace(value)
|
||||
&& forbiddenHostPatterns.Any(pattern => value!.Contains(pattern, StringComparison.OrdinalIgnoreCase));
|
||||
|
||||
var violations = GitHubRunnerDeployments().Values.SelectMany(deployment =>
|
||||
{
|
||||
var local = new List<string>();
|
||||
var podSpec = ManifestNodeExtensions.Mapping(deployment.Root, "spec", "template", "spec");
|
||||
if (podSpec is null)
|
||||
{
|
||||
return local;
|
||||
}
|
||||
|
||||
// nodeName: pins the pod to a specific node by name.
|
||||
var nodeName = ManifestNodeExtensions.Scalar(podSpec, "nodeName");
|
||||
if (ContainsForbidden(nodeName))
|
||||
{
|
||||
local.Add($"{deployment.Name} sets nodeName='{nodeName}' which targets a forbidden operator-workstation host.");
|
||||
}
|
||||
|
||||
// nodeSelector: dict of label → value pinning the pod to nodes
|
||||
// carrying matching labels. Examples that would trip this:
|
||||
// kubernetes.io/hostname: bluejay-ws
|
||||
// flowercore.io/host: bluejay-ws.iamworkin.lan
|
||||
var nodeSelector = ManifestNodeExtensions.Mapping(podSpec, "nodeSelector");
|
||||
if (nodeSelector is not null)
|
||||
{
|
||||
foreach (var entry in nodeSelector.Children)
|
||||
{
|
||||
var key = entry.Key is YamlScalarNode keyScalar ? keyScalar.Value : null;
|
||||
var value = entry.Value is YamlScalarNode valueScalar ? valueScalar.Value : null;
|
||||
if (ContainsForbidden(value))
|
||||
{
|
||||
local.Add($"{deployment.Name} has nodeSelector entry '{key}: {value}' which targets a forbidden operator-workstation host.");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// nodeAffinity: matchExpressions over node labels.
|
||||
foreach (var term in ManifestNodeExtensions.MappingSequence(podSpec, "affinity", "nodeAffinity", "requiredDuringSchedulingIgnoredDuringExecution", "nodeSelectorTerms"))
|
||||
{
|
||||
foreach (var expr in ManifestNodeExtensions.MappingSequence(term, "matchExpressions"))
|
||||
{
|
||||
var key = ManifestNodeExtensions.Scalar(expr, "key");
|
||||
foreach (var valueNode in ManifestNodeExtensions.ScalarSequence(expr, "values"))
|
||||
{
|
||||
if (ContainsForbidden(valueNode))
|
||||
{
|
||||
local.Add($"{deployment.Name} has nodeAffinity matchExpression '{key}' value '{valueNode}' which targets a forbidden operator-workstation host.");
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// tolerations: scheduling onto a tainted operator-workstation
|
||||
// node would let the runner run there. Forbid any toleration
|
||||
// value that names the workstation.
|
||||
foreach (var toleration in ManifestNodeExtensions.MappingSequence(podSpec, "tolerations"))
|
||||
{
|
||||
var key = ManifestNodeExtensions.Scalar(toleration, "key");
|
||||
var value = ManifestNodeExtensions.Scalar(toleration, "value");
|
||||
if (ContainsForbidden(key))
|
||||
{
|
||||
local.Add($"{deployment.Name} has toleration key '{key}' which targets a forbidden operator-workstation host.");
|
||||
}
|
||||
if (ContainsForbidden(value))
|
||||
{
|
||||
local.Add($"{deployment.Name} has toleration value '{value}' which targets a forbidden operator-workstation host.");
|
||||
}
|
||||
}
|
||||
|
||||
return local;
|
||||
}).ToList();
|
||||
|
||||
violations.Should().BeEmpty("BLUEJAY-WS / iamworkin-ws must never host a fleet GitHub Actions runner; see CLAUDE.md 'Registering BLUEJAY-WS as a fleet GitHub Actions runner' and feedback_bluejay_ws_never_public_runner.md");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void Monitoring_MustAlertWhenLinuxRunnerDeploymentIsUnavailable()
|
||||
{
|
||||
@@ -430,6 +537,7 @@ public sealed class FleetManifestLintTests
|
||||
var expectedFiles = new[]
|
||||
{
|
||||
"1password-item.yaml",
|
||||
"argocd-application.yaml",
|
||||
"certificate-web.yaml",
|
||||
"clusterrole-operator.yaml",
|
||||
"clusterrolebinding-operator.yaml",
|
||||
@@ -585,15 +693,17 @@ public sealed class FleetManifestLintTests
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public void FcDeviceManagement_MustRelyOnApplicationSetDiscovery()
|
||||
public void FcDeviceManagement_ArgocdApplicationMustMatchApplicationSetDiscoveryConventions()
|
||||
{
|
||||
FcDeviceManagementDocuments()
|
||||
.Should()
|
||||
.NotContain(document => document.Kind == "Application", "the root ApplicationSet owns apps/fc-devicemgmt discovery");
|
||||
var application = FcDeviceManagementDocuments()
|
||||
.Single(document => document.Kind == "Application" && document.Name == "infra-fc-devicemgmt");
|
||||
|
||||
FcDeviceManagementDocuments()
|
||||
application.Namespace.Should().Be("argocd");
|
||||
application.Scalar("spec", "source", "repoURL")
|
||||
.Should()
|
||||
.Contain(document => document.Kind == "Namespace" && document.Name == "fc-devicemgmt");
|
||||
.Be("http://gitea-clusterip.gitea.svc.cluster.local:3000/bluejay/bluejay-infra.git");
|
||||
application.Scalar("spec", "source", "path").Should().Be("apps/fc-devicemgmt");
|
||||
application.Scalar("spec", "destination", "namespace").Should().Be("fc-devicemgmt");
|
||||
}
|
||||
|
||||
private static IEnumerable<string> ProbeViolations(
|
||||
@@ -628,12 +738,6 @@ public sealed class FleetManifestLintTests
|
||||
.ToDictionary(document => document.Name, StringComparer.Ordinal);
|
||||
}
|
||||
|
||||
private static YamlMappingNode RunnerContainer(ManifestDocument deployment)
|
||||
{
|
||||
return deployment.ContainerMappings()
|
||||
.Single(container => string.Equals(ManifestNodeExtensions.Scalar(container, "name"), "runner", StringComparison.Ordinal));
|
||||
}
|
||||
|
||||
private static int ReplicaCount(ManifestDocument document)
|
||||
{
|
||||
return int.TryParse(document.Scalar("spec", "replicas"), out var replicas) ? replicas : 1;
|
||||
@@ -893,6 +997,22 @@ internal sealed record ManifestDocument(
|
||||
.ToList();
|
||||
}
|
||||
|
||||
// MainContainerMappings excludes initContainers. Use this when asserting
|
||||
// properties of the primary container (env, image, volumeMounts) where an
|
||||
// initContainer would be a false-positive match — e.g. the GitHub runner
|
||||
// image's `setup-runner-home` initContainer should not count toward the
|
||||
// single-container assertions on the runner deployments.
|
||||
public IReadOnlyList<YamlMappingNode> MainContainerMappings()
|
||||
{
|
||||
var podSpec = PodSpec();
|
||||
if (podSpec is null)
|
||||
{
|
||||
return Array.Empty<YamlMappingNode>();
|
||||
}
|
||||
|
||||
return ManifestNodeExtensions.MappingSequence(podSpec, "containers").ToList();
|
||||
}
|
||||
|
||||
public IReadOnlyList<ContainerSpec> ContainerSpecs()
|
||||
{
|
||||
return ContainerMappings()
|
||||
|
||||
Reference in New Issue
Block a user