From 4c5fdde787461652da8abdec6a38ca10c30ce7be Mon Sep 17 00:00:00 2001 From: Ronni Baslund Date: Mon, 8 Jun 2026 22:56:21 +0200 Subject: [PATCH] fix(infra): docker:24-dind + capacity 2 (fix moby cgroup-v2 teardown deadlock that hung 'Complete job') --- infrastructure/production/fleet/ci/gitea-runner.yaml | 12 ++++++++---- 1 file changed, 8 insertions(+), 4 deletions(-) diff --git a/infrastructure/production/fleet/ci/gitea-runner.yaml b/infrastructure/production/fleet/ci/gitea-runner.yaml index 8bee05c..ec694dd 100644 --- a/infrastructure/production/fleet/ci/gitea-runner.yaml +++ b/infrastructure/production/fleet/ci/gitea-runner.yaml @@ -37,9 +37,10 @@ data: log: level: info runner: - # Run several jobs at once (the 4-app typecheck matrix + image builds) - # instead of one-at-a-time. The AX41 has headroom. - capacity: 4 + # Some parallelism without overloading the single shared dind daemon + # (concurrent container teardowns trigger moby's cgroup-v2 removal + # deadlock). 2 is a safe balance on this node. + capacity: 2 timeout: 3h labels: - "ubuntu-latest:docker://catthehacker/ubuntu:act-22.04" @@ -101,7 +102,10 @@ spec: - name: runner-config mountPath: /config - name: dind - image: docker:27-dind + # docker:24-dind — moby 24 avoids the cgroup-v2 container-removal + # deadlock seen on 27 ("removal of container … is already in + # progress" looping → "Complete job" hangs). + image: docker:24-dind securityContext: privileged: true env: