From c0460fcde7051a8d07612ec2a17718d3c3019bb0 Mon Sep 17 00:00:00 2001 From: Aleksandr Nogikh Date: Tue, 21 Oct 2025 14:37:49 +0200 Subject: syz-cluster: set workflow step retry strategy When a triage or build step coincides with a cron job that polls new kernel trees, they often fail due to git command noticing that the repository is being updated. In this case, the step logs an error and exits with status=1. Argo workflows offers a functionality to retry such steps up to the specific number of times and with exponentially increasing backoffs. Configure the build and triage step templates to retry 3 times with 5 and then 10 minutes distance between the retries. --- syz-cluster/workflow/build-step/workflow-template.yaml | 4 ++++ syz-cluster/workflow/triage-step/workflow-template.yaml | 4 ++++ 2 files changed, 8 insertions(+) (limited to 'syz-cluster') diff --git a/syz-cluster/workflow/build-step/workflow-template.yaml b/syz-cluster/workflow/build-step/workflow-template.yaml index 76edbf037..b7b343745 100644 --- a/syz-cluster/workflow/build-step/workflow-template.yaml +++ b/syz-cluster/workflow/build-step/workflow-template.yaml @@ -8,6 +8,10 @@ metadata: spec: templates: - name: build-step + retryStrategy: + limit: "3" + backoff: + duration: "5m" inputs: parameters: - name: findings diff --git a/syz-cluster/workflow/triage-step/workflow-template.yaml b/syz-cluster/workflow/triage-step/workflow-template.yaml index 37427cf73..126d6c775 100644 --- a/syz-cluster/workflow/triage-step/workflow-template.yaml +++ b/syz-cluster/workflow/triage-step/workflow-template.yaml @@ -8,6 +8,10 @@ metadata: spec: templates: - name: triage-step + retryStrategy: + limit: "3" + backoff: + duration: "5m" initContainers: - name: setup-overlays image: alpine/git:latest -- cgit mrf-deployment