You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
64 lines
2.1 KiB
Bash
64 lines
2.1 KiB
Bash
#!/usr/bin/env bash
|
|
# vim:ts=4:sts=4:sw=4:et
|
|
#
|
|
# Author: Hari Sekhon
|
|
# Date: 2020-04-01 18:59:00 +0100 (Wed, 01 Apr 2020)
|
|
#
|
|
# https://github.com/harisekhon/bash-tools
|
|
#
|
|
# License: see accompanying Hari Sekhon LICENSE file
|
|
#
|
|
# If you're using my code you're welcome to connect with me on LinkedIn and optionally send me feedback to help steer this or other code I publish
|
|
#
|
|
# https://www.linkedin.com/in/harisekhon
|
|
#
|
|
|
|
# https://buildkite.com/docs/apis/rest-api/builds
|
|
|
|
# https://buildkite.com/docs/apis/rest-api/jobs
|
|
|
|
set -euo pipefail
|
|
[ -n "${DEBUG:-}" ] && set -x
|
|
srcdir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
|
|
# shellcheck disable=SC1090
|
|
. "$srcdir/lib/utils.sh"
|
|
|
|
# used by usage() in lib/utils.sh
|
|
# shellcheck disable=SC2034
|
|
usage_description="
|
|
Triggers job retries jobs within builds where Failed status was due to a dead or timed out agent, using the BuildKite API
|
|
|
|
This is slightly better than retrying the failed builds because it restarts those builds from point of agent failure and replaces the Failed status with the real final status
|
|
|
|
Really BuildKite should auto-retry in this scenario, which can be configured but is not the default, and this script is a quick workaround to retry failed jobs
|
|
|
|
https://forum.buildkite.community/t/reschedule-builds-on-other-agents-rather-than-fail-builds-when-agents-time-out-or-are-killed-machine-shut-down-or-put-to-sleep/1388
|
|
|
|
Can optionally specify a pipeline to retry only failed jobs in builds for that pipeline
|
|
"
|
|
|
|
# shellcheck disable=SC2034
|
|
usage_args="[<pipeline>]"
|
|
|
|
help_usage "$@"
|
|
|
|
pipeline="${1:-}"
|
|
|
|
url_path="/builds"
|
|
|
|
if [ -n "$pipeline" ]; then
|
|
url_path="/{organization}/pipelines/$pipeline/builds"
|
|
fi
|
|
|
|
"$srcdir/buildkite_api.sh" "$url_path" |
|
|
jq -r '.[] |
|
|
select(.state == "failed") |
|
|
select(.jobs[].exit_status == -1) |
|
|
[.number, (.jobs[] | (select(.exit_status == -1) | .id)), .pipeline.slug ] |
|
|
@tsv' |
|
|
while read -r build_number job_id pipeline_slug; do
|
|
timestamp "retrying '$pipeline_slug' build '$build_number' job '$job_id'"
|
|
"$srcdir/buildkite_api.sh" "/organizations/{organization}/pipelines/$pipeline_slug/builds/$build_number/jobs/$job_id/retry" -X PUT >/dev/null
|
|
done
|