shuffle-tests-across-shards #109

Workflow file for this run

.github/workflows/shuffle-tests-across-shards.yml at 9aad890

	name: shuffle-tests-across-shards

	on:
	# gh api repos/getsentry/sentry/actions/workflows/shuffle-tests-across-shards.yml/dispatches -f ref=shuffle-tests-across-shards
	workflow_dispatch:
	inputs:
	seed:
	description: The seed for the test ordering (all shards must share the same seed)
	required: false

	# run every 30 minutes between 6PM-9AM PST
	schedule:
	- cron: '/30 2-17 * *'

	jobs:
	backend-test:
	name: run backend tests
	runs-on: ubuntu-24.04
	timeout-minutes: 60
	permissions:
	contents: read
	issues: write
	strategy:
	# This helps not having to run multiple jobs because one fails, thus, reducing resource usage
	# and reducing the risk that one of many runs would turn red again (read: intermittent tests)
	fail-fast: false
	matrix:
	# XXX: When updating this, make sure you also update MATRIX_INSTANCE_TOTAL.
	instance: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10]

	env:
	# XXX: `MATRIX_INSTANCE_TOTAL` must be hardcoded to the length of `strategy.matrix.instance`.
	MATRIX_INSTANCE_TOTAL: 11
	SENTRY_SHUFFLE_TESTS: 1
	# All shards must share the same seed; github.run_id is consistent across matrix instances
	SENTRY_SHUFFLE_TESTS_SEED: ${{ inputs.seed \|\| github.run_id }}

	steps:
	- uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7

	- name: Setup sentry env
	uses: ./.github/actions/setup-sentry
	id: setup
	with:
	mode: backend-ci

	- name: Run backend test (${{ steps.setup.outputs.matrix-instance-number }} of ${{ steps.setup.outputs.matrix-instance-total }})
	id: run-tests
	continue-on-error: true
	run: \|
	python3 -b -m pytest \
	--exitfirst \
	tests \
	--reuse-db \
	--ignore tests/acceptance \
	--ignore tests/apidocs \
	--ignore tests/js \
	--ignore tests/tools \
	--ignore tests/relay_integration \
	--ignore tests/symbolicator

	- name: Truncate testids
	if: steps.run-tests.outcome == 'failure' && hashFiles('/tmp/failing-testid') != ''
	run: \|
	# Keep only tests up to and including the failing test;
	# tests that run after it cannot be polluting it.
	read -r FAILING_TESTID < /tmp/failing-testid
	head -n "$(grep -nF "$FAILING_TESTID" /tmp/testids-full \| head -1 \| cut -d: -f1)" /tmp/testids-full > /tmp/testids

	- uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
	if: steps.run-tests.outcome == 'failure' && hashFiles('/tmp/failing-testid') != ''
	with:
	name: testids-${{ matrix.instance }}
	path: /tmp/testids

	- name: Detect test pollution
	if: steps.run-tests.outcome == 'failure' && hashFiles('/tmp/failing-testid') != ''
	env:
	# just so we get realtime output since detect-test-pollution doesn't print much
	PYTHONUNBUFFERED: 1
	run: \|
	read -r FAILING_TESTID < /tmp/failing-testid
	python .github/workflows/scripts/detect-test-pollution.py \
	--failing-test "$FAILING_TESTID" \
	--testids-file /tmp/testids \
	\| tee /tmp/detect-test-pollution-output
	read -r POLLUTING_TESTID < <(tail -1 /tmp/detect-test-pollution-output)
	echo "detected test pollution: \`pytest $POLLUTING_TESTID $FAILING_TESTID\`" >> "$GITHUB_STEP_SUMMARY"
	echo "sentry sha: ${{ github.sha }}" >> "$GITHUB_STEP_SUMMARY"

	- name: Create GitHub issue
	if: steps.run-tests.outcome == 'failure' && hashFiles('/tmp/failing-testid') != ''
	run: \|
	gh issue create \
	--title "Test pollution: $FAILING_TESTID" \
	--label test-pollution \
	--body "$(cat "$GITHUB_STEP_SUMMARY")"

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

shuffle-tests-across-shards #109

Workflow file

shuffle-tests-across-shards #109

Uh oh!

Workflow file for this run