Add backend selective testing workflow

rbro112 · rbro112 · commit 74eba04118fc · 2025-12-29T12:20:00.000-08:00
diff --git a/.github/workflows/backend_selective_testing.yml b/.github/workflows/backend_selective_testing.yml
@@ -0,0 +1,83 @@
+name: backend - selective
+
+on:
+  pull_request:
+
+# Cancel in progress workflows on pull_requests.
+# https://docs.github.com/en/actions/using-jobs/using-concurrency#example-using-a-fallback-value
+concurrency:
+  group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
+  cancel-in-progress: true
+
+jobs:
+  backend-test-selective:
+    name: backend test (selective)
+    runs-on: ubuntu-24.04
+    timeout-minutes: 60
+    permissions:
+      contents: read
+      id-token: write
+      actions: read # used for DIM metadata
+    strategy:
+      fail-fast: false
+      matrix:
+        instance:
+          [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21]
+
+    env:
+      MATRIX_INSTANCE_TOTAL: 22
+
+    steps:
+      - uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7
+
+      - name: Setup sentry env
+        uses: ./.github/actions/setup-sentry
+        id: setup
+        with:
+          mode: backend-ci
+
+      # TODO: Gcloud
+      - name: Download coverage database
+        uses: actions/download-artifact@v4
+        with:
+          name: pycoverage-sqlite-combined-20529759656
+          path: .coverage
+          run-id: 20529759656
+
+      - name: Get changed files
+        id: changed-files
+        uses: tj-actions/changed-files@24d32ffd492484c1d75e0c0b894501ddb9d30d62
+
+      - name: List all changed files
+        env:
+          ALL_CHANGED_FILES: ${{ steps.changed-files.outputs.all_changed_files }}
+        run: |
+          for file in ${ALL_CHANGED_FILES}; do
+              echo "$file was changed"
+          done
+
+      - name: Run backend tests (${{ steps.setup.outputs.matrix-instance-number }} of ${{ steps.setup.outputs.matrix-instance-total }})
+        id: run_backend_tests
+        run: make test-python-ci
+        env:
+          SELECTIVE_TESTING_ENABLED: true
+          CHANGED_FILES: ${{ steps.changed-files.outputs.all_changed_files }}
+          COVERAGE_DB_PATH: .coverage
+
+      - name: Inspect failure
+        if: failure()
+        run: |
+          if command -v devservices; then
+            devservices logs
+          fi
+
+    #   - name: Collect test data
+    #     uses: ./.github/actions/collect-test-data
+    #     if: ${{ !cancelled() }}
+    #     with:
+    #       artifact_path: .artifacts/pytest.json # TODO
+    #       gcs_bucket: ${{ secrets.COLLECT_TEST_DATA_GCS_BUCKET }}
+    #       gcp_project_id: ${{ secrets.COLLECT_TEST_DATA_GCP_PROJECT_ID }}
+    #       workload_identity_provider: ${{ secrets.SENTRY_GCP_DEV_WORKLOAD_IDENTITY_POOL }}
+    #       service_account_email: ${{ secrets.COLLECT_TEST_DATA_SERVICE_ACCOUNT_EMAIL }}
+    #       matrix_instance_number: ${{ steps.setup.outputs.matrix-instance-number }}
diff --git a/src/sentry/preprod/size_analysis/compare.py b/src/sentry/preprod/size_analysis/compare.py
@@ -155,6 +155,8 @@ def compare_size_analysis(
         base_download_size=base_size_analysis.max_download_size,
     )
 
+    # Placeholder
+
     # Compare insights only if we're not skipping the comparison
     insight_diff_items = []
     if not skip_diff_item_comparison:
diff --git a/src/sentry/testutils/pytest/selective_testing.py b/src/sentry/testutils/pytest/selective_testing.py
@@ -0,0 +1,103 @@
+from __future__ import annotations
+
+import os
+import sqlite3
+import sys
+
+
+def _file_executed(bitblob: bytes) -> bool:
+    """
+    Returns True if any line in the file was executed (bitblob has any bits set).
+    """
+    return any(b != 0 for b in bitblob)
+
+
+def get_affected_tests_from_coverage(db_path: str, source_files: list[str]) -> set[str] | None:
+    """
+    Query the coverage database to find which tests executed code in the given source files.
+
+    Args:
+        db_path: Path to the .coverage SQLite database
+        source_files: List of source file paths that have changed
+
+    Returns:
+        Set of test file paths (e.g., 'tests/sentry/api/test_foo.py'),
+        or None if the database doesn't exist or there's an error.
+    """
+    if not os.path.exists(db_path):
+        return None
+
+    try:
+        conn = sqlite3.connect(db_path)
+        cur = conn.cursor()
+
+        test_contexts = set()
+
+        for file_path in source_files:
+            # Query for test contexts that executed this file
+            cur.execute(
+                """
+                SELECT c.context, lb.numbits
+                FROM line_bits lb
+                JOIN file f    ON lb.file_id = f.id
+                JOIN context c ON lb.context_id = c.id
+                WHERE f.path LIKE '%' || ?
+                  AND c.context != ''
+            """,
+                (f"/{file_path}",),
+            )
+
+            for context, bitblob in cur.fetchall():
+                if _file_executed(bitblob):
+                    test_contexts.add(context)
+
+        conn.close()
+
+        # Extract test file paths from contexts
+        # Context format: 'tests/foo/bar.py::TestClass::test_function'
+        test_files = set()
+        for context in test_contexts:
+            test_file = context.split("::", 1)[0]
+            test_files.add(test_file)
+
+        return test_files
+
+    except (sqlite3.Error, Exception) as e:
+        # Log the error but don't fail the test run
+        print(f"Warning: Could not query coverage database: {e}", file=sys.stderr)
+        return None
+
+
+def filter_items_by_coverage(items, changed_files: list[str], coverage_db_path: str):
+    """
+    Filter pytest items to only include tests affected by the changed files.
+
+    Args:
+        items: List of pytest.Item objects to filter
+        changed_files: List of source files that have changed
+        coverage_db_path: Path to the coverage database
+
+    Returns:
+        Tuple of (selected_items, discarded_items, affected_test_files)
+        where affected_test_files is the set of test files found in coverage data,
+        or None if coverage data could not be loaded.
+    """
+    affected_test_files = get_affected_tests_from_coverage(coverage_db_path, changed_files)
+
+    if affected_test_files is None:
+        # Could not load coverage data, return all items as selected
+        return list(items), [], None
+
+    # Filter items to only include tests from affected files
+    selected_items = []
+    discarded_items = []
+
+    for item in items:
+        # Extract test file path from nodeid (e.g., 'tests/foo.py::TestClass::test_func')
+        test_file = item.nodeid.split("::", 1)[0]
+        if test_file in affected_test_files:
+            selected_items.append(item)
+        else:
+            discarded_items.append(item)
+
+    return selected_items, discarded_items, affected_test_files
diff --git a/src/sentry/testutils/pytest/sentry.py b/src/sentry/testutils/pytest/sentry.py
@@ -18,6 +18,7 @@
 
 from sentry.runner.importer import install_plugin_apps
 from sentry.silo.base import SiloMode
+from sentry.testutils.pytest.selective_testing import filter_items_by_coverage
 from sentry.testutils.region import TestEnvRegionDirectory
 from sentry.testutils.silo import monkey_patch_single_process_silo_mode_state
 from sentry.types import region
@@ -388,6 +389,43 @@ def _shuffle_d(dct: dict[K, V]) -> dict[K, V]:
 def pytest_collection_modifyitems(config: pytest.Config, items: list[pytest.Item]) -> None:
     """After collection, we need to select tests based on group and group strategy"""
 
+    initial_discard = []
+
+    # Selective testing based on coverage data
+    if os.environ.get("SELECTIVE_TESTING_ENABLED"):
+        changed_files_str = os.environ.get("CHANGED_FILES", "")
+        coverage_db_path = os.environ.get("COVERAGE_DB_PATH", ".coverage.combined")
+
+        if changed_files_str:
+            # Parse changed files from comma-separated string
+            changed_files = [f.strip() for f in changed_files_str.split(",") if f.strip()]
+
+            config.get_terminal_writer().line(
+                f"Selective testing enabled for {len(changed_files)} changed file(s)"
+            )
+
+            # Filter tests using coverage data
+            selected_items, discarded_items, affected_test_files = filter_items_by_coverage(
+                items, changed_files, coverage_db_path
+            )
+
+            if affected_test_files is not None:
+                config.get_terminal_writer().line(
+                    f"Found {len(affected_test_files)} affected test file(s) from coverage data"
+                )
+                config.get_terminal_writer().line(
+                    f"Selected {len(selected_items)}/{len(items)} tests based on coverage"
+                )
+
+                # Update items with filtered list
+                items[:] = selected_items
+                initial_discard = discarded_items
+            else:
+                config.get_terminal_writer().line(
+                    "Warning: Could not load coverage data, running all tests"
+                )
+
+    # Existing grouping logic (unchanged)
     total_groups = int(os.environ.get("TOTAL_TEST_GROUPS", 1))
     current_group = int(os.environ.get("TEST_GROUP", 0))
     grouping_strategy = os.environ.get("TEST_GROUP_STRATEGY", "scope")
@@ -420,9 +458,12 @@ def pytest_collection_modifyitems(config: pytest.Config, items: list[pytest.Item
         config.get_terminal_writer().line(f"SENTRY_SHUFFLE_TESTS_SEED: {seed}")
         _shuffle(items, random.Random(seed))
 
+    # Combine discards from both selective testing and grouping
+    all_discarded = initial_discard + discard
+
     # This only needs to be done if there are items to be de-selected
-    if len(discard) > 0:
-        config.hook.pytest_deselected(items=discard)
+    if len(all_discarded) > 0:
+        config.hook.pytest_deselected(items=all_discarded)
 
 
 def pytest_xdist_setupnodes() -> None:

Original file line number	Diff line number	Diff line change
`@@ -155,6 +155,8 @@ def compare_size_analysis(`
`155`	`155`	`base_download_size=base_size_analysis.max_download_size,`
`156`	`156`	`)`
`157`	`157`
	`158`	`+ # Placeholder`
	`159`	`+`
`158`	`160`	`# Compare insights only if we're not skipping the comparison`
`159`	`161`	`insight_diff_items = []`
`160`	`162`	`if not skip_diff_item_comparison:`