From 5be09de504ab0f6ef9b9d81defd1a13c9e7124b4 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:06:59 -0400
Subject: [PATCH 01/15] Add universal package detection for bisection across
 package managers
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add python-command input to specify how to invoke Python in test environment
- Support pip, conda, uv, poetry, pixi, and other package managers
- Use importlib.metadata for universal package detection (works with all managers)
- Capture package versions from actual test environment, not action environment
- Store both package versions and Git commit info for comprehensive bisection
- Generate per-test analysis showing exactly when each test last passed
- Improve branch handling with better error recovery and git configuration
- Add comprehensive tests for new functionality
- Update documentation with examples for all major package managers

Backward compatible: existing workflows continue to work without changes.

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 README.md              | 263 ++++++++++++++++++++
 action.yaml            | 123 +++++++++
 parse_logs.py          |  13 +
 test_track_packages.py | 363 +++++++++++++++++++++++++++
 track_packages.py      | 549 +++++++++++++++++++++++++++++++++++++++++
 5 files changed, 1311 insertions(+)
 create mode 100644 test_track_packages.py
 create mode 100644 track_packages.py

diff --git a/README.md b/README.md
index 435932d..d28b441 100644
--- a/README.md
+++ b/README.md
@@ -110,3 +110,266 @@ Any assignees to set on the new issue:
 ```
 
 Note that assignees must have the commit bit on the repository.
+
+## Bisection Feature
+
+The action can track package versions between successful and failed CI runs to help identify which dependency changes might have caused test failures.
+
+### track-packages
+
+optional
+
+Comma-separated list of packages to track for bisection analysis. Use `"all"` to track all installed packages:
+
+```yaml
+- uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+  with:
+    log-path: pytest-log.jsonl
+    track-packages: "xarray,pandas,numpy"
+```
+
+Or track all packages:
+
+```yaml
+- uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+  with:
+    log-path: pytest-log.jsonl
+    track-packages: "all"
+```
+
+### python-command
+
+optional. Default: `"python"`
+
+Command to invoke Python in the test environment. This ensures package versions are captured from the same environment that ran the tests:
+
+```yaml
+- uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+  with:
+    log-path: pytest-log.jsonl
+    track-packages: "xarray,pandas,numpy"
+    python-command: "python3"
+```
+
+### bisect-storage-method
+
+optional. Default: `"branch"`
+
+Storage method for bisection data. Currently only `"branch"` is supported.
+
+### bisect-branch
+
+optional. Default: `"bisect-data"`
+
+Branch name for storing bisection data when using branch storage method.
+
+### Setting up Bisection
+
+To use the bisection feature, run the action with `track-packages` specified. The action will automatically store both package versions and test results for every run, and generate bisection analysis when tests fail.
+
+#### Standard Python/pip Setup
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    permissions:
+      issues: write
+      contents: write  # Needed for bisection branch
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          token: ${{ secrets.GITHUB_TOKEN }}
+          fetch-depth: 0  # Needed for bisection branch operations
+
+      - uses: actions/setup-python@v4
+        with:
+          python-version: "3.12"
+
+      - run: |
+          pip install --upgrade pytest-reportlog
+
+      - run: |
+          pytest --report-log pytest-log.jsonl
+
+      # Track package versions and create issue if tests fail
+      - name: Track packages and create issue if needed
+        if: always()  # Run regardless of test outcome to store data
+        uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+        with:
+          log-path: pytest-log.jsonl
+          track-packages: "xarray,pandas,numpy"
+          python-command: "python"  # Default, can be omitted
+```
+
+#### Conda/Mamba Setup
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    permissions:
+      issues: write
+      contents: write
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: conda-incubator/setup-miniconda@v2
+        with:
+          auto-update-conda: true
+          python-version: "3.12"
+
+      - name: Install dependencies
+        shell: bash -l {0}
+        run: |
+          conda install pytest pytest-reportlog numpy pandas
+
+      - name: Run tests
+        shell: bash -l {0}
+        run: |
+          pytest --report-log pytest-log.jsonl
+
+      - name: Track packages and create issue if needed
+        if: always()
+        uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+        with:
+          log-path: pytest-log.jsonl
+          track-packages: "numpy,pandas,pytest"
+          python-command: "python"  # Conda python is already in PATH
+```
+
+#### UV Setup
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    permissions:
+      issues: write
+      contents: write
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: astral-sh/setup-uv@v1
+
+      - name: Run tests
+        run: |
+          uv run pytest --report-log pytest-log.jsonl
+
+      - name: Track packages and create issue if needed
+        if: always()
+        uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+        with:
+          log-path: pytest-log.jsonl
+          track-packages: "all"  # Track all packages
+          python-command: "uv run python"
+```
+
+#### Poetry Setup
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    permissions:
+      issues: write
+      contents: write
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: actions/setup-python@v4
+        with:
+          python-version: "3.12"
+
+      - name: Install Poetry
+        uses: snok/install-poetry@v1
+
+      - name: Run tests
+        run: |
+          poetry run pytest --report-log pytest-log.jsonl
+
+      - name: Track packages and create issue if needed
+        if: always()
+        uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+        with:
+          log-path: pytest-log.jsonl
+          track-packages: "numpy,pandas,pytest"
+          python-command: "poetry run python"
+```
+
+#### Pixi Setup
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    permissions:
+      issues: write
+      contents: write
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: prefix-dev/setup-pixi@v0.3.0
+
+      - name: Run tests
+        run: |
+          pixi run pytest --report-log pytest-log.jsonl
+
+      - name: Track packages and create issue if needed
+        if: always()
+        uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
+        with:
+          log-path: pytest-log.jsonl
+          track-packages: "numpy,pandas,pytest"
+          python-command: "pixi run python"
+```
+
+When enabled, the bisection feature will add comprehensive analysis to GitHub issues:
+
+```
+## tests/test_plotting.py::test_plot_basic
+
+### Package changes since last pass
+- matplotlib: 3.8.0 → 3.9.0
+- numpy: 1.24.0 → 1.25.0
+
+### Code changes since last pass
+- a1b2c3d4 (Fix plotting bug in core module for edge cases...)
+- → e5f6g7h8 (Update dependencies and refactor plotting tests...)
+- Last passed in run #120 on 2024-01-15T10:30:00Z
+
+## tests/test_io.py::test_read_netcdf[dataset1]
+
+### Package changes since last pass
+- xarray: 2024.01.0 → 2024.02.0
+- netcdf4: 1.6.0 → 1.6.1
+
+### Code changes since last pass
+- f9a8b7c6 (Add netcdf4 compatibility layer for new datasets...)
+- → e5f6g7h8 (Update dependencies and refactor plotting tests...)
+- Last passed in run #118 on 2024-01-14T14:22:00Z
+
+## tests/test_core.py::test_merge_datasets
+
+### Analysis
+- No recent successful run found for this test
+```
+
+This enhanced bisection feature helps identify:
+1. **For each failing test**, exactly which dependencies and code changed since it last passed
+2. **Precise correlation** between specific changes and test failures
+3. **Historical context** with exact commits and timestamps
+4. **Actionable debugging information** organized by failing test
diff --git a/action.yaml b/action.yaml
index 84a70db..13efdfa 100644
--- a/action.yaml
+++ b/action.yaml
@@ -23,6 +23,30 @@ inputs:
       have commit rights.
     required: false
     default: ""
+  track-packages:
+    description: >-
+      Comma-separated list of packages to track for bisection (e.g., "xarray,pandas,numpy").
+      Use "all" to track all installed packages. If provided, the action will compare
+      package versions between the last successful run and the current failed run.
+    required: false
+    default: ""
+  bisect-storage-method:
+    description: >-
+      Storage method for bisection data. Either "branch" or "artifact".
+    required: false
+    default: "branch"
+  bisect-branch:
+    description: >-
+      Branch name for storing bisection data when using branch storage method.
+    required: false
+    default: "bisect-data"
+  python-command:
+    description: >-
+      Command to invoke Python in the test environment (e.g., "python", "python3",
+      "conda run python", "uv run python", "poetry run python"). This ensures
+      package versions are captured from the same environment that ran the tests.
+    required: false
+    default: "python"
 outputs: {}
 branding:
   color: "red"
@@ -41,6 +65,105 @@ runs:
       shell: bash -l {0}
       run: |
         python -m pip install pytest more-itertools
+    - name: capture package versions from test environment
+      shell: bash -l {0}
+      run: |
+        if [ -n "${{ inputs.track-packages }}" ]; then
+          echo "Capturing package versions using: ${{ inputs.python-command }}"
+
+          # Capture package versions from the test environment
+          ${{ inputs.python-command }} -c "
+import json
+import sys
+
+packages_input = '${{ inputs.track-packages }}'.strip()
+if not packages_input:
+    exit()
+
+packages = [pkg.strip() for pkg in packages_input.split(',')]
+versions = {}
+
+# Try importlib.metadata first (Python 3.8+)
+try:
+    import importlib.metadata as metadata
+    if len(packages) == 1 and packages[0].lower() == 'all':
+        print('Capturing all installed packages...')
+        for dist in metadata.distributions():
+            versions[dist.name] = dist.version
+    else:
+        print(f'Capturing specific packages: {packages}')
+        for pkg in packages:
+            if pkg:
+                try:
+                    versions[pkg] = metadata.version(pkg)
+                    print(f'  {pkg}: {versions[pkg]}')
+                except Exception as e:
+                    versions[pkg] = None
+                    print(f'  {pkg}: not found ({e})')
+except ImportError:
+    print('importlib.metadata not available, trying pkg_resources...')
+    # Fallback to pkg_resources
+    try:
+        import pkg_resources
+        if len(packages) == 1 and packages[0].lower() == 'all':
+            print('Capturing all installed packages...')
+            for dist in pkg_resources.working_set:
+                versions[dist.project_name] = dist.version
+        else:
+            print(f'Capturing specific packages: {packages}')
+            for pkg in packages:
+                if pkg:
+                    try:
+                        versions[pkg] = pkg_resources.get_distribution(pkg).version
+                        print(f'  {pkg}: {versions[pkg]}')
+                    except Exception as e:
+                        versions[pkg] = None
+                        print(f'  {pkg}: not found ({e})')
+    except ImportError:
+        print('ERROR: No package detection method available')
+        versions = {'error': 'No package detection method available'}
+
+# Save captured versions
+capture_data = {
+    'python_version': '.'.join(map(str, sys.version_info[:3])),
+    'python_executable': sys.executable,
+    'packages': versions,
+    'capture_method': 'importlib.metadata' if 'importlib.metadata' in sys.modules else 'pkg_resources'
+}
+
+with open('captured-package-versions.json', 'w') as f:
+    json.dump(capture_data, f, indent=2)
+
+print(f'Captured {len(versions)} package versions')
+"
+        else
+          echo "No packages specified for tracking, skipping package capture"
+        fi
+    - name: handle package tracking
+      shell: bash -l {0}
+      run: |
+        if [ -n "${{ inputs.track-packages }}" ]; then
+          echo "Processing package tracking for: ${{ inputs.track-packages }}"
+
+          # Always store current run data (packages + test results)
+          python $GITHUB_ACTION_PATH/track_packages.py \
+            --packages "${{ inputs.track-packages }}" \
+            --log-path "${{ inputs.log-path }}" \
+            --captured-versions captured-package-versions.json \
+            --store-run \
+            --branch "${{ inputs.bisect-branch }}"
+
+          # Generate comparison for bisection analysis
+          python $GITHUB_ACTION_PATH/track_packages.py \
+            --packages "${{ inputs.track-packages }}" \
+            --log-path "${{ inputs.log-path }}" \
+            --captured-versions captured-package-versions.json \
+            --generate-comparison \
+            --branch "${{ inputs.bisect-branch }}" \
+            --output-file bisect-comparison.txt
+        else
+          echo "No packages specified for tracking, skipping package tracking"
+        fi
     - name: produce the issue body
       shell: bash -l {0}
       run: |
diff --git a/parse_logs.py b/parse_logs.py
index 756aa19..c73a18e 100644
--- a/parse_logs.py
+++ b/parse_logs.py
@@ -242,6 +242,16 @@ def format_collection_error(error, **formatter_kwargs):
     ).format(py_version=py_version, name=error.name, traceback=error.repr_)
 
 
+def include_bisection_info(message: str, bisect_file: str = "bisect-comparison.txt") -> str:
+    """Include bisection information in the issue message if available."""
+    bisect_path = pathlib.Path(bisect_file)
+    if bisect_path.exists():
+        bisect_content = bisect_path.read_text().strip()
+        if bisect_content:
+            return f"{bisect_content}\n{message}"
+    return message
+
+
 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
     parser.add_argument("filepath", type=pathlib.Path)
@@ -268,6 +278,9 @@ def format_collection_error(error, **formatter_kwargs):
             preformatted, max_chars=65535, py_version=py_version
         )
 
+    # Include bisection information if available
+    message = include_bisection_info(message)
+
     output_file = pathlib.Path("pytest-logs.txt")
     print(f"Writing output file to: {output_file.absolute()}")
     output_file.write_text(message)
diff --git a/test_track_packages.py b/test_track_packages.py
new file mode 100644
index 0000000..ba921c2
--- /dev/null
+++ b/test_track_packages.py
@@ -0,0 +1,363 @@
+import json
+import os
+import sys
+import tempfile
+from unittest.mock import Mock, patch
+from datetime import datetime
+
+import hypothesis.strategies as st
+from hypothesis import given
+
+import track_packages
+
+
+def test_get_package_version_existing():
+    """Test getting version of an existing package."""
+    with patch("subprocess.run") as mock_run:
+        mock_run.return_value.stdout = "Name: pytest\nVersion: 7.4.0\nSummary: ..."
+        mock_run.return_value.check = True
+
+        version = track_packages.get_package_version("pytest")
+        assert version == "7.4.0"
+
+
+def test_get_package_version_nonexistent():
+    """Test getting version of a non-existent package."""
+    with patch("subprocess.run") as mock_run:
+        mock_run.side_effect = track_packages.subprocess.CalledProcessError(1, "pip")
+
+        version = track_packages.get_package_version("nonexistent-package")
+        assert version is None
+
+
+def test_get_all_installed_packages():
+    """Test getting all installed packages."""
+    mock_packages = [
+        {"name": "pytest", "version": "7.4.0"},
+        {"name": "hypothesis", "version": "6.82.0"},
+        {"name": "more-itertools", "version": "10.1.0"},
+    ]
+
+    with patch("subprocess.run") as mock_run:
+        mock_run.return_value.stdout = json.dumps(mock_packages)
+        mock_run.return_value.check = True
+
+        packages = track_packages.get_all_installed_packages()
+        expected = {
+            "pytest": "7.4.0",
+            "hypothesis": "6.82.0",
+            "more-itertools": "10.1.0",
+        }
+        assert packages == expected
+
+
+def test_get_current_package_versions_specific():
+    """Test getting versions of specific packages."""
+    with patch("track_packages.get_package_version") as mock_get_version:
+        mock_get_version.side_effect = lambda pkg: {
+            "pytest": "7.4.0",
+            "hypothesis": "6.82.0",
+            "nonexistent": None,
+        }.get(pkg)
+
+        versions = track_packages.get_current_package_versions(["pytest", "hypothesis", "nonexistent"])
+        expected = {
+            "pytest": "7.4.0",
+            "hypothesis": "6.82.0",
+            "nonexistent": None,
+        }
+        assert versions == expected
+
+
+def test_get_current_package_versions_from_captured_file():
+    """Test getting versions from a captured JSON file."""
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+        captured_data = {
+            "python_version": "3.11.0",
+            "packages": {
+                "pytest": "7.4.0",
+                "numpy": "1.24.0",
+                "requests": "2.31.0"
+            },
+            "capture_method": "importlib.metadata"
+        }
+        json.dump(captured_data, f)
+        captured_file = f.name
+
+    try:
+        # Test specific packages
+        versions = track_packages.get_current_package_versions(
+            ["pytest", "numpy", "missing"], captured_file
+        )
+        expected = {
+            "pytest": "7.4.0",
+            "numpy": "1.24.0",
+            "missing": None
+        }
+        assert versions == expected
+
+        # Test "all" packages
+        all_versions = track_packages.get_current_package_versions(["all"], captured_file)
+        expected_all = {
+            "pytest": "7.4.0",
+            "numpy": "1.24.0",
+            "requests": "2.31.0"
+        }
+        assert all_versions == expected_all
+    finally:
+        os.unlink(captured_file)
+
+
+def test_get_current_package_versions_fallback_on_bad_file():
+    """Test fallback when captured file is invalid."""
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+        f.write("invalid json content")
+        bad_file = f.name
+
+    try:
+        with patch("track_packages.get_package_version") as mock_get_version:
+            mock_get_version.return_value = "fallback-version"
+
+            versions = track_packages.get_current_package_versions(["pytest"], bad_file)
+            expected = {"pytest": "fallback-version"}
+            assert versions == expected
+    finally:
+        os.unlink(bad_file)
+
+
+def test_get_current_package_versions_all():
+    """Test getting versions when 'all' is specified."""
+    with patch("track_packages.get_all_installed_packages") as mock_get_all:
+        mock_get_all.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
+
+        versions = track_packages.get_current_package_versions(["all"])
+        assert versions == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
+
+
+def test_get_git_info():
+    """Test getting Git information."""
+    with patch("subprocess.run") as mock_run:
+        # Mock the sequence of git commands
+        mock_run.side_effect = [
+            Mock(stdout="abc123def456789\n", check=True),  # git rev-parse HEAD
+            Mock(stdout="Fix test regression\n", check=True),  # git log -1 --pretty=format:%s
+            Mock(stdout="John Doe <john@example.com>\n", check=True),  # git log -1 --pretty=format:%an <%ae>
+            Mock(stdout="2024-01-15 10:30:00 +0000\n", check=True),  # git log -1 --pretty=format:%ci
+        ]
+
+        git_info = track_packages.get_git_info()
+
+        expected = {
+            "commit_hash": "abc123def456789",
+            "commit_hash_short": "abc123de",
+            "commit_message": "Fix test regression",
+            "commit_author": "John Doe <john@example.com>",
+            "commit_date": "2024-01-15 10:30:00 +0000",
+        }
+        assert git_info == expected
+
+
+def test_extract_failed_tests_from_log():
+    """Test extracting failed tests from pytest log file."""
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.jsonl', delete=False) as f:
+        # Write sample pytest log entries
+        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_pass", "outcome": "passed"}\n')
+        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_fail1", "outcome": "failed"}\n')
+        f.write('{"$report_type": "CollectReport", "nodeid": "test_file.py::test_fail2", "outcome": "failed"}\n')
+        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_skip", "outcome": "skipped"}\n')
+        f.write('{"$report_type": "WarningMessage", "outcome": "failed"}\n')  # Should be ignored
+        log_path = f.name
+
+    try:
+        failed_tests = track_packages.extract_failed_tests_from_log(log_path)
+        expected = ["test_file.py::test_fail1", "test_file.py::test_fail2"]
+        assert failed_tests == expected
+    finally:
+        os.unlink(log_path)
+
+
+def test_extract_failed_tests_from_log_missing_file():
+    """Test extracting failed tests when log file doesn't exist."""
+    failed_tests = track_packages.extract_failed_tests_from_log("nonexistent.jsonl")
+    assert failed_tests == []
+
+
+def test_get_git_info_failure():
+    """Test getting Git information when git commands fail."""
+    with patch("subprocess.run") as mock_run:
+        mock_run.side_effect = track_packages.subprocess.CalledProcessError(1, "git")
+
+        git_info = track_packages.get_git_info()
+
+        expected = {
+            "commit_hash": "unknown",
+            "commit_hash_short": "unknown",
+            "commit_message": "unknown",
+            "commit_author": "unknown",
+            "commit_date": "unknown",
+        }
+        assert git_info == expected
+
+
+def test_create_bisect_data():
+    """Test creating bisection data."""
+    packages = ["pytest", "hypothesis"]
+
+    with patch("track_packages.get_current_package_versions") as mock_get_versions, \
+         patch("track_packages.get_git_info") as mock_get_git, \
+         patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests:
+
+        mock_get_versions.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
+        mock_get_git.return_value = {
+            "commit_hash": "abc123",
+            "commit_hash_short": "abc123de",
+            "commit_message": "Test commit",
+            "commit_author": "Test Author",
+            "commit_date": "2024-01-01",
+        }
+        mock_extract_tests.return_value = []
+
+        with patch.dict("os.environ", {"GITHUB_RUN_ID": "12345"}):
+            data = track_packages.create_bisect_data(packages)
+
+            assert data["workflow_run_id"] == "12345"
+            assert data["python_version"] == ".".join(str(v) for v in sys.version_info[:3])
+            assert data["packages"] == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
+            assert data["failed_tests"] == []
+            assert data["test_status"] == "passed"
+            assert data["git"]["commit_hash"] == "abc123"
+            assert "timestamp" in data
+            # Check timestamp format
+            datetime.fromisoformat(data["timestamp"].replace("Z", "+00:00"))
+
+
+def test_create_bisect_data_with_captured_versions():
+    """Test creating bisection data with captured versions file."""
+    packages = ["pytest", "numpy"]
+
+    # Create a captured versions file
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+        captured_data = {
+            "python_version": "3.11.5",
+            "packages": {
+                "pytest": "7.4.2",
+                "numpy": "1.25.1"
+            }
+        }
+        json.dump(captured_data, f)
+        captured_file = f.name
+
+    try:
+        with patch("track_packages.get_git_info") as mock_get_git, \
+             patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests:
+
+            mock_get_git.return_value = {
+                "commit_hash": "def456",
+                "commit_hash_short": "def456gh",
+                "commit_message": "Test commit with captured versions",
+                "commit_author": "Test Author",
+                "commit_date": "2024-01-01",
+            }
+            mock_extract_tests.return_value = ["test_fail.py::test_example"]
+
+            with patch.dict("os.environ", {"GITHUB_RUN_ID": "67890"}):
+                data = track_packages.create_bisect_data(packages, captured_versions_file=captured_file)
+
+                assert data["workflow_run_id"] == "67890"
+                assert data["python_version"] == "3.11.5"  # From captured file
+                assert data["packages"] == {"pytest": "7.4.2", "numpy": "1.25.1"}  # From captured file
+                assert data["failed_tests"] == ["test_fail.py::test_example"]
+                assert data["test_status"] == "failed"
+                assert data["git"]["commit_hash"] == "def456"
+                assert "timestamp" in data
+    finally:
+        os.unlink(captured_file)
+
+
+def test_format_bisect_comparison_no_previous():
+    """Test formatting comparison when no previous data exists."""
+    current_data = {
+        "workflow_run_id": "456",
+        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0"},
+    }
+
+    result = track_packages.format_bisect_comparison(current_data, None)
+    assert result is None
+
+
+def test_format_bisect_comparison_with_changes():
+    """Test formatting comparison with package changes."""
+    previous_data = {
+        "workflow_run_id": "123",
+        "packages": {"pytest": "7.3.0", "hypothesis": "6.82.0", "removed-pkg": "1.0.0"},
+    }
+    current_data = {
+        "workflow_run_id": "456",
+        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0", "new-pkg": "2.0.0"},
+    }
+
+    result = track_packages.format_bisect_comparison(current_data, previous_data)
+
+    assert "Package Version Changes" in result
+    assert "Last Successful Run #123 → Current Failed Run #456" in result
+    assert "pytest: 7.3.0 → 7.4.0" in result
+    assert "hypothesis: 6.82.0 (unchanged)" in result
+    assert "removed-pkg: 1.0.0 → (not installed)" in result
+    assert "new-pkg: (not installed) → 2.0.0" in result
+
+
+def test_format_bisect_comparison_no_changes():
+    """Test formatting comparison when no packages changed."""
+    data = {
+        "workflow_run_id": "456",
+        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0"},
+    }
+
+    result = track_packages.format_bisect_comparison(data, data)
+
+    assert "Package Version Changes" in result
+    assert "pytest: 7.4.0 (unchanged)" in result
+    assert "hypothesis: 6.82.0 (unchanged)" in result
+
+
+@given(st.lists(st.text(min_size=1), min_size=1, max_size=5))
+def test_get_current_package_versions_property(package_names):
+    """Property test for get_current_package_versions."""
+    with patch("track_packages.get_package_version") as mock_get_version:
+        mock_get_version.return_value = "1.0.0"
+
+        versions = track_packages.get_current_package_versions(package_names)
+
+        assert len(versions) == len(package_names)
+        for pkg in package_names:
+            assert pkg in versions
+
+
+def test_retrieve_bisect_data_from_branch_no_branch():
+    """Test retrieving data when branch doesn't exist."""
+    with patch("subprocess.run") as mock_run:
+        # Simulate no branch found
+        mock_run.return_value.stdout = ""
+        mock_run.return_value.check = True
+
+        result = track_packages.retrieve_bisect_data_from_branch("nonexistent-branch")
+        assert result is None
+
+
+def test_retrieve_bisect_data_from_branch_success():
+    """Test successfully retrieving data from branch."""
+    mock_data = {
+        "workflow_run_id": "123",
+        "packages": {"pytest": "7.3.0"},
+    }
+
+    with patch("subprocess.run") as mock_run:
+        # Mock the sequence of git commands
+        mock_run.side_effect = [
+            Mock(stdout="abc123\trefs/heads/bisect-data\n", check=True),  # ls-remote
+            Mock(check=True),  # fetch
+            Mock(stdout=json.dumps(mock_data), check=True),  # show
+        ]
+
+        result = track_packages.retrieve_bisect_data_from_branch("bisect-data")
+        assert result == mock_data
\ No newline at end of file
diff --git a/track_packages.py b/track_packages.py
new file mode 100644
index 0000000..02a41fd
--- /dev/null
+++ b/track_packages.py
@@ -0,0 +1,549 @@
+"""
+Package version tracking for bisection analysis.
+
+This module handles tracking package versions between CI runs to help identify
+which dependency changes might have caused test failures.
+"""
+
+import argparse
+import json
+import os
+import pathlib
+import subprocess
+import sys
+import tempfile
+from datetime import datetime
+from typing import Dict, List, Optional, Tuple
+
+
+def get_all_installed_packages() -> Dict[str, str]:
+    """Get all installed packages and their versions."""
+    try:
+        result = subprocess.run(
+            [sys.executable, "-m", "pip", "list", "--format=json"],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        packages_data = json.loads(result.stdout)
+        return {pkg["name"]: pkg["version"] for pkg in packages_data}
+    except (subprocess.CalledProcessError, json.JSONDecodeError):
+        return {}
+
+
+def get_package_version(package_name: str) -> Optional[str]:
+    """Get the version of an installed package."""
+    try:
+        result = subprocess.run(
+            [sys.executable, "-m", "pip", "show", package_name],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        for line in result.stdout.split("\n"):
+            if line.startswith("Version:"):
+                return line.split(":", 1)[1].strip()
+    except (subprocess.CalledProcessError, IndexError):
+        pass
+    return None
+
+
+def get_current_package_versions(packages: List[str], captured_versions_file: str = None) -> Dict[str, Optional[str]]:
+    """Get current versions of specified packages."""
+    # First try to read from captured versions file if provided
+    if captured_versions_file and os.path.exists(captured_versions_file):
+        try:
+            with open(captured_versions_file, 'r') as f:
+                captured_data = json.load(f)
+                captured_packages = captured_data.get('packages', {})
+
+                if len(packages) == 1 and packages[0].lower() == "all":
+                    return captured_packages
+
+                # Return only the requested packages from captured data
+                versions = {}
+                for package in packages:
+                    versions[package] = captured_packages.get(package)
+                return versions
+        except (json.JSONDecodeError, IOError) as e:
+            print(f"Warning: Could not read captured versions file {captured_versions_file}: {e}")
+            print("Falling back to direct package detection...")
+
+    # Fallback to direct detection (original behavior)
+    if len(packages) == 1 and packages[0].lower() == "all":
+        return get_all_installed_packages()
+
+    versions = {}
+    for package in packages:
+        versions[package] = get_package_version(package)
+    return versions
+
+
+def extract_failed_tests_from_log(log_path: str) -> List[str]:
+    """Extract failed test nodeids from pytest log file."""
+    failed_tests = []
+    try:
+        with open(log_path, 'r') as f:
+            for line in f:
+                try:
+                    record = json.loads(line)
+                    if (record.get("$report_type") in ["TestReport", "CollectReport"] and
+                        record.get("outcome") == "failed" and
+                        record.get("nodeid")):
+                        failed_tests.append(record["nodeid"])
+                except json.JSONDecodeError:
+                    continue
+    except FileNotFoundError:
+        pass
+    return failed_tests
+
+
+def get_git_info() -> Dict[str, str]:
+    """Get current Git commit information."""
+    try:
+        # Get current commit hash
+        commit_result = subprocess.run(
+            ["git", "rev-parse", "HEAD"],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        commit_hash = commit_result.stdout.strip()
+
+        # Get commit message
+        message_result = subprocess.run(
+            ["git", "log", "-1", "--pretty=format:%s"],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        commit_message = message_result.stdout.strip()
+
+        # Get commit author and date
+        author_result = subprocess.run(
+            ["git", "log", "-1", "--pretty=format:%an <%ae>"],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        commit_author = author_result.stdout.strip()
+
+        date_result = subprocess.run(
+            ["git", "log", "-1", "--pretty=format:%ci"],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+        commit_date = date_result.stdout.strip()
+
+        return {
+            "commit_hash": commit_hash,
+            "commit_hash_short": commit_hash[:8],
+            "commit_message": commit_message,
+            "commit_author": commit_author,
+            "commit_date": commit_date,
+        }
+    except subprocess.CalledProcessError:
+        return {
+            "commit_hash": "unknown",
+            "commit_hash_short": "unknown",
+            "commit_message": "unknown",
+            "commit_author": "unknown",
+            "commit_date": "unknown",
+        }
+
+
+def create_bisect_data(packages: List[str], log_path: str = None, captured_versions_file: str = None, workflow_run_id: str = None) -> Dict:
+    """Create bisection data for current environment."""
+    if workflow_run_id is None:
+        workflow_run_id = os.environ.get("GITHUB_RUN_ID", "unknown")
+
+    failed_tests = []
+    if log_path and os.path.exists(log_path):
+        failed_tests = extract_failed_tests_from_log(log_path)
+
+    # Get package versions - prefer captured versions, fall back to direct detection
+    package_versions = get_current_package_versions(packages, captured_versions_file)
+
+    # Get Python version - prefer from captured data if available
+    python_version = ".".join(str(v) for v in sys.version_info[:3])
+    if captured_versions_file and os.path.exists(captured_versions_file):
+        try:
+            with open(captured_versions_file, 'r') as f:
+                captured_data = json.load(f)
+                if 'python_version' in captured_data:
+                    python_version = captured_data['python_version']
+        except (json.JSONDecodeError, IOError):
+            pass  # Use default python_version
+
+    return {
+        "workflow_run_id": workflow_run_id,
+        "timestamp": datetime.utcnow().isoformat() + "Z",
+        "python_version": python_version,
+        "packages": package_versions,
+        "failed_tests": failed_tests,
+        "test_status": "failed" if failed_tests else "passed",
+        "git": get_git_info(),
+    }
+
+
+def store_bisect_data_to_branch(
+    data: Dict, branch_name: str
+) -> bool:
+    """Store bisection data to a Git branch."""
+    try:
+        # Create filename based on run ID and timestamp
+        filename = f"run_{data['workflow_run_id']}_{data['timestamp'].replace(':', '-').replace('Z', '')}.json"
+
+        # Configure git user if not already set (needed for GitHub Actions)
+        try:
+            subprocess.run(["git", "config", "user.name"], check=True, capture_output=True)
+        except subprocess.CalledProcessError:
+            subprocess.run(["git", "config", "user.name", "github-actions[bot]"], check=True)
+            subprocess.run(["git", "config", "user.email", "github-actions[bot]@users.noreply.github.com"], check=True)
+
+        # Check if branch exists remotely
+        branch_exists_result = subprocess.run(
+            ["git", "ls-remote", "--heads", "origin", branch_name],
+            capture_output=True,
+            text=True,
+        )
+        branch_exists = bool(branch_exists_result.stdout.strip())
+
+        # Store current branch to restore later
+        current_branch_result = subprocess.run(
+            ["git", "rev-parse", "--abbrev-ref", "HEAD"],
+            capture_output=True,
+            text=True,
+        )
+        original_branch = current_branch_result.stdout.strip() if current_branch_result.returncode == 0 else None
+
+        try:
+            if branch_exists:
+                # Fetch and checkout existing branch
+                subprocess.run(["git", "fetch", "origin", branch_name], check=True)
+
+                # Check if local branch exists
+                local_branch_exists = subprocess.run(
+                    ["git", "rev-parse", "--verify", branch_name],
+                    capture_output=True,
+                ).returncode == 0
+
+                if local_branch_exists:
+                    subprocess.run(["git", "checkout", branch_name], check=True)
+                    subprocess.run(["git", "reset", "--hard", f"origin/{branch_name}"], check=True)
+                else:
+                    subprocess.run(["git", "checkout", "-b", branch_name, f"origin/{branch_name}"], check=True)
+            else:
+                # Create new orphan branch
+                subprocess.run(["git", "checkout", "--orphan", branch_name], check=True)
+                # Remove any existing files from the new branch
+                subprocess.run(["git", "rm", "-rf", "."], capture_output=True, check=False)
+
+            # Write the data file
+            pathlib.Path(filename).write_text(json.dumps(data, indent=2))
+
+            # Add and commit the file
+            subprocess.run(["git", "add", filename], check=True)
+            subprocess.run(
+                [
+                    "git",
+                    "commit",
+                    "-m",
+                    f"Add run data for {data['workflow_run_id']} ({data['test_status']})",
+                ],
+                check=True,
+            )
+
+            # Push the branch (create remote branch if it doesn't exist)
+            if branch_exists:
+                subprocess.run(["git", "push", "origin", branch_name], check=True)
+            else:
+                subprocess.run(["git", "push", "-u", "origin", branch_name], check=True)
+
+        finally:
+            # Restore original branch if possible
+            if original_branch and original_branch != branch_name:
+                try:
+                    subprocess.run(["git", "checkout", original_branch], check=True, capture_output=True)
+                except subprocess.CalledProcessError:
+                    # If we can't restore, at least try to get back to main/master
+                    for fallback_branch in ["main", "master"]:
+                        try:
+                            subprocess.run(["git", "checkout", fallback_branch], check=True, capture_output=True)
+                            break
+                        except subprocess.CalledProcessError:
+                            continue
+
+        return True
+    except subprocess.CalledProcessError as e:
+        print(f"Error storing bisect data to branch '{branch_name}': {e}")
+        print(f"Make sure the repository has proper permissions and the branch name '{branch_name}' is valid")
+        return False
+    except Exception as e:
+        print(f"Unexpected error storing bisect data: {e}")
+        return False
+
+
+def retrieve_last_successful_run(branch_name: str) -> Optional[Dict]:
+    """Retrieve the most recent successful run data from a Git branch."""
+    try:
+        # Check if branch exists remotely
+        result = subprocess.run(
+            ["git", "ls-remote", "--heads", "origin", branch_name],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+
+        if not result.stdout.strip():
+            return None
+
+        # Fetch the branch
+        subprocess.run(["git", "fetch", "origin", f"{branch_name}:{branch_name}"], check=True)
+
+        # List all JSON files in the branch
+        result = subprocess.run(
+            ["git", "ls-tree", "-r", "--name-only", branch_name],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+
+        json_files = [f for f in result.stdout.strip().split('\n') if f.endswith('.json')]
+
+        if not json_files:
+            return None
+
+        # Check each file to find the most recent successful run
+        most_recent_success = None
+        most_recent_timestamp = None
+
+        for filename in json_files:
+            try:
+                # Get the file content
+                file_result = subprocess.run(
+                    ["git", "show", f"{branch_name}:{filename}"],
+                    capture_output=True,
+                    text=True,
+                    check=True,
+                )
+
+                run_data = json.loads(file_result.stdout)
+
+                # Check if this was a successful run
+                if run_data.get("test_status") == "passed":
+                    timestamp = run_data.get("timestamp")
+                    if timestamp and (most_recent_timestamp is None or timestamp > most_recent_timestamp):
+                        most_recent_timestamp = timestamp
+                        most_recent_success = run_data
+
+            except (subprocess.CalledProcessError, json.JSONDecodeError):
+                continue
+
+        return most_recent_success
+
+    except (subprocess.CalledProcessError, json.JSONDecodeError):
+        return None
+
+
+def find_last_successful_run_for_tests(branch_name: str, failed_tests: List[str]) -> Dict[str, Optional[Dict]]:
+    """Find the last successful run for each currently failing test."""
+    test_last_success = {}
+
+    try:
+        # Get all run files
+        result = subprocess.run(
+            ["git", "ls-tree", "-r", "--name-only", branch_name],
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+
+        json_files = [f for f in result.stdout.strip().split('\n') if f.endswith('.json')]
+
+        # Get all run data and sort by timestamp (newest first)
+        all_runs = []
+        for filename in json_files:
+            try:
+                file_result = subprocess.run(
+                    ["git", "show", f"{branch_name}:{filename}"],
+                    capture_output=True,
+                    text=True,
+                    check=True,
+                )
+                run_data = json.loads(file_result.stdout)
+                all_runs.append(run_data)
+            except (subprocess.CalledProcessError, json.JSONDecodeError):
+                continue
+
+        # Sort by timestamp (newest first)
+        all_runs.sort(key=lambda x: x.get("timestamp", ""), reverse=True)
+
+        # For each currently failing test, find its last successful run
+        for test in failed_tests:
+            test_last_success[test] = None
+            for run in all_runs:
+                # If this test wasn't in the failed list for this run, it passed
+                if test not in run.get("failed_tests", []):
+                    test_last_success[test] = run
+                    break
+
+    except (subprocess.CalledProcessError, json.JSONDecodeError):
+        # Initialize with None for all tests if we can't retrieve data
+        for test in failed_tests:
+            test_last_success[test] = None
+
+    return test_last_success
+
+
+def get_package_changes(current_packages: Dict, previous_packages: Dict) -> List[str]:
+    """Get list of package changes between two runs."""
+    changes = []
+    all_packages = set(current_packages.keys()) | set(previous_packages.keys())
+
+    for package in sorted(all_packages):
+        current_version = current_packages.get(package)
+        previous_version = previous_packages.get(package)
+
+        if current_version is None and previous_version is None:
+            continue
+        elif current_version is None:
+            changes.append(f"- {package}: {previous_version} → (removed)")
+        elif previous_version is None:
+            changes.append(f"- {package}: (new) → {current_version}")
+        elif current_version != previous_version:
+            changes.append(f"- {package}: {previous_version} → {current_version}")
+
+    return changes
+
+
+def format_bisect_comparison(
+    current_data: Dict, previous_data: Optional[Dict], branch_name: str
+) -> Optional[str]:
+    """Format bisection comparison for display in GitHub issue."""
+    failed_tests = current_data.get("failed_tests", [])
+    if not failed_tests:
+        return None
+
+    test_last_success = find_last_successful_run_for_tests(branch_name, failed_tests)
+    current_packages = current_data["packages"]
+    current_git = current_data.get("git", {})
+
+    test_sections = []
+
+    for test in failed_tests:
+        last_success = test_last_success.get(test)
+
+        # Create section for this failing test
+        test_section = [f"## {test}"]
+
+        if last_success:
+            # Get changes since this test last passed
+            last_success_packages = last_success.get("packages", {})
+            last_success_git = last_success.get("git", {})
+
+            # Package changes since last pass
+            package_changes = get_package_changes(current_packages, last_success_packages)
+            if package_changes:
+                test_section.append("### Package changes since last pass")
+                test_section.extend(package_changes)
+            else:
+                test_section.append("### Package changes since last pass")
+                test_section.append("- No package changes detected")
+
+            # Code changes since last pass
+            if current_git.get("commit_hash") != last_success_git.get("commit_hash"):
+                prev_commit = last_success_git.get("commit_hash_short", "unknown")
+                curr_commit = current_git.get("commit_hash_short", "unknown")
+                prev_msg = last_success_git.get("commit_message", "")[:60] + ("..." if len(last_success_git.get("commit_message", "")) > 60 else "")
+                curr_msg = current_git.get("commit_message", "")[:60] + ("..." if len(current_git.get("commit_message", "")) > 60 else "")
+
+                test_section.append("### Code changes since last pass")
+                test_section.append(f"- {prev_commit} ({prev_msg})")
+                test_section.append(f"- → {curr_commit} ({curr_msg})")
+                test_section.append(f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}")
+            else:
+                test_section.append("### Code changes since last pass")
+                test_section.append("- No code changes detected")
+                test_section.append(f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}")
+        else:
+            test_section.append("### Analysis")
+            test_section.append("- No recent successful run found for this test")
+
+        test_sections.append("\n".join(test_section))
+
+    if test_sections:
+        return "\n\n".join(test_sections) + "\n\n"
+
+    return None
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Track package versions for bisection")
+    parser.add_argument(
+        "--packages",
+        required=True,
+        help="Comma-separated list of packages to track",
+    )
+    parser.add_argument(
+        "--log-path",
+        help="Path to pytest log file",
+    )
+    parser.add_argument(
+        "--captured-versions",
+        help="Path to captured package versions JSON file",
+    )
+    parser.add_argument(
+        "--store-run",
+        action="store_true",
+        help="Store current run data (both packages and test results)",
+    )
+    parser.add_argument(
+        "--generate-comparison",
+        action="store_true",
+        help="Generate comparison with last successful run",
+    )
+    parser.add_argument(
+        "--branch",
+        default="bisect-data",
+        help="Branch name for storing bisection data",
+    )
+    parser.add_argument(
+        "--output-file",
+        default="bisect-comparison.txt",
+        help="Output file for bisection comparison",
+    )
+
+    args = parser.parse_args()
+
+    packages = [pkg.strip() for pkg in args.packages.split(",") if pkg.strip()]
+
+    if args.store_run:
+        # Store current run data (packages + test results)
+        data = create_bisect_data(packages, args.log_path, args.captured_versions)
+        success = store_bisect_data_to_branch(data, args.branch)
+        if success:
+            print(f"Successfully stored run data to branch '{args.branch}' (status: {data['test_status']})")
+        else:
+            print("Failed to store run data", file=sys.stderr)
+            sys.exit(1)
+
+    if args.generate_comparison:
+        # Generate comparison with last successful run
+        current_data = create_bisect_data(packages, args.log_path, args.captured_versions)
+        previous_data = retrieve_last_successful_run(args.branch)
+
+        comparison = format_bisect_comparison(current_data, previous_data, args.branch)
+
+        output_path = pathlib.Path(args.output_file)
+        if comparison:
+            output_path.write_text(comparison)
+            print(f"Bisection comparison written to {output_path.absolute()}")
+        else:
+            output_path.write_text("")
+            print("No bisection data to display")
+
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file

From e82029ba1469c6853a35f8c289483bafbe8afdb4 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:18:35 -0400
Subject: [PATCH 02/15] Add GitHub diff links and extract action code to
 separate files
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

This commit improves maintainability and enhances the bisection feature:

- Extract inline Python code from action.yaml to capture_versions.py for better maintainability
- Add GitHub diff links for common packages (numpy, pandas, pytest, etc.) in bisection output
- Include package metadata for 22 popular Python packages to generate release comparison links
- Update package changes display to include clickable links when available
- Add comprehensive tests for GitHub link generation functionality
- Fix mypy type annotations to use modern Python 3.10+ syntax (str | None instead of Optional[str])

The bisection output now shows package changes like:
- [numpy: 1.24.0 → 1.25.0](https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0)

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 action.yaml            | 68 +----------------------------
 capture_versions.py    | 78 +++++++++++++++++++++++++++++++++
 test_track_packages.py | 35 ++++++++++++++-
 track_packages.py      | 99 ++++++++++++++++++++++++++++++++----------
 4 files changed, 189 insertions(+), 91 deletions(-)
 create mode 100644 capture_versions.py

diff --git a/action.yaml b/action.yaml
index 13efdfa..2b8e8dc 100644
--- a/action.yaml
+++ b/action.yaml
@@ -70,72 +70,8 @@ runs:
       run: |
         if [ -n "${{ inputs.track-packages }}" ]; then
           echo "Capturing package versions using: ${{ inputs.python-command }}"
-
-          # Capture package versions from the test environment
-          ${{ inputs.python-command }} -c "
-import json
-import sys
-
-packages_input = '${{ inputs.track-packages }}'.strip()
-if not packages_input:
-    exit()
-
-packages = [pkg.strip() for pkg in packages_input.split(',')]
-versions = {}
-
-# Try importlib.metadata first (Python 3.8+)
-try:
-    import importlib.metadata as metadata
-    if len(packages) == 1 and packages[0].lower() == 'all':
-        print('Capturing all installed packages...')
-        for dist in metadata.distributions():
-            versions[dist.name] = dist.version
-    else:
-        print(f'Capturing specific packages: {packages}')
-        for pkg in packages:
-            if pkg:
-                try:
-                    versions[pkg] = metadata.version(pkg)
-                    print(f'  {pkg}: {versions[pkg]}')
-                except Exception as e:
-                    versions[pkg] = None
-                    print(f'  {pkg}: not found ({e})')
-except ImportError:
-    print('importlib.metadata not available, trying pkg_resources...')
-    # Fallback to pkg_resources
-    try:
-        import pkg_resources
-        if len(packages) == 1 and packages[0].lower() == 'all':
-            print('Capturing all installed packages...')
-            for dist in pkg_resources.working_set:
-                versions[dist.project_name] = dist.version
-        else:
-            print(f'Capturing specific packages: {packages}')
-            for pkg in packages:
-                if pkg:
-                    try:
-                        versions[pkg] = pkg_resources.get_distribution(pkg).version
-                        print(f'  {pkg}: {versions[pkg]}')
-                    except Exception as e:
-                        versions[pkg] = None
-                        print(f'  {pkg}: not found ({e})')
-    except ImportError:
-        print('ERROR: No package detection method available')
-        versions = {'error': 'No package detection method available'}
-
-# Save captured versions
-capture_data = {
-    'python_version': '.'.join(map(str, sys.version_info[:3])),
-    'python_executable': sys.executable,
-    'packages': versions,
-    'capture_method': 'importlib.metadata' if 'importlib.metadata' in sys.modules else 'pkg_resources'
-}
-
-with open('captured-package-versions.json', 'w') as f:
-    json.dump(capture_data, f, indent=2)
-
-print(f'Captured {len(versions)} package versions')
-"
+          export TRACK_PACKAGES="${{ inputs.track-packages }}"
+          ${{ inputs.python-command }} $GITHUB_ACTION_PATH/capture_versions.py
         else
           echo "No packages specified for tracking, skipping package capture"
         fi
diff --git a/capture_versions.py b/capture_versions.py
new file mode 100644
index 0000000..4be46c7
--- /dev/null
+++ b/capture_versions.py
@@ -0,0 +1,78 @@
+#!/usr/bin/env python3
+"""
+Capture package versions from the test environment.
+
+This script captures package versions using the specified Python command
+to ensure we get versions from the same environment that ran the tests.
+"""
+import json
+import sys
+import os
+
+
+def main():
+    """Main function to capture package versions."""
+    packages_input = os.environ.get('TRACK_PACKAGES', '').strip()
+    if not packages_input:
+        print("No packages specified for tracking, skipping package capture")
+        return
+
+    packages = [pkg.strip() for pkg in packages_input.split(',')]
+    versions = {}
+
+    # Try importlib.metadata first (Python 3.8+)
+    try:
+        import importlib.metadata as metadata
+        if len(packages) == 1 and packages[0].lower() == 'all':
+            print('Capturing all installed packages...')
+            for dist in metadata.distributions():
+                versions[dist.name] = dist.version
+        else:
+            print(f'Capturing specific packages: {packages}')
+            for pkg in packages:
+                if pkg:
+                    try:
+                        versions[pkg] = metadata.version(pkg)
+                        print(f'  {pkg}: {versions[pkg]}')
+                    except Exception as e:
+                        versions[pkg] = None
+                        print(f'  {pkg}: not found ({e})')
+    except ImportError:
+        print('importlib.metadata not available, trying pkg_resources...')
+        # Fallback to pkg_resources
+        try:
+            import pkg_resources
+            if len(packages) == 1 and packages[0].lower() == 'all':
+                print('Capturing all installed packages...')
+                for dist in pkg_resources.working_set:
+                    versions[dist.project_name] = dist.version
+            else:
+                print(f'Capturing specific packages: {packages}')
+                for pkg in packages:
+                    if pkg:
+                        try:
+                            versions[pkg] = pkg_resources.get_distribution(pkg).version
+                            print(f'  {pkg}: {versions[pkg]}')
+                        except Exception as e:
+                            versions[pkg] = None
+                            print(f'  {pkg}: not found ({e})')
+        except ImportError:
+            print('ERROR: No package detection method available')
+            versions = {'error': 'No package detection method available'}
+
+    # Save captured versions
+    capture_data = {
+        'python_version': '.'.join(map(str, sys.version_info[:3])),
+        'python_executable': sys.executable,
+        'packages': versions,
+        'capture_method': 'importlib.metadata' if 'importlib.metadata' in sys.modules else 'pkg_resources'
+    }
+
+    with open('captured-package-versions.json', 'w') as f:
+        json.dump(capture_data, f, indent=2)
+
+    print(f'Captured {len(versions)} package versions')
+
+
+if __name__ == '__main__':
+    main()
\ No newline at end of file
diff --git a/test_track_packages.py b/test_track_packages.py
index ba921c2..14f8274 100644
--- a/test_track_packages.py
+++ b/test_track_packages.py
@@ -2,8 +2,8 @@
 import os
 import sys
 import tempfile
-from unittest.mock import Mock, patch
 from datetime import datetime
+from unittest.mock import Mock, patch
 
 import hypothesis.strategies as st
 from hypothesis import given
@@ -360,4 +360,35 @@ def test_retrieve_bisect_data_from_branch_success():
         ]
 
         result = track_packages.retrieve_bisect_data_from_branch("bisect-data")
-        assert result == mock_data
\ No newline at end of file
+        assert result == mock_data
+
+
+def test_generate_package_diff_link():
+    """Test generating GitHub diff links for package changes."""
+    # Test known package
+    link = track_packages.generate_package_diff_link("numpy", "1.24.0", "1.25.0")
+    assert link == "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0"
+
+    # Test unknown package
+    link = track_packages.generate_package_diff_link("unknown-package", "1.0.0", "2.0.0")
+    assert link is None
+
+
+def test_get_package_changes_with_github_links():
+    """Test package changes include GitHub links when available."""
+    previous_packages = {"numpy": "1.24.0", "unknown-pkg": "1.0.0"}
+    current_packages = {"numpy": "1.25.0", "unknown-pkg": "2.0.0"}
+
+    changes = track_packages.get_package_changes(current_packages, previous_packages)
+
+    # Should have GitHub link for numpy
+    numpy_change = next((c for c in changes if "numpy" in c), None)
+    assert numpy_change is not None
+    assert "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0" in numpy_change
+    assert "[numpy: 1.24.0 → 1.25.0]" in numpy_change
+
+    # Should not have GitHub link for unknown package
+    unknown_change = next((c for c in changes if "unknown-pkg" in c), None)
+    assert unknown_change is not None
+    assert "unknown-pkg: 1.0.0 → 2.0.0" in unknown_change
+    assert "https://" not in unknown_change
diff --git a/track_packages.py b/track_packages.py
index 02a41fd..c7d82be 100644
--- a/track_packages.py
+++ b/track_packages.py
@@ -11,12 +11,60 @@
 import pathlib
 import subprocess
 import sys
-import tempfile
 from datetime import datetime
-from typing import Dict, List, Optional, Tuple
 
 
-def get_all_installed_packages() -> Dict[str, str]:
+# Package metadata for generating GitHub links
+PACKAGE_METADATA = {
+    "numpy": {"github": "numpy/numpy", "type": "releases"},
+    "pandas": {"github": "pandas-dev/pandas", "type": "releases"},
+    "matplotlib": {"github": "matplotlib/matplotlib", "type": "releases"},
+    "scipy": {"github": "scipy/scipy", "type": "releases"},
+    "scikit-learn": {"github": "scikit-learn/scikit-learn", "type": "releases"},
+    "requests": {"github": "psf/requests", "type": "releases"},
+    "django": {"github": "django/django", "type": "releases"},
+    "flask": {"github": "pallets/flask", "type": "releases"},
+    "pytest": {"github": "pytest-dev/pytest", "type": "releases"},
+    "hypothesis": {"github": "HypothesisWorks/hypothesis", "type": "releases"},
+    "xarray": {"github": "pydata/xarray", "type": "releases"},
+    "dask": {"github": "dask/dask", "type": "releases"},
+    "jupyterlab": {"github": "jupyterlab/jupyterlab", "type": "releases"},
+    "notebook": {"github": "jupyter/notebook", "type": "releases"},
+    "ipython": {"github": "ipython/ipython", "type": "releases"},
+    "tensorflow": {"github": "tensorflow/tensorflow", "type": "releases"},
+    "torch": {"github": "pytorch/pytorch", "type": "releases"},
+    "fastapi": {"github": "tiangolo/fastapi", "type": "releases"},
+    "pydantic": {"github": "pydantic/pydantic", "type": "releases"},
+    "sqlalchemy": {"github": "sqlalchemy/sqlalchemy", "type": "releases"},
+    "black": {"github": "psf/black", "type": "releases"},
+    "mypy": {"github": "python/mypy", "type": "releases"},
+    "ruff": {"github": "astral-sh/ruff", "type": "releases"},
+}
+
+
+def generate_package_diff_link(package_name: str, old_version: str, new_version: str) -> str | None:
+    """Generate a GitHub diff link for package version changes."""
+    if package_name not in PACKAGE_METADATA:
+        return None
+
+    metadata = PACKAGE_METADATA[package_name]
+    repo = metadata["github"]
+
+    if metadata["type"] == "releases":
+        # Try different tag formats common in Python packages
+        tag_formats = [
+            f"v{old_version}...v{new_version}",  # v1.0.0...v1.1.0
+            f"{old_version}...{new_version}",    # 1.0.0...1.1.0
+            f"release-{old_version}...release-{new_version}",  # release-1.0.0...release-1.1.0
+        ]
+
+        # Return the first format (most common)
+        return f"https://github.com/{repo}/compare/{tag_formats[0]}"
+
+    return None
+
+
+def get_all_installed_packages() -> dict[str, str | None]:
     """Get all installed packages and their versions."""
     try:
         result = subprocess.run(
@@ -31,7 +79,7 @@ def get_all_installed_packages() -> Dict[str, str]:
         return {}
 
 
-def get_package_version(package_name: str) -> Optional[str]:
+def get_package_version(package_name: str) -> str | None:
     """Get the version of an installed package."""
     try:
         result = subprocess.run(
@@ -48,24 +96,24 @@ def get_package_version(package_name: str) -> Optional[str]:
     return None
 
 
-def get_current_package_versions(packages: List[str], captured_versions_file: str = None) -> Dict[str, Optional[str]]:
+def get_current_package_versions(packages: list[str], captured_versions_file: str | None = None) -> dict[str, str | None]:
     """Get current versions of specified packages."""
     # First try to read from captured versions file if provided
     if captured_versions_file and os.path.exists(captured_versions_file):
         try:
-            with open(captured_versions_file, 'r') as f:
+            with open(captured_versions_file) as f:
                 captured_data = json.load(f)
                 captured_packages = captured_data.get('packages', {})
 
                 if len(packages) == 1 and packages[0].lower() == "all":
-                    return captured_packages
+                    return captured_packages  # type: ignore[return-value]
 
                 # Return only the requested packages from captured data
                 versions = {}
                 for package in packages:
                     versions[package] = captured_packages.get(package)
                 return versions
-        except (json.JSONDecodeError, IOError) as e:
+        except (json.JSONDecodeError, OSError) as e:
             print(f"Warning: Could not read captured versions file {captured_versions_file}: {e}")
             print("Falling back to direct package detection...")
 
@@ -79,11 +127,11 @@ def get_current_package_versions(packages: List[str], captured_versions_file: st
     return versions
 
 
-def extract_failed_tests_from_log(log_path: str) -> List[str]:
+def extract_failed_tests_from_log(log_path: str) -> list[str]:
     """Extract failed test nodeids from pytest log file."""
     failed_tests = []
     try:
-        with open(log_path, 'r') as f:
+        with open(log_path) as f:
             for line in f:
                 try:
                     record = json.loads(line)
@@ -98,7 +146,7 @@ def extract_failed_tests_from_log(log_path: str) -> List[str]:
     return failed_tests
 
 
-def get_git_info() -> Dict[str, str]:
+def get_git_info() -> dict[str, str]:
     """Get current Git commit information."""
     try:
         # Get current commit hash
@@ -153,7 +201,7 @@ def get_git_info() -> Dict[str, str]:
         }
 
 
-def create_bisect_data(packages: List[str], log_path: str = None, captured_versions_file: str = None, workflow_run_id: str = None) -> Dict:
+def create_bisect_data(packages: list[str], log_path: str | None = None, captured_versions_file: str | None = None, workflow_run_id: str | None = None) -> dict:
     """Create bisection data for current environment."""
     if workflow_run_id is None:
         workflow_run_id = os.environ.get("GITHUB_RUN_ID", "unknown")
@@ -169,11 +217,11 @@ def create_bisect_data(packages: List[str], log_path: str = None, captured_versi
     python_version = ".".join(str(v) for v in sys.version_info[:3])
     if captured_versions_file and os.path.exists(captured_versions_file):
         try:
-            with open(captured_versions_file, 'r') as f:
+            with open(captured_versions_file) as f:
                 captured_data = json.load(f)
                 if 'python_version' in captured_data:
                     python_version = captured_data['python_version']
-        except (json.JSONDecodeError, IOError):
+        except (json.JSONDecodeError, OSError):
             pass  # Use default python_version
 
     return {
@@ -188,7 +236,7 @@ def create_bisect_data(packages: List[str], log_path: str = None, captured_versi
 
 
 def store_bisect_data_to_branch(
-    data: Dict, branch_name: str
+    data: dict, branch_name: str
 ) -> bool:
     """Store bisection data to a Git branch."""
     try:
@@ -285,7 +333,7 @@ def store_bisect_data_to_branch(
         return False
 
 
-def retrieve_last_successful_run(branch_name: str) -> Optional[Dict]:
+def retrieve_last_successful_run(branch_name: str) -> dict | None:
     """Retrieve the most recent successful run data from a Git branch."""
     try:
         # Check if branch exists remotely
@@ -347,9 +395,9 @@ def retrieve_last_successful_run(branch_name: str) -> Optional[Dict]:
         return None
 
 
-def find_last_successful_run_for_tests(branch_name: str, failed_tests: List[str]) -> Dict[str, Optional[Dict]]:
+def find_last_successful_run_for_tests(branch_name: str, failed_tests: list[str]) -> dict[str, dict | None]:
     """Find the last successful run for each currently failing test."""
-    test_last_success = {}
+    test_last_success: dict[str, dict | None] = {}
 
     try:
         # Get all run files
@@ -397,7 +445,7 @@ def find_last_successful_run_for_tests(branch_name: str, failed_tests: List[str]
     return test_last_success
 
 
-def get_package_changes(current_packages: Dict, previous_packages: Dict) -> List[str]:
+def get_package_changes(current_packages: dict, previous_packages: dict) -> list[str]:
     """Get list of package changes between two runs."""
     changes = []
     all_packages = set(current_packages.keys()) | set(previous_packages.keys())
@@ -413,14 +461,19 @@ def get_package_changes(current_packages: Dict, previous_packages: Dict) -> List
         elif previous_version is None:
             changes.append(f"- {package}: (new) → {current_version}")
         elif current_version != previous_version:
-            changes.append(f"- {package}: {previous_version} → {current_version}")
+            # Try to generate a GitHub diff link
+            diff_link = generate_package_diff_link(package, previous_version, current_version)
+            if diff_link:
+                changes.append(f"- [{package}: {previous_version} → {current_version}]({diff_link})")
+            else:
+                changes.append(f"- {package}: {previous_version} → {current_version}")
 
     return changes
 
 
 def format_bisect_comparison(
-    current_data: Dict, previous_data: Optional[Dict], branch_name: str
-) -> Optional[str]:
+    current_data: dict, previous_data: dict | None, branch_name: str
+) -> str | None:
     """Format bisection comparison for display in GitHub issue."""
     failed_tests = current_data.get("failed_tests", [])
     if not failed_tests:
@@ -546,4 +599,4 @@ def main():
 
 
 if __name__ == "__main__":
-    main()
\ No newline at end of file
+    main()

From 9741e71a3aca06b3ac4386d8ec3dfddd64db2aa1 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:22:04 -0400
Subject: [PATCH 03/15] Use user's python-command for environment info
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

This ensures the environment information step shows the actual Python
environment being used for tests, not just the action's Python.

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 action.yaml         | 5 +++--
 capture_versions.py | 4 ++--
 track_packages.py   | 1 -
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/action.yaml b/action.yaml
index 2b8e8dc..537f957 100644
--- a/action.yaml
+++ b/action.yaml
@@ -59,8 +59,9 @@ runs:
     - name: print environment information
       shell: bash -l {0}
       run: |
-        python --version
-        python -m pip list
+        echo "Using Python command: ${{ inputs.python-command }}"
+        ${{ inputs.python-command }} --version
+        ${{ inputs.python-command }} -m pip list
     - name: install dependencies
       shell: bash -l {0}
       run: |
diff --git a/capture_versions.py b/capture_versions.py
index 4be46c7..3429c2d 100644
--- a/capture_versions.py
+++ b/capture_versions.py
@@ -6,8 +6,8 @@
 to ensure we get versions from the same environment that ran the tests.
 """
 import json
-import sys
 import os
+import sys
 
 
 def main():
@@ -75,4 +75,4 @@ def main():
 
 
 if __name__ == '__main__':
-    main()
\ No newline at end of file
+    main()
diff --git a/track_packages.py b/track_packages.py
index c7d82be..7dd7d86 100644
--- a/track_packages.py
+++ b/track_packages.py
@@ -13,7 +13,6 @@
 import sys
 from datetime import datetime
 
-
 # Package metadata for generating GitHub links
 PACKAGE_METADATA = {
     "numpy": {"github": "numpy/numpy", "type": "releases"},

From a8c41c60397a9f300226dee22e21d00e265fdd97 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:24:38 -0400
Subject: [PATCH 04/15] Add comprehensive pre-commit hooks
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Added actionlint and mypy to existing pre-commit configuration:
- actionlint for GitHub Actions workflow validation
- mypy for type checking with proper type stubs
- Fixed pkg_resources import type annotation with type: ignore

Pre-commit now includes:
- ruff (linting and formatting)
- black (code formatting)
- prettier (markdown/yaml formatting)
- actionlint (workflow validation)
- mypy (type checking)
- Standard hooks (trailing whitespace, end-of-file, etc.)

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .pre-commit-config.yaml |  12 +++
 README.md               |  13 ++--
 capture_versions.py     |  52 +++++++------
 parse_logs.py           |   4 +-
 test_track_packages.py  | 103 ++++++++++++++-----------
 track_packages.py       | 162 +++++++++++++++++++++++++++++-----------
 6 files changed, 231 insertions(+), 115 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 5dcb2a9..a1b5684 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -32,3 +32,15 @@ repos:
         args: ["--option", "array_auto_collapse=false"]
       - id: taplo-lint
         args: ["--no-schema"]
+
+  - repo: https://github.com/rhysd/actionlint
+    rev: v1.7.1
+    hooks:
+      - id: actionlint
+
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.11.2
+    hooks:
+      - id: mypy
+        additional_dependencies: [hypothesis, types-setuptools]
+        exclude: ^test_
diff --git a/README.md b/README.md
index d28b441..1dc1fa0 100644
--- a/README.md
+++ b/README.md
@@ -175,13 +175,13 @@ jobs:
     runs-on: ubuntu-latest
     permissions:
       issues: write
-      contents: write  # Needed for bisection branch
+      contents: write # Needed for bisection branch
 
     steps:
       - uses: actions/checkout@v4
         with:
           token: ${{ secrets.GITHUB_TOKEN }}
-          fetch-depth: 0  # Needed for bisection branch operations
+          fetch-depth: 0 # Needed for bisection branch operations
 
       - uses: actions/setup-python@v4
         with:
@@ -195,12 +195,12 @@ jobs:
 
       # Track package versions and create issue if tests fail
       - name: Track packages and create issue if needed
-        if: always()  # Run regardless of test outcome to store data
+        if: always() # Run regardless of test outcome to store data
         uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
         with:
           log-path: pytest-log.jsonl
           track-packages: "xarray,pandas,numpy"
-          python-command: "python"  # Default, can be omitted
+          python-command: "python" # Default, can be omitted
 ```
 
 #### Conda/Mamba Setup
@@ -239,7 +239,7 @@ jobs:
         with:
           log-path: pytest-log.jsonl
           track-packages: "numpy,pandas,pytest"
-          python-command: "python"  # Conda python is already in PATH
+          python-command: "python" # Conda python is already in PATH
 ```
 
 #### UV Setup
@@ -268,7 +268,7 @@ jobs:
         uses: scientific-python/issue-from-pytest-log-action@f94477e45ef40e4403d7585ba639a9a3bcc53d43 # v1.3.0
         with:
           log-path: pytest-log.jsonl
-          track-packages: "all"  # Track all packages
+          track-packages: "all" # Track all packages
           python-command: "uv run python"
 ```
 
@@ -369,6 +369,7 @@ When enabled, the bisection feature will add comprehensive analysis to GitHub is
 ```
 
 This enhanced bisection feature helps identify:
+
 1. **For each failing test**, exactly which dependencies and code changed since it last passed
 2. **Precise correlation** between specific changes and test failures
 3. **Historical context** with exact commits and timestamps
diff --git a/capture_versions.py b/capture_versions.py
index 3429c2d..c281eae 100644
--- a/capture_versions.py
+++ b/capture_versions.py
@@ -12,67 +12,73 @@
 
 def main():
     """Main function to capture package versions."""
-    packages_input = os.environ.get('TRACK_PACKAGES', '').strip()
+    packages_input = os.environ.get("TRACK_PACKAGES", "").strip()
     if not packages_input:
         print("No packages specified for tracking, skipping package capture")
         return
 
-    packages = [pkg.strip() for pkg in packages_input.split(',')]
+    packages = [pkg.strip() for pkg in packages_input.split(",")]
     versions = {}
 
     # Try importlib.metadata first (Python 3.8+)
     try:
         import importlib.metadata as metadata
-        if len(packages) == 1 and packages[0].lower() == 'all':
-            print('Capturing all installed packages...')
+
+        if len(packages) == 1 and packages[0].lower() == "all":
+            print("Capturing all installed packages...")
             for dist in metadata.distributions():
                 versions[dist.name] = dist.version
         else:
-            print(f'Capturing specific packages: {packages}')
+            print(f"Capturing specific packages: {packages}")
             for pkg in packages:
                 if pkg:
                     try:
                         versions[pkg] = metadata.version(pkg)
-                        print(f'  {pkg}: {versions[pkg]}')
+                        print(f"  {pkg}: {versions[pkg]}")
                     except Exception as e:
                         versions[pkg] = None
-                        print(f'  {pkg}: not found ({e})')
+                        print(f"  {pkg}: not found ({e})")
     except ImportError:
-        print('importlib.metadata not available, trying pkg_resources...')
+        print("importlib.metadata not available, trying pkg_resources...")
         # Fallback to pkg_resources
         try:
-            import pkg_resources
-            if len(packages) == 1 and packages[0].lower() == 'all':
-                print('Capturing all installed packages...')
+            import pkg_resources  # type: ignore[import-untyped]
+
+            if len(packages) == 1 and packages[0].lower() == "all":
+                print("Capturing all installed packages...")
                 for dist in pkg_resources.working_set:
                     versions[dist.project_name] = dist.version
             else:
-                print(f'Capturing specific packages: {packages}')
+                print(f"Capturing specific packages: {packages}")
                 for pkg in packages:
                     if pkg:
                         try:
                             versions[pkg] = pkg_resources.get_distribution(pkg).version
-                            print(f'  {pkg}: {versions[pkg]}')
+                            print(f"  {pkg}: {versions[pkg]}")
                         except Exception as e:
                             versions[pkg] = None
-                            print(f'  {pkg}: not found ({e})')
+                            print(f"  {pkg}: not found ({e})")
         except ImportError:
-            print('ERROR: No package detection method available')
-            versions = {'error': 'No package detection method available'}
+            print("ERROR: No package detection method available")
+            versions = {"error": "No package detection method available"}
 
     # Save captured versions
     capture_data = {
-        'python_version': '.'.join(map(str, sys.version_info[:3])),
-        'python_executable': sys.executable,
-        'packages': versions,
-        'capture_method': 'importlib.metadata' if 'importlib.metadata' in sys.modules else 'pkg_resources'
+        "python_version": ".".join(map(str, sys.version_info[:3])),
+        "python_executable": sys.executable,
+        "packages": versions,
+        "capture_method": (
+            "importlib.metadata"
+            if "importlib.metadata" in sys.modules
+            else "pkg_resources"
+        ),
     }
 
-    with open('captured-package-versions.json', 'w') as f:
+    with open("captured-package-versions.json", "w") as f:
         json.dump(capture_data, f, indent=2)
 
-    print(f'Captured {len(versions)} package versions')
+    print(f"Captured {len(versions)} package versions")
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     main()
diff --git a/parse_logs.py b/parse_logs.py
index c73a18e..199d635 100644
--- a/parse_logs.py
+++ b/parse_logs.py
@@ -242,7 +242,9 @@ def format_collection_error(error, **formatter_kwargs):
     ).format(py_version=py_version, name=error.name, traceback=error.repr_)
 
 
-def include_bisection_info(message: str, bisect_file: str = "bisect-comparison.txt") -> str:
+def include_bisection_info(
+    message: str, bisect_file: str = "bisect-comparison.txt"
+) -> str:
     """Include bisection information in the issue message if available."""
     bisect_path = pathlib.Path(bisect_file)
     if bisect_path.exists():
diff --git a/test_track_packages.py b/test_track_packages.py
index 14f8274..f97d1d0 100644
--- a/test_track_packages.py
+++ b/test_track_packages.py
@@ -60,7 +60,9 @@ def test_get_current_package_versions_specific():
             "nonexistent": None,
         }.get(pkg)
 
-        versions = track_packages.get_current_package_versions(["pytest", "hypothesis", "nonexistent"])
+        versions = track_packages.get_current_package_versions(
+            ["pytest", "hypothesis", "nonexistent"]
+        )
         expected = {
             "pytest": "7.4.0",
             "hypothesis": "6.82.0",
@@ -71,15 +73,11 @@ def test_get_current_package_versions_specific():
 
 def test_get_current_package_versions_from_captured_file():
     """Test getting versions from a captured JSON file."""
-    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
         captured_data = {
             "python_version": "3.11.0",
-            "packages": {
-                "pytest": "7.4.0",
-                "numpy": "1.24.0",
-                "requests": "2.31.0"
-            },
-            "capture_method": "importlib.metadata"
+            "packages": {"pytest": "7.4.0", "numpy": "1.24.0", "requests": "2.31.0"},
+            "capture_method": "importlib.metadata",
         }
         json.dump(captured_data, f)
         captured_file = f.name
@@ -89,20 +87,14 @@ def test_get_current_package_versions_from_captured_file():
         versions = track_packages.get_current_package_versions(
             ["pytest", "numpy", "missing"], captured_file
         )
-        expected = {
-            "pytest": "7.4.0",
-            "numpy": "1.24.0",
-            "missing": None
-        }
+        expected = {"pytest": "7.4.0", "numpy": "1.24.0", "missing": None}
         assert versions == expected
 
         # Test "all" packages
-        all_versions = track_packages.get_current_package_versions(["all"], captured_file)
-        expected_all = {
-            "pytest": "7.4.0",
-            "numpy": "1.24.0",
-            "requests": "2.31.0"
-        }
+        all_versions = track_packages.get_current_package_versions(
+            ["all"], captured_file
+        )
+        expected_all = {"pytest": "7.4.0", "numpy": "1.24.0", "requests": "2.31.0"}
         assert all_versions == expected_all
     finally:
         os.unlink(captured_file)
@@ -110,7 +102,7 @@ def test_get_current_package_versions_from_captured_file():
 
 def test_get_current_package_versions_fallback_on_bad_file():
     """Test fallback when captured file is invalid."""
-    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
         f.write("invalid json content")
         bad_file = f.name
 
@@ -140,9 +132,15 @@ def test_get_git_info():
         # Mock the sequence of git commands
         mock_run.side_effect = [
             Mock(stdout="abc123def456789\n", check=True),  # git rev-parse HEAD
-            Mock(stdout="Fix test regression\n", check=True),  # git log -1 --pretty=format:%s
-            Mock(stdout="John Doe <john@example.com>\n", check=True),  # git log -1 --pretty=format:%an <%ae>
-            Mock(stdout="2024-01-15 10:30:00 +0000\n", check=True),  # git log -1 --pretty=format:%ci
+            Mock(
+                stdout="Fix test regression\n", check=True
+            ),  # git log -1 --pretty=format:%s
+            Mock(
+                stdout="John Doe <john@example.com>\n", check=True
+            ),  # git log -1 --pretty=format:%an <%ae>
+            Mock(
+                stdout="2024-01-15 10:30:00 +0000\n", check=True
+            ),  # git log -1 --pretty=format:%ci
         ]
 
         git_info = track_packages.get_git_info()
@@ -159,13 +157,23 @@ def test_get_git_info():
 
 def test_extract_failed_tests_from_log():
     """Test extracting failed tests from pytest log file."""
-    with tempfile.NamedTemporaryFile(mode='w', suffix='.jsonl', delete=False) as f:
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
         # Write sample pytest log entries
-        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_pass", "outcome": "passed"}\n')
-        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_fail1", "outcome": "failed"}\n')
-        f.write('{"$report_type": "CollectReport", "nodeid": "test_file.py::test_fail2", "outcome": "failed"}\n')
-        f.write('{"$report_type": "TestReport", "nodeid": "test_file.py::test_skip", "outcome": "skipped"}\n')
-        f.write('{"$report_type": "WarningMessage", "outcome": "failed"}\n')  # Should be ignored
+        f.write(
+            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_pass", "outcome": "passed"}\n'
+        )
+        f.write(
+            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_fail1", "outcome": "failed"}\n'
+        )
+        f.write(
+            '{"$report_type": "CollectReport", "nodeid": "test_file.py::test_fail2", "outcome": "failed"}\n'
+        )
+        f.write(
+            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_skip", "outcome": "skipped"}\n'
+        )
+        f.write(
+            '{"$report_type": "WarningMessage", "outcome": "failed"}\n'
+        )  # Should be ignored
         log_path = f.name
 
     try:
@@ -203,9 +211,11 @@ def test_create_bisect_data():
     """Test creating bisection data."""
     packages = ["pytest", "hypothesis"]
 
-    with patch("track_packages.get_current_package_versions") as mock_get_versions, \
-         patch("track_packages.get_git_info") as mock_get_git, \
-         patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests:
+    with patch(
+        "track_packages.get_current_package_versions"
+    ) as mock_get_versions, patch("track_packages.get_git_info") as mock_get_git, patch(
+        "track_packages.extract_failed_tests_from_log"
+    ) as mock_extract_tests:
 
         mock_get_versions.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
         mock_get_git.return_value = {
@@ -221,7 +231,9 @@ def test_create_bisect_data():
             data = track_packages.create_bisect_data(packages)
 
             assert data["workflow_run_id"] == "12345"
-            assert data["python_version"] == ".".join(str(v) for v in sys.version_info[:3])
+            assert data["python_version"] == ".".join(
+                str(v) for v in sys.version_info[:3]
+            )
             assert data["packages"] == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
             assert data["failed_tests"] == []
             assert data["test_status"] == "passed"
@@ -236,20 +248,18 @@ def test_create_bisect_data_with_captured_versions():
     packages = ["pytest", "numpy"]
 
     # Create a captured versions file
-    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
         captured_data = {
             "python_version": "3.11.5",
-            "packages": {
-                "pytest": "7.4.2",
-                "numpy": "1.25.1"
-            }
+            "packages": {"pytest": "7.4.2", "numpy": "1.25.1"},
         }
         json.dump(captured_data, f)
         captured_file = f.name
 
     try:
-        with patch("track_packages.get_git_info") as mock_get_git, \
-             patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests:
+        with patch("track_packages.get_git_info") as mock_get_git, patch(
+            "track_packages.extract_failed_tests_from_log"
+        ) as mock_extract_tests:
 
             mock_get_git.return_value = {
                 "commit_hash": "def456",
@@ -261,11 +271,16 @@ def test_create_bisect_data_with_captured_versions():
             mock_extract_tests.return_value = ["test_fail.py::test_example"]
 
             with patch.dict("os.environ", {"GITHUB_RUN_ID": "67890"}):
-                data = track_packages.create_bisect_data(packages, captured_versions_file=captured_file)
+                data = track_packages.create_bisect_data(
+                    packages, captured_versions_file=captured_file
+                )
 
                 assert data["workflow_run_id"] == "67890"
                 assert data["python_version"] == "3.11.5"  # From captured file
-                assert data["packages"] == {"pytest": "7.4.2", "numpy": "1.25.1"}  # From captured file
+                assert data["packages"] == {
+                    "pytest": "7.4.2",
+                    "numpy": "1.25.1",
+                }  # From captured file
                 assert data["failed_tests"] == ["test_fail.py::test_example"]
                 assert data["test_status"] == "failed"
                 assert data["git"]["commit_hash"] == "def456"
@@ -370,7 +385,9 @@ def test_generate_package_diff_link():
     assert link == "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0"
 
     # Test unknown package
-    link = track_packages.generate_package_diff_link("unknown-package", "1.0.0", "2.0.0")
+    link = track_packages.generate_package_diff_link(
+        "unknown-package", "1.0.0", "2.0.0"
+    )
     assert link is None
 
 
diff --git a/track_packages.py b/track_packages.py
index 7dd7d86..364a3c4 100644
--- a/track_packages.py
+++ b/track_packages.py
@@ -41,7 +41,9 @@
 }
 
 
-def generate_package_diff_link(package_name: str, old_version: str, new_version: str) -> str | None:
+def generate_package_diff_link(
+    package_name: str, old_version: str, new_version: str
+) -> str | None:
     """Generate a GitHub diff link for package version changes."""
     if package_name not in PACKAGE_METADATA:
         return None
@@ -53,7 +55,7 @@ def generate_package_diff_link(package_name: str, old_version: str, new_version:
         # Try different tag formats common in Python packages
         tag_formats = [
             f"v{old_version}...v{new_version}",  # v1.0.0...v1.1.0
-            f"{old_version}...{new_version}",    # 1.0.0...1.1.0
+            f"{old_version}...{new_version}",  # 1.0.0...1.1.0
             f"release-{old_version}...release-{new_version}",  # release-1.0.0...release-1.1.0
         ]
 
@@ -95,14 +97,16 @@ def get_package_version(package_name: str) -> str | None:
     return None
 
 
-def get_current_package_versions(packages: list[str], captured_versions_file: str | None = None) -> dict[str, str | None]:
+def get_current_package_versions(
+    packages: list[str], captured_versions_file: str | None = None
+) -> dict[str, str | None]:
     """Get current versions of specified packages."""
     # First try to read from captured versions file if provided
     if captured_versions_file and os.path.exists(captured_versions_file):
         try:
             with open(captured_versions_file) as f:
                 captured_data = json.load(f)
-                captured_packages = captured_data.get('packages', {})
+                captured_packages = captured_data.get("packages", {})
 
                 if len(packages) == 1 and packages[0].lower() == "all":
                     return captured_packages  # type: ignore[return-value]
@@ -113,7 +117,9 @@ def get_current_package_versions(packages: list[str], captured_versions_file: st
                     versions[package] = captured_packages.get(package)
                 return versions
         except (json.JSONDecodeError, OSError) as e:
-            print(f"Warning: Could not read captured versions file {captured_versions_file}: {e}")
+            print(
+                f"Warning: Could not read captured versions file {captured_versions_file}: {e}"
+            )
             print("Falling back to direct package detection...")
 
     # Fallback to direct detection (original behavior)
@@ -134,9 +140,11 @@ def extract_failed_tests_from_log(log_path: str) -> list[str]:
             for line in f:
                 try:
                     record = json.loads(line)
-                    if (record.get("$report_type") in ["TestReport", "CollectReport"] and
-                        record.get("outcome") == "failed" and
-                        record.get("nodeid")):
+                    if (
+                        record.get("$report_type") in ["TestReport", "CollectReport"]
+                        and record.get("outcome") == "failed"
+                        and record.get("nodeid")
+                    ):
                         failed_tests.append(record["nodeid"])
                 except json.JSONDecodeError:
                     continue
@@ -200,7 +208,12 @@ def get_git_info() -> dict[str, str]:
         }
 
 
-def create_bisect_data(packages: list[str], log_path: str | None = None, captured_versions_file: str | None = None, workflow_run_id: str | None = None) -> dict:
+def create_bisect_data(
+    packages: list[str],
+    log_path: str | None = None,
+    captured_versions_file: str | None = None,
+    workflow_run_id: str | None = None,
+) -> dict:
     """Create bisection data for current environment."""
     if workflow_run_id is None:
         workflow_run_id = os.environ.get("GITHUB_RUN_ID", "unknown")
@@ -218,8 +231,8 @@ def create_bisect_data(packages: list[str], log_path: str | None = None, capture
         try:
             with open(captured_versions_file) as f:
                 captured_data = json.load(f)
-                if 'python_version' in captured_data:
-                    python_version = captured_data['python_version']
+                if "python_version" in captured_data:
+                    python_version = captured_data["python_version"]
         except (json.JSONDecodeError, OSError):
             pass  # Use default python_version
 
@@ -234,9 +247,7 @@ def create_bisect_data(packages: list[str], log_path: str | None = None, capture
     }
 
 
-def store_bisect_data_to_branch(
-    data: dict, branch_name: str
-) -> bool:
+def store_bisect_data_to_branch(data: dict, branch_name: str) -> bool:
     """Store bisection data to a Git branch."""
     try:
         # Create filename based on run ID and timestamp
@@ -244,10 +255,22 @@ def store_bisect_data_to_branch(
 
         # Configure git user if not already set (needed for GitHub Actions)
         try:
-            subprocess.run(["git", "config", "user.name"], check=True, capture_output=True)
+            subprocess.run(
+                ["git", "config", "user.name"], check=True, capture_output=True
+            )
         except subprocess.CalledProcessError:
-            subprocess.run(["git", "config", "user.name", "github-actions[bot]"], check=True)
-            subprocess.run(["git", "config", "user.email", "github-actions[bot]@users.noreply.github.com"], check=True)
+            subprocess.run(
+                ["git", "config", "user.name", "github-actions[bot]"], check=True
+            )
+            subprocess.run(
+                [
+                    "git",
+                    "config",
+                    "user.email",
+                    "github-actions[bot]@users.noreply.github.com",
+                ],
+                check=True,
+            )
 
         # Check if branch exists remotely
         branch_exists_result = subprocess.run(
@@ -263,7 +286,11 @@ def store_bisect_data_to_branch(
             capture_output=True,
             text=True,
         )
-        original_branch = current_branch_result.stdout.strip() if current_branch_result.returncode == 0 else None
+        original_branch = (
+            current_branch_result.stdout.strip()
+            if current_branch_result.returncode == 0
+            else None
+        )
 
         try:
             if branch_exists:
@@ -271,21 +298,31 @@ def store_bisect_data_to_branch(
                 subprocess.run(["git", "fetch", "origin", branch_name], check=True)
 
                 # Check if local branch exists
-                local_branch_exists = subprocess.run(
-                    ["git", "rev-parse", "--verify", branch_name],
-                    capture_output=True,
-                ).returncode == 0
+                local_branch_exists = (
+                    subprocess.run(
+                        ["git", "rev-parse", "--verify", branch_name],
+                        capture_output=True,
+                    ).returncode
+                    == 0
+                )
 
                 if local_branch_exists:
                     subprocess.run(["git", "checkout", branch_name], check=True)
-                    subprocess.run(["git", "reset", "--hard", f"origin/{branch_name}"], check=True)
+                    subprocess.run(
+                        ["git", "reset", "--hard", f"origin/{branch_name}"], check=True
+                    )
                 else:
-                    subprocess.run(["git", "checkout", "-b", branch_name, f"origin/{branch_name}"], check=True)
+                    subprocess.run(
+                        ["git", "checkout", "-b", branch_name, f"origin/{branch_name}"],
+                        check=True,
+                    )
             else:
                 # Create new orphan branch
                 subprocess.run(["git", "checkout", "--orphan", branch_name], check=True)
                 # Remove any existing files from the new branch
-                subprocess.run(["git", "rm", "-rf", "."], capture_output=True, check=False)
+                subprocess.run(
+                    ["git", "rm", "-rf", "."], capture_output=True, check=False
+                )
 
             # Write the data file
             pathlib.Path(filename).write_text(json.dumps(data, indent=2))
@@ -312,12 +349,20 @@ def store_bisect_data_to_branch(
             # Restore original branch if possible
             if original_branch and original_branch != branch_name:
                 try:
-                    subprocess.run(["git", "checkout", original_branch], check=True, capture_output=True)
+                    subprocess.run(
+                        ["git", "checkout", original_branch],
+                        check=True,
+                        capture_output=True,
+                    )
                 except subprocess.CalledProcessError:
                     # If we can't restore, at least try to get back to main/master
                     for fallback_branch in ["main", "master"]:
                         try:
-                            subprocess.run(["git", "checkout", fallback_branch], check=True, capture_output=True)
+                            subprocess.run(
+                                ["git", "checkout", fallback_branch],
+                                check=True,
+                                capture_output=True,
+                            )
                             break
                         except subprocess.CalledProcessError:
                             continue
@@ -325,7 +370,9 @@ def store_bisect_data_to_branch(
         return True
     except subprocess.CalledProcessError as e:
         print(f"Error storing bisect data to branch '{branch_name}': {e}")
-        print(f"Make sure the repository has proper permissions and the branch name '{branch_name}' is valid")
+        print(
+            f"Make sure the repository has proper permissions and the branch name '{branch_name}' is valid"
+        )
         return False
     except Exception as e:
         print(f"Unexpected error storing bisect data: {e}")
@@ -347,7 +394,9 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
             return None
 
         # Fetch the branch
-        subprocess.run(["git", "fetch", "origin", f"{branch_name}:{branch_name}"], check=True)
+        subprocess.run(
+            ["git", "fetch", "origin", f"{branch_name}:{branch_name}"], check=True
+        )
 
         # List all JSON files in the branch
         result = subprocess.run(
@@ -357,7 +406,9 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
             check=True,
         )
 
-        json_files = [f for f in result.stdout.strip().split('\n') if f.endswith('.json')]
+        json_files = [
+            f for f in result.stdout.strip().split("\n") if f.endswith(".json")
+        ]
 
         if not json_files:
             return None
@@ -381,7 +432,10 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
                 # Check if this was a successful run
                 if run_data.get("test_status") == "passed":
                     timestamp = run_data.get("timestamp")
-                    if timestamp and (most_recent_timestamp is None or timestamp > most_recent_timestamp):
+                    if timestamp and (
+                        most_recent_timestamp is None
+                        or timestamp > most_recent_timestamp
+                    ):
                         most_recent_timestamp = timestamp
                         most_recent_success = run_data
 
@@ -394,7 +448,9 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
         return None
 
 
-def find_last_successful_run_for_tests(branch_name: str, failed_tests: list[str]) -> dict[str, dict | None]:
+def find_last_successful_run_for_tests(
+    branch_name: str, failed_tests: list[str]
+) -> dict[str, dict | None]:
     """Find the last successful run for each currently failing test."""
     test_last_success: dict[str, dict | None] = {}
 
@@ -407,7 +463,9 @@ def find_last_successful_run_for_tests(branch_name: str, failed_tests: list[str]
             check=True,
         )
 
-        json_files = [f for f in result.stdout.strip().split('\n') if f.endswith('.json')]
+        json_files = [
+            f for f in result.stdout.strip().split("\n") if f.endswith(".json")
+        ]
 
         # Get all run data and sort by timestamp (newest first)
         all_runs = []
@@ -461,9 +519,13 @@ def get_package_changes(current_packages: dict, previous_packages: dict) -> list
             changes.append(f"- {package}: (new) → {current_version}")
         elif current_version != previous_version:
             # Try to generate a GitHub diff link
-            diff_link = generate_package_diff_link(package, previous_version, current_version)
+            diff_link = generate_package_diff_link(
+                package, previous_version, current_version
+            )
             if diff_link:
-                changes.append(f"- [{package}: {previous_version} → {current_version}]({diff_link})")
+                changes.append(
+                    f"- [{package}: {previous_version} → {current_version}]({diff_link})"
+                )
             else:
                 changes.append(f"- {package}: {previous_version} → {current_version}")
 
@@ -496,7 +558,9 @@ def format_bisect_comparison(
             last_success_git = last_success.get("git", {})
 
             # Package changes since last pass
-            package_changes = get_package_changes(current_packages, last_success_packages)
+            package_changes = get_package_changes(
+                current_packages, last_success_packages
+            )
             if package_changes:
                 test_section.append("### Package changes since last pass")
                 test_section.extend(package_changes)
@@ -508,17 +572,27 @@ def format_bisect_comparison(
             if current_git.get("commit_hash") != last_success_git.get("commit_hash"):
                 prev_commit = last_success_git.get("commit_hash_short", "unknown")
                 curr_commit = current_git.get("commit_hash_short", "unknown")
-                prev_msg = last_success_git.get("commit_message", "")[:60] + ("..." if len(last_success_git.get("commit_message", "")) > 60 else "")
-                curr_msg = current_git.get("commit_message", "")[:60] + ("..." if len(current_git.get("commit_message", "")) > 60 else "")
+                prev_msg = last_success_git.get("commit_message", "")[:60] + (
+                    "..."
+                    if len(last_success_git.get("commit_message", "")) > 60
+                    else ""
+                )
+                curr_msg = current_git.get("commit_message", "")[:60] + (
+                    "..." if len(current_git.get("commit_message", "")) > 60 else ""
+                )
 
                 test_section.append("### Code changes since last pass")
                 test_section.append(f"- {prev_commit} ({prev_msg})")
                 test_section.append(f"- → {curr_commit} ({curr_msg})")
-                test_section.append(f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}")
+                test_section.append(
+                    f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}"
+                )
             else:
                 test_section.append("### Code changes since last pass")
                 test_section.append("- No code changes detected")
-                test_section.append(f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}")
+                test_section.append(
+                    f"- Last passed in run #{last_success['workflow_run_id']} on {last_success['timestamp']}"
+                )
         else:
             test_section.append("### Analysis")
             test_section.append("- No recent successful run found for this test")
@@ -576,14 +650,18 @@ def main():
         data = create_bisect_data(packages, args.log_path, args.captured_versions)
         success = store_bisect_data_to_branch(data, args.branch)
         if success:
-            print(f"Successfully stored run data to branch '{args.branch}' (status: {data['test_status']})")
+            print(
+                f"Successfully stored run data to branch '{args.branch}' (status: {data['test_status']})"
+            )
         else:
             print("Failed to store run data", file=sys.stderr)
             sys.exit(1)
 
     if args.generate_comparison:
         # Generate comparison with last successful run
-        current_data = create_bisect_data(packages, args.log_path, args.captured_versions)
+        current_data = create_bisect_data(
+            packages, args.log_path, args.captured_versions
+        )
         previous_data = retrieve_last_successful_run(args.branch)
 
         comparison = format_bisect_comparison(current_data, previous_data, args.branch)

From c957b7faba46373bf3afcca4d998d982f1dfdcff Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:27:57 -0400
Subject: [PATCH 05/15] Switch from black to ruff-format in pre-commit
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Updated pre-commit configuration to use ruff for both linting and formatting:
- Removed black (redundant with ruff-format)
- Added ruff-format for consistent code formatting
- Kept actionlint for GitHub Actions validation
- Fixed formatting issues found by ruff-format

This provides a more streamlined toolchain with ruff handling both
linting and formatting responsibilities.

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .pre-commit-config.yaml |  6 +----
 capture_versions.py     |  5 ++--
 parse_logs.py           | 12 +++------
 test_track_packages.py  | 39 ++++++++++-----------------
 track_packages.py       | 59 +++++++++++------------------------------
 5 files changed, 35 insertions(+), 86 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index a1b5684..3f4713d 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -8,16 +8,12 @@ repos:
       - id: trailing-whitespace
       - id: end-of-file-fixer
 
-  - repo: https://github.com/psf/black-pre-commit-mirror
-    rev: 25.1.0
-    hooks:
-      - id: black
-
   - repo: https://github.com/astral-sh/ruff-pre-commit
     rev: v0.12.2
     hooks:
       - id: ruff
         args: ["--fix", "--show-fixes"]
+      - id: ruff-format
 
   - repo: https://github.com/rbubley/mirrors-prettier
     rev: v3.6.2
diff --git a/capture_versions.py b/capture_versions.py
index c281eae..00ad052 100644
--- a/capture_versions.py
+++ b/capture_versions.py
@@ -5,6 +5,7 @@
 This script captures package versions using the specified Python command
 to ensure we get versions from the same environment that ran the tests.
 """
+
 import json
 import os
 import sys
@@ -68,9 +69,7 @@ def main():
         "python_executable": sys.executable,
         "packages": versions,
         "capture_method": (
-            "importlib.metadata"
-            if "importlib.metadata" in sys.modules
-            else "pkg_resources"
+            "importlib.metadata" if "importlib.metadata" in sys.modules else "pkg_resources"
         ),
     }
 
diff --git a/parse_logs.py b/parse_logs.py
index 199d635..4ba3151 100644
--- a/parse_logs.py
+++ b/parse_logs.py
@@ -242,9 +242,7 @@ def format_collection_error(error, **formatter_kwargs):
     ).format(py_version=py_version, name=error.name, traceback=error.repr_)
 
 
-def include_bisection_info(
-    message: str, bisect_file: str = "bisect-comparison.txt"
-) -> str:
+def include_bisection_info(message: str, bisect_file: str = "bisect-comparison.txt") -> str:
     """Include bisection information in the issue message if available."""
     bisect_path = pathlib.Path(bisect_file)
     if bisect_path.exists():
@@ -266,9 +264,7 @@ def include_bisection_info(
     lines = args.filepath.read_text().splitlines()
     parsed_lines = [json.loads(line) for line in lines]
     reports = [
-        parse_record(data)
-        for data in parsed_lines
-        if data["$report_type"] != "WarningMessage"
+        parse_record(data) for data in parsed_lines if data["$report_type"] != "WarningMessage"
     ]
 
     failed = [report for report in reports if report.outcome == "failed"]
@@ -276,9 +272,7 @@ def include_bisection_info(
     if len(preformatted) == 1 and isinstance(preformatted[0], CollectionError):
         message = format_collection_error(preformatted[0], py_version=py_version)
     else:
-        message = compressed_report(
-            preformatted, max_chars=65535, py_version=py_version
-        )
+        message = compressed_report(preformatted, max_chars=65535, py_version=py_version)
 
     # Include bisection information if available
     message = include_bisection_info(message)
diff --git a/test_track_packages.py b/test_track_packages.py
index f97d1d0..1d10a13 100644
--- a/test_track_packages.py
+++ b/test_track_packages.py
@@ -91,9 +91,7 @@ def test_get_current_package_versions_from_captured_file():
         assert versions == expected
 
         # Test "all" packages
-        all_versions = track_packages.get_current_package_versions(
-            ["all"], captured_file
-        )
+        all_versions = track_packages.get_current_package_versions(["all"], captured_file)
         expected_all = {"pytest": "7.4.0", "numpy": "1.24.0", "requests": "2.31.0"}
         assert all_versions == expected_all
     finally:
@@ -132,9 +130,7 @@ def test_get_git_info():
         # Mock the sequence of git commands
         mock_run.side_effect = [
             Mock(stdout="abc123def456789\n", check=True),  # git rev-parse HEAD
-            Mock(
-                stdout="Fix test regression\n", check=True
-            ),  # git log -1 --pretty=format:%s
+            Mock(stdout="Fix test regression\n", check=True),  # git log -1 --pretty=format:%s
             Mock(
                 stdout="John Doe <john@example.com>\n", check=True
             ),  # git log -1 --pretty=format:%an <%ae>
@@ -171,9 +167,7 @@ def test_extract_failed_tests_from_log():
         f.write(
             '{"$report_type": "TestReport", "nodeid": "test_file.py::test_skip", "outcome": "skipped"}\n'
         )
-        f.write(
-            '{"$report_type": "WarningMessage", "outcome": "failed"}\n'
-        )  # Should be ignored
+        f.write('{"$report_type": "WarningMessage", "outcome": "failed"}\n')  # Should be ignored
         log_path = f.name
 
     try:
@@ -211,12 +205,11 @@ def test_create_bisect_data():
     """Test creating bisection data."""
     packages = ["pytest", "hypothesis"]
 
-    with patch(
-        "track_packages.get_current_package_versions"
-    ) as mock_get_versions, patch("track_packages.get_git_info") as mock_get_git, patch(
-        "track_packages.extract_failed_tests_from_log"
-    ) as mock_extract_tests:
-
+    with (
+        patch("track_packages.get_current_package_versions") as mock_get_versions,
+        patch("track_packages.get_git_info") as mock_get_git,
+        patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests,
+    ):
         mock_get_versions.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
         mock_get_git.return_value = {
             "commit_hash": "abc123",
@@ -231,9 +224,7 @@ def test_create_bisect_data():
             data = track_packages.create_bisect_data(packages)
 
             assert data["workflow_run_id"] == "12345"
-            assert data["python_version"] == ".".join(
-                str(v) for v in sys.version_info[:3]
-            )
+            assert data["python_version"] == ".".join(str(v) for v in sys.version_info[:3])
             assert data["packages"] == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
             assert data["failed_tests"] == []
             assert data["test_status"] == "passed"
@@ -257,10 +248,10 @@ def test_create_bisect_data_with_captured_versions():
         captured_file = f.name
 
     try:
-        with patch("track_packages.get_git_info") as mock_get_git, patch(
-            "track_packages.extract_failed_tests_from_log"
-        ) as mock_extract_tests:
-
+        with (
+            patch("track_packages.get_git_info") as mock_get_git,
+            patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests,
+        ):
             mock_get_git.return_value = {
                 "commit_hash": "def456",
                 "commit_hash_short": "def456gh",
@@ -385,9 +376,7 @@ def test_generate_package_diff_link():
     assert link == "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0"
 
     # Test unknown package
-    link = track_packages.generate_package_diff_link(
-        "unknown-package", "1.0.0", "2.0.0"
-    )
+    link = track_packages.generate_package_diff_link("unknown-package", "1.0.0", "2.0.0")
     assert link is None
 
 
diff --git a/track_packages.py b/track_packages.py
index 364a3c4..00a61b5 100644
--- a/track_packages.py
+++ b/track_packages.py
@@ -41,9 +41,7 @@
 }
 
 
-def generate_package_diff_link(
-    package_name: str, old_version: str, new_version: str
-) -> str | None:
+def generate_package_diff_link(package_name: str, old_version: str, new_version: str) -> str | None:
     """Generate a GitHub diff link for package version changes."""
     if package_name not in PACKAGE_METADATA:
         return None
@@ -117,9 +115,7 @@ def get_current_package_versions(
                     versions[package] = captured_packages.get(package)
                 return versions
         except (json.JSONDecodeError, OSError) as e:
-            print(
-                f"Warning: Could not read captured versions file {captured_versions_file}: {e}"
-            )
+            print(f"Warning: Could not read captured versions file {captured_versions_file}: {e}")
             print("Falling back to direct package detection...")
 
     # Fallback to direct detection (original behavior)
@@ -255,13 +251,9 @@ def store_bisect_data_to_branch(data: dict, branch_name: str) -> bool:
 
         # Configure git user if not already set (needed for GitHub Actions)
         try:
-            subprocess.run(
-                ["git", "config", "user.name"], check=True, capture_output=True
-            )
+            subprocess.run(["git", "config", "user.name"], check=True, capture_output=True)
         except subprocess.CalledProcessError:
-            subprocess.run(
-                ["git", "config", "user.name", "github-actions[bot]"], check=True
-            )
+            subprocess.run(["git", "config", "user.name", "github-actions[bot]"], check=True)
             subprocess.run(
                 [
                     "git",
@@ -287,9 +279,7 @@ def store_bisect_data_to_branch(data: dict, branch_name: str) -> bool:
             text=True,
         )
         original_branch = (
-            current_branch_result.stdout.strip()
-            if current_branch_result.returncode == 0
-            else None
+            current_branch_result.stdout.strip() if current_branch_result.returncode == 0 else None
         )
 
         try:
@@ -308,9 +298,7 @@ def store_bisect_data_to_branch(data: dict, branch_name: str) -> bool:
 
                 if local_branch_exists:
                     subprocess.run(["git", "checkout", branch_name], check=True)
-                    subprocess.run(
-                        ["git", "reset", "--hard", f"origin/{branch_name}"], check=True
-                    )
+                    subprocess.run(["git", "reset", "--hard", f"origin/{branch_name}"], check=True)
                 else:
                     subprocess.run(
                         ["git", "checkout", "-b", branch_name, f"origin/{branch_name}"],
@@ -320,9 +308,7 @@ def store_bisect_data_to_branch(data: dict, branch_name: str) -> bool:
                 # Create new orphan branch
                 subprocess.run(["git", "checkout", "--orphan", branch_name], check=True)
                 # Remove any existing files from the new branch
-                subprocess.run(
-                    ["git", "rm", "-rf", "."], capture_output=True, check=False
-                )
+                subprocess.run(["git", "rm", "-rf", "."], capture_output=True, check=False)
 
             # Write the data file
             pathlib.Path(filename).write_text(json.dumps(data, indent=2))
@@ -394,9 +380,7 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
             return None
 
         # Fetch the branch
-        subprocess.run(
-            ["git", "fetch", "origin", f"{branch_name}:{branch_name}"], check=True
-        )
+        subprocess.run(["git", "fetch", "origin", f"{branch_name}:{branch_name}"], check=True)
 
         # List all JSON files in the branch
         result = subprocess.run(
@@ -406,9 +390,7 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
             check=True,
         )
 
-        json_files = [
-            f for f in result.stdout.strip().split("\n") if f.endswith(".json")
-        ]
+        json_files = [f for f in result.stdout.strip().split("\n") if f.endswith(".json")]
 
         if not json_files:
             return None
@@ -433,8 +415,7 @@ def retrieve_last_successful_run(branch_name: str) -> dict | None:
                 if run_data.get("test_status") == "passed":
                     timestamp = run_data.get("timestamp")
                     if timestamp and (
-                        most_recent_timestamp is None
-                        or timestamp > most_recent_timestamp
+                        most_recent_timestamp is None or timestamp > most_recent_timestamp
                     ):
                         most_recent_timestamp = timestamp
                         most_recent_success = run_data
@@ -463,9 +444,7 @@ def find_last_successful_run_for_tests(
             check=True,
         )
 
-        json_files = [
-            f for f in result.stdout.strip().split("\n") if f.endswith(".json")
-        ]
+        json_files = [f for f in result.stdout.strip().split("\n") if f.endswith(".json")]
 
         # Get all run data and sort by timestamp (newest first)
         all_runs = []
@@ -519,9 +498,7 @@ def get_package_changes(current_packages: dict, previous_packages: dict) -> list
             changes.append(f"- {package}: (new) → {current_version}")
         elif current_version != previous_version:
             # Try to generate a GitHub diff link
-            diff_link = generate_package_diff_link(
-                package, previous_version, current_version
-            )
+            diff_link = generate_package_diff_link(package, previous_version, current_version)
             if diff_link:
                 changes.append(
                     f"- [{package}: {previous_version} → {current_version}]({diff_link})"
@@ -558,9 +535,7 @@ def format_bisect_comparison(
             last_success_git = last_success.get("git", {})
 
             # Package changes since last pass
-            package_changes = get_package_changes(
-                current_packages, last_success_packages
-            )
+            package_changes = get_package_changes(current_packages, last_success_packages)
             if package_changes:
                 test_section.append("### Package changes since last pass")
                 test_section.extend(package_changes)
@@ -573,9 +548,7 @@ def format_bisect_comparison(
                 prev_commit = last_success_git.get("commit_hash_short", "unknown")
                 curr_commit = current_git.get("commit_hash_short", "unknown")
                 prev_msg = last_success_git.get("commit_message", "")[:60] + (
-                    "..."
-                    if len(last_success_git.get("commit_message", "")) > 60
-                    else ""
+                    "..." if len(last_success_git.get("commit_message", "")) > 60 else ""
                 )
                 curr_msg = current_git.get("commit_message", "")[:60] + (
                     "..." if len(current_git.get("commit_message", "")) > 60 else ""
@@ -659,9 +632,7 @@ def main():
 
     if args.generate_comparison:
         # Generate comparison with last successful run
-        current_data = create_bisect_data(
-            packages, args.log_path, args.captured_versions
-        )
+        current_data = create_bisect_data(packages, args.log_path, args.captured_versions)
         previous_data = retrieve_last_successful_run(args.branch)
 
         comparison = format_bisect_comparison(current_data, previous_data, args.branch)

From e6a1be6d488402eda5e4e086f1907bae1172d023 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Fri, 26 Sep 2025 12:32:47 -0400
Subject: [PATCH 06/15] Refactor Git operations to GitHub Actions steps
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Major improvements to bisection implementation:

### Fixed Issues:
- Updated outdated GitHub Actions (checkout@v3 → v4, setup-python@v4 → v5)
- Updated pre-commit hooks to latest versions
- All pre-commit checks now passing (ruff, actionlint, mypy)

### Refactored Git Operations:
- Moved Git branch operations from Python subprocess to GitHub Actions steps
- Created simple_bisect.py for clean data-only operations
- Git operations now transparent in workflow logs
- Easier debugging and better error handling

### Benefits:
- No more complex subprocess Git calls in Python
- Clear separation of concerns (Python = data, Actions = Git)
- Better error visibility in workflow logs
- Follows GitHub Actions best practices

The action now handles Git operations in workflow steps while Python
focuses purely on data processing and analysis.

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .github/workflows/ci.yaml     |   4 +-
 .pre-commit-config.yaml       |   8 +--
 action.yaml                   |  83 ++++++++++++++++++++-----
 generate_bisect_comparison.py | 109 ++++++++++++++++++++++++++++++++
 simple_bisect.py              | 114 ++++++++++++++++++++++++++++++++++
 store_bisect_data.py          |  45 ++++++++++++++
 6 files changed, 342 insertions(+), 21 deletions(-)
 create mode 100644 generate_bisect_comparison.py
 create mode 100644 simple_bisect.py
 create mode 100644 store_bisect_data.py

diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index fe00a24..6d465eb 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -15,9 +15,9 @@ jobs:
 
     steps:
       - name: clone the repository
-        uses: actions/checkout@v3
+        uses: actions/checkout@v4
       - name: setup python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: ${{ matrix.python-version }}
       - name: upgrade pip
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 3f4713d..e0597f4 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -3,13 +3,13 @@ ci:
 
 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v5.0.0
+    rev: v6.0.0
     hooks:
       - id: trailing-whitespace
       - id: end-of-file-fixer
 
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.12.2
+    rev: v0.13.2
     hooks:
       - id: ruff
         args: ["--fix", "--show-fixes"]
@@ -30,12 +30,12 @@ repos:
         args: ["--no-schema"]
 
   - repo: https://github.com/rhysd/actionlint
-    rev: v1.7.1
+    rev: v1.7.7
     hooks:
       - id: actionlint
 
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v1.11.2
+    rev: v1.18.2
     hooks:
       - id: mypy
         additional_dependencies: [hypothesis, types-setuptools]
diff --git a/action.yaml b/action.yaml
index 537f957..28810f9 100644
--- a/action.yaml
+++ b/action.yaml
@@ -76,31 +76,84 @@ runs:
         else
           echo "No packages specified for tracking, skipping package capture"
         fi
-    - name: handle package tracking
+    - name: store bisection data
       shell: bash -l {0}
       run: |
         if [ -n "${{ inputs.track-packages }}" ]; then
-          echo "Processing package tracking for: ${{ inputs.track-packages }}"
+          echo "Creating bisection data for: ${{ inputs.track-packages }}"
 
-          # Always store current run data (packages + test results)
-          python $GITHUB_ACTION_PATH/track_packages.py \
+          # Create run data file
+          python $GITHUB_ACTION_PATH/simple_bisect.py \
             --packages "${{ inputs.track-packages }}" \
             --log-path "${{ inputs.log-path }}" \
             --captured-versions captured-package-versions.json \
-            --store-run \
-            --branch "${{ inputs.bisect-branch }}"
-
-          # Generate comparison for bisection analysis
-          python $GITHUB_ACTION_PATH/track_packages.py \
-            --packages "${{ inputs.track-packages }}" \
-            --log-path "${{ inputs.log-path }}" \
-            --captured-versions captured-package-versions.json \
-            --generate-comparison \
             --branch "${{ inputs.bisect-branch }}" \
-            --output-file bisect-comparison.txt
+            --store-run
+        else
+          echo "No packages specified for tracking, skipping bisection"
+        fi
+
+    - name: setup git for bisection branch
+      if: ${{ inputs.track-packages != '' }}
+      shell: bash -l {0}
+      run: |
+        git config user.name "github-actions[bot]"
+        git config user.email "github-actions[bot]@users.noreply.github.com"
+
+    - name: fetch bisection branch
+      if: ${{ inputs.track-packages != '' }}
+      shell: bash -l {0}
+      run: |
+        # Check if branch exists remotely
+        if git ls-remote --heads origin "${{ inputs.bisect-branch }}" | grep -q "${{ inputs.bisect-branch }}"; then
+          echo "Branch ${{ inputs.bisect-branch }} exists, fetching..."
+          git fetch origin "${{ inputs.bisect-branch }}"
+          git checkout -B "${{ inputs.bisect-branch }}" "origin/${{ inputs.bisect-branch }}"
+        else
+          echo "Branch ${{ inputs.bisect-branch }} doesn't exist, creating orphan branch..."
+          git checkout --orphan "${{ inputs.bisect-branch }}"
+          git rm -rf . || true
+        fi
+
+    - name: commit bisection data
+      if: ${{ inputs.track-packages != '' }}
+      shell: bash -l {0}
+      run: |
+        # Add the new run data file
+        git add run_*.json
+
+        # Check if there are changes to commit
+        if git diff --staged --quiet; then
+          echo "No changes to commit"
         else
-          echo "No packages specified for tracking, skipping package tracking"
+          git commit -m "Add bisection data for run ${{ github.run_id }}
+
+          Test status: $(python -c "import json; data=json.load(open([f for f in __import__('pathlib').Path('.').glob('run_*.json')][-1])); print(data['test_status'])")
+          Failed tests: $(python -c "import json; data=json.load(open([f for f in __import__('pathlib').Path('.').glob('run_*.json')][-1])); print(len(data.get('failed_tests', [])))")
+          "
+
+          # Push to remote
+          git push origin "${{ inputs.bisect-branch }}"
         fi
+
+    - name: generate bisection comparison
+      if: ${{ inputs.track-packages != '' }}
+      shell: bash -l {0}
+      run: |
+        # Generate comparison from historical data in the bisection branch
+        python $GITHUB_ACTION_PATH/simple_bisect.py \
+          --packages "${{ inputs.track-packages }}" \
+          --log-path "${{ inputs.log-path }}" \
+          --captured-versions captured-package-versions.json \
+          --branch "${{ inputs.bisect-branch }}" \
+          --generate-comparison
+
+    - name: return to original branch
+      if: ${{ inputs.track-packages != '' && always() }}
+      shell: bash -l {0}
+      run: |
+        # Return to the original branch
+        git checkout -
     - name: produce the issue body
       shell: bash -l {0}
       run: |
diff --git a/generate_bisect_comparison.py b/generate_bisect_comparison.py
new file mode 100644
index 0000000..3116b2e
--- /dev/null
+++ b/generate_bisect_comparison.py
@@ -0,0 +1,109 @@
+#!/usr/bin/env python3
+"""
+Generate bisection comparison using GitHub API instead of Git operations.
+
+This approach uses the GitHub API to fetch previous run data from the branch,
+avoiding complex Git subprocess operations.
+"""
+
+import json
+import os
+import sys
+from pathlib import Path
+
+import track_packages
+
+
+def fetch_previous_data_via_api(repo: str, branch: str, token: str) -> dict | None:
+    """Fetch the most recent successful run data via GitHub API."""
+    import urllib.error
+    import urllib.request
+
+    try:
+        # Get branch contents
+        url = f"https://api.github.com/repos/{repo}/contents?ref={branch}"
+        req = urllib.request.Request(url)
+        req.add_header("Authorization", f"token {token}")
+        req.add_header("Accept", "application/vnd.github.v3+json")
+
+        with urllib.request.urlopen(req) as response:
+            files = json.loads(response.read().decode())
+
+        # Find JSON files
+        json_files = [f for f in files if f["name"].endswith(".json")]
+
+        if not json_files:
+            return None
+
+        # Check each file to find the most recent successful run
+        most_recent_success = None
+        most_recent_timestamp = None
+
+        for file_info in json_files:
+            try:
+                # Fetch file content
+                content_url = file_info["download_url"]
+                with urllib.request.urlopen(content_url) as response:
+                    run_data = json.loads(response.read().decode())
+
+                # Check if this was a successful run
+                if run_data.get("test_status") == "passed":
+                    timestamp = run_data.get("timestamp")
+                    if timestamp and (
+                        most_recent_timestamp is None or timestamp > most_recent_timestamp
+                    ):
+                        most_recent_timestamp = timestamp
+                        most_recent_success = run_data
+
+            except (urllib.error.URLError, json.JSONDecodeError):
+                continue
+
+        return most_recent_success
+
+    except (urllib.error.URLError, json.JSONDecodeError):
+        return None
+
+
+def main():
+    """Generate bisection comparison using GitHub API."""
+    if len(sys.argv) < 4:
+        print(
+            "Usage: generate_bisect_comparison.py <packages> <log_path> <branch> [captured_versions_file]"
+        )
+        sys.exit(1)
+
+    packages_str = sys.argv[1]
+    log_path = sys.argv[2]
+    branch = sys.argv[3]
+    captured_versions_file = sys.argv[4] if len(sys.argv) > 4 else None
+
+    packages = [pkg.strip() for pkg in packages_str.split(",") if pkg.strip()]
+
+    # Create current run data
+    current_data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
+
+    # Get repository info from environment
+    repo = os.environ.get("GITHUB_REPOSITORY")
+    token = os.environ.get("GITHUB_TOKEN")
+
+    if not repo or not token:
+        print("Error: GITHUB_REPOSITORY and GITHUB_TOKEN environment variables required")
+        sys.exit(1)
+
+    # Fetch previous successful run data
+    previous_data = fetch_previous_data_via_api(repo, branch, token)
+
+    # Generate comparison
+    comparison = track_packages.format_bisect_comparison(current_data, previous_data, branch)
+
+    # Write comparison to file
+    output_path = Path("bisect-comparison.txt")
+    if comparison:
+        output_path.write_text(comparison)
+        print(f"Bisection comparison written to {output_path.absolute()}")
+    else:
+        print("No comparison generated (no failed tests)")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/simple_bisect.py b/simple_bisect.py
new file mode 100644
index 0000000..1636389
--- /dev/null
+++ b/simple_bisect.py
@@ -0,0 +1,114 @@
+#!/usr/bin/env python3
+"""
+Simplified bisection data handling - Git operations done by GitHub Actions.
+
+This script only handles data creation and file operations. All Git branch
+switching, fetching, and pushing is handled by GitHub Actions workflow steps.
+"""
+
+import argparse
+import json
+from pathlib import Path
+
+import track_packages
+
+
+def create_run_data_file(
+    packages: list[str], log_path: str | None, captured_versions_file: str | None
+) -> str:
+    """Create bisection data file for current run."""
+    data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
+
+    # Create filename based on run ID and timestamp
+    filename = (
+        f"run_{data['workflow_run_id']}_{data['timestamp'].replace(':', '-').replace('Z', '')}.json"
+    )
+
+    # Write the data file
+    Path(filename).write_text(json.dumps(data, indent=2))
+
+    print(f"Created run data file: {filename}")
+    print(f"Test status: {data['test_status']}")
+    print(f"Failed tests: {len(data.get('failed_tests', []))}")
+
+    return filename
+
+
+def find_last_successful_run(directory: str = ".") -> dict | None:
+    """Find the most recent successful run from JSON files in current directory."""
+    json_files = list(Path(directory).glob("run_*.json"))
+
+    if not json_files:
+        return None
+
+    most_recent_success = None
+    most_recent_timestamp = None
+
+    for json_file in json_files:
+        try:
+            run_data = json.loads(json_file.read_text())
+
+            # Check if this was a successful run
+            if run_data.get("test_status") == "passed":
+                timestamp = run_data.get("timestamp")
+                if timestamp and (
+                    most_recent_timestamp is None or timestamp > most_recent_timestamp
+                ):
+                    most_recent_timestamp = timestamp
+                    most_recent_success = run_data
+
+        except (json.JSONDecodeError, OSError):
+            continue
+
+    return most_recent_success
+
+
+def generate_comparison(
+    packages: list[str], log_path: str | None, captured_versions_file: str | None, branch_name: str
+) -> None:
+    """Generate bisection comparison from current run and historical data."""
+    # Create current run data
+    current_data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
+
+    # Find last successful run from files in current directory (bisect branch)
+    previous_data = find_last_successful_run()
+
+    # Generate comparison
+    comparison = track_packages.format_bisect_comparison(current_data, previous_data, branch_name)
+
+    # Write comparison to file
+    output_path = Path("bisect-comparison.txt")
+    if comparison:
+        output_path.write_text(comparison)
+        print(f"Bisection comparison written to {output_path.absolute()}")
+    else:
+        print("No comparison generated (no failed tests)")
+
+
+def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Handle bisection data")
+    parser.add_argument("--packages", required=True, help="Comma-separated list of packages")
+    parser.add_argument("--log-path", help="Path to pytest log file")
+    parser.add_argument("--captured-versions", help="Path to captured versions JSON file")
+    parser.add_argument("--branch", default="bisect-data", help="Branch name for bisection data")
+
+    # Action to perform
+    parser.add_argument("--store-run", action="store_true", help="Store current run data")
+    parser.add_argument(
+        "--generate-comparison", action="store_true", help="Generate bisection comparison"
+    )
+
+    args = parser.parse_args()
+
+    packages = [pkg.strip() for pkg in args.packages.split(",") if pkg.strip()]
+
+    if args.store_run:
+        create_run_data_file(packages, args.log_path, args.captured_versions)
+
+    if args.generate_comparison:
+        generate_comparison(packages, args.log_path, args.captured_versions, args.branch)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/store_bisect_data.py b/store_bisect_data.py
new file mode 100644
index 0000000..4c01e96
--- /dev/null
+++ b/store_bisect_data.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python3
+"""
+Store bisection data as JSON file - Git operations handled by GitHub Actions.
+
+This simplified approach creates the JSON data file and lets GitHub Actions
+handle all Git operations for better transparency and debugging.
+"""
+
+import json
+import sys
+from pathlib import Path
+
+import track_packages
+
+
+def main():
+    """Create bisection data file for GitHub Actions to commit."""
+    if len(sys.argv) < 3:
+        print("Usage: store_bisect_data.py <packages> <log_path> [captured_versions_file]")
+        sys.exit(1)
+
+    packages_str = sys.argv[1]
+    log_path = sys.argv[2]
+    captured_versions_file = sys.argv[3] if len(sys.argv) > 3 else None
+
+    packages = [pkg.strip() for pkg in packages_str.split(",") if pkg.strip()]
+
+    # Create bisection data
+    data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
+
+    # Create filename based on run ID and timestamp
+    filename = (
+        f"run_{data['workflow_run_id']}_{data['timestamp'].replace(':', '-').replace('Z', '')}.json"
+    )
+
+    # Write the data file
+    Path(filename).write_text(json.dumps(data, indent=2))
+
+    print(f"Created bisection data file: {filename}")
+    print(f"Test status: {data['test_status']}")
+    print(f"Failed tests: {len(data.get('failed_tests', []))}")
+
+
+if __name__ == "__main__":
+    main()

From a3783d146a6a45422241179c8246409ce724ea0b Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 12:53:15 -0400
Subject: [PATCH 07/15] Enhance package version tracking with git commit hash
 extraction
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add git revision extraction from nightly wheels and setuptools_scm packages
- Support both traditional version strings and new format with git info
- Create comprehensive test suite for version extraction functionality
- Make repository installable as Python package with entry points
- Update package change detection to handle git revision changes
- Add support for scientific Python nightly wheel tracking

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 capture_versions.py              |  81 ++++++++-
 pyproject.toml                   |  56 +++++++
 tests/__init__.py                |   1 +
 tests/test_nightly_wheels.py     | 149 +++++++++++++++++
 tests/test_version_extraction.py | 272 +++++++++++++++++++++++++++++++
 track_packages.py                |  77 +++++++--
 6 files changed, 615 insertions(+), 21 deletions(-)
 create mode 100644 tests/__init__.py
 create mode 100644 tests/test_nightly_wheels.py
 create mode 100644 tests/test_version_extraction.py

diff --git a/capture_versions.py b/capture_versions.py
index 00ad052..0880b29 100644
--- a/capture_versions.py
+++ b/capture_versions.py
@@ -11,6 +11,52 @@
 import sys
 
 
+def extract_git_info(package_name: str) -> dict:
+    """Extract git revision and other VCS info from a package."""
+    git_info = {}
+
+    try:
+        import importlib
+
+        # Try to import the package to check for version attributes
+        pkg = importlib.import_module(package_name.replace("-", "_"))
+
+        # Check for git revision in various locations
+        revision_attrs = [
+            "__git_revision__",
+            "version.git_revision",
+            "_version.get_versions",
+            "__version_info__.git_revision",
+        ]
+
+        for attr_path in revision_attrs:
+            try:
+                obj = pkg
+                for part in attr_path.split("."):
+                    obj = getattr(obj, part)
+
+                if callable(obj):
+                    result = obj()
+                    if isinstance(result, dict):
+                        git_info.update(result)
+                    else:
+                        git_info["git_revision"] = str(result)
+                else:
+                    git_info["git_revision"] = str(obj)
+                break
+            except AttributeError:
+                continue
+
+        # Check for full version info
+        if hasattr(pkg, "version") and hasattr(pkg.version, "full_version"):
+            git_info["full_version"] = pkg.version.full_version
+
+    except (ImportError, AttributeError):
+        pass
+
+    return git_info
+
+
 def main():
     """Main function to capture package versions."""
     packages_input = os.environ.get("TRACK_PACKAGES", "").strip()
@@ -28,14 +74,23 @@ def main():
         if len(packages) == 1 and packages[0].lower() == "all":
             print("Capturing all installed packages...")
             for dist in metadata.distributions():
-                versions[dist.name] = dist.version
+                pkg_info = {"version": dist.version, "git_info": extract_git_info(dist.name)}
+                versions[dist.name] = pkg_info
         else:
             print(f"Capturing specific packages: {packages}")
             for pkg in packages:
                 if pkg:
                     try:
-                        versions[pkg] = metadata.version(pkg)
-                        print(f"  {pkg}: {versions[pkg]}")
+                        pkg_version = metadata.version(pkg)
+                        git_info = extract_git_info(pkg)
+
+                        pkg_info = {"version": pkg_version, "git_info": git_info}
+                        versions[pkg] = pkg_info
+
+                        print(f"  {pkg}: {pkg_version}")
+                        if git_info:
+                            for key, value in git_info.items():
+                                print(f"    {key}: {value}")
                     except Exception as e:
                         versions[pkg] = None
                         print(f"  {pkg}: not found ({e})")
@@ -43,19 +98,31 @@ def main():
         print("importlib.metadata not available, trying pkg_resources...")
         # Fallback to pkg_resources
         try:
-            import pkg_resources  # type: ignore[import-untyped]
+            import pkg_resources  # type: ignore[import-not-found]
 
             if len(packages) == 1 and packages[0].lower() == "all":
                 print("Capturing all installed packages...")
                 for dist in pkg_resources.working_set:
-                    versions[dist.project_name] = dist.version
+                    pkg_info = {
+                        "version": dist.version,
+                        "git_info": extract_git_info(dist.project_name),
+                    }
+                    versions[dist.project_name] = pkg_info
             else:
                 print(f"Capturing specific packages: {packages}")
                 for pkg in packages:
                     if pkg:
                         try:
-                            versions[pkg] = pkg_resources.get_distribution(pkg).version
-                            print(f"  {pkg}: {versions[pkg]}")
+                            pkg_version = pkg_resources.get_distribution(pkg).version
+                            git_info = extract_git_info(pkg)
+
+                            pkg_info = {"version": pkg_version, "git_info": git_info}
+                            versions[pkg] = pkg_info
+
+                            print(f"  {pkg}: {pkg_version}")
+                            if git_info:
+                                for key, value in git_info.items():
+                                    print(f"    {key}: {value}")
                         except Exception as e:
                             versions[pkg] = None
                             print(f"  {pkg}: not found ({e})")
diff --git a/pyproject.toml b/pyproject.toml
index b7b41eb..4762556 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,3 +1,59 @@
+[build-system]
+requires = ["setuptools>=45", "wheel"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "issue-from-pytest-log-action"
+version = "0.1.0"
+description = "GitHub Action for bisection analysis of pytest failures with package version tracking"
+authors = [{ name = "Ian Hunt-Isaak", email = "ianhuntisaak@gmail.com" }]
+readme = "README.md"
+license = { text = "MIT" }
+requires-python = ">=3.8"
+classifiers = [
+  "Development Status :: 3 - Alpha",
+  "Intended Audience :: Developers",
+  "License :: OSI Approved :: MIT License",
+  "Programming Language :: Python :: 3",
+  "Programming Language :: Python :: 3.8",
+  "Programming Language :: Python :: 3.9",
+  "Programming Language :: Python :: 3.10",
+  "Programming Language :: Python :: 3.11",
+  "Programming Language :: Python :: 3.12",
+  "Programming Language :: Python :: 3.13",
+]
+
+dependencies = [
+  "setuptools; python_version >= '3.12'", # For pkg_resources fallback
+]
+
+[project.optional-dependencies]
+test = [
+  "pytest>=6.0",
+  "pytest-cov",
+]
+dev = [
+  "ruff",
+  "mypy",
+  "pre-commit",
+]
+
+[project.scripts]
+capture-versions = "capture_versions:main"
+simple-bisect = "simple_bisect:main"
+
+[tool.setuptools.packages.find]
+where = ["."]
+include = ["capture_versions*", "simple_bisect*", "track_packages*"]
+
+[tool.setuptools]
+py-modules = ["capture_versions", "simple_bisect", "track_packages"]
+
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+python_files = ["test_*.py"]
+addopts = "-v --tb=short"
+
 [tool.ruff]
 target-version = "py310"
 builtins = ["ellipsis"]
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..66173ae
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1 @@
+# Test package
diff --git a/tests/test_nightly_wheels.py b/tests/test_nightly_wheels.py
new file mode 100644
index 0000000..c5eee0d
--- /dev/null
+++ b/tests/test_nightly_wheels.py
@@ -0,0 +1,149 @@
+"""Test nightly wheel support with scientific Python packages."""
+
+import json
+import os
+import subprocess
+import sys
+import tempfile
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from capture_versions import extract_git_info
+
+
+class TestNightlyWheelSupport:
+    """Test support for scientific Python nightly wheels."""
+
+    @pytest.mark.parametrize(
+        "package_name", ["numpy", "pandas", "scipy", "matplotlib", "xarray", "zarr"]
+    )
+    def test_git_info_extraction_for_scientific_packages(self, package_name):
+        """Test git info extraction for common scientific packages."""
+        # This test checks if our extraction works, but doesn't require the packages to be installed
+        with patch("importlib.import_module") as mock_import:
+            # Mock a nightly wheel package with git info
+            mock_pkg = MagicMock()
+            mock_pkg.version.git_revision = "abc123def456789012345678901234567890abcd"
+            mock_pkg.version.full_version = "2.1.0.dev0+123.gabc123d"
+            mock_import.return_value = mock_pkg
+
+            git_info = extract_git_info(package_name)
+
+            assert git_info.get("git_revision") == "abc123def456789012345678901234567890abcd"
+            assert git_info.get("full_version") == "2.1.0.dev0+123.gabc123d"
+
+    def test_nightly_wheel_version_patterns(self):
+        """Test handling of nightly wheel version patterns."""
+        # Common nightly version patterns
+        nightly_patterns = [
+            "2.1.0.dev0",
+            "1.5.0.dev0+123.gabc123d",
+            "3.0.0a1.dev0+456.gdef456a",
+            "2.0.0.post1.dev0+789.g123abc4",
+        ]
+
+        for version in nightly_patterns:
+            # Test that we can parse these version formats
+            package_info = {
+                "version": version,
+                "git_info": {"git_revision": "abc123def456789012345678901234567890abcd"},
+            }
+
+            from track_packages import extract_version_string, format_version_with_git
+
+            extracted_version = extract_version_string(package_info)
+            assert extracted_version == version
+
+            formatted = format_version_with_git(package_info)
+            assert version in formatted
+            assert "(abc123de)" in formatted
+
+    def test_capture_multiple_scientific_packages(self):
+        """Test capturing multiple scientific packages at once."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            test_env = os.environ.copy()
+            # Test with packages that might be available
+            test_env["TRACK_PACKAGES"] = "pytest,setuptools"
+
+            # Use the script directly from the source directory
+            script_path = os.path.join(
+                os.path.dirname(os.path.dirname(__file__)), "capture_versions.py"
+            )
+            result = subprocess.run(
+                [sys.executable, script_path],
+                env=test_env,
+                cwd=tmpdir,
+                capture_output=True,
+                text=True,
+            )
+
+            assert result.returncode == 0, f"Script failed: {result.stderr}"
+
+            with open(f"{tmpdir}/captured-package-versions.json") as f:
+                data = json.load(f)
+
+            packages = data["packages"]
+            assert len(packages) >= 1  # Should capture at least one package
+
+            # Check that each captured package has the expected structure
+            for pkg_name, pkg_info in packages.items():
+                if pkg_info is not None:  # Skip packages that weren't found
+                    if isinstance(pkg_info, dict):
+                        assert "version" in pkg_info
+                        assert "git_info" in pkg_info
+                    else:
+                        # Old string format is also acceptable
+                        assert isinstance(pkg_info, str)
+
+    def test_scientific_python_nightly_index_handling(self):
+        """Test that we can handle the scientific Python nightly wheel index format."""
+        # This tests the theoretical handling of nightly wheels
+        # In practice, these would come from: https://pypi.anaconda.org/scientific-python-nightly-wheels/simple
+
+        mock_nightly_packages = {
+            "numpy": {
+                "version": "2.1.0.dev0",
+                "git_info": {
+                    "git_revision": "e7a123b2d3eca9897843791dd698c1803d9a39c2",
+                    "full_version": "2.1.0.dev0+nightly",
+                },
+            },
+            "pandas": {
+                "version": "2.2.0.dev0",
+                "git_info": {
+                    "git_revision": "def456c9b8e7f6a5d4c3b2a1f0e9d8c7b6a59483",
+                    "full_version": "2.2.0.dev0+nightly",
+                },
+            },
+        }
+
+        # Test that package changes detect nightly wheel updates properly
+        from track_packages import get_package_changes
+
+        # Simulate updating from one nightly to another
+        previous_nightly = {
+            "numpy": {
+                "version": "2.1.0.dev0",
+                "git_info": {
+                    "git_revision": "old123b2d3eca9897843791dd698c1803d9a39c2",
+                },
+            }
+        }
+
+        changes = get_package_changes(mock_nightly_packages, previous_nightly)
+
+        # Should detect git revision change for numpy
+        numpy_change = [c for c in changes if "numpy" in c][0]
+        assert "git revision changed" in numpy_change
+        assert "2.1.0.dev0 (old123b2)" in numpy_change
+        assert "2.1.0.dev0 (e7a123b2)" in numpy_change
+
+        # Should detect new package pandas
+        pandas_change = [c for c in changes if "pandas" in c][0]
+        assert "(new)" in pandas_change
+        assert "2.2.0.dev0 (def456c9)" in pandas_change
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])
diff --git a/tests/test_version_extraction.py b/tests/test_version_extraction.py
new file mode 100644
index 0000000..1df70c9
--- /dev/null
+++ b/tests/test_version_extraction.py
@@ -0,0 +1,272 @@
+"""Test version extraction and git info functionality."""
+
+import json
+import os
+import tempfile
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from capture_versions import extract_git_info
+from track_packages import (
+    extract_git_revision,
+    extract_version_string,
+    format_version_with_git,
+    get_package_changes,
+)
+
+
+class TestGitInfoExtraction:
+    """Test git info extraction from packages."""
+
+    def test_extract_git_info_with_revision(self):
+        """Test extracting git info from a package that has git_revision."""
+        with patch("importlib.import_module") as mock_import:
+            # Mock package with git revision
+            mock_pkg = MagicMock()
+            mock_pkg.version.git_revision = "abc123def456"
+            mock_pkg.version.full_version = "1.0.0"
+            mock_import.return_value = mock_pkg
+
+            result = extract_git_info("numpy")
+
+            assert result["git_revision"] == "abc123def456"
+            assert result["full_version"] == "1.0.0"
+
+    def test_extract_git_info_with_versioneer(self):
+        """Test extracting git info from a package using versioneer."""
+        with patch("importlib.import_module") as mock_import:
+            # Mock package with versioneer-style version info
+            mock_pkg = MagicMock()
+
+            def mock_get_versions():
+                return {
+                    "version": "1.0.0+123.gabc123d",
+                    "full-revisionid": "abc123def456789",
+                    "dirty": False,
+                    "error": None,
+                }
+
+            mock_pkg._version.get_versions = mock_get_versions
+            # Remove other attributes to ensure we hit the _version.get_versions path
+            delattr(mock_pkg, "version")
+            mock_import.return_value = mock_pkg
+
+            result = extract_git_info("some_package")
+
+            # The function should update the result dict with the returned values
+            assert "version" in result
+            assert "full-revisionid" in result
+
+    def test_extract_git_info_no_version_info(self):
+        """Test extracting git info from a package without version info."""
+        with patch("importlib.import_module") as mock_import:
+            # Mock package without version info
+            mock_pkg = MagicMock()
+            # Remove all version-related attributes
+            del mock_pkg.version
+            del mock_pkg._version
+            del mock_pkg.__git_revision__
+            mock_import.return_value = mock_pkg
+
+            result = extract_git_info("basic_package")
+
+            assert result == {}
+
+    def test_extract_git_info_import_error(self):
+        """Test handling import errors gracefully."""
+        with patch("importlib.import_module", side_effect=ImportError("Package not found")):
+            result = extract_git_info("nonexistent_package")
+
+            assert result == {}
+
+
+class TestVersionStringExtraction:
+    """Test version string extraction from different formats."""
+
+    def test_extract_version_string_from_dict(self):
+        """Test extracting version from new dict format."""
+        package_info = {"version": "2.1.0", "git_info": {"git_revision": "abc123"}}
+        result = extract_version_string(package_info)
+        assert result == "2.1.0"
+
+    def test_extract_version_string_from_string(self):
+        """Test extracting version from old string format."""
+        package_info = "1.5.0"
+        result = extract_version_string(package_info)
+        assert result == "1.5.0"
+
+    def test_extract_version_string_none(self):
+        """Test handling None input."""
+        result = extract_version_string(None)
+        assert result is None
+
+    def test_extract_git_revision_from_dict(self):
+        """Test extracting git revision from dict format."""
+        package_info = {"version": "2.1.0", "git_info": {"git_revision": "abc123def456"}}
+        result = extract_git_revision(package_info)
+        assert result == "abc123def456"
+
+    def test_extract_git_revision_no_git_info(self):
+        """Test extracting git revision when not available."""
+        package_info = {"version": "2.1.0"}
+        result = extract_git_revision(package_info)
+        assert result is None
+
+    def test_extract_git_revision_from_string(self):
+        """Test extracting git revision from old string format."""
+        result = extract_git_revision("1.5.0")
+        assert result is None
+
+
+class TestVersionFormatting:
+    """Test version formatting with git info."""
+
+    def test_format_version_with_git_info(self):
+        """Test formatting version with git revision."""
+        package_info = {
+            "version": "2.1.0",
+            "git_info": {"git_revision": "abc123def456789012345678901234567890abcd"},
+        }
+        result = format_version_with_git(package_info)
+        assert result == "2.1.0 (abc123de)"
+
+    def test_format_version_without_git_info(self):
+        """Test formatting version without git revision."""
+        package_info = {"version": "2.1.0"}
+        result = format_version_with_git(package_info)
+        assert result == "2.1.0"
+
+    def test_format_version_string_format(self):
+        """Test formatting old string format."""
+        result = format_version_with_git("1.5.0")
+        assert result == "1.5.0"
+
+    def test_format_version_none(self):
+        """Test formatting None."""
+        result = format_version_with_git(None)
+        assert result == "(missing)"
+
+
+class TestPackageChanges:
+    """Test package change detection."""
+
+    def test_package_changes_version_only(self):
+        """Test detecting version-only changes."""
+        current = {"numpy": "2.1.0"}
+        previous = {"numpy": "2.0.0"}
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "numpy: 2.0.0 → 2.1.0" in changes[0]
+
+    def test_package_changes_with_git_info(self):
+        """Test detecting changes with git revision info."""
+        current = {
+            "numpy": {
+                "version": "2.1.0",
+                "git_info": {"git_revision": "newcommitabc123def456789012345678901234567890"},
+            }
+        }
+        previous = {
+            "numpy": {
+                "version": "2.1.0",
+                "git_info": {"git_revision": "oldcommitdef456789012345678901234567890abc123"},
+            }
+        }
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "git revision changed" in changes[0]
+        assert "2.1.0 (oldcommi)" in changes[0]
+        assert "2.1.0 (newcommi)" in changes[0]
+
+    def test_package_changes_mixed_formats(self):
+        """Test detecting changes between old and new formats."""
+        current = {
+            "numpy": {
+                "version": "2.1.0",
+                "git_info": {"git_revision": "abc123def456789012345678901234567890abcd"},
+            }
+        }
+        previous = {"numpy": "2.0.0"}
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "numpy: 2.0.0 → 2.1.0 (abc123de)" in changes[0]
+
+    def test_package_changes_new_package(self):
+        """Test detecting new packages."""
+        current = {"pandas": "1.5.0"}
+        previous = {}
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "pandas: (new) → 1.5.0" in changes[0]
+
+    def test_package_changes_removed_package(self):
+        """Test detecting removed packages."""
+        current = {}
+        previous = {"pandas": "1.4.0"}
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "pandas: 1.4.0 → (removed)" in changes[0]
+
+
+class TestCaptureVersionsIntegration:
+    """Integration tests for the capture_versions script."""
+
+    def test_capture_versions_output_structure(self):
+        """Test that capture_versions produces correct JSON structure."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            test_env = os.environ.copy()
+            test_env["TRACK_PACKAGES"] = "pytest"  # Use pytest as it should always be available
+
+            import subprocess
+            import sys
+
+            # Use the script directly from the source directory
+            script_path = os.path.join(
+                os.path.dirname(os.path.dirname(__file__)), "capture_versions.py"
+            )
+            result = subprocess.run(
+                [sys.executable, script_path],
+                env=test_env,
+                cwd=tmpdir,
+                capture_output=True,
+                text=True,
+            )
+
+            assert result.returncode == 0, f"Script failed: {result.stderr}"
+
+            # Read the output file
+            with open(os.path.join(tmpdir, "captured-package-versions.json")) as f:
+                data = json.load(f)
+
+            # Check required fields
+            assert "python_version" in data
+            assert "python_executable" in data
+            assert "packages" in data
+            assert "capture_method" in data
+
+            # Check pytest package info
+            assert "pytest" in data["packages"]
+            pytest_info = data["packages"]["pytest"]
+
+            if isinstance(pytest_info, dict):
+                # New format with git_info
+                assert "version" in pytest_info
+                assert "git_info" in pytest_info
+            else:
+                # Old format (string)
+                assert isinstance(pytest_info, str)
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])
diff --git a/track_packages.py b/track_packages.py
index 00a61b5..f0c7238 100644
--- a/track_packages.py
+++ b/track_packages.py
@@ -12,6 +12,7 @@
 import subprocess
 import sys
 from datetime import datetime
+from typing import Any
 
 # Package metadata for generating GitHub links
 PACKAGE_METADATA = {
@@ -97,8 +98,8 @@ def get_package_version(package_name: str) -> str | None:
 
 def get_current_package_versions(
     packages: list[str], captured_versions_file: str | None = None
-) -> dict[str, str | None]:
-    """Get current versions of specified packages."""
+) -> dict[str, Any]:
+    """Get current versions of specified packages with git info if available."""
     # First try to read from captured versions file if provided
     if captured_versions_file and os.path.exists(captured_versions_file):
         try:
@@ -118,7 +119,7 @@ def get_current_package_versions(
             print(f"Warning: Could not read captured versions file {captured_versions_file}: {e}")
             print("Falling back to direct package detection...")
 
-    # Fallback to direct detection (original behavior)
+    # Fallback to direct detection (original behavior) - returns simple version strings
     if len(packages) == 1 and packages[0].lower() == "all":
         return get_all_installed_packages()
 
@@ -481,30 +482,78 @@ def find_last_successful_run_for_tests(
     return test_last_success
 
 
+def extract_version_string(package_info: dict | str | None) -> str | None:
+    """Extract version string from package info (handles both old and new formats)."""
+    if package_info is None:
+        return None
+    if isinstance(package_info, str):
+        return package_info
+    if isinstance(package_info, dict):
+        return package_info.get("version")
+    return None
+
+
+def extract_git_revision(package_info: dict | str | None) -> str | None:
+    """Extract git revision from package info if available."""
+    if isinstance(package_info, dict) and "git_info" in package_info:
+        git_info = package_info["git_info"]
+        return git_info.get("git_revision")
+    return None
+
+
+def format_version_with_git(package_info: dict | str | None) -> str:
+    """Format version string with git revision if available."""
+    version = extract_version_string(package_info)
+    if version is None:
+        return "(missing)"
+
+    git_revision = extract_git_revision(package_info)
+    if git_revision:
+        # Show first 8 characters of git hash
+        short_hash = git_revision[:8]
+        return f"{version} ({short_hash})"
+    return version
+
+
 def get_package_changes(current_packages: dict, previous_packages: dict) -> list[str]:
     """Get list of package changes between two runs."""
     changes = []
     all_packages = set(current_packages.keys()) | set(previous_packages.keys())
 
     for package in sorted(all_packages):
-        current_version = current_packages.get(package)
-        previous_version = previous_packages.get(package)
+        current_info = current_packages.get(package)
+        previous_info = previous_packages.get(package)
+
+        current_version = extract_version_string(current_info)
+        previous_version = extract_version_string(previous_info)
 
         if current_version is None and previous_version is None:
             continue
         elif current_version is None:
-            changes.append(f"- {package}: {previous_version} → (removed)")
+            prev_display = format_version_with_git(previous_info)
+            changes.append(f"- {package}: {prev_display} → (removed)")
         elif previous_version is None:
-            changes.append(f"- {package}: (new) → {current_version}")
-        elif current_version != previous_version:
-            # Try to generate a GitHub diff link
-            diff_link = generate_package_diff_link(package, previous_version, current_version)
-            if diff_link:
+            curr_display = format_version_with_git(current_info)
+            changes.append(f"- {package}: (new) → {curr_display}")
+        elif current_version != previous_version or extract_git_revision(
+            current_info
+        ) != extract_git_revision(previous_info):
+            # Version changed OR git revision changed
+            prev_display = format_version_with_git(previous_info)
+            curr_display = format_version_with_git(current_info)
+
+            # Try to generate a GitHub diff link for version changes
+            if current_version != previous_version:
+                diff_link = generate_package_diff_link(package, previous_version, current_version)
+                if diff_link:
+                    changes.append(f"- [{package}: {prev_display} → {curr_display}]({diff_link})")
+                else:
+                    changes.append(f"- {package}: {prev_display} → {curr_display}")
+            else:
+                # Only git revision changed (nightly build case)
                 changes.append(
-                    f"- [{package}: {previous_version} → {current_version}]({diff_link})"
+                    f"- {package}: {prev_display} → {curr_display} (git revision changed)"
                 )
-            else:
-                changes.append(f"- {package}: {previous_version} → {current_version}")
 
     return changes
 

From 52f2f9892cb063e219030fd5a8a88ba5d2313ec3 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:25:19 -0400
Subject: [PATCH 08/15] Restructure as installable package and enhance git hash
 extraction
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Move Python modules to src/issue_from_pytest_log_action/ package structure
- Update action.yaml to install and use package instead of direct script calls
- Enhance git hash extraction to parse version strings with 'g' prefix patterns
- Add comprehensive tests for version string parsing (30 new test cases)
- Support nightly wheel patterns: +gabc123d, .gabc123d, dev0+123.gabc123d
- Handle packages starting with 'g' correctly (glib, gtk, greenlet, etc.)
- Validate minimum git hash length (7+ characters) and hex-only content
- Backward compatible with existing setuptools_scm and versioneer approaches
- Update .gitignore to exclude build artifacts and temporary files

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .gitignore                                    |  15 ++
 action.yaml                                   |   7 +-
 pyproject.toml                                |  11 +-
 src/issue_from_pytest_log_action/__init__.py  |  27 ++++
 .../capture_versions.py                       |  44 ++++++
 .../simple_bisect.py                          |   2 +-
 .../track_packages.py                         |   0
 tests/test_nightly_wheels.py                  |  16 +-
 tests/test_version_extraction.py              |  11 +-
 tests/test_version_string_parsing.py          | 143 ++++++++++++++++++
 10 files changed, 250 insertions(+), 26 deletions(-)
 create mode 100644 src/issue_from_pytest_log_action/__init__.py
 rename capture_versions.py => src/issue_from_pytest_log_action/capture_versions.py (77%)
 rename simple_bisect.py => src/issue_from_pytest_log_action/simple_bisect.py (98%)
 rename track_packages.py => src/issue_from_pytest_log_action/track_packages.py (100%)
 create mode 100644 tests/test_version_string_parsing.py

diff --git a/.gitignore b/.gitignore
index 07b6500..ac675e8 100644
--- a/.gitignore
+++ b/.gitignore
@@ -2,3 +2,18 @@
 __pycache__/
 
 /.prettier_cache/
+
+# Python package build artifacts
+*.egg-info/
+dist/
+build/
+*.egg
+
+# UV lock file
+uv.lock
+
+# Temporary test outputs
+captured-package-versions.json
+bisect-comparison.txt
+pytest-logs.txt
+run_*.json
diff --git a/action.yaml b/action.yaml
index 28810f9..ea52001 100644
--- a/action.yaml
+++ b/action.yaml
@@ -66,13 +66,14 @@ runs:
       shell: bash -l {0}
       run: |
         python -m pip install pytest more-itertools
+        python -m pip install $GITHUB_ACTION_PATH
     - name: capture package versions from test environment
       shell: bash -l {0}
       run: |
         if [ -n "${{ inputs.track-packages }}" ]; then
           echo "Capturing package versions using: ${{ inputs.python-command }}"
           export TRACK_PACKAGES="${{ inputs.track-packages }}"
-          ${{ inputs.python-command }} $GITHUB_ACTION_PATH/capture_versions.py
+          ${{ inputs.python-command }} -m issue_from_pytest_log_action.capture_versions
         else
           echo "No packages specified for tracking, skipping package capture"
         fi
@@ -83,7 +84,7 @@ runs:
           echo "Creating bisection data for: ${{ inputs.track-packages }}"
 
           # Create run data file
-          python $GITHUB_ACTION_PATH/simple_bisect.py \
+          python -m issue_from_pytest_log_action.simple_bisect \
             --packages "${{ inputs.track-packages }}" \
             --log-path "${{ inputs.log-path }}" \
             --captured-versions captured-package-versions.json \
@@ -141,7 +142,7 @@ runs:
       shell: bash -l {0}
       run: |
         # Generate comparison from historical data in the bisection branch
-        python $GITHUB_ACTION_PATH/simple_bisect.py \
+        python -m issue_from_pytest_log_action.simple_bisect \
           --packages "${{ inputs.track-packages }}" \
           --log-path "${{ inputs.log-path }}" \
           --captured-versions captured-package-versions.json \
diff --git a/pyproject.toml b/pyproject.toml
index 4762556..379fd04 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -39,15 +39,12 @@ dev = [
 ]
 
 [project.scripts]
-capture-versions = "capture_versions:main"
-simple-bisect = "simple_bisect:main"
+capture-versions = "issue_from_pytest_log_action.capture_versions:main"
+simple-bisect = "issue_from_pytest_log_action.simple_bisect:main"
 
 [tool.setuptools.packages.find]
-where = ["."]
-include = ["capture_versions*", "simple_bisect*", "track_packages*"]
-
-[tool.setuptools]
-py-modules = ["capture_versions", "simple_bisect", "track_packages"]
+where = ["src"]
+include = ["issue_from_pytest_log_action*"]
 
 [tool.pytest.ini_options]
 testpaths = ["tests"]
diff --git a/src/issue_from_pytest_log_action/__init__.py b/src/issue_from_pytest_log_action/__init__.py
new file mode 100644
index 0000000..15b3701
--- /dev/null
+++ b/src/issue_from_pytest_log_action/__init__.py
@@ -0,0 +1,27 @@
+"""Issue from pytest log action package."""
+
+__version__ = "0.1.0"
+
+from issue_from_pytest_log_action.capture_versions import extract_git_info
+from issue_from_pytest_log_action.capture_versions import main as capture_versions_main
+from issue_from_pytest_log_action.simple_bisect import main as simple_bisect_main
+from issue_from_pytest_log_action.track_packages import (
+    create_bisect_data,
+    extract_git_revision,
+    extract_version_string,
+    format_bisect_comparison,
+    format_version_with_git,
+    get_package_changes,
+)
+
+__all__ = [
+    "extract_git_info",
+    "capture_versions_main",
+    "simple_bisect_main",
+    "create_bisect_data",
+    "extract_git_revision",
+    "extract_version_string",
+    "format_bisect_comparison",
+    "format_version_with_git",
+    "get_package_changes",
+]
diff --git a/capture_versions.py b/src/issue_from_pytest_log_action/capture_versions.py
similarity index 77%
rename from capture_versions.py
rename to src/issue_from_pytest_log_action/capture_versions.py
index 0880b29..f82c58e 100644
--- a/capture_versions.py
+++ b/src/issue_from_pytest_log_action/capture_versions.py
@@ -11,6 +11,25 @@
 import sys
 
 
+def extract_git_hash_from_version(version_string: str) -> str | None:
+    """Extract git hash from version string (e.g., '2.1.0.dev0+123.gabc123d')."""
+    import re
+
+    # Common patterns for git hashes in version strings
+    patterns = [
+        r"\.g([a-f0-9]{7,40})",  # .gabc123d or .gabc123def456...
+        r"\+g([a-f0-9]{7,40})",  # +gabc123d
+        r"g([a-f0-9]{7,40})",  # gabc123d (less specific, used last)
+    ]
+
+    for pattern in patterns:
+        match = re.search(pattern, version_string, re.IGNORECASE)
+        if match:
+            return match.group(1)
+
+    return None
+
+
 def extract_git_info(package_name: str) -> dict:
     """Extract git revision and other VCS info from a package."""
     git_info = {}
@@ -51,9 +70,34 @@ def extract_git_info(package_name: str) -> dict:
         if hasattr(pkg, "version") and hasattr(pkg.version, "full_version"):
             git_info["full_version"] = pkg.version.full_version
 
+        # If we haven't found a git revision yet, try to extract from version string
+        if "git_revision" not in git_info and hasattr(pkg, "__version__"):
+            version_hash = extract_git_hash_from_version(pkg.__version__)
+            if version_hash:
+                git_info["git_revision"] = version_hash
+                git_info["source"] = "version_string"
+
     except (ImportError, AttributeError):
         pass
 
+    # Also try to extract from importlib.metadata if available
+    if not git_info:
+        try:
+            import importlib.metadata as metadata
+
+            dist = metadata.distribution(package_name)
+            version = dist.version
+
+            # Check if the version string contains a git hash
+            version_hash = extract_git_hash_from_version(version)
+            if version_hash:
+                git_info["git_revision"] = version_hash
+                git_info["source"] = "metadata_version"
+                git_info["full_version"] = version
+
+        except Exception:
+            pass
+
     return git_info
 
 
diff --git a/simple_bisect.py b/src/issue_from_pytest_log_action/simple_bisect.py
similarity index 98%
rename from simple_bisect.py
rename to src/issue_from_pytest_log_action/simple_bisect.py
index 1636389..a180acc 100644
--- a/simple_bisect.py
+++ b/src/issue_from_pytest_log_action/simple_bisect.py
@@ -10,7 +10,7 @@
 import json
 from pathlib import Path
 
-import track_packages
+from issue_from_pytest_log_action import track_packages
 
 
 def create_run_data_file(
diff --git a/track_packages.py b/src/issue_from_pytest_log_action/track_packages.py
similarity index 100%
rename from track_packages.py
rename to src/issue_from_pytest_log_action/track_packages.py
diff --git a/tests/test_nightly_wheels.py b/tests/test_nightly_wheels.py
index c5eee0d..2630d79 100644
--- a/tests/test_nightly_wheels.py
+++ b/tests/test_nightly_wheels.py
@@ -9,7 +9,7 @@
 
 import pytest
 
-from capture_versions import extract_git_info
+from issue_from_pytest_log_action.capture_versions import extract_git_info
 
 
 class TestNightlyWheelSupport:
@@ -50,7 +50,10 @@ def test_nightly_wheel_version_patterns(self):
                 "git_info": {"git_revision": "abc123def456789012345678901234567890abcd"},
             }
 
-            from track_packages import extract_version_string, format_version_with_git
+            from issue_from_pytest_log_action.track_packages import (
+                extract_version_string,
+                format_version_with_git,
+            )
 
             extracted_version = extract_version_string(package_info)
             assert extracted_version == version
@@ -66,12 +69,9 @@ def test_capture_multiple_scientific_packages(self):
             # Test with packages that might be available
             test_env["TRACK_PACKAGES"] = "pytest,setuptools"
 
-            # Use the script directly from the source directory
-            script_path = os.path.join(
-                os.path.dirname(os.path.dirname(__file__)), "capture_versions.py"
-            )
+            # Use the installed package script
             result = subprocess.run(
-                [sys.executable, script_path],
+                [sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"],
                 env=test_env,
                 cwd=tmpdir,
                 capture_output=True,
@@ -119,7 +119,7 @@ def test_scientific_python_nightly_index_handling(self):
         }
 
         # Test that package changes detect nightly wheel updates properly
-        from track_packages import get_package_changes
+        from issue_from_pytest_log_action.track_packages import get_package_changes
 
         # Simulate updating from one nightly to another
         previous_nightly = {
diff --git a/tests/test_version_extraction.py b/tests/test_version_extraction.py
index 1df70c9..4d305a8 100644
--- a/tests/test_version_extraction.py
+++ b/tests/test_version_extraction.py
@@ -7,8 +7,8 @@
 
 import pytest
 
-from capture_versions import extract_git_info
-from track_packages import (
+from issue_from_pytest_log_action.capture_versions import extract_git_info
+from issue_from_pytest_log_action.track_packages import (
     extract_git_revision,
     extract_version_string,
     format_version_with_git,
@@ -231,12 +231,9 @@ def test_capture_versions_output_structure(self):
             import subprocess
             import sys
 
-            # Use the script directly from the source directory
-            script_path = os.path.join(
-                os.path.dirname(os.path.dirname(__file__)), "capture_versions.py"
-            )
+            # Use the installed package script
             result = subprocess.run(
-                [sys.executable, script_path],
+                [sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"],
                 env=test_env,
                 cwd=tmpdir,
                 capture_output=True,
diff --git a/tests/test_version_string_parsing.py b/tests/test_version_string_parsing.py
new file mode 100644
index 0000000..d881402
--- /dev/null
+++ b/tests/test_version_string_parsing.py
@@ -0,0 +1,143 @@
+"""Test git hash extraction from version strings."""
+
+import pytest
+
+from issue_from_pytest_log_action.capture_versions import extract_git_hash_from_version
+
+
+class TestVersionStringParsing:
+    """Test parsing git hashes from version strings."""
+
+    @pytest.mark.parametrize(
+        "version_string,expected_hash",
+        [
+            # Common nightly wheel patterns
+            ("2.1.0.dev0+123.gabc123d", "abc123d"),
+            ("1.5.0.dev0+456.gdef456a789", "def456a789"),
+            ("3.0.0a1.dev0+789.g123abc4", "123abc4"),
+            ("2.0.0.post1.dev0+100.gabc123def456", "abc123def456"),
+            # setuptools_scm patterns
+            ("1.0.0+123.gabc123d", "abc123d"),
+            ("2.1.0+gabc123def456789", "abc123def456789"),
+            # Direct git hash patterns
+            ("1.0.0.gabc123d", "abc123d"),
+            ("2.1.0.gabc123def456789012345678901234567890", "abc123def456789012345678901234567890"),
+            # Full SHA patterns
+            ("1.0.0+g" + "a" * 40, "a" * 40),
+            ("2.1.0.dev0+123.g" + "b" * 40, "b" * 40),
+            # Case insensitive
+            ("1.0.0+gABC123D", "ABC123D"),
+            ("2.1.0.gDEF456A", "DEF456A"),
+        ],
+    )
+    def test_extract_git_hash_from_version_success(self, version_string, expected_hash):
+        """Test successful extraction of git hashes from version strings."""
+        result = extract_git_hash_from_version(version_string)
+        assert result == expected_hash
+
+    @pytest.mark.parametrize(
+        "version_string",
+        [
+            # No git hash
+            "1.0.0",
+            "2.1.0.dev0",
+            "3.0.0a1",
+            "2.0.0.post1",
+            # Invalid patterns (too short)
+            "1.0.0+g123",
+            "2.1.0.g12345",
+            # Invalid characters
+            "1.0.0+gzzzyyy",
+            "2.1.0.gxywzyx",
+            # Edge cases
+            "",
+            "not.a.version",
+            "1.0.0+123",  # Number without 'g' prefix
+            # Package names that start with 'g' but aren't git hashes
+            "1.0.0+glib2.0",
+            "2.1.0.gstreamer",
+            "1.5.0+gtk3.22",
+        ],
+    )
+    def test_extract_git_hash_from_version_none(self, version_string):
+        """Test cases where no git hash should be extracted."""
+        result = extract_git_hash_from_version(version_string)
+        assert result is None
+
+    def test_extract_git_hash_multiple_patterns(self):
+        """Test that the most specific pattern is matched first."""
+        # This version has multiple potential matches, should pick the first one
+        version = "1.0.0.dev0+123.gabc123d.more.gdef456"
+        result = extract_git_hash_from_version(version)
+        assert result == "abc123d"  # Should match the first .g pattern
+
+    def test_extract_git_hash_minimum_length(self):
+        """Test minimum hash length requirement."""
+        # 7 characters should work (git short hash)
+        assert extract_git_hash_from_version("1.0.0+gabcdef1") == "abcdef1"
+
+        # 6 characters should not work
+        assert extract_git_hash_from_version("1.0.0+gabcdef") is None
+
+    def test_extract_git_hash_real_examples(self):
+        """Test with real-world examples from nightly wheels."""
+        real_examples = [
+            # numpy nightly examples
+            ("2.1.0.dev0+nightly.g1a2b3c4", "1a2b3c4"),
+            # pandas nightly examples
+            ("2.2.0.dev0+123.gabc123d", "abc123d"),
+            # setuptools_scm examples
+            ("1.0.0+dirty", None),  # dirty build, no git hash
+            ("1.0.0+123.dirty", None),  # dirty build, no git hash
+        ]
+
+        for version, expected in real_examples:
+            result = extract_git_hash_from_version(version)
+            assert result == expected, f"Failed for {version}: got {result}, expected {expected}"
+
+    def test_packages_starting_with_g(self):
+        """Test that packages starting with 'g' don't interfere with git hash extraction."""
+        from unittest.mock import MagicMock, patch
+
+        from issue_from_pytest_log_action.capture_versions import extract_git_info
+
+        # Test packages that start with 'g'
+        g_packages = ["glib", "gtk", "gstreamer", "gdal", "greenlet"]
+
+        for package_name in g_packages:
+            with patch("importlib.import_module") as mock_import:
+                # Mock a package with a version that contains a git hash
+                mock_pkg = MagicMock()
+                mock_pkg.__version__ = "2.1.0.dev0+123.gabc123d"
+
+                # Remove version module attributes to force fallback to __version__
+                delattr(mock_pkg, "version")
+                delattr(mock_pkg, "_version")
+                delattr(mock_pkg, "__git_revision__")
+
+                mock_import.return_value = mock_pkg
+
+                git_info = extract_git_info(package_name)
+
+                # Should successfully extract git hash despite package name starting with 'g'
+                assert git_info.get("git_revision") == "abc123d"
+                assert git_info.get("source") == "version_string"
+
+        # Test edge case: package named 'g' itself
+        with patch("importlib.import_module") as mock_import:
+            mock_pkg = MagicMock()
+            mock_pkg.__version__ = "1.0.0+gabc123def"
+
+            # Remove version module attributes to force fallback to __version__
+            delattr(mock_pkg, "version")
+            delattr(mock_pkg, "_version")
+            delattr(mock_pkg, "__git_revision__")
+
+            mock_import.return_value = mock_pkg
+
+            git_info = extract_git_info("g")
+            assert git_info.get("git_revision") == "abc123def"
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])

From 526a647b80de21623b25d138b5239d670d09c092 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:26:10 -0400
Subject: [PATCH 09/15] more gitignore

---
 .gitignore | 216 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 216 insertions(+)

diff --git a/.gitignore b/.gitignore
index ac675e8..d71f55c 100644
--- a/.gitignore
+++ b/.gitignore
@@ -17,3 +17,219 @@ captured-package-versions.json
 bisect-comparison.txt
 pytest-logs.txt
 run_*.json
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[codz]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#   Usually these files are written by a python script from a template
+#   before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py.cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+# Pipfile.lock
+
+# UV
+#   Similar to Pipfile.lock, it is generally recommended to include uv.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+# uv.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+# poetry.lock
+# poetry.toml
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#   pdm recommends including project-wide configuration in pdm.toml, but excluding .pdm-python.
+#   https://pdm-project.org/en/latest/usage/project/#working-with-version-control
+# pdm.lock
+# pdm.toml
+.pdm-python
+.pdm-build/
+
+# pixi
+#   Similar to Pipfile.lock, it is generally recommended to include pixi.lock in version control.
+# pixi.lock
+#   Pixi creates a virtual environment in the .pixi directory, just like venv module creates one
+#   in the .venv directory. It is recommended not to include this directory in version control.
+.pixi
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# Redis
+*.rdb
+*.aof
+*.pid
+
+# RabbitMQ
+mnesia/
+rabbitmq/
+rabbitmq-data/
+
+# ActiveMQ
+activemq-data/
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.envrc
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#   JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#   be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#   and can be added to the global gitignore or merged into this file.  For a more nuclear
+#   option (not recommended) you can uncomment the following to ignore the entire idea folder.
+# .idea/
+
+# Abstra
+#   Abstra is an AI-powered process automation framework.
+#   Ignore directories containing user credentials, local state, and settings.
+#   Learn more at https://abstra.io/docs
+.abstra/
+
+# Visual Studio Code
+#   Visual Studio Code specific template is maintained in a separate VisualStudioCode.gitignore
+#   that can be found at https://github.com/github/gitignore/blob/main/Global/VisualStudioCode.gitignore
+#   and can be added to the global gitignore or merged into this file. However, if you prefer,
+#   you could uncomment the following to ignore the entire vscode folder
+# .vscode/
+
+# Ruff stuff:
+.ruff_cache/
+
+# PyPI configuration file
+.pypirc
+
+# Marimo
+marimo/_static/
+marimo/_lsp/
+__marimo__/
+
+# Streamlit
+.streamlit/secrets.toml

From 927378411573e9b83ece6ae861064cb0b39326da Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:29:49 -0400
Subject: [PATCH 10/15] Add GitHub Actions testing workflow and project
 documentation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add comprehensive test workflow with Python 3.9-3.13 matrix testing
- Include lint job with ruff and mypy validation
- Add action integration test to verify CLI functionality works
- Create CLAUDE.md with project overview, goals, and structure
- Test both package installation and git info extraction capabilities

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .github/workflows/test.yml | 98 ++++++++++++++++++++++++++++++++++++++
 CLAUDE.md                  | 69 +++++++++++++++++++++++++++
 2 files changed, 167 insertions(+)
 create mode 100644 .github/workflows/test.yml
 create mode 100644 CLAUDE.md

diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
new file mode 100644
index 0000000..fb81fb8
--- /dev/null
+++ b/.github/workflows/test.yml
@@ -0,0 +1,98 @@
+name: Test
+
+on:
+  push:
+    branches: [main, bisect]
+  pull_request:
+    branches: [main]
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.9", "3.10", "3.11", "3.12", "3.13"]
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+        with:
+          enable-cache: true
+
+      - name: Set up Python ${{ matrix.python-version }}
+        run: uv python install ${{ matrix.python-version }}
+
+      - name: Install dependencies
+        run: |
+          uv sync --extra test
+
+      - name: Run tests with pytest
+        run: |
+          uv run pytest tests/ -v --tb=short
+
+      - name: Test CLI commands
+        run: |
+          # Test the CLI entry points work
+          uv run capture-versions --help || echo "capture-versions help not available (expected)"
+
+          # Test module execution
+          TRACK_PACKAGES="pytest" uv run python -m issue_from_pytest_log_action.capture_versions
+
+          # Test simple-bisect help
+          uv run python -m issue_from_pytest_log_action.simple_bisect --help
+
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+        with:
+          enable-cache: true
+
+      - name: Set up Python
+        run: uv python install 3.12
+
+      - name: Install dependencies
+        run: |
+          uv sync --extra dev
+
+      - name: Run ruff
+        run: |
+          uv run ruff check .
+
+      - name: Run mypy
+        run: |
+          uv run mypy src/issue_from_pytest_log_action/
+
+  test-action:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Test Action Installation
+        run: |
+          python -m pip install .
+
+      - name: Test capture-versions CLI
+        run: |
+          TRACK_PACKAGES="pytest,setuptools" python -m issue_from_pytest_log_action.capture_versions
+          cat captured-package-versions.json
+
+      - name: Verify git info extraction
+        run: |
+          python -c "
+          import json
+          with open('captured-package-versions.json') as f:
+              data = json.load(f)
+
+          packages = data['packages']
+          for pkg_name, pkg_info in packages.items():
+              if isinstance(pkg_info, dict) and 'git_info' in pkg_info:
+                  print(f'{pkg_name}: {pkg_info[\"version\"]} with git_info: {pkg_info[\"git_info\"]}')
+              else:
+                  print(f'{pkg_name}: {pkg_info} (simple format)')
+          "
diff --git a/CLAUDE.md b/CLAUDE.md
new file mode 100644
index 0000000..23005c6
--- /dev/null
+++ b/CLAUDE.md
@@ -0,0 +1,69 @@
+# Issue from pytest log action
+
+## Project Goals
+
+This GitHub Action creates GitHub issues from pytest failures and provides **bisection analysis** to identify which package version changes may have caused test failures. It's particularly useful for monitoring upstream dependency changes in CI pipelines.
+
+## Key Features
+
+- **Automated Issue Creation**: Parses pytest-reportlog files and creates/updates GitHub issues for failures
+- **Package Version Tracking**: Captures package versions from the test environment using any Python package manager (pip, conda, uv, poetry, pixi)
+- **Bisection Analysis**: Compares current failures with historical successful runs to identify version changes
+- **Git Commit Hash Extraction**: Extracts commit hashes from nightly wheels and setuptools_scm packages for precise tracking
+- **Per-Test Analysis**: Shows when each failing test last passed and what changed since then
+
+## Project Structure
+
+```
+├── src/issue_from_pytest_log_action/     # Main Python package
+│   ├── capture_versions.py               # Extract package versions & git info
+│   ├── simple_bisect.py                  # Bisection data handling
+│   └── track_packages.py                 # Package comparison & GitHub links
+├── tests/                                 # Comprehensive test suite (59 tests)
+│   ├── test_version_extraction.py        # Core version handling tests
+│   ├── test_nightly_wheels.py           # Scientific Python nightly wheel support
+│   └── test_version_string_parsing.py   # Git hash extraction from version strings
+├── action.yaml                          # GitHub Action definition
+├── parse_logs.py                        # Legacy pytest log parser
+└── .github/workflows/test.yml           # CI testing workflow
+```
+
+## How It Works
+
+1. **Test Environment Analysis**: Captures package versions from the same environment that ran tests
+2. **Git Operations**: Uses GitHub Actions steps to manage the bisection data branch
+3. **Historical Comparison**: Compares current failures with the last successful run
+4. **Rich Reporting**: Generates markdown reports with GitHub diff links and git commit info
+
+## Nightly Wheel Support
+
+The action can extract git commit hashes from various version string patterns:
+
+- `2.1.0.dev0+123.gabc123d` → `abc123d`
+- `1.5.0+gdef456a789` → `def456a789`
+- Scientific Python nightly wheels from `pypi.anaconda.org/scientific-python-nightly-wheels/simple`
+
+## Usage Example
+
+```yaml
+- name: Create issue from pytest failures
+  uses: ianhi/issue-from-pytest-log-action@bisect
+  with:
+    log-path: pytest-log.jsonl
+    track-packages: "numpy,pandas,xarray"
+    python-command: "uv run python"
+```
+
+## Development
+
+- **Package Management**: Uses `uv` for dependency management
+- **Testing**: Run `uv run pytest tests/` (59 comprehensive tests)
+- **Linting**: Pre-commit hooks with ruff, mypy, and actionlint
+- **Installation**: `pip install .` installs the `issue-from-pytest-log-action` package
+
+## Key Files to Understand
+
+- `action.yaml`: The main GitHub Action interface
+- `src/issue_from_pytest_log_action/capture_versions.py`: Version extraction logic
+- `src/issue_from_pytest_log_action/track_packages.py`: Bisection comparison logic
+- `tests/`: Comprehensive test coverage for all functionality

From c94b492aaca3c1220d576455ea42cc60c8f5b4a6 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:36:23 -0400
Subject: [PATCH 11/15] Fix GitHub diff link generation and py_version
 parameter
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Completely rewrote generate_package_diff_link() to properly handle different tag formats
- Added PACKAGE_METADATA with tag formats for common packages (numpy, pandas, etc.)
- Support commit-to-commit comparison when git hashes are available
- Clean version strings for proper tag matching
- Handle special cases like SQLAlchemy's rel_ prefix and hypothesis naming
- Fix py_version undefined error in format_collection_error()

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .markdownlint.yaml                            |   5 +
 action.yaml                                   |   2 +-
 .../parse_logs.py                             | 290 ++++++++++++++++++
 .../track_packages.py                         | 157 +++++++---
 4 files changed, 416 insertions(+), 38 deletions(-)
 create mode 100644 .markdownlint.yaml
 create mode 100644 src/issue_from_pytest_log_action/parse_logs.py

diff --git a/.markdownlint.yaml b/.markdownlint.yaml
new file mode 100644
index 0000000..faa444e
--- /dev/null
+++ b/.markdownlint.yaml
@@ -0,0 +1,5 @@
+# Markdownlint configuration
+# See: https://github.com/DavidAnson/markdownlint/blob/main/schema/.markdownlint.yaml
+
+# Disable line length rule
+MD013: false
diff --git a/action.yaml b/action.yaml
index ea52001..007366a 100644
--- a/action.yaml
+++ b/action.yaml
@@ -158,7 +158,7 @@ runs:
     - name: produce the issue body
       shell: bash -l {0}
       run: |
-        python $GITHUB_ACTION_PATH/parse_logs.py ${{ inputs.log-path }}
+        python -m issue_from_pytest_log_action.parse_logs ${{ inputs.log-path }}
     - name: create the issue
       uses: actions/github-script@v7
       with:
diff --git a/src/issue_from_pytest_log_action/parse_logs.py b/src/issue_from_pytest_log_action/parse_logs.py
new file mode 100644
index 0000000..156901f
--- /dev/null
+++ b/src/issue_from_pytest_log_action/parse_logs.py
@@ -0,0 +1,290 @@
+# type: ignore
+import argparse
+import functools
+import json
+import pathlib
+import re
+import sys
+import textwrap
+from dataclasses import dataclass
+
+import more_itertools
+from pytest import CollectReport, TestReport
+
+test_collection_stage = "test collection session"
+fe_bytes = "[\x40-\x5f]"
+parameter_bytes = "[\x30-\x3f]"
+intermediate_bytes = "[\x20-\x2f]"
+final_bytes = "[\x40-\x7e]"
+ansi_fe_escape_re = re.compile(
+    rf"""
+    \x1B # ESC
+    (?:
+      \[  # CSI
+      {parameter_bytes}*
+      {intermediate_bytes}*
+      {final_bytes}
+      | {fe_bytes}  # single-byte Fe
+    )
+    """,
+    re.VERBOSE,
+)
+
+
+def strip_ansi(msg):
+    """strip all ansi escape sequences"""
+    return ansi_fe_escape_re.sub("", msg)
+
+
+@dataclass
+class SessionStart:
+    pytest_version: str
+    outcome: str = "status"
+
+    @classmethod
+    def _from_json(cls, json):
+        json_ = json.copy()
+        json_.pop("$report_type")
+        return cls(**json_)
+
+
+@dataclass
+class SessionFinish:
+    exitstatus: str
+    outcome: str = "status"
+
+    @classmethod
+    def _from_json(cls, json):
+        json_ = json.copy()
+        json_.pop("$report_type")
+        return cls(**json_)
+
+
+@dataclass
+class PreformattedReport:
+    filepath: str
+    name: str
+    variant: str | None
+    message: str
+
+    def __post_init__(self):
+        self.message = strip_ansi(self.message)
+
+
+@dataclass
+class CollectionError:
+    name: str
+    repr_: str
+
+
+def parse_record(record):
+    report_types = {
+        "TestReport": TestReport,
+        "CollectReport": CollectReport,
+        "SessionStart": SessionStart,
+        "SessionFinish": SessionFinish,
+    }
+    cls = report_types.get(record["$report_type"])
+    if cls is None:
+        raise ValueError(f"unknown report type: {record['$report_type']}")
+
+    return cls._from_json(record)
+
+
+nodeid_re = re.compile(r"(?P<filepath>.+?)::(?P<name>.+?)(?:\[(?P<variant>.+)\])?")
+
+
+def parse_nodeid(nodeid):
+    match = nodeid_re.fullmatch(nodeid)
+    if match is None:
+        raise ValueError(f"unknown test id: {nodeid}")
+
+    return match.groupdict()
+
+
+@functools.singledispatch
+def preformat_report(report):
+    parsed = parse_nodeid(report.nodeid)
+    return PreformattedReport(message=str(report), **parsed)
+
+
+@preformat_report.register
+def _(report: TestReport):
+    parsed = parse_nodeid(report.nodeid)
+    if isinstance(report.longrepr, str):
+        message = report.longrepr
+    else:
+        message = report.longrepr.reprcrash.message
+    return PreformattedReport(message=message, **parsed)
+
+
+@preformat_report.register
+def _(report: CollectReport):
+    if report.nodeid == "":
+        return CollectionError(name=test_collection_stage, repr_=str(report.longrepr))
+
+    if "::" not in report.nodeid:
+        parsed = {
+            "filepath": report.nodeid,
+            "name": None,
+            "variant": None,
+        }
+    else:
+        parsed = parse_nodeid(report.nodeid)
+
+    if isinstance(report.longrepr, str):
+        message = report.longrepr.split("\n")[-1].removeprefix("E").lstrip()
+    else:
+        message = report.longrepr.reprcrash.message
+    return PreformattedReport(message=message, **parsed)
+
+
+def format_summary(report):
+    if report.variant is not None:
+        return f"{report.filepath}::{report.name}[{report.variant}]: {report.message}"
+    elif report.name is not None:
+        return f"{report.filepath}::{report.name}: {report.message}"
+    else:
+        return f"{report.filepath}: {report.message}"
+
+
+def format_report(summaries, py_version):
+    template = textwrap.dedent(
+        """\
+        <details><summary>Python {py_version} Test Summary</summary>
+
+        ```
+        {summaries}
+        ```
+
+        </details>
+        """
+    )
+    # can't use f-strings because that would format *before* the dedenting
+    message = template.format(summaries="\n".join(summaries), py_version=py_version)
+    return message
+
+
+def merge_variants(reports, max_chars, **formatter_kwargs):
+    def format_variant_group(name, group):
+        filepath, test_name, message = name
+
+        n_variants = len(group)
+        if n_variants != 1:
+            return f"{filepath}::{test_name}[{n_variants} failing variants]: {message}"
+        elif n_variants == 1 and group[0].variant is not None:
+            report = more_itertools.one(group)
+            return f"{filepath}::{test_name}[{report.variant}]: {message}"
+        else:
+            return f"{filepath}::{test_name}: {message}"
+
+    bucket = more_itertools.bucket(reports, lambda r: (r.filepath, r.name, r.message))
+
+    summaries = [format_variant_group(name, list(bucket[name])) for name in bucket]
+    formatted = format_report(summaries, **formatter_kwargs)
+
+    return formatted
+
+
+def truncate(reports, max_chars, **formatter_kwargs):
+    fractions = [0.95, 0.75, 0.5, 0.25, 0.1, 0.01]
+
+    n_reports = len(reports)
+    for fraction in fractions:
+        n_selected = int(n_reports * fraction)
+        selected_reports = reports[: int(n_reports * fraction)]
+        report_messages = [format_summary(report) for report in selected_reports]
+        summary = report_messages + [f"+ {n_reports - n_selected} failing tests"]
+        formatted = format_report(summary, **formatter_kwargs)
+        if len(formatted) <= max_chars:
+            return formatted
+
+    return None
+
+
+def summarize(reports, **formatter_kwargs):
+    summary = [f"{len(reports)} failing tests"]
+    return format_report(summary, **formatter_kwargs)
+
+
+def compressed_report(reports, max_chars, **formatter_kwargs):
+    strategies = [
+        merge_variants,
+        # merge_test_files,
+        # merge_tests,
+        truncate,
+    ]
+    summaries = [format_summary(report) for report in reports]
+    formatted = format_report(summaries, **formatter_kwargs)
+    if len(formatted) <= max_chars:
+        return formatted
+
+    for strategy in strategies:
+        formatted = strategy(reports, max_chars=max_chars, **formatter_kwargs)
+        if formatted is not None and len(formatted) <= max_chars:
+            return formatted
+
+    return summarize(reports, **formatter_kwargs)
+
+
+def format_collection_error(error, py_version, **formatter_kwargs):
+    return textwrap.dedent(
+        """\
+        <details><summary>Python {py_version} Test Summary</summary>
+
+        {name} failed:
+        ```
+        {traceback}
+        ```
+
+        </details>
+        """
+    ).format(py_version=py_version, name=error.name, traceback=error.repr_)
+
+
+def include_bisection_info(message: str, bisect_file: str = "bisect-comparison.txt") -> str:
+    """Include bisection information in the issue message if available."""
+    bisect_path = pathlib.Path(bisect_file)
+    if bisect_path.exists():
+        bisect_content = bisect_path.read_text().strip()
+        if bisect_content:
+            return f"{bisect_content}\n{message}"
+    return message
+
+
+def main(argv=None):
+    """Main entry point for parse_logs module."""
+    if argv is None:
+        argv = sys.argv[1:]
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("filepath", type=pathlib.Path)
+    args = parser.parse_args(argv)
+
+    py_version = ".".join(str(_) for _ in sys.version_info[:2])
+
+    print("Parsing logs ...")
+
+    lines = args.filepath.read_text().splitlines()
+    parsed_lines = [json.loads(line) for line in lines]
+    reports = [
+        parse_record(data) for data in parsed_lines if data["$report_type"] != "WarningMessage"
+    ]
+
+    failed = [report for report in reports if report.outcome == "failed"]
+    preformatted = [preformat_report(report) for report in failed]
+    if len(preformatted) == 1 and isinstance(preformatted[0], CollectionError):
+        message = format_collection_error(preformatted[0], py_version=py_version)
+    else:
+        message = compressed_report(preformatted, max_chars=65535, py_version=py_version)
+
+    # Include bisection information if available
+    message = include_bisection_info(message)
+
+    output_file = pathlib.Path("pytest-logs.txt")
+    print(f"Writing output file to: {output_file.absolute()}")
+    output_file.write_text(message)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/src/issue_from_pytest_log_action/track_packages.py b/src/issue_from_pytest_log_action/track_packages.py
index f0c7238..5111712 100644
--- a/src/issue_from_pytest_log_action/track_packages.py
+++ b/src/issue_from_pytest_log_action/track_packages.py
@@ -16,52 +16,110 @@
 
 # Package metadata for generating GitHub links
 PACKAGE_METADATA = {
-    "numpy": {"github": "numpy/numpy", "type": "releases"},
-    "pandas": {"github": "pandas-dev/pandas", "type": "releases"},
-    "matplotlib": {"github": "matplotlib/matplotlib", "type": "releases"},
-    "scipy": {"github": "scipy/scipy", "type": "releases"},
-    "scikit-learn": {"github": "scikit-learn/scikit-learn", "type": "releases"},
-    "requests": {"github": "psf/requests", "type": "releases"},
-    "django": {"github": "django/django", "type": "releases"},
-    "flask": {"github": "pallets/flask", "type": "releases"},
-    "pytest": {"github": "pytest-dev/pytest", "type": "releases"},
-    "hypothesis": {"github": "HypothesisWorks/hypothesis", "type": "releases"},
-    "xarray": {"github": "pydata/xarray", "type": "releases"},
-    "dask": {"github": "dask/dask", "type": "releases"},
-    "jupyterlab": {"github": "jupyterlab/jupyterlab", "type": "releases"},
-    "notebook": {"github": "jupyter/notebook", "type": "releases"},
-    "ipython": {"github": "ipython/ipython", "type": "releases"},
-    "tensorflow": {"github": "tensorflow/tensorflow", "type": "releases"},
-    "torch": {"github": "pytorch/pytorch", "type": "releases"},
-    "fastapi": {"github": "tiangolo/fastapi", "type": "releases"},
-    "pydantic": {"github": "pydantic/pydantic", "type": "releases"},
-    "sqlalchemy": {"github": "sqlalchemy/sqlalchemy", "type": "releases"},
-    "black": {"github": "psf/black", "type": "releases"},
-    "mypy": {"github": "python/mypy", "type": "releases"},
-    "ruff": {"github": "astral-sh/ruff", "type": "releases"},
+    "numpy": {"github": "numpy/numpy", "tag_format": "v{version}"},
+    "pandas": {"github": "pandas-dev/pandas", "tag_format": "v{version}"},
+    "matplotlib": {"github": "matplotlib/matplotlib", "tag_format": "v{version}"},
+    "scipy": {"github": "scipy/scipy", "tag_format": "v{version}"},
+    "scikit-learn": {"github": "scikit-learn/scikit-learn", "tag_format": "{version}"},
+    "requests": {"github": "psf/requests", "tag_format": "v{version}"},
+    "django": {"github": "django/django", "tag_format": "{version}"},
+    "flask": {"github": "pallets/flask", "tag_format": "{version}"},
+    "pytest": {"github": "pytest-dev/pytest", "tag_format": "{version}"},
+    "hypothesis": {
+        "github": "HypothesisWorks/hypothesis",
+        "tag_format": "hypothesis-python-{version}",
+    },
+    "xarray": {"github": "pydata/xarray", "tag_format": "v{version}"},
+    "dask": {"github": "dask/dask", "tag_format": "{version}"},
+    "jupyterlab": {"github": "jupyterlab/jupyterlab", "tag_format": "v{version}"},
+    "notebook": {"github": "jupyter/notebook", "tag_format": "v{version}"},
+    "ipython": {"github": "ipython/ipython", "tag_format": "{version}"},
+    "tensorflow": {"github": "tensorflow/tensorflow", "tag_format": "v{version}"},
+    "torch": {"github": "pytorch/pytorch", "tag_format": "v{version}"},
+    "fastapi": {"github": "tiangolo/fastapi", "tag_format": "{version}"},
+    "pydantic": {"github": "pydantic/pydantic", "tag_format": "v{version}"},
+    "sqlalchemy": {"github": "sqlalchemy/sqlalchemy", "tag_format": "rel_{version}"},
+    "black": {"github": "psf/black", "tag_format": "{version}"},
+    "mypy": {"github": "python/mypy", "tag_format": "v{version}"},
+    "ruff": {"github": "astral-sh/ruff", "tag_format": "{version}"},
 }
 
 
-def generate_package_diff_link(package_name: str, old_version: str, new_version: str) -> str | None:
+def is_git_commit(version_or_commit: str) -> bool:
+    """Check if a string looks like a git commit hash."""
+    import re
+
+    # Git commit hash: 7-40 hex characters
+    return bool(re.match(r"^[a-f0-9]{7,40}$", version_or_commit, re.IGNORECASE))
+
+
+def clean_version_for_tag(version: str) -> str:
+    """Clean version string for tag lookup (remove dev/nightly suffixes)."""
+    import re
+
+    # Remove common development suffixes
+    patterns = [
+        r"\.dev\d*.*",  # .dev0, .dev123+gabc
+        r"\+.*",  # +gabc123d, +123.gabc123d
+        r"\.post\d*.*",  # .post1
+        r"[ab]\d*.*",  # a1, b2, alpha1, beta2
+        r"rc\d*.*",  # rc1, rc2
+        r"\.dirty.*",  # .dirty
+    ]
+
+    clean_version = version
+    for pattern in patterns:
+        clean_version = re.sub(pattern, "", clean_version)
+
+    return clean_version
+
+
+def generate_package_diff_link(
+    package_name: str,
+    old_version: str,
+    new_version: str,
+    old_git_info: dict | None = None,
+    new_git_info: dict | None = None,
+) -> str | None:
     """Generate a GitHub diff link for package version changes."""
     if package_name not in PACKAGE_METADATA:
         return None
 
     metadata = PACKAGE_METADATA[package_name]
     repo = metadata["github"]
+    tag_format = metadata["tag_format"]
 
-    if metadata["type"] == "releases":
-        # Try different tag formats common in Python packages
-        tag_formats = [
-            f"v{old_version}...v{new_version}",  # v1.0.0...v1.1.0
-            f"{old_version}...{new_version}",  # 1.0.0...1.1.0
-            f"release-{old_version}...release-{new_version}",  # release-1.0.0...release-1.1.0
-        ]
+    # Extract git commits if available
+    old_commit = None
+    new_commit = None
 
-        # Return the first format (most common)
-        return f"https://github.com/{repo}/compare/{tag_formats[0]}"
+    if old_git_info and "git_revision" in old_git_info:
+        old_commit = old_git_info["git_revision"]
+    if new_git_info and "git_revision" in new_git_info:
+        new_commit = new_git_info["git_revision"]
 
-    return None
+    # Case 1: Both have git commits - use commit comparison
+    if old_commit and new_commit and old_commit != new_commit:
+        return f"https://github.com/{repo}/compare/{old_commit}...{new_commit}"
+
+    # Case 2: Only one has git commit - can't create meaningful diff
+    if (old_commit and not new_commit) or (new_commit and not old_commit):
+        return None
+
+    # Case 3: No git commits, use version tags
+    # Clean versions for tag comparison
+    clean_old = clean_version_for_tag(old_version)
+    clean_new = clean_version_for_tag(new_version)
+
+    # Skip if versions are the same after cleaning (likely just different git commits)
+    if clean_old == clean_new:
+        return None
+
+    # Generate tags using the package's tag format
+    old_tag = tag_format.format(version=clean_old)
+    new_tag = tag_format.format(version=clean_new)
+
+    return f"https://github.com/{repo}/compare/{old_tag}...{new_tag}"
 
 
 def get_all_installed_packages() -> dict[str, str | None]:
@@ -493,6 +551,13 @@ def extract_version_string(package_info: dict | str | None) -> str | None:
     return None
 
 
+def extract_git_revision_dict(package_info: dict | str | None) -> dict | None:
+    """Extract git info dict from package info if available."""
+    if isinstance(package_info, dict) and "git_info" in package_info:
+        return package_info["git_info"]
+    return None
+
+
 def extract_git_revision(package_info: dict | str | None) -> str | None:
     """Extract git revision from package info if available."""
     if isinstance(package_info, dict) and "git_info" in package_info:
@@ -544,16 +609,34 @@ def get_package_changes(current_packages: dict, previous_packages: dict) -> list
 
             # Try to generate a GitHub diff link for version changes
             if current_version != previous_version:
-                diff_link = generate_package_diff_link(package, previous_version, current_version)
+                # Extract git info for link generation
+                old_git_info = extract_git_revision_dict(previous_info)
+                new_git_info = extract_git_revision_dict(current_info)
+
+                diff_link = generate_package_diff_link(
+                    package, previous_version, current_version, old_git_info, new_git_info
+                )
                 if diff_link:
                     changes.append(f"- [{package}: {prev_display} → {curr_display}]({diff_link})")
                 else:
                     changes.append(f"- {package}: {prev_display} → {curr_display}")
             else:
                 # Only git revision changed (nightly build case)
-                changes.append(
-                    f"- {package}: {prev_display} → {curr_display} (git revision changed)"
+                # Try to generate commit comparison link
+                old_git_info = extract_git_revision_dict(previous_info)
+                new_git_info = extract_git_revision_dict(current_info)
+
+                diff_link = generate_package_diff_link(
+                    package, previous_version, current_version, old_git_info, new_git_info
                 )
+                if diff_link:
+                    changes.append(
+                        f"- [{package}: {prev_display} → {curr_display} (git revision changed)]({diff_link})"
+                    )
+                else:
+                    changes.append(
+                        f"- {package}: {prev_display} → {curr_display} (git revision changed)"
+                    )
 
     return changes
 

From 98427d30c8d6942b2e27db82d109b96cadc5e2ad Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:38:00 -0400
Subject: [PATCH 12/15] Clean up repository structure by removing old files
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Remove old Python files that were moved into the package structure:
- generate_bisect_comparison.py → src/issue_from_pytest_log_action/simple_bisect.py
- parse_logs.py → src/issue_from_pytest_log_action/parse_logs.py
- store_bisect_data.py → merged into simple_bisect.py
- test_parse_log.py → tests/test_parse_logs.py
- test_track_packages.py → tests/test_version_string_parsing.py

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 generate_bisect_comparison.py | 109 ---------
 parse_logs.py                 | 282 ------------------------
 store_bisect_data.py          |  45 ----
 test_parse_log.py             |  93 --------
 test_track_packages.py        | 400 ----------------------------------
 5 files changed, 929 deletions(-)
 delete mode 100644 generate_bisect_comparison.py
 delete mode 100644 parse_logs.py
 delete mode 100644 store_bisect_data.py
 delete mode 100644 test_parse_log.py
 delete mode 100644 test_track_packages.py

diff --git a/generate_bisect_comparison.py b/generate_bisect_comparison.py
deleted file mode 100644
index 3116b2e..0000000
--- a/generate_bisect_comparison.py
+++ /dev/null
@@ -1,109 +0,0 @@
-#!/usr/bin/env python3
-"""
-Generate bisection comparison using GitHub API instead of Git operations.
-
-This approach uses the GitHub API to fetch previous run data from the branch,
-avoiding complex Git subprocess operations.
-"""
-
-import json
-import os
-import sys
-from pathlib import Path
-
-import track_packages
-
-
-def fetch_previous_data_via_api(repo: str, branch: str, token: str) -> dict | None:
-    """Fetch the most recent successful run data via GitHub API."""
-    import urllib.error
-    import urllib.request
-
-    try:
-        # Get branch contents
-        url = f"https://api.github.com/repos/{repo}/contents?ref={branch}"
-        req = urllib.request.Request(url)
-        req.add_header("Authorization", f"token {token}")
-        req.add_header("Accept", "application/vnd.github.v3+json")
-
-        with urllib.request.urlopen(req) as response:
-            files = json.loads(response.read().decode())
-
-        # Find JSON files
-        json_files = [f for f in files if f["name"].endswith(".json")]
-
-        if not json_files:
-            return None
-
-        # Check each file to find the most recent successful run
-        most_recent_success = None
-        most_recent_timestamp = None
-
-        for file_info in json_files:
-            try:
-                # Fetch file content
-                content_url = file_info["download_url"]
-                with urllib.request.urlopen(content_url) as response:
-                    run_data = json.loads(response.read().decode())
-
-                # Check if this was a successful run
-                if run_data.get("test_status") == "passed":
-                    timestamp = run_data.get("timestamp")
-                    if timestamp and (
-                        most_recent_timestamp is None or timestamp > most_recent_timestamp
-                    ):
-                        most_recent_timestamp = timestamp
-                        most_recent_success = run_data
-
-            except (urllib.error.URLError, json.JSONDecodeError):
-                continue
-
-        return most_recent_success
-
-    except (urllib.error.URLError, json.JSONDecodeError):
-        return None
-
-
-def main():
-    """Generate bisection comparison using GitHub API."""
-    if len(sys.argv) < 4:
-        print(
-            "Usage: generate_bisect_comparison.py <packages> <log_path> <branch> [captured_versions_file]"
-        )
-        sys.exit(1)
-
-    packages_str = sys.argv[1]
-    log_path = sys.argv[2]
-    branch = sys.argv[3]
-    captured_versions_file = sys.argv[4] if len(sys.argv) > 4 else None
-
-    packages = [pkg.strip() for pkg in packages_str.split(",") if pkg.strip()]
-
-    # Create current run data
-    current_data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
-
-    # Get repository info from environment
-    repo = os.environ.get("GITHUB_REPOSITORY")
-    token = os.environ.get("GITHUB_TOKEN")
-
-    if not repo or not token:
-        print("Error: GITHUB_REPOSITORY and GITHUB_TOKEN environment variables required")
-        sys.exit(1)
-
-    # Fetch previous successful run data
-    previous_data = fetch_previous_data_via_api(repo, branch, token)
-
-    # Generate comparison
-    comparison = track_packages.format_bisect_comparison(current_data, previous_data, branch)
-
-    # Write comparison to file
-    output_path = Path("bisect-comparison.txt")
-    if comparison:
-        output_path.write_text(comparison)
-        print(f"Bisection comparison written to {output_path.absolute()}")
-    else:
-        print("No comparison generated (no failed tests)")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/parse_logs.py b/parse_logs.py
deleted file mode 100644
index 4ba3151..0000000
--- a/parse_logs.py
+++ /dev/null
@@ -1,282 +0,0 @@
-# type: ignore
-import argparse
-import functools
-import json
-import pathlib
-import re
-import sys
-import textwrap
-from dataclasses import dataclass
-
-import more_itertools
-from pytest import CollectReport, TestReport
-
-test_collection_stage = "test collection session"
-fe_bytes = "[\x40-\x5f]"
-parameter_bytes = "[\x30-\x3f]"
-intermediate_bytes = "[\x20-\x2f]"
-final_bytes = "[\x40-\x7e]"
-ansi_fe_escape_re = re.compile(
-    rf"""
-    \x1B # ESC
-    (?:
-      \[  # CSI
-      {parameter_bytes}*
-      {intermediate_bytes}*
-      {final_bytes}
-      | {fe_bytes}  # single-byte Fe
-    )
-    """,
-    re.VERBOSE,
-)
-
-
-def strip_ansi(msg):
-    """strip all ansi escape sequences"""
-    return ansi_fe_escape_re.sub("", msg)
-
-
-@dataclass
-class SessionStart:
-    pytest_version: str
-    outcome: str = "status"
-
-    @classmethod
-    def _from_json(cls, json):
-        json_ = json.copy()
-        json_.pop("$report_type")
-        return cls(**json_)
-
-
-@dataclass
-class SessionFinish:
-    exitstatus: str
-    outcome: str = "status"
-
-    @classmethod
-    def _from_json(cls, json):
-        json_ = json.copy()
-        json_.pop("$report_type")
-        return cls(**json_)
-
-
-@dataclass
-class PreformattedReport:
-    filepath: str
-    name: str
-    variant: str | None
-    message: str
-
-    def __post_init__(self):
-        self.message = strip_ansi(self.message)
-
-
-@dataclass
-class CollectionError:
-    name: str
-    repr_: str
-
-
-def parse_record(record):
-    report_types = {
-        "TestReport": TestReport,
-        "CollectReport": CollectReport,
-        "SessionStart": SessionStart,
-        "SessionFinish": SessionFinish,
-    }
-    cls = report_types.get(record["$report_type"])
-    if cls is None:
-        raise ValueError(f"unknown report type: {record['$report_type']}")
-
-    return cls._from_json(record)
-
-
-nodeid_re = re.compile(r"(?P<filepath>.+?)::(?P<name>.+?)(?:\[(?P<variant>.+)\])?")
-
-
-def parse_nodeid(nodeid):
-    match = nodeid_re.fullmatch(nodeid)
-    if match is None:
-        raise ValueError(f"unknown test id: {nodeid}")
-
-    return match.groupdict()
-
-
-@functools.singledispatch
-def preformat_report(report):
-    parsed = parse_nodeid(report.nodeid)
-    return PreformattedReport(message=str(report), **parsed)
-
-
-@preformat_report.register
-def _(report: TestReport):
-    parsed = parse_nodeid(report.nodeid)
-    if isinstance(report.longrepr, str):
-        message = report.longrepr
-    else:
-        message = report.longrepr.reprcrash.message
-    return PreformattedReport(message=message, **parsed)
-
-
-@preformat_report.register
-def _(report: CollectReport):
-    if report.nodeid == "":
-        return CollectionError(name=test_collection_stage, repr_=str(report.longrepr))
-
-    if "::" not in report.nodeid:
-        parsed = {
-            "filepath": report.nodeid,
-            "name": None,
-            "variant": None,
-        }
-    else:
-        parsed = parse_nodeid(report.nodeid)
-
-    if isinstance(report.longrepr, str):
-        message = report.longrepr.split("\n")[-1].removeprefix("E").lstrip()
-    else:
-        message = report.longrepr.reprcrash.message
-    return PreformattedReport(message=message, **parsed)
-
-
-def format_summary(report):
-    if report.variant is not None:
-        return f"{report.filepath}::{report.name}[{report.variant}]: {report.message}"
-    elif report.name is not None:
-        return f"{report.filepath}::{report.name}: {report.message}"
-    else:
-        return f"{report.filepath}: {report.message}"
-
-
-def format_report(summaries, py_version):
-    template = textwrap.dedent(
-        """\
-        <details><summary>Python {py_version} Test Summary</summary>
-
-        ```
-        {summaries}
-        ```
-
-        </details>
-        """
-    )
-    # can't use f-strings because that would format *before* the dedenting
-    message = template.format(summaries="\n".join(summaries), py_version=py_version)
-    return message
-
-
-def merge_variants(reports, max_chars, **formatter_kwargs):
-    def format_variant_group(name, group):
-        filepath, test_name, message = name
-
-        n_variants = len(group)
-        if n_variants != 1:
-            return f"{filepath}::{test_name}[{n_variants} failing variants]: {message}"
-        elif n_variants == 1 and group[0].variant is not None:
-            report = more_itertools.one(group)
-            return f"{filepath}::{test_name}[{report.variant}]: {message}"
-        else:
-            return f"{filepath}::{test_name}: {message}"
-
-    bucket = more_itertools.bucket(reports, lambda r: (r.filepath, r.name, r.message))
-
-    summaries = [format_variant_group(name, list(bucket[name])) for name in bucket]
-    formatted = format_report(summaries, **formatter_kwargs)
-
-    return formatted
-
-
-def truncate(reports, max_chars, **formatter_kwargs):
-    fractions = [0.95, 0.75, 0.5, 0.25, 0.1, 0.01]
-
-    n_reports = len(reports)
-    for fraction in fractions:
-        n_selected = int(n_reports * fraction)
-        selected_reports = reports[: int(n_reports * fraction)]
-        report_messages = [format_summary(report) for report in selected_reports]
-        summary = report_messages + [f"+ {n_reports - n_selected} failing tests"]
-        formatted = format_report(summary, **formatter_kwargs)
-        if len(formatted) <= max_chars:
-            return formatted
-
-    return None
-
-
-def summarize(reports, **formatter_kwargs):
-    summary = [f"{len(reports)} failing tests"]
-    return format_report(summary, **formatter_kwargs)
-
-
-def compressed_report(reports, max_chars, **formatter_kwargs):
-    strategies = [
-        merge_variants,
-        # merge_test_files,
-        # merge_tests,
-        truncate,
-    ]
-    summaries = [format_summary(report) for report in reports]
-    formatted = format_report(summaries, **formatter_kwargs)
-    if len(formatted) <= max_chars:
-        return formatted
-
-    for strategy in strategies:
-        formatted = strategy(reports, max_chars=max_chars, **formatter_kwargs)
-        if formatted is not None and len(formatted) <= max_chars:
-            return formatted
-
-    return summarize(reports, **formatter_kwargs)
-
-
-def format_collection_error(error, **formatter_kwargs):
-    return textwrap.dedent(
-        """\
-        <details><summary>Python {py_version} Test Summary</summary>
-
-        {name} failed:
-        ```
-        {traceback}
-        ```
-
-        </details>
-        """
-    ).format(py_version=py_version, name=error.name, traceback=error.repr_)
-
-
-def include_bisection_info(message: str, bisect_file: str = "bisect-comparison.txt") -> str:
-    """Include bisection information in the issue message if available."""
-    bisect_path = pathlib.Path(bisect_file)
-    if bisect_path.exists():
-        bisect_content = bisect_path.read_text().strip()
-        if bisect_content:
-            return f"{bisect_content}\n{message}"
-    return message
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser()
-    parser.add_argument("filepath", type=pathlib.Path)
-    args = parser.parse_args()
-
-    py_version = ".".join(str(_) for _ in sys.version_info[:2])
-
-    print("Parsing logs ...")
-
-    lines = args.filepath.read_text().splitlines()
-    parsed_lines = [json.loads(line) for line in lines]
-    reports = [
-        parse_record(data) for data in parsed_lines if data["$report_type"] != "WarningMessage"
-    ]
-
-    failed = [report for report in reports if report.outcome == "failed"]
-    preformatted = [preformat_report(report) for report in failed]
-    if len(preformatted) == 1 and isinstance(preformatted[0], CollectionError):
-        message = format_collection_error(preformatted[0], py_version=py_version)
-    else:
-        message = compressed_report(preformatted, max_chars=65535, py_version=py_version)
-
-    # Include bisection information if available
-    message = include_bisection_info(message)
-
-    output_file = pathlib.Path("pytest-logs.txt")
-    print(f"Writing output file to: {output_file.absolute()}")
-    output_file.write_text(message)
diff --git a/store_bisect_data.py b/store_bisect_data.py
deleted file mode 100644
index 4c01e96..0000000
--- a/store_bisect_data.py
+++ /dev/null
@@ -1,45 +0,0 @@
-#!/usr/bin/env python3
-"""
-Store bisection data as JSON file - Git operations handled by GitHub Actions.
-
-This simplified approach creates the JSON data file and lets GitHub Actions
-handle all Git operations for better transparency and debugging.
-"""
-
-import json
-import sys
-from pathlib import Path
-
-import track_packages
-
-
-def main():
-    """Create bisection data file for GitHub Actions to commit."""
-    if len(sys.argv) < 3:
-        print("Usage: store_bisect_data.py <packages> <log_path> [captured_versions_file]")
-        sys.exit(1)
-
-    packages_str = sys.argv[1]
-    log_path = sys.argv[2]
-    captured_versions_file = sys.argv[3] if len(sys.argv) > 3 else None
-
-    packages = [pkg.strip() for pkg in packages_str.split(",") if pkg.strip()]
-
-    # Create bisection data
-    data = track_packages.create_bisect_data(packages, log_path, captured_versions_file)
-
-    # Create filename based on run ID and timestamp
-    filename = (
-        f"run_{data['workflow_run_id']}_{data['timestamp'].replace(':', '-').replace('Z', '')}.json"
-    )
-
-    # Write the data file
-    Path(filename).write_text(json.dumps(data, indent=2))
-
-    print(f"Created bisection data file: {filename}")
-    print(f"Test status: {data['test_status']}")
-    print(f"Failed tests: {len(data.get('failed_tests', []))}")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/test_parse_log.py b/test_parse_log.py
deleted file mode 100644
index 9407b3f..0000000
--- a/test_parse_log.py
+++ /dev/null
@@ -1,93 +0,0 @@
-import re
-import sys
-
-import hypothesis.strategies as st
-from hypothesis import given, note
-
-import parse_logs
-
-directory_re = r"(\w|-)+"
-path_re = re.compile(rf"/?({directory_re}(/{directory_re})*/)?test_[A-Za-z0-9_]+\.py")
-filepaths = st.from_regex(path_re, fullmatch=True)
-
-group_re = r"Test[A-Za-z0-9_]+"
-name_re = re.compile(rf"({group_re}::)*test_[A-Za-z0-9_]+")
-names = st.from_regex(name_re, fullmatch=True)
-
-variants = st.from_regex(re.compile(r"(\w+-)*\w+"), fullmatch=True)
-
-messages = st.text()
-
-
-def ansi_csi_escapes():
-    parameter_bytes = st.lists(st.characters(min_codepoint=0x30, max_codepoint=0x3F))
-    intermediate_bytes = st.lists(st.characters(min_codepoint=0x20, max_codepoint=0x2F))
-    final_bytes = st.characters(min_codepoint=0x40, max_codepoint=0x7E)
-
-    return st.builds(
-        lambda *args: "".join(["\x1b[", *args]),
-        parameter_bytes.map("".join),
-        intermediate_bytes.map("".join),
-        final_bytes,
-    )
-
-
-def ansi_c1_escapes():
-    byte_ = st.characters(
-        codec="ascii", min_codepoint=0x40, max_codepoint=0x5F, exclude_characters=["["]
-    )
-    return st.builds(lambda b: f"\x1b{b}", byte_)
-
-
-def ansi_fe_escapes():
-    return ansi_csi_escapes() | ansi_c1_escapes()
-
-
-def preformatted_reports():
-    return st.tuples(filepaths, names, variants | st.none(), messages).map(
-        lambda x: parse_logs.PreformattedReport(*x)
-    )
-
-
-@given(filepaths, names, variants)
-def test_parse_nodeid(path, name, variant):
-    if variant is not None:
-        nodeid = f"{path}::{name}[{variant}]"
-    else:
-        nodeid = f"{path}::{name}"
-
-    note(f"nodeid: {nodeid}")
-
-    expected = {"filepath": path, "name": name, "variant": variant}
-    actual = parse_logs.parse_nodeid(nodeid)
-
-    assert actual == expected
-
-
-@given(st.lists(preformatted_reports()), st.integers(min_value=0))
-def test_truncate(reports, max_chars):
-    py_version = ".".join(str(part) for part in sys.version_info[:3])
-
-    formatted = parse_logs.truncate(reports, max_chars=max_chars, py_version=py_version)
-
-    assert formatted is None or len(formatted) <= max_chars
-
-
-@given(st.lists(ansi_fe_escapes()).map("".join))
-def test_strip_ansi_multiple(escapes):
-    assert parse_logs.strip_ansi(escapes) == ""
-
-
-@given(ansi_fe_escapes())
-def test_strip_ansi(escape):
-    message = f"some {escape}text"
-
-    assert parse_logs.strip_ansi(message) == "some text"
-
-
-@given(ansi_fe_escapes())
-def test_preformatted_report_ansi(escape):
-    actual = parse_logs.PreformattedReport(
-        filepath="a", name="b", variant=None, message=f"{escape}text"
-    )
-    assert actual.message == "text"
diff --git a/test_track_packages.py b/test_track_packages.py
deleted file mode 100644
index 1d10a13..0000000
--- a/test_track_packages.py
+++ /dev/null
@@ -1,400 +0,0 @@
-import json
-import os
-import sys
-import tempfile
-from datetime import datetime
-from unittest.mock import Mock, patch
-
-import hypothesis.strategies as st
-from hypothesis import given
-
-import track_packages
-
-
-def test_get_package_version_existing():
-    """Test getting version of an existing package."""
-    with patch("subprocess.run") as mock_run:
-        mock_run.return_value.stdout = "Name: pytest\nVersion: 7.4.0\nSummary: ..."
-        mock_run.return_value.check = True
-
-        version = track_packages.get_package_version("pytest")
-        assert version == "7.4.0"
-
-
-def test_get_package_version_nonexistent():
-    """Test getting version of a non-existent package."""
-    with patch("subprocess.run") as mock_run:
-        mock_run.side_effect = track_packages.subprocess.CalledProcessError(1, "pip")
-
-        version = track_packages.get_package_version("nonexistent-package")
-        assert version is None
-
-
-def test_get_all_installed_packages():
-    """Test getting all installed packages."""
-    mock_packages = [
-        {"name": "pytest", "version": "7.4.0"},
-        {"name": "hypothesis", "version": "6.82.0"},
-        {"name": "more-itertools", "version": "10.1.0"},
-    ]
-
-    with patch("subprocess.run") as mock_run:
-        mock_run.return_value.stdout = json.dumps(mock_packages)
-        mock_run.return_value.check = True
-
-        packages = track_packages.get_all_installed_packages()
-        expected = {
-            "pytest": "7.4.0",
-            "hypothesis": "6.82.0",
-            "more-itertools": "10.1.0",
-        }
-        assert packages == expected
-
-
-def test_get_current_package_versions_specific():
-    """Test getting versions of specific packages."""
-    with patch("track_packages.get_package_version") as mock_get_version:
-        mock_get_version.side_effect = lambda pkg: {
-            "pytest": "7.4.0",
-            "hypothesis": "6.82.0",
-            "nonexistent": None,
-        }.get(pkg)
-
-        versions = track_packages.get_current_package_versions(
-            ["pytest", "hypothesis", "nonexistent"]
-        )
-        expected = {
-            "pytest": "7.4.0",
-            "hypothesis": "6.82.0",
-            "nonexistent": None,
-        }
-        assert versions == expected
-
-
-def test_get_current_package_versions_from_captured_file():
-    """Test getting versions from a captured JSON file."""
-    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
-        captured_data = {
-            "python_version": "3.11.0",
-            "packages": {"pytest": "7.4.0", "numpy": "1.24.0", "requests": "2.31.0"},
-            "capture_method": "importlib.metadata",
-        }
-        json.dump(captured_data, f)
-        captured_file = f.name
-
-    try:
-        # Test specific packages
-        versions = track_packages.get_current_package_versions(
-            ["pytest", "numpy", "missing"], captured_file
-        )
-        expected = {"pytest": "7.4.0", "numpy": "1.24.0", "missing": None}
-        assert versions == expected
-
-        # Test "all" packages
-        all_versions = track_packages.get_current_package_versions(["all"], captured_file)
-        expected_all = {"pytest": "7.4.0", "numpy": "1.24.0", "requests": "2.31.0"}
-        assert all_versions == expected_all
-    finally:
-        os.unlink(captured_file)
-
-
-def test_get_current_package_versions_fallback_on_bad_file():
-    """Test fallback when captured file is invalid."""
-    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
-        f.write("invalid json content")
-        bad_file = f.name
-
-    try:
-        with patch("track_packages.get_package_version") as mock_get_version:
-            mock_get_version.return_value = "fallback-version"
-
-            versions = track_packages.get_current_package_versions(["pytest"], bad_file)
-            expected = {"pytest": "fallback-version"}
-            assert versions == expected
-    finally:
-        os.unlink(bad_file)
-
-
-def test_get_current_package_versions_all():
-    """Test getting versions when 'all' is specified."""
-    with patch("track_packages.get_all_installed_packages") as mock_get_all:
-        mock_get_all.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
-
-        versions = track_packages.get_current_package_versions(["all"])
-        assert versions == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
-
-
-def test_get_git_info():
-    """Test getting Git information."""
-    with patch("subprocess.run") as mock_run:
-        # Mock the sequence of git commands
-        mock_run.side_effect = [
-            Mock(stdout="abc123def456789\n", check=True),  # git rev-parse HEAD
-            Mock(stdout="Fix test regression\n", check=True),  # git log -1 --pretty=format:%s
-            Mock(
-                stdout="John Doe <john@example.com>\n", check=True
-            ),  # git log -1 --pretty=format:%an <%ae>
-            Mock(
-                stdout="2024-01-15 10:30:00 +0000\n", check=True
-            ),  # git log -1 --pretty=format:%ci
-        ]
-
-        git_info = track_packages.get_git_info()
-
-        expected = {
-            "commit_hash": "abc123def456789",
-            "commit_hash_short": "abc123de",
-            "commit_message": "Fix test regression",
-            "commit_author": "John Doe <john@example.com>",
-            "commit_date": "2024-01-15 10:30:00 +0000",
-        }
-        assert git_info == expected
-
-
-def test_extract_failed_tests_from_log():
-    """Test extracting failed tests from pytest log file."""
-    with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
-        # Write sample pytest log entries
-        f.write(
-            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_pass", "outcome": "passed"}\n'
-        )
-        f.write(
-            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_fail1", "outcome": "failed"}\n'
-        )
-        f.write(
-            '{"$report_type": "CollectReport", "nodeid": "test_file.py::test_fail2", "outcome": "failed"}\n'
-        )
-        f.write(
-            '{"$report_type": "TestReport", "nodeid": "test_file.py::test_skip", "outcome": "skipped"}\n'
-        )
-        f.write('{"$report_type": "WarningMessage", "outcome": "failed"}\n')  # Should be ignored
-        log_path = f.name
-
-    try:
-        failed_tests = track_packages.extract_failed_tests_from_log(log_path)
-        expected = ["test_file.py::test_fail1", "test_file.py::test_fail2"]
-        assert failed_tests == expected
-    finally:
-        os.unlink(log_path)
-
-
-def test_extract_failed_tests_from_log_missing_file():
-    """Test extracting failed tests when log file doesn't exist."""
-    failed_tests = track_packages.extract_failed_tests_from_log("nonexistent.jsonl")
-    assert failed_tests == []
-
-
-def test_get_git_info_failure():
-    """Test getting Git information when git commands fail."""
-    with patch("subprocess.run") as mock_run:
-        mock_run.side_effect = track_packages.subprocess.CalledProcessError(1, "git")
-
-        git_info = track_packages.get_git_info()
-
-        expected = {
-            "commit_hash": "unknown",
-            "commit_hash_short": "unknown",
-            "commit_message": "unknown",
-            "commit_author": "unknown",
-            "commit_date": "unknown",
-        }
-        assert git_info == expected
-
-
-def test_create_bisect_data():
-    """Test creating bisection data."""
-    packages = ["pytest", "hypothesis"]
-
-    with (
-        patch("track_packages.get_current_package_versions") as mock_get_versions,
-        patch("track_packages.get_git_info") as mock_get_git,
-        patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests,
-    ):
-        mock_get_versions.return_value = {"pytest": "7.4.0", "hypothesis": "6.82.0"}
-        mock_get_git.return_value = {
-            "commit_hash": "abc123",
-            "commit_hash_short": "abc123de",
-            "commit_message": "Test commit",
-            "commit_author": "Test Author",
-            "commit_date": "2024-01-01",
-        }
-        mock_extract_tests.return_value = []
-
-        with patch.dict("os.environ", {"GITHUB_RUN_ID": "12345"}):
-            data = track_packages.create_bisect_data(packages)
-
-            assert data["workflow_run_id"] == "12345"
-            assert data["python_version"] == ".".join(str(v) for v in sys.version_info[:3])
-            assert data["packages"] == {"pytest": "7.4.0", "hypothesis": "6.82.0"}
-            assert data["failed_tests"] == []
-            assert data["test_status"] == "passed"
-            assert data["git"]["commit_hash"] == "abc123"
-            assert "timestamp" in data
-            # Check timestamp format
-            datetime.fromisoformat(data["timestamp"].replace("Z", "+00:00"))
-
-
-def test_create_bisect_data_with_captured_versions():
-    """Test creating bisection data with captured versions file."""
-    packages = ["pytest", "numpy"]
-
-    # Create a captured versions file
-    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
-        captured_data = {
-            "python_version": "3.11.5",
-            "packages": {"pytest": "7.4.2", "numpy": "1.25.1"},
-        }
-        json.dump(captured_data, f)
-        captured_file = f.name
-
-    try:
-        with (
-            patch("track_packages.get_git_info") as mock_get_git,
-            patch("track_packages.extract_failed_tests_from_log") as mock_extract_tests,
-        ):
-            mock_get_git.return_value = {
-                "commit_hash": "def456",
-                "commit_hash_short": "def456gh",
-                "commit_message": "Test commit with captured versions",
-                "commit_author": "Test Author",
-                "commit_date": "2024-01-01",
-            }
-            mock_extract_tests.return_value = ["test_fail.py::test_example"]
-
-            with patch.dict("os.environ", {"GITHUB_RUN_ID": "67890"}):
-                data = track_packages.create_bisect_data(
-                    packages, captured_versions_file=captured_file
-                )
-
-                assert data["workflow_run_id"] == "67890"
-                assert data["python_version"] == "3.11.5"  # From captured file
-                assert data["packages"] == {
-                    "pytest": "7.4.2",
-                    "numpy": "1.25.1",
-                }  # From captured file
-                assert data["failed_tests"] == ["test_fail.py::test_example"]
-                assert data["test_status"] == "failed"
-                assert data["git"]["commit_hash"] == "def456"
-                assert "timestamp" in data
-    finally:
-        os.unlink(captured_file)
-
-
-def test_format_bisect_comparison_no_previous():
-    """Test formatting comparison when no previous data exists."""
-    current_data = {
-        "workflow_run_id": "456",
-        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0"},
-    }
-
-    result = track_packages.format_bisect_comparison(current_data, None)
-    assert result is None
-
-
-def test_format_bisect_comparison_with_changes():
-    """Test formatting comparison with package changes."""
-    previous_data = {
-        "workflow_run_id": "123",
-        "packages": {"pytest": "7.3.0", "hypothesis": "6.82.0", "removed-pkg": "1.0.0"},
-    }
-    current_data = {
-        "workflow_run_id": "456",
-        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0", "new-pkg": "2.0.0"},
-    }
-
-    result = track_packages.format_bisect_comparison(current_data, previous_data)
-
-    assert "Package Version Changes" in result
-    assert "Last Successful Run #123 → Current Failed Run #456" in result
-    assert "pytest: 7.3.0 → 7.4.0" in result
-    assert "hypothesis: 6.82.0 (unchanged)" in result
-    assert "removed-pkg: 1.0.0 → (not installed)" in result
-    assert "new-pkg: (not installed) → 2.0.0" in result
-
-
-def test_format_bisect_comparison_no_changes():
-    """Test formatting comparison when no packages changed."""
-    data = {
-        "workflow_run_id": "456",
-        "packages": {"pytest": "7.4.0", "hypothesis": "6.82.0"},
-    }
-
-    result = track_packages.format_bisect_comparison(data, data)
-
-    assert "Package Version Changes" in result
-    assert "pytest: 7.4.0 (unchanged)" in result
-    assert "hypothesis: 6.82.0 (unchanged)" in result
-
-
-@given(st.lists(st.text(min_size=1), min_size=1, max_size=5))
-def test_get_current_package_versions_property(package_names):
-    """Property test for get_current_package_versions."""
-    with patch("track_packages.get_package_version") as mock_get_version:
-        mock_get_version.return_value = "1.0.0"
-
-        versions = track_packages.get_current_package_versions(package_names)
-
-        assert len(versions) == len(package_names)
-        for pkg in package_names:
-            assert pkg in versions
-
-
-def test_retrieve_bisect_data_from_branch_no_branch():
-    """Test retrieving data when branch doesn't exist."""
-    with patch("subprocess.run") as mock_run:
-        # Simulate no branch found
-        mock_run.return_value.stdout = ""
-        mock_run.return_value.check = True
-
-        result = track_packages.retrieve_bisect_data_from_branch("nonexistent-branch")
-        assert result is None
-
-
-def test_retrieve_bisect_data_from_branch_success():
-    """Test successfully retrieving data from branch."""
-    mock_data = {
-        "workflow_run_id": "123",
-        "packages": {"pytest": "7.3.0"},
-    }
-
-    with patch("subprocess.run") as mock_run:
-        # Mock the sequence of git commands
-        mock_run.side_effect = [
-            Mock(stdout="abc123\trefs/heads/bisect-data\n", check=True),  # ls-remote
-            Mock(check=True),  # fetch
-            Mock(stdout=json.dumps(mock_data), check=True),  # show
-        ]
-
-        result = track_packages.retrieve_bisect_data_from_branch("bisect-data")
-        assert result == mock_data
-
-
-def test_generate_package_diff_link():
-    """Test generating GitHub diff links for package changes."""
-    # Test known package
-    link = track_packages.generate_package_diff_link("numpy", "1.24.0", "1.25.0")
-    assert link == "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0"
-
-    # Test unknown package
-    link = track_packages.generate_package_diff_link("unknown-package", "1.0.0", "2.0.0")
-    assert link is None
-
-
-def test_get_package_changes_with_github_links():
-    """Test package changes include GitHub links when available."""
-    previous_packages = {"numpy": "1.24.0", "unknown-pkg": "1.0.0"}
-    current_packages = {"numpy": "1.25.0", "unknown-pkg": "2.0.0"}
-
-    changes = track_packages.get_package_changes(current_packages, previous_packages)
-
-    # Should have GitHub link for numpy
-    numpy_change = next((c for c in changes if "numpy" in c), None)
-    assert numpy_change is not None
-    assert "https://github.com/numpy/numpy/compare/v1.24.0...v1.25.0" in numpy_change
-    assert "[numpy: 1.24.0 → 1.25.0]" in numpy_change
-
-    # Should not have GitHub link for unknown package
-    unknown_change = next((c for c in changes if "unknown-pkg" in c), None)
-    assert unknown_change is not None
-    assert "unknown-pkg: 1.0.0 → 2.0.0" in unknown_change
-    assert "https://" not in unknown_change

From a1e0c184cd69beb31c1a6a7f56ec47c3387cd7b2 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 15:41:47 -0400
Subject: [PATCH 13/15] Replace complex shell one-liners with Python command
 for run metadata extraction
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Create new extract_run_metadata.py module with proper CLI interface
- Add extract-run-metadata console script to pyproject.toml
- Replace complex Python one-liners in action.yaml with clean command calls
- Fix shell syntax error with multi-line commit message quotes
- Add comprehensive tests for the new functionality
- Ensure action uses the package consistently throughout

The action now uses:
- python -m issue_from_pytest_log_action.extract_run_metadata test_status
- python -m issue_from_pytest_log_action.extract_run_metadata failed_count

Instead of complex inline Python expressions.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 action.yaml                                   |   7 +-
 pyproject.toml                                |   1 +
 .../extract_run_metadata.py                   |  84 +++++++++
 tests/test_extract_run_metadata.py            | 163 ++++++++++++++++++
 4 files changed, 252 insertions(+), 3 deletions(-)
 create mode 100644 src/issue_from_pytest_log_action/extract_run_metadata.py
 create mode 100644 tests/test_extract_run_metadata.py

diff --git a/action.yaml b/action.yaml
index 007366a..36e2d03 100644
--- a/action.yaml
+++ b/action.yaml
@@ -127,11 +127,12 @@ runs:
         if git diff --staged --quiet; then
           echo "No changes to commit"
         else
+          TEST_STATUS=$(python -m issue_from_pytest_log_action.extract_run_metadata test_status)
+          FAILED_COUNT=$(python -m issue_from_pytest_log_action.extract_run_metadata failed_count)
           git commit -m "Add bisection data for run ${{ github.run_id }}
 
-          Test status: $(python -c "import json; data=json.load(open([f for f in __import__('pathlib').Path('.').glob('run_*.json')][-1])); print(data['test_status'])")
-          Failed tests: $(python -c "import json; data=json.load(open([f for f in __import__('pathlib').Path('.').glob('run_*.json')][-1])); print(len(data.get('failed_tests', [])))")
-          "
+          Test status: ${TEST_STATUS}
+          Failed tests: ${FAILED_COUNT}"
 
           # Push to remote
           git push origin "${{ inputs.bisect-branch }}"
diff --git a/pyproject.toml b/pyproject.toml
index 379fd04..33a57b3 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -41,6 +41,7 @@ dev = [
 [project.scripts]
 capture-versions = "issue_from_pytest_log_action.capture_versions:main"
 simple-bisect = "issue_from_pytest_log_action.simple_bisect:main"
+extract-run-metadata = "issue_from_pytest_log_action.extract_run_metadata:main"
 
 [tool.setuptools.packages.find]
 where = ["src"]
diff --git a/src/issue_from_pytest_log_action/extract_run_metadata.py b/src/issue_from_pytest_log_action/extract_run_metadata.py
new file mode 100644
index 0000000..fed74d1
--- /dev/null
+++ b/src/issue_from_pytest_log_action/extract_run_metadata.py
@@ -0,0 +1,84 @@
+#!/usr/bin/env python3
+"""Extract metadata from bisection run JSON files for commit messages."""
+
+import argparse
+import json
+import pathlib
+import sys
+from typing import Any
+
+
+def find_latest_run_file() -> pathlib.Path:
+    """Find the most recent run_*.json file in the current directory."""
+    current_dir = pathlib.Path(".")
+    run_files = list(current_dir.glob("run_*.json"))
+
+    if not run_files:
+        raise FileNotFoundError("No run_*.json files found in current directory")
+
+    # Sort by modification time and return the most recent
+    return max(run_files, key=lambda f: f.stat().st_mtime)
+
+
+def load_run_data(file_path: pathlib.Path) -> dict[str, Any]:
+    """Load and parse the run JSON data."""
+    try:
+        with file_path.open() as f:
+            return json.load(f)
+    except (json.JSONDecodeError, OSError) as e:
+        raise ValueError(f"Failed to load run data from {file_path}: {e}")
+
+
+def extract_test_status(data: dict[str, Any]) -> str:
+    """Extract the test status from run data."""
+    return data.get("test_status", "unknown")
+
+
+def extract_failed_test_count(data: dict[str, Any]) -> int:
+    """Extract the count of failed tests from run data."""
+    failed_tests = data.get("failed_tests", [])
+    return len(failed_tests)
+
+
+def main(argv=None):
+    """Main entry point for extract_run_metadata command."""
+    if argv is None:
+        argv = sys.argv[1:]
+
+    parser = argparse.ArgumentParser(description="Extract metadata from bisection run JSON files")
+    parser.add_argument(
+        "field", choices=["test_status", "failed_count"], help="Field to extract from the run data"
+    )
+    parser.add_argument(
+        "--file",
+        type=pathlib.Path,
+        help="Specific run file to read (default: find latest run_*.json)",
+    )
+
+    args = parser.parse_args(argv)
+
+    try:
+        # Find the run file
+        if args.file:
+            run_file = args.file
+        else:
+            run_file = find_latest_run_file()
+
+        # Load the data
+        data = load_run_data(run_file)
+
+        # Extract the requested field
+        if args.field == "test_status":
+            result = extract_test_status(data)
+        elif args.field == "failed_count":
+            result = extract_failed_test_count(data)
+
+        print(result)
+
+    except (FileNotFoundError, ValueError) as e:
+        print(f"Error: {e}", file=sys.stderr)
+        sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tests/test_extract_run_metadata.py b/tests/test_extract_run_metadata.py
new file mode 100644
index 0000000..5776496
--- /dev/null
+++ b/tests/test_extract_run_metadata.py
@@ -0,0 +1,163 @@
+"""Tests for extract_run_metadata module."""
+
+import json
+import pathlib
+import tempfile
+
+import pytest
+
+from issue_from_pytest_log_action.extract_run_metadata import (
+    extract_failed_test_count,
+    extract_test_status,
+    find_latest_run_file,
+    load_run_data,
+    main,
+)
+
+
+@pytest.fixture
+def sample_run_data():
+    """Sample run data for testing."""
+    return {
+        "test_status": "failed",
+        "failed_tests": ["test1", "test2", "test3"],
+        "packages": {"numpy": "1.21.0"},
+        "timestamp": "2024-01-01T10:00:00Z",
+    }
+
+
+@pytest.fixture
+def temp_run_file(sample_run_data):
+    """Create a temporary run file for testing."""
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", prefix="run_", delete=False) as f:
+        json.dump(sample_run_data, f)
+        temp_file = pathlib.Path(f.name)
+
+    yield temp_file
+
+    # Cleanup
+    if temp_file.exists():
+        temp_file.unlink()
+
+
+def test_load_run_data(temp_run_file, sample_run_data):
+    """Test loading run data from a JSON file."""
+    data = load_run_data(temp_run_file)
+    assert data == sample_run_data
+
+
+def test_load_run_data_invalid_file():
+    """Test loading run data from a non-existent file."""
+    with pytest.raises(ValueError, match="Failed to load run data"):
+        load_run_data(pathlib.Path("nonexistent.json"))
+
+
+def test_extract_test_status(sample_run_data):
+    """Test extracting test status."""
+    assert extract_test_status(sample_run_data) == "failed"
+    assert extract_test_status({}) == "unknown"
+
+
+def test_extract_failed_test_count(sample_run_data):
+    """Test extracting failed test count."""
+    assert extract_failed_test_count(sample_run_data) == 3
+    assert extract_failed_test_count({}) == 0
+    assert extract_failed_test_count({"failed_tests": []}) == 0
+
+
+def test_find_latest_run_file():
+    """Test finding the latest run file."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        temp_path = pathlib.Path(temp_dir)
+
+        # Create some run files with different timestamps
+        run_file1 = temp_path / "run_123.json"
+        run_file2 = temp_path / "run_456.json"
+
+        run_file1.write_text('{"test_status": "passed"}')
+        run_file2.write_text('{"test_status": "failed"}')
+
+        # Make run_file2 newer by touching it
+        import time
+
+        time.sleep(0.01)  # Small delay to ensure different timestamps
+        run_file2.touch()
+
+        # Change to the temp directory
+        import os
+
+        original_cwd = os.getcwd()
+        try:
+            os.chdir(temp_dir)
+            latest = find_latest_run_file()
+            assert latest.name == "run_456.json"
+        finally:
+            os.chdir(original_cwd)
+
+
+def test_find_latest_run_file_no_files():
+    """Test finding run files when none exist."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        import os
+
+        original_cwd = os.getcwd()
+        try:
+            os.chdir(temp_dir)
+            with pytest.raises(FileNotFoundError, match="No run_.*json files found"):
+                find_latest_run_file()
+        finally:
+            os.chdir(original_cwd)
+
+
+def test_main_test_status(temp_run_file, capsys):
+    """Test main function extracting test status."""
+    main(["test_status", "--file", str(temp_run_file)])
+    captured = capsys.readouterr()
+    assert captured.out.strip() == "failed"
+
+
+def test_main_failed_count(temp_run_file, capsys):
+    """Test main function extracting failed test count."""
+    main(["failed_count", "--file", str(temp_run_file)])
+    captured = capsys.readouterr()
+    assert captured.out.strip() == "3"
+
+
+def test_main_invalid_file(capsys):
+    """Test main function with invalid file."""
+    with pytest.raises(SystemExit):
+        main(["test_status", "--file", "nonexistent.json"])
+
+    captured = capsys.readouterr()
+    assert "Error:" in captured.err
+
+
+def test_main_find_latest():
+    """Test main function finding latest file automatically."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        temp_path = pathlib.Path(temp_dir)
+        run_file = temp_path / "run_123.json"
+        run_file.write_text('{"test_status": "passed", "failed_tests": ["test1"]}')
+
+        import os
+
+        original_cwd = os.getcwd()
+        try:
+            os.chdir(temp_dir)
+
+            # Test with capsys
+            import sys
+            from io import StringIO
+
+            old_stdout = sys.stdout
+            sys.stdout = captured_output = StringIO()
+
+            try:
+                main(["test_status"])
+                output = captured_output.getvalue()
+                assert output.strip() == "passed"
+            finally:
+                sys.stdout = old_stdout
+
+        finally:
+            os.chdir(original_cwd)

From cdc0cbbd524f52f32fec63b47d72ab8a5efa1237 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 16:33:20 -0400
Subject: [PATCH 14/15] Fix pre-commit issues and add comprehensive end-to-end
 testing
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Fix all ruff import errors and mypy type issues across modules
- Add comprehensive end-to-end testing framework with 11 test scenarios
- Add specialized tests for scientific packages (numpy, pandas, xarray, zarr)
- Increase test coverage from 29% to 69% with 170 total tests
- Add integration markers and performance benchmarks for large log files
- Fix PreformattedReport type annotations and JSON parsing issues

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 pyproject.toml                                |  21 +
 .../capture_versions.py                       |  11 +-
 .../extract_run_metadata.py                   |   3 +
 .../parse_logs.py                             |  13 +-
 .../simple_bisect.py                          |   4 +-
 .../track_packages.py                         |  31 +-
 tests/test_end_to_end.py                      | 507 ++++++++++++++++++
 tests/test_parse_logs.py                      | 482 +++++++++++++++++
 tests/test_scientific_packages.py             | 263 +++++++++
 tests/test_simple_bisect.py                   | 309 +++++++++++
 tests/test_track_packages.py                  | 503 +++++++++++++++++
 tests/test_version_extraction.py              |   4 +-
 12 files changed, 2127 insertions(+), 24 deletions(-)
 create mode 100644 tests/test_end_to_end.py
 create mode 100644 tests/test_parse_logs.py
 create mode 100644 tests/test_scientific_packages.py
 create mode 100644 tests/test_simple_bisect.py
 create mode 100644 tests/test_track_packages.py

diff --git a/pyproject.toml b/pyproject.toml
index 33a57b3..84ec621 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -25,6 +25,8 @@ classifiers = [
 
 dependencies = [
   "setuptools; python_version >= '3.12'", # For pkg_resources fallback
+  "more-itertools",
+  "pytest",
 ]
 
 [project.optional-dependencies]
@@ -51,6 +53,9 @@ include = ["issue_from_pytest_log_action*"]
 testpaths = ["tests"]
 python_files = ["test_*.py"]
 addopts = "-v --tb=short"
+markers = [
+  "integration: marks tests as integration tests (deselect with '-m \"not integration\"')",
+]
 
 [tool.ruff]
 target-version = "py310"
@@ -96,3 +101,19 @@ branch = true
 [tool.coverage.report]
 show_missing = true
 exclude_lines = ["pragma: no cover", "if TYPE_CHECKING"]
+
+[tool.mypy]
+python_version = "3.10"
+packages = ["src/issue_from_pytest_log_action", "tests"]
+check_untyped_defs = true
+disallow_untyped_defs = false
+ignore_missing_imports = false
+
+[[tool.mypy.overrides]]
+module = ["pytest.*", "more_itertools.*"]
+ignore_missing_imports = true
+
+[dependency-groups]
+dev = [
+  "mypy>=1.14.1",
+]
diff --git a/src/issue_from_pytest_log_action/capture_versions.py b/src/issue_from_pytest_log_action/capture_versions.py
index f82c58e..cbaaca8 100644
--- a/src/issue_from_pytest_log_action/capture_versions.py
+++ b/src/issue_from_pytest_log_action/capture_versions.py
@@ -9,6 +9,7 @@
 import json
 import os
 import sys
+from typing import Any
 
 
 def extract_git_hash_from_version(version_string: str) -> str | None:
@@ -109,7 +110,7 @@ def main():
         return
 
     packages = [pkg.strip() for pkg in packages_input.split(",")]
-    versions = {}
+    versions: dict[str, dict[str, Any] | None | str] = {}
 
     # Try importlib.metadata first (Python 3.8+)
     try:
@@ -146,12 +147,12 @@ def main():
 
             if len(packages) == 1 and packages[0].lower() == "all":
                 print("Capturing all installed packages...")
-                for dist in pkg_resources.working_set:
+                for dist in pkg_resources.working_set:  # type: ignore[attr-defined]
                     pkg_info = {
                         "version": dist.version,
-                        "git_info": extract_git_info(dist.project_name),
+                        "git_info": extract_git_info(dist.project_name),  # type: ignore[attr-defined]
                     }
-                    versions[dist.project_name] = pkg_info
+                    versions[dist.project_name] = pkg_info  # type: ignore[attr-defined]
             else:
                 print(f"Capturing specific packages: {packages}")
                 for pkg in packages:
@@ -172,7 +173,7 @@ def main():
                             print(f"  {pkg}: not found ({e})")
         except ImportError:
             print("ERROR: No package detection method available")
-            versions = {"error": "No package detection method available"}
+            versions["error"] = "No package detection method available"
 
     # Save captured versions
     capture_data = {
diff --git a/src/issue_from_pytest_log_action/extract_run_metadata.py b/src/issue_from_pytest_log_action/extract_run_metadata.py
index fed74d1..f9859ff 100644
--- a/src/issue_from_pytest_log_action/extract_run_metadata.py
+++ b/src/issue_from_pytest_log_action/extract_run_metadata.py
@@ -68,10 +68,13 @@ def main(argv=None):
         data = load_run_data(run_file)
 
         # Extract the requested field
+        result: str | int
         if args.field == "test_status":
             result = extract_test_status(data)
         elif args.field == "failed_count":
             result = extract_failed_test_count(data)
+        else:
+            raise ValueError(f"Unknown field: {args.field}")
 
         print(result)
 
diff --git a/src/issue_from_pytest_log_action/parse_logs.py b/src/issue_from_pytest_log_action/parse_logs.py
index 156901f..3d65daa 100644
--- a/src/issue_from_pytest_log_action/parse_logs.py
+++ b/src/issue_from_pytest_log_action/parse_logs.py
@@ -1,4 +1,3 @@
-# type: ignore
 import argparse
 import functools
 import json
@@ -63,7 +62,7 @@ def _from_json(cls, json):
 @dataclass
 class PreformattedReport:
     filepath: str
-    name: str
+    name: str | None
     variant: str | None
     message: str
 
@@ -88,7 +87,7 @@ def parse_record(record):
     if cls is None:
         raise ValueError(f"unknown report type: {record['$report_type']}")
 
-    return cls._from_json(record)
+    return cls._from_json(record)  # type: ignore[attr-defined]
 
 
 nodeid_re = re.compile(r"(?P<filepath>.+?)::(?P<name>.+?)(?:\[(?P<variant>.+)\])?")
@@ -114,8 +113,8 @@ def _(report: TestReport):
     if isinstance(report.longrepr, str):
         message = report.longrepr
     else:
-        message = report.longrepr.reprcrash.message
-    return PreformattedReport(message=message, **parsed)
+        message = report.longrepr.reprcrash.message  # type: ignore[union-attr]
+    return PreformattedReport(message=message, **parsed)  # type: ignore[arg-type]
 
 
 @preformat_report.register
@@ -135,8 +134,8 @@ def _(report: CollectReport):
     if isinstance(report.longrepr, str):
         message = report.longrepr.split("\n")[-1].removeprefix("E").lstrip()
     else:
-        message = report.longrepr.reprcrash.message
-    return PreformattedReport(message=message, **parsed)
+        message = report.longrepr.reprcrash.message  # type: ignore[union-attr]
+    return PreformattedReport(message=message, **parsed)  # type: ignore[arg-type]
 
 
 def format_summary(report):
diff --git a/src/issue_from_pytest_log_action/simple_bisect.py b/src/issue_from_pytest_log_action/simple_bisect.py
index a180acc..d17aa5b 100644
--- a/src/issue_from_pytest_log_action/simple_bisect.py
+++ b/src/issue_from_pytest_log_action/simple_bisect.py
@@ -85,7 +85,7 @@ def generate_comparison(
         print("No comparison generated (no failed tests)")
 
 
-def main():
+def main(argv=None):
     """Main entry point."""
     parser = argparse.ArgumentParser(description="Handle bisection data")
     parser.add_argument("--packages", required=True, help="Comma-separated list of packages")
@@ -99,7 +99,7 @@ def main():
         "--generate-comparison", action="store_true", help="Generate bisection comparison"
     )
 
-    args = parser.parse_args()
+    args = parser.parse_args(argv)
 
     packages = [pkg.strip() for pkg in args.packages.split(",") if pkg.strip()]
 
diff --git a/src/issue_from_pytest_log_action/track_packages.py b/src/issue_from_pytest_log_action/track_packages.py
index 5111712..d2c5e42 100644
--- a/src/issue_from_pytest_log_action/track_packages.py
+++ b/src/issue_from_pytest_log_action/track_packages.py
@@ -11,7 +11,7 @@
 import pathlib
 import subprocess
 import sys
-from datetime import datetime
+from datetime import datetime, timezone
 from typing import Any
 
 # Package metadata for generating GitHub links
@@ -30,6 +30,7 @@
         "tag_format": "hypothesis-python-{version}",
     },
     "xarray": {"github": "pydata/xarray", "tag_format": "v{version}"},
+    "zarr": {"github": "zarr-developers/zarr-python", "tag_format": "v{version}"},
     "dask": {"github": "dask/dask", "tag_format": "{version}"},
     "jupyterlab": {"github": "jupyterlab/jupyterlab", "tag_format": "v{version}"},
     "notebook": {"github": "jupyter/notebook", "tag_format": "v{version}"},
@@ -54,23 +55,31 @@ def is_git_commit(version_or_commit: str) -> bool:
 
 
 def clean_version_for_tag(version: str) -> str:
-    """Clean version string for tag lookup (remove dev/nightly suffixes)."""
+    """Clean version string for tag lookup (remove dev/nightly suffixes but preserve rc/alpha)."""
     import re
 
-    # Remove common development suffixes
+    # First preserve rc/alpha parts by marking them
+    # Replace rc and alpha with placeholder markers to preserve them
+    preserved_version = version
+    preserved_version = re.sub(r"(rc\d+)", r"__RC__\1__RC__", preserved_version)
+    preserved_version = re.sub(r"([ab]\d+)", r"__ALPHA__\1__ALPHA__", preserved_version)
+
+    # Remove development suffixes (but not rc/alpha which are now marked)
     patterns = [
         r"\.dev\d*.*",  # .dev0, .dev123+gabc
         r"\+.*",  # +gabc123d, +123.gabc123d
         r"\.post\d*.*",  # .post1
-        r"[ab]\d*.*",  # a1, b2, alpha1, beta2
-        r"rc\d*.*",  # rc1, rc2
         r"\.dirty.*",  # .dirty
     ]
 
-    clean_version = version
+    clean_version = preserved_version
     for pattern in patterns:
         clean_version = re.sub(pattern, "", clean_version)
 
+    # Restore the preserved rc/alpha parts
+    clean_version = re.sub(r"__RC__(rc\d+)__RC__", r"\1", clean_version)
+    clean_version = re.sub(r"__ALPHA__([ab]\d+)__ALPHA__", r"\1", clean_version)
+
     return clean_version
 
 
@@ -116,6 +125,11 @@ def generate_package_diff_link(
         return None
 
     # Generate tags using the package's tag format
+    # Special handling for packages that use underscores instead of dots
+    if package_name == "sqlalchemy":
+        clean_old = clean_old.replace(".", "_")
+        clean_new = clean_new.replace(".", "_")
+
     old_tag = tag_format.format(version=clean_old)
     new_tag = tag_format.format(version=clean_new)
 
@@ -293,7 +307,7 @@ def create_bisect_data(
 
     return {
         "workflow_run_id": workflow_run_id,
-        "timestamp": datetime.utcnow().isoformat() + "Z",
+        "timestamp": datetime.now(timezone.utc).isoformat().replace("+00:00", "Z"),
         "python_version": python_version,
         "packages": package_versions,
         "failed_tests": failed_tests,
@@ -562,7 +576,8 @@ def extract_git_revision(package_info: dict | str | None) -> str | None:
     """Extract git revision from package info if available."""
     if isinstance(package_info, dict) and "git_info" in package_info:
         git_info = package_info["git_info"]
-        return git_info.get("git_revision")
+        if git_info is not None:
+            return git_info.get("git_revision")
     return None
 
 
diff --git a/tests/test_end_to_end.py b/tests/test_end_to_end.py
new file mode 100644
index 0000000..63bfdb0
--- /dev/null
+++ b/tests/test_end_to_end.py
@@ -0,0 +1,507 @@
+"""End-to-end integration tests for the GitHub Action workflow.
+
+These tests verify that the complete action workflow functions correctly
+with realistic test scenarios and data.
+"""
+
+import json
+import os
+import subprocess
+import sys
+import tempfile
+import time
+from pathlib import Path
+from unittest import mock
+
+import pytest
+
+
+class TestActionWorkflow:
+    """Test the complete GitHub Action workflow end-to-end."""
+
+    def create_realistic_pytest_log(self, temp_dir: Path, scenario: str) -> Path:
+        """Create realistic pytest log files for different test scenarios."""
+        scenarios = {
+            "numpy_import_failure": [
+                {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+                {
+                    "$report_type": "CollectReport",
+                    "nodeid": "",
+                    "outcome": "failed",
+                    "result": [],
+                    "longrepr": "ModuleNotFoundError: No module named 'numpy'",
+                },
+            ],
+            "mixed_failures": [
+                {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+                {
+                    "$report_type": "TestReport",
+                    "nodeid": "tests/test_data_processing.py::test_numpy_operations",
+                    "outcome": "failed",
+                    "location": ("tests/test_data_processing.py", 45, "test_numpy_operations"),
+                    "keywords": {"parametrize": True},
+                    "when": "call",
+                    "longrepr": "AssertionError: Arrays are not equal\\nExpected: [1, 2, 3]\\nActual: [1, 2, 4]",
+                },
+                {
+                    "$report_type": "TestReport",
+                    "nodeid": "tests/test_analysis.py::test_pandas_groupby[method-mean]",
+                    "outcome": "failed",
+                    "location": ("tests/test_analysis.py", 23, "test_pandas_groupby"),
+                    "keywords": {"parametrize": True},
+                    "when": "call",
+                    "longrepr": "KeyError: 'column_name'",
+                },
+                {
+                    "$report_type": "TestReport",
+                    "nodeid": "tests/test_plotting.py::test_visualization",
+                    "outcome": "passed",
+                    "location": ("tests/test_plotting.py", 67, "test_visualization"),
+                    "keywords": {},
+                    "when": "call",
+                    "longrepr": None,
+                },
+                {"$report_type": "SessionFinish", "exitstatus": "1"},
+            ],
+            "all_pass": [
+                {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+                {
+                    "$report_type": "TestReport",
+                    "nodeid": "tests/test_basic.py::test_simple",
+                    "outcome": "passed",
+                    "location": ("tests/test_basic.py", 10, "test_simple"),
+                    "keywords": {},
+                    "when": "call",
+                    "longrepr": None,
+                },
+                {"$report_type": "SessionFinish", "exitstatus": "0"},
+            ],
+        }
+
+        log_file = temp_dir / "pytest-log.jsonl"
+        with log_file.open("w") as f:
+            for record in scenarios[scenario]:
+                json.dump(record, f)
+                f.write("\n")
+
+        return log_file
+
+    def create_realistic_package_versions(self, temp_dir: Path, scenario: str) -> Path:
+        """Create realistic package version files for different scenarios."""
+        scenarios = {
+            "scientific_stack_update": {
+                "python_version": "3.11.0",
+                "python_executable": "/opt/miniconda3/bin/python",
+                "packages": {
+                    "numpy": {
+                        "version": "1.26.0.dev0+1234.g5678abc",
+                        "git_info": {"git_revision": "5678abc", "source": "version_string"}
+                    },
+                    "pandas": {
+                        "version": "2.2.0rc1",
+                        "git_info": None
+                    },
+                    "xarray": {
+                        "version": "2024.1.0",
+                        "git_info": None
+                    },
+                    "zarr": {
+                        "version": "2.16.0.dev0+123.gdef456",
+                        "git_info": {"git_revision": "def456", "source": "version_string"}
+                    },
+                },
+                "capture_method": "importlib.metadata"
+            },
+            "stable_versions": {
+                "python_version": "3.11.0",
+                "python_executable": "/usr/bin/python3",
+                "packages": {
+                    "numpy": {"version": "1.25.0", "git_info": None},
+                    "pandas": {"version": "2.1.0", "git_info": None},
+                    "xarray": {"version": "2023.8.0", "git_info": None},
+                },
+                "capture_method": "importlib.metadata"
+            },
+        }
+
+        versions_file = temp_dir / "captured-package-versions.json"
+        with versions_file.open("w") as f:
+            json.dump(scenarios[scenario], f, indent=2)
+
+        return versions_file
+
+    def test_complete_failure_workflow(self):
+        """Test the complete workflow when tests fail with package tracking."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create realistic test scenario files
+            log_file = self.create_realistic_pytest_log(temp_path, "mixed_failures")
+            versions_file = self.create_realistic_package_versions(temp_path, "scientific_stack_update")
+
+            # Simulate running the main workflow commands
+            env = os.environ.copy()
+            env.update({
+                "TRACK_PACKAGES": "numpy,pandas,xarray,zarr",
+                "GITHUB_WORKSPACE": str(temp_path),
+            })
+
+            # Change to temp directory for the test
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_path)
+
+                # Test log parsing step
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
+                    str(log_file)
+                ], env=env, capture_output=True, text=True)
+
+                assert result.returncode == 0
+                assert Path("pytest-logs.txt").exists()
+
+                # Verify log parsing output
+                log_content = Path("pytest-logs.txt").read_text()
+                assert "test_numpy_operations" in log_content
+                assert "test_pandas_groupby" in log_content
+                assert "AssertionError" in log_content
+
+                # Test bisection data creation
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.simple_bisect",
+                    "--packages", "numpy,pandas,xarray,zarr",
+                    "--log-path", str(log_file),
+                    "--captured-versions", str(versions_file),
+                    "--branch", "test-bisect-branch",
+                    "--store-run"
+                ], env=env, capture_output=True, text=True)
+
+                assert result.returncode == 0
+
+                # Check that run file was created
+                run_files = list(Path(".").glob("run_*.json"))
+                assert len(run_files) == 1
+
+                # Verify run file content
+                run_data = json.loads(run_files[0].read_text())
+                assert run_data["test_status"] == "failed"
+                assert len(run_data["failed_tests"]) == 2
+                assert "tests/test_data_processing.py::test_numpy_operations" in run_data["failed_tests"]
+                assert "tests/test_analysis.py::test_pandas_groupby[method-mean]" in run_data["failed_tests"]
+                assert "numpy" in run_data["packages"]
+                assert "pandas" in run_data["packages"]
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_package_tracking_integration(self):
+        """Test package version tracking integration."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            env = os.environ.copy()
+            env["TRACK_PACKAGES"] = "pytest,setuptools"  # Use packages we know exist
+
+            # Test package capture
+            result = subprocess.run([
+                sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"
+            ], env=env, cwd=temp_dir, capture_output=True, text=True)
+
+            assert result.returncode == 0
+
+            # Verify output file
+            output_file = Path(temp_dir) / "captured-package-versions.json"
+            assert output_file.exists()
+
+            data = json.loads(output_file.read_text())
+            assert "packages" in data
+            assert "python_version" in data
+            assert "pytest" in data["packages"]
+            assert "setuptools" in data["packages"]
+
+    def test_run_metadata_extraction(self):
+        """Test the run metadata extraction CLI."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create a test run file
+            run_data = {
+                "test_status": "failed",
+                "failed_tests": ["test_a.py::test_1", "test_b.py::test_2"],
+                "timestamp": "2024-01-01T10:00:00Z",
+                "packages": {"numpy": {"version": "1.25.0"}}
+            }
+
+            run_file = temp_path / "run_12345.json"
+            with run_file.open("w") as f:
+                json.dump(run_data, f)
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_path)
+
+                # Test status extraction
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.extract_run_metadata",
+                    "test_status"
+                ], capture_output=True, text=True)
+
+                assert result.returncode == 0
+                assert result.stdout.strip() == "failed"
+
+                # Test failed count extraction
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.extract_run_metadata",
+                    "failed_count"
+                ], capture_output=True, text=True)
+
+                assert result.returncode == 0
+                assert result.stdout.strip() == "2"
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_successful_run_workflow(self):
+        """Test workflow when all tests pass."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create passing test scenario
+            log_file = self.create_realistic_pytest_log(temp_path, "all_pass")
+            versions_file = self.create_realistic_package_versions(temp_path, "stable_versions")
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_path)
+
+                # Test log parsing
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
+                    str(log_file)
+                ], capture_output=True, text=True)
+
+                assert result.returncode == 0
+
+                # For passing tests, the action should still work but produce different output
+                log_content = Path("pytest-logs.txt").read_text()
+                # The exact content will depend on implementation, but it should not crash
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_error_handling(self):
+        """Test error handling for various failure modes."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+
+                # Test with missing log file
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
+                    "nonexistent.jsonl"
+                ], capture_output=True, text=True)
+
+                # Should handle missing files gracefully
+                assert result.returncode != 0  # Expected to fail
+
+                # Test with invalid JSON
+                bad_log = Path("bad.jsonl")
+                bad_log.write_text("invalid json content")
+
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
+                    str(bad_log)
+                ], capture_output=True, text=True)
+
+                # Should handle invalid JSON gracefully
+                assert result.returncode != 0  # Expected to fail
+
+            finally:
+                os.chdir(original_cwd)
+
+
+class TestRealisticScenarios:
+    """Test realistic scientific computing CI/CD scenarios."""
+
+    def test_nightly_wheel_scenario(self):
+        """Test scenario with nightly wheels causing failures."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create scenario: numpy nightly introduced breaking change
+            test_data = [
+                {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+                {
+                    "$report_type": "TestReport",
+                    "nodeid": "tests/test_numerical.py::test_array_ops",
+                    "outcome": "failed",
+                    "location": ("tests/test_numerical.py", 15, "test_array_ops"),
+                    "keywords": {},
+                    "when": "call",
+                    "longrepr": "AttributeError: module 'numpy' has no attribute 'array_function_like'",
+                },
+                {"$report_type": "SessionFinish", "exitstatus": "1"},
+            ]
+
+            log_file = temp_path / "pytest-log.jsonl"
+            with log_file.open("w") as f:
+                for record in test_data:
+                    json.dump(record, f)
+                    f.write("\n")
+
+            # Package versions showing nightly numpy
+            package_data = {
+                "python_version": "3.11.0",
+                "packages": {
+                    "numpy": {
+                        "version": "1.26.0.dev0+1598.g1234abc",
+                        "git_info": {"git_revision": "1234abc", "source": "version_string"}
+                    },
+                    "pandas": {"version": "2.1.0", "git_info": None},
+                },
+                "capture_method": "importlib.metadata"
+            }
+
+            versions_file = temp_path / "versions.json"
+            with versions_file.open("w") as f:
+                json.dump(package_data, f)
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_path)
+
+                # Test the complete pipeline
+                result = subprocess.run([
+                    sys.executable, "-m", "issue_from_pytest_log_action.simple_bisect",
+                    "--packages", "numpy,pandas",
+                    "--log-path", str(log_file),
+                    "--captured-versions", str(versions_file),
+                    "--branch", "test-nightly-scenario",
+                    "--store-run"
+                ], capture_output=True, text=True)
+
+                assert result.returncode == 0
+
+                # Verify the run data captures the nightly version correctly
+                run_files = list(Path(".").glob("run_*.json"))
+                assert len(run_files) == 1
+
+                run_data = json.loads(run_files[0].read_text())
+                assert run_data["test_status"] == "failed"
+                numpy_info = run_data["packages"]["numpy"]
+                assert "1.26.0.dev0" in numpy_info["version"]
+                assert numpy_info["git_info"]["git_revision"] == "1234abc"
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_version_pinning_scenario(self):
+        """Test scenario where version pinning resolves issues."""
+        # This would be useful for testing the bisection feature
+        # when we have historical data showing when a test last passed
+        pass
+
+
+class TestPerformance:
+    """Test performance with large datasets."""
+
+    def test_large_log_file_handling(self):
+        """Test handling of large pytest log files."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create a large log file (simulate 1000 tests)
+            log_file = temp_path / "large-pytest-log.jsonl"
+
+            with log_file.open("w") as f:
+                # Session start
+                json.dump({"$report_type": "SessionStart", "pytest_version": "7.4.0"}, f)
+                f.write("\n")
+
+                # Generate many test results
+                for i in range(1000):
+                    test_result = {
+                        "$report_type": "TestReport",
+                        "nodeid": f"tests/test_module_{i % 10}.py::test_function_{i}",
+                        "outcome": "failed" if i % 50 == 0 else "passed",  # 2% failure rate
+                        "location": (f"tests/test_module_{i % 10}.py", 10 + i % 100, f"test_function_{i}"),
+                        "keywords": {},
+                        "when": "call",
+                        "longrepr": f"AssertionError: Test {i} failed" if i % 50 == 0 else None,
+                    }
+
+                    json.dump(test_result, f)
+                    f.write("\n")
+
+                # Session finish
+                json.dump({"$report_type": "SessionFinish", "exitstatus": "1"}, f)
+                f.write("\n")
+
+            start_time = time.time()
+
+            # Test parsing performance
+            result = subprocess.run([
+                sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
+                str(log_file)
+            ], cwd=temp_path, capture_output=True, text=True)
+
+            processing_time = time.time() - start_time
+
+            assert result.returncode == 0
+            assert processing_time < 5.0  # Should process 1000 tests in under 5 seconds
+
+            # Verify output
+            assert Path(temp_path / "pytest-logs.txt").exists()
+            log_content = Path(temp_path / "pytest-logs.txt").read_text()
+
+            # Should contain information about the failed tests
+            assert "test_function_" in log_content
+
+    def test_many_packages_performance(self):
+        """Test performance with many tracked packages."""
+        # Test with a scenario tracking many packages
+        env = os.environ.copy()
+        env["TRACK_PACKAGES"] = "all"  # Track all installed packages
+
+        start_time = time.time()
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            result = subprocess.run([
+                sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"
+            ], env=env, cwd=temp_dir, capture_output=True, text=True)
+
+            processing_time = time.time() - start_time
+
+            assert result.returncode == 0
+            assert processing_time < 10.0  # Should complete in reasonable time
+
+            # Check that many packages were captured
+            output_file = Path(temp_dir) / "captured-package-versions.json"
+            data = json.loads(output_file.read_text())
+
+            # Should have captured multiple packages
+            assert len(data["packages"]) >= 5  # At least a few packages should be installed
+
+
+@pytest.mark.integration
+class TestGitHubActionEnvironment:
+    """Test components that simulate GitHub Actions environment."""
+
+    def test_environment_variable_handling(self):
+        """Test handling of GitHub Actions environment variables."""
+        env_vars = {
+            "GITHUB_WORKSPACE": "/github/workspace",
+            "GITHUB_REPOSITORY": "owner/repo",
+            "GITHUB_RUN_ID": "123456789",
+            "GITHUB_SHA": "abc123def456",
+        }
+
+        # These tests would verify that the action handles GitHub environment
+        # variables correctly, but we can't easily test this without actual
+        # GitHub Actions infrastructure
+        pass
+
+    def test_github_api_integration(self):
+        """Test GitHub API integration (would require mocking)."""
+        # This would test the JavaScript portion that creates issues
+        # For now, we can at least verify the data format is correct
+        pass
\ No newline at end of file
diff --git a/tests/test_parse_logs.py b/tests/test_parse_logs.py
new file mode 100644
index 0000000..f34fc3d
--- /dev/null
+++ b/tests/test_parse_logs.py
@@ -0,0 +1,482 @@
+"""Tests for parse_logs module."""
+
+import json
+import pathlib
+import tempfile
+import textwrap
+
+import pytest
+
+from issue_from_pytest_log_action.parse_logs import (
+    CollectionError,
+    PreformattedReport,
+    SessionFinish,
+    SessionStart,
+    compressed_report,
+    format_collection_error,
+    format_report,
+    format_summary,
+    include_bisection_info,
+    main,
+    merge_variants,
+    parse_nodeid,
+    parse_record,
+    strip_ansi,
+    summarize,
+    truncate,
+)
+
+
+class TestStripAnsi:
+    """Test ANSI escape sequence stripping."""
+
+    def test_strip_ansi_no_sequences(self):
+        """Test text without ANSI sequences."""
+        text = "Normal text"
+        assert strip_ansi(text) == "Normal text"
+
+    def test_strip_ansi_with_color_sequences(self):
+        """Test stripping color sequences."""
+        text = "\x1b[31mRed text\x1b[0m"
+        assert strip_ansi(text) == "Red text"
+
+    def test_strip_ansi_with_cursor_sequences(self):
+        """Test stripping cursor movement sequences."""
+        text = "\x1b[2J\x1b[HClear screen"
+        assert strip_ansi(text) == "Clear screen"
+
+    def test_strip_ansi_complex_sequences(self):
+        """Test stripping complex ANSI sequences."""
+        text = "\x1b[1;31;40mBold red on black\x1b[0m"
+        assert strip_ansi(text) == "Bold red on black"
+
+
+class TestSessionStart:
+    """Test SessionStart dataclass."""
+
+    def test_session_start_creation(self):
+        """Test creating SessionStart from JSON."""
+        data = {"$report_type": "SessionStart", "pytest_version": "7.4.0"}
+        session = SessionStart._from_json(data)
+        assert session.pytest_version == "7.4.0"
+        assert session.outcome == "status"
+
+    def test_session_start_with_custom_outcome(self):
+        """Test SessionStart with custom outcome."""
+        data = {"$report_type": "SessionStart", "pytest_version": "7.4.0", "outcome": "custom"}
+        session = SessionStart._from_json(data)
+        assert session.pytest_version == "7.4.0"
+        assert session.outcome == "custom"
+
+
+class TestSessionFinish:
+    """Test SessionFinish dataclass."""
+
+    def test_session_finish_creation(self):
+        """Test creating SessionFinish from JSON."""
+        data = {"$report_type": "SessionFinish", "exitstatus": "0"}
+        session = SessionFinish._from_json(data)
+        assert session.exitstatus == "0"
+        assert session.outcome == "status"
+
+
+class TestPreformattedReport:
+    """Test PreformattedReport dataclass."""
+
+    def test_preformatted_report_creation(self):
+        """Test creating PreformattedReport."""
+        report = PreformattedReport(
+            filepath="test.py", name="test_func", variant="param1", message="Test failed"
+        )
+        assert report.filepath == "test.py"
+        assert report.name == "test_func"
+        assert report.variant == "param1"
+        assert report.message == "Test failed"
+
+    def test_preformatted_report_strips_ansi(self):
+        """Test that PreformattedReport strips ANSI sequences."""
+        report = PreformattedReport(
+            filepath="test.py",
+            name="test_func",
+            variant=None,
+            message="\x1b[31mRed error message\x1b[0m",
+        )
+        assert report.message == "Red error message"
+
+
+class TestParseNodeid:
+    """Test nodeid parsing."""
+
+    def test_parse_nodeid_simple(self):
+        """Test parsing simple nodeid."""
+        result = parse_nodeid("test_file.py::test_function")
+        assert result == {"filepath": "test_file.py", "name": "test_function", "variant": None}
+
+    def test_parse_nodeid_with_variant(self):
+        """Test parsing nodeid with variant."""
+        result = parse_nodeid("test_file.py::test_function[param1]")
+        assert result == {"filepath": "test_file.py", "name": "test_function", "variant": "param1"}
+
+    def test_parse_nodeid_complex_variant(self):
+        """Test parsing nodeid with complex variant."""
+        result = parse_nodeid("test_file.py::test_function[param1-value2]")
+        assert result == {
+            "filepath": "test_file.py",
+            "name": "test_function",
+            "variant": "param1-value2",
+        }
+
+    def test_parse_nodeid_invalid(self):
+        """Test parsing invalid nodeid."""
+        with pytest.raises(ValueError, match="unknown test id"):
+            parse_nodeid("invalid_nodeid")
+
+
+class TestParseRecord:
+    """Test record parsing."""
+
+    def test_parse_record_session_start(self):
+        """Test parsing SessionStart record."""
+        record = {"$report_type": "SessionStart", "pytest_version": "7.4.0"}
+        result = parse_record(record)
+        assert isinstance(result, SessionStart)
+        assert result.pytest_version == "7.4.0"
+
+    def test_parse_record_session_finish(self):
+        """Test parsing SessionFinish record."""
+        record = {"$report_type": "SessionFinish", "exitstatus": "0"}
+        result = parse_record(record)
+        assert isinstance(result, SessionFinish)
+        assert result.exitstatus == "0"
+
+    def test_parse_record_unknown_type(self):
+        """Test parsing unknown record type."""
+        record = {"$report_type": "UnknownType", "data": "value"}
+        with pytest.raises(ValueError, match="unknown report type"):
+            parse_record(record)
+
+
+class TestFormatSummary:
+    """Test summary formatting."""
+
+    def test_format_summary_with_variant(self):
+        """Test formatting summary with variant."""
+        report = PreformattedReport(
+            filepath="test.py", name="test_func", variant="param1", message="Failed"
+        )
+        result = format_summary(report)
+        assert result == "test.py::test_func[param1]: Failed"
+
+    def test_format_summary_without_variant(self):
+        """Test formatting summary without variant."""
+        report = PreformattedReport(
+            filepath="test.py", name="test_func", variant=None, message="Failed"
+        )
+        result = format_summary(report)
+        assert result == "test.py::test_func: Failed"
+
+    def test_format_summary_no_name(self):
+        """Test formatting summary without function name."""
+        report = PreformattedReport(filepath="test.py", name=None, variant=None, message="Failed")
+        result = format_summary(report)
+        assert result == "test.py: Failed"
+
+
+class TestFormatReport:
+    """Test report formatting."""
+
+    def test_format_report_basic(self):
+        """Test basic report formatting."""
+        summaries = ["test1.py::test_func: Failed", "test2.py::test_other: Error"]
+        result = format_report(summaries, "3.9")
+
+        expected = textwrap.dedent("""\
+        <details><summary>Python 3.9 Test Summary</summary>
+
+        ```
+        test1.py::test_func: Failed
+        test2.py::test_other: Error
+        ```
+
+        </details>
+        """)
+        assert result == expected
+
+    def test_format_report_empty(self):
+        """Test report formatting with no summaries."""
+        result = format_report([], "3.9")
+        expected = textwrap.dedent("""\
+        <details><summary>Python 3.9 Test Summary</summary>
+
+        ```
+
+        ```
+
+        </details>
+        """)
+        assert result == expected
+
+
+class TestMergeVariants:
+    """Test variant merging functionality."""
+
+    def test_merge_variants_single_variant(self):
+        """Test merging with single variant."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name="test_func", variant="param1", message="Failed"
+            )
+        ]
+        result = merge_variants(reports, max_chars=1000, py_version="3.9")
+        assert "test.py::test_func[param1]: Failed" in result
+
+    def test_merge_variants_multiple_variants(self):
+        """Test merging multiple variants of same test."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name="test_func", variant="param1", message="Failed"
+            ),
+            PreformattedReport(
+                filepath="test.py", name="test_func", variant="param2", message="Failed"
+            ),
+        ]
+        result = merge_variants(reports, max_chars=1000, py_version="3.9")
+        assert "test.py::test_func[2 failing variants]: Failed" in result
+
+    def test_merge_variants_no_variant(self):
+        """Test merging with no variants."""
+        reports = [
+            PreformattedReport(filepath="test.py", name="test_func", variant=None, message="Failed")
+        ]
+        result = merge_variants(reports, max_chars=1000, py_version="3.9")
+        assert "test.py::test_func: Failed" in result
+
+
+class TestTruncate:
+    """Test truncation functionality."""
+
+    def test_truncate_fits_all(self):
+        """Test truncation when all reports fit."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name="test_func1", variant=None, message="Failed"
+            ),
+            PreformattedReport(
+                filepath="test.py", name="test_func2", variant=None, message="Failed"
+            ),
+        ]
+        result = truncate(reports, max_chars=10000, py_version="3.9")
+        assert result is not None
+        # truncate function always tries fractions, so check for the actual behavior
+        # With 2 reports and 95% fraction, we get 1 report + summary
+        assert "test.py::test_func1: Failed" in result
+        assert "+ 1 failing tests" in result
+
+    def test_truncate_needs_truncation(self):
+        """Test truncation when reports need to be truncated."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name=f"test_func{i}", variant=None, message="Failed"
+            )
+            for i in range(100)
+        ]
+        result = truncate(reports, max_chars=500, py_version="3.9")
+        assert result is not None
+        assert "failing tests" in result
+
+    def test_truncate_too_large(self):
+        """Test truncation when even smallest result is too large."""
+        reports = [
+            PreformattedReport(
+                filepath="very_long_filename_that_exceeds_limits.py",
+                name="very_long_function_name_that_also_exceeds_limits",
+                variant=None,
+                message="Very long error message that makes everything too large for limits",
+            )
+            for i in range(10)
+        ]
+        result = truncate(reports, max_chars=50, py_version="3.9")
+        assert result is None
+
+
+class TestSummarize:
+    """Test summarize functionality."""
+
+    def test_summarize_multiple_reports(self):
+        """Test summarizing multiple reports."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name="test_func1", variant=None, message="Failed"
+            ),
+            PreformattedReport(
+                filepath="test.py", name="test_func2", variant=None, message="Failed"
+            ),
+            PreformattedReport(
+                filepath="test.py", name="test_func3", variant=None, message="Failed"
+            ),
+        ]
+        result = summarize(reports, py_version="3.9")
+        assert "3 failing tests" in result
+
+    def test_summarize_single_report(self):
+        """Test summarizing single report."""
+        reports = [
+            PreformattedReport(filepath="test.py", name="test_func", variant=None, message="Failed")
+        ]
+        result = summarize(reports, py_version="3.9")
+        assert "1 failing tests" in result
+
+
+class TestCompressedReport:
+    """Test compressed report functionality."""
+
+    def test_compressed_report_fits_all(self):
+        """Test compressed report when all fits."""
+        reports = [
+            PreformattedReport(filepath="test.py", name="test_func", variant=None, message="Failed")
+        ]
+        result = compressed_report(reports, max_chars=10000, py_version="3.9")
+        assert "test.py::test_func: Failed" in result
+
+    def test_compressed_report_needs_compression(self):
+        """Test compressed report with compression needed."""
+        reports = [
+            PreformattedReport(
+                filepath="test.py", name=f"test_func{i}", variant=None, message="Failed"
+            )
+            for i in range(100)
+        ]
+        result = compressed_report(reports, max_chars=500, py_version="3.9")
+        assert result is not None
+        assert "failing tests" in result
+
+
+class TestFormatCollectionError:
+    """Test collection error formatting."""
+
+    def test_format_collection_error(self):
+        """Test formatting collection error."""
+        error = CollectionError(
+            name="test collection session", repr_="ImportError: No module named 'missing'"
+        )
+        result = format_collection_error(error, py_version="3.9")
+
+        assert "Python 3.9 Test Summary" in result
+        assert "test collection session failed:" in result
+        assert "ImportError: No module named 'missing'" in result
+
+
+class TestIncludeBisectionInfo:
+    """Test bisection info inclusion."""
+
+    def test_include_bisection_info_no_file(self):
+        """Test when bisection file doesn't exist."""
+        message = "Original message"
+        result = include_bisection_info(message, bisect_file="nonexistent.txt")
+        assert result == "Original message"
+
+    def test_include_bisection_info_with_file(self):
+        """Test when bisection file exists."""
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".txt", delete=False) as f:
+            f.write("Bisection info: Package X changed from v1.0 to v2.0")
+            bisect_file = f.name
+
+        try:
+            message = "Original message"
+            result = include_bisection_info(message, bisect_file=bisect_file)
+            expected = "Bisection info: Package X changed from v1.0 to v2.0\nOriginal message"
+            assert result == expected
+        finally:
+            pathlib.Path(bisect_file).unlink()
+
+    def test_include_bisection_info_empty_file(self):
+        """Test when bisection file is empty."""
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".txt", delete=False) as f:
+            f.write("")
+            bisect_file = f.name
+
+        try:
+            message = "Original message"
+            result = include_bisection_info(message, bisect_file=bisect_file)
+            assert result == "Original message"
+        finally:
+            pathlib.Path(bisect_file).unlink()
+
+
+class TestMain:
+    """Test main function."""
+
+    def test_main_with_test_data(self):
+        """Test main function with test data."""
+        # Create test log data with proper TestReport fields
+        test_data = [
+            {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+            {
+                "$report_type": "TestReport",
+                "nodeid": "test_example.py::test_failing",
+                "outcome": "failed",
+                "location": ("test_example.py", 10, "test_failing"),
+                "keywords": {},
+                "when": "call",
+                "longrepr": "AssertionError: Expected True",
+            },
+            {"$report_type": "SessionFinish", "exitstatus": "1"},
+        ]
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
+            for item in test_data:
+                json.dump(item, f)
+                f.write("\n")
+            log_file = f.name
+
+        try:
+            # Test main function
+            main([log_file])
+
+            # Check output file was created
+            output_file = pathlib.Path("pytest-logs.txt")
+            assert output_file.exists()
+
+            content = output_file.read_text()
+            assert "test_example.py::test_failing" in content
+            assert "AssertionError: Expected True" in content
+
+        finally:
+            pathlib.Path(log_file).unlink()
+            output_file = pathlib.Path("pytest-logs.txt")
+            if output_file.exists():
+                output_file.unlink()
+
+    def test_main_with_collection_error(self):
+        """Test main function with collection error."""
+        test_data = [
+            {
+                "$report_type": "CollectReport",
+                "nodeid": "",
+                "outcome": "failed",
+                "result": [],  # Required field for CollectReport
+                "longrepr": "ImportError: No module named 'missing_module'",
+            }
+        ]
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
+            for item in test_data:
+                json.dump(item, f)
+                f.write("\n")
+            log_file = f.name
+
+        try:
+            main([log_file])
+
+            output_file = pathlib.Path("pytest-logs.txt")
+            assert output_file.exists()
+
+            content = output_file.read_text()
+            assert "test collection session failed:" in content
+            assert "ImportError: No module named 'missing_module'" in content
+
+        finally:
+            pathlib.Path(log_file).unlink()
+            output_file = pathlib.Path("pytest-logs.txt")
+            if output_file.exists():
+                output_file.unlink()
diff --git a/tests/test_scientific_packages.py b/tests/test_scientific_packages.py
new file mode 100644
index 0000000..3920a55
--- /dev/null
+++ b/tests/test_scientific_packages.py
@@ -0,0 +1,263 @@
+"""Tests focused on key scientific packages: pandas, zarr, numpy, and xarray.
+
+These tests focus on real-world scenarios with the main scientific computing packages
+that users are most likely to encounter in their CI/CD pipelines.
+"""
+
+import json
+import tempfile
+from pathlib import Path
+from unittest import mock
+
+import pytest
+
+from issue_from_pytest_log_action.capture_versions import extract_git_info
+from issue_from_pytest_log_action.track_packages import (
+    clean_version_for_tag,
+    format_version_with_git,
+    generate_package_diff_link,
+    get_package_changes,
+)
+
+
+class TestScientificPackageMetadata:
+    """Test metadata for core scientific packages."""
+
+    def test_numpy_metadata(self):
+        """Test numpy package diff link generation."""
+        link = generate_package_diff_link("numpy", "1.24.0", "1.25.0")
+        assert link is not None
+        assert "github.com/numpy/numpy/compare" in link
+        assert "v1.24.0...v1.25.0" in link
+
+    def test_pandas_metadata(self):
+        """Test pandas package diff link generation."""
+        link = generate_package_diff_link("pandas", "2.0.0", "2.1.0")
+        assert link is not None
+        assert "github.com/pandas-dev/pandas/compare" in link
+        assert "v2.0.0...v2.1.0" in link
+
+    def test_xarray_metadata(self):
+        """Test xarray package diff link generation."""
+        link = generate_package_diff_link("xarray", "2023.1.0", "2023.2.0")
+        assert link is not None
+        assert "github.com/pydata/xarray/compare" in link
+        assert "v2023.1.0...v2023.2.0" in link
+
+    def test_zarr_metadata(self):
+        """Test zarr package diff link generation."""
+        link = generate_package_diff_link("zarr", "2.14.0", "2.15.0")
+        assert link is not None
+        assert "github.com/zarr-developers/zarr-python/compare" in link
+        assert "v2.14.0...v2.15.0" in link
+
+
+class TestScientificPackageVersionCleaning:
+    """Test version cleaning for scientific packages with realistic versions."""
+
+    def test_numpy_nightly_versions(self):
+        """Test cleaning numpy nightly versions."""
+        # NumPy nightly format: 1.26.0.dev0+1234.g5678abc
+        assert clean_version_for_tag("1.26.0.dev0+1234.g5678abc") == "1.26.0"
+        assert clean_version_for_tag("2.0.0.dev0+456.gabc123d") == "2.0.0"
+
+    def test_pandas_rc_versions(self):
+        """Test cleaning pandas release candidate versions."""
+        assert clean_version_for_tag("2.1.0rc1") == "2.1.0rc1"
+        assert clean_version_for_tag("2.2.0rc2.dev0+123.gabc") == "2.2.0rc2"
+
+    def test_xarray_alpha_versions(self):
+        """Test cleaning xarray alpha versions."""
+        assert clean_version_for_tag("2024.1.0a1") == "2024.1.0a1"
+        assert clean_version_for_tag("2024.2.0a2.dev0+git.abc123") == "2024.2.0a2"
+
+    def test_zarr_dev_versions(self):
+        """Test cleaning zarr development versions."""
+        assert clean_version_for_tag("2.16.0.dev0") == "2.16.0"
+        assert clean_version_for_tag("3.0.0.dev123+g456def") == "3.0.0"
+
+
+class TestScientificPackageChanges:
+    """Test package change detection for scientific computing stacks."""
+
+    def test_scientific_stack_upgrade(self):
+        """Test detecting changes in a typical scientific computing stack."""
+        current = {
+            "numpy": {"version": "1.25.0", "git_info": {"git_revision": "abc123"}},
+            "pandas": {"version": "2.1.0", "git_info": None},
+            "xarray": {"version": "2023.8.0", "git_info": None},
+            "zarr": {"version": "2.15.0", "git_info": {"git_revision": "def456"}},
+        }
+
+        previous = {
+            "numpy": {"version": "1.24.0", "git_info": {"git_revision": "xyz789"}},
+            "pandas": {"version": "2.0.0", "git_info": None},
+            "xarray": {"version": "2023.7.0", "git_info": None},
+            "zarr": {"version": "2.14.0", "git_info": {"git_revision": "uvw012"}},
+        }
+
+        changes = get_package_changes(current, previous)
+
+        # Should detect all 4 package changes
+        assert len(changes) == 4
+
+        # Check that all packages are mentioned
+        change_text = " ".join(changes)
+        assert "numpy" in change_text
+        assert "pandas" in change_text
+        assert "xarray" in change_text
+        assert "zarr" in change_text
+
+        # Check version changes
+        assert "1.24.0" in change_text and "1.25.0" in change_text
+        assert "2.0.0" in change_text and "2.1.0" in change_text
+
+    def test_nightly_wheel_installation(self):
+        """Test tracking nightly wheel installations."""
+        current = {
+            "numpy": {
+                "version": "1.26.0.dev0+1234.g5678abc",
+                "git_info": {"git_revision": "5678abc", "source": "version_string"}
+            },
+            "pandas": {
+                "version": "2.2.0.dev0+567.gdef123",
+                "git_info": {"git_revision": "def123", "source": "version_string"}
+            },
+        }
+
+        previous = {
+            "numpy": {"version": "1.25.0", "git_info": None},
+            "pandas": {"version": "2.1.0", "git_info": None},
+        }
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 2
+        change_text = " ".join(changes)
+
+        # Should show git hashes for nightly versions
+        assert "(5678abc)" in change_text
+        assert "(def123)" in change_text
+
+    def test_new_scientific_dependency(self):
+        """Test detecting new scientific package additions."""
+        current = {
+            "numpy": {"version": "1.25.0", "git_info": None},
+            "pandas": {"version": "2.1.0", "git_info": None},
+            "xarray": {"version": "2023.8.0", "git_info": None},  # New dependency
+        }
+
+        previous = {
+            "numpy": {"version": "1.25.0", "git_info": None},
+            "pandas": {"version": "2.1.0", "git_info": None},
+        }
+
+        changes = get_package_changes(current, previous)
+
+        assert len(changes) == 1
+        assert "xarray" in changes[0]
+        assert "(new)" in changes[0]
+        assert "2023.8.0" in changes[0]
+
+
+class TestScientificPackageGitInfo:
+    """Test git info extraction for scientific packages."""
+
+    def test_format_numpy_with_git_info(self):
+        """Test formatting numpy with git revision."""
+        package_info = {
+            "version": "1.26.0.dev0+1234.g5678abc",
+            "git_info": {"git_revision": "5678abcdef123456789"}
+        }
+
+        result = format_version_with_git(package_info)
+        assert result == "1.26.0.dev0+1234.g5678abc (5678abcd)"
+
+    def test_format_pandas_without_git_info(self):
+        """Test formatting pandas without git revision."""
+        package_info = {"version": "2.1.0", "git_info": None}
+
+        result = format_version_with_git(package_info)
+        assert result == "2.1.0"
+
+    def test_extract_git_from_nightly_versions(self):
+        """Test extracting git info from nightly package versions."""
+        # Test various nightly version formats
+        test_cases = [
+            ("numpy", "1.26.0.dev0+1234.g5678abc", "5678abc"),
+            ("pandas", "2.2.0.dev0+567.gdef123", "def123"),
+            ("xarray", "2024.1.0.dev0+89.gabc456", "abc456"),
+        ]
+
+        for package, version, expected_hash in test_cases:
+            with mock.patch("issue_from_pytest_log_action.capture_versions.extract_git_info") as mock_extract:
+                mock_extract.return_value = {"git_revision": expected_hash, "source": "version_string"}
+
+                git_info = extract_git_info(package)
+
+                if git_info:
+                    assert git_info["git_revision"] == expected_hash
+                    assert git_info["source"] == "version_string"
+
+
+class TestScientificPackageIntegration:
+    """Integration tests for scientific package tracking."""
+
+    def test_capture_scientific_packages(self):
+        """Test capturing versions of key scientific packages."""
+        import os
+        import subprocess
+        import sys
+
+        # Test with packages that are commonly available
+        test_packages = "pytest,setuptools"  # Use packages we know exist
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            env = os.environ.copy()
+            env["TRACK_PACKAGES"] = test_packages
+
+            result = subprocess.run(
+                [sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"],
+                env=env,
+                cwd=tmpdir,
+                capture_output=True,
+                text=True,
+            )
+
+            assert result.returncode == 0
+
+            # Check that output file was created
+            output_file = Path(tmpdir) / "captured-package-versions.json"
+            assert output_file.exists()
+
+            # Check content
+            data = json.loads(output_file.read_text())
+            assert "packages" in data
+            assert "python_version" in data
+
+            # Should have captured the test packages
+            packages = data["packages"]
+            assert "pytest" in packages
+            assert "setuptools" in packages
+
+    def test_diff_links_for_scientific_packages(self):
+        """Test that diff links work for all key scientific packages."""
+        scientific_packages = ["numpy", "pandas", "xarray", "zarr"]
+
+        for package in scientific_packages:
+            # Test basic version diff
+            link = generate_package_diff_link(package, "1.0.0", "1.1.0")
+            assert link is not None, f"Failed to generate diff link for {package}"
+            assert f"github.com" in link
+            assert package in link or package.replace("-", "") in link
+
+            # Test with git commit info
+            old_git_info = {"git_revision": "abc123"}
+            new_git_info = {"git_revision": "def456"}
+
+            link_with_git = generate_package_diff_link(
+                package, "1.0.0", "1.1.0", old_git_info, new_git_info
+            )
+            assert link_with_git is not None
+            assert "abc123" in link_with_git
+            assert "def456" in link_with_git
\ No newline at end of file
diff --git a/tests/test_simple_bisect.py b/tests/test_simple_bisect.py
new file mode 100644
index 0000000..3d1575a
--- /dev/null
+++ b/tests/test_simple_bisect.py
@@ -0,0 +1,309 @@
+"""Tests for simple_bisect module."""
+
+import json
+import tempfile
+from pathlib import Path
+from unittest import mock
+
+import pytest
+
+from issue_from_pytest_log_action.simple_bisect import main
+
+
+class TestSimpleBisectMain:
+    """Test simple_bisect main function."""
+
+    def test_main_store_run_success(self):
+        """Test storing a run successfully."""
+        # Create test log file
+        test_log_data = [
+            {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+            {
+                "$report_type": "TestReport",
+                "nodeid": "test_example.py::test_failing",
+                "outcome": "failed",
+                "location": ("test_example.py", 10, "test_failing"),
+                "keywords": {},
+                "when": "call",
+                "longrepr": "Test failed",
+            },
+            {"$report_type": "SessionFinish", "exitstatus": "1"},
+        ]
+
+        # Create test captured versions file
+        test_versions = {
+            "python_version": "3.9.0",
+            "packages": {
+                "numpy": {"version": "1.21.0", "git_info": {"revision": "abc123"}},
+                "pandas": {"version": "1.3.0", "git_info": None},
+            },
+        }
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Write test files
+            log_file = temp_path / "test.jsonl"
+            versions_file = temp_path / "versions.json"
+
+            with log_file.open("w") as f:
+                for item in test_log_data:
+                    json.dump(item, f)
+                    f.write("\n")
+
+            with versions_file.open("w") as f:
+                json.dump(test_versions, f)
+
+            # Test storing run
+            args = [
+                "--packages",
+                "numpy,pandas",
+                "--log-path",
+                str(log_file),
+                "--captured-versions",
+                str(versions_file),
+                "--branch",
+                "test-branch",
+                "--store-run",
+            ]
+
+            # Change to temp directory to capture output files
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                main(args)
+
+                # Check that a run file was created
+                run_files = list(Path(".").glob("run_*.json"))
+                assert len(run_files) == 1
+
+                # Verify run file content
+                run_data = json.loads(run_files[0].read_text())
+                assert run_data["test_status"] == "failed"
+                assert len(run_data["failed_tests"]) == 1
+                assert run_data["failed_tests"][0] == "test_example.py::test_failing"
+                assert "numpy" in run_data["packages"]
+                assert "pandas" in run_data["packages"]
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_main_store_run_passed_tests(self):
+        """Test storing a run with passed tests."""
+        test_log_data = [
+            {"$report_type": "SessionStart", "pytest_version": "7.4.0"},
+            {
+                "$report_type": "TestReport",
+                "nodeid": "test_example.py::test_passing",
+                "outcome": "passed",
+            },
+            {"$report_type": "SessionFinish", "exitstatus": "0"},
+        ]
+
+        test_versions = {
+            "python_version": "3.9.0",
+            "packages": {"numpy": {"version": "1.21.0", "git_info": None}},
+        }
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+            log_file = temp_path / "test.jsonl"
+            versions_file = temp_path / "versions.json"
+
+            with log_file.open("w") as f:
+                for item in test_log_data:
+                    json.dump(item, f)
+                    f.write("\n")
+
+            with versions_file.open("w") as f:
+                json.dump(test_versions, f)
+
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                main(
+                    [
+                        "--packages",
+                        "numpy",
+                        "--log-path",
+                        str(log_file),
+                        "--captured-versions",
+                        str(versions_file),
+                        "--branch",
+                        "test-branch",
+                        "--store-run",
+                    ]
+                )
+
+                run_files = list(Path(".").glob("run_*.json"))
+                assert len(run_files) == 1
+
+                run_data = json.loads(run_files[0].read_text())
+                assert run_data["test_status"] == "passed"
+                assert len(run_data["failed_tests"]) == 0
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_main_generate_comparison_no_data(self):
+        """Test generating comparison with no historical data."""
+        test_log_data = [{"$report_type": "SessionFinish", "exitstatus": "1"}]
+        test_versions = {"python_version": "3.9.0", "packages": {}}
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+            log_file = temp_path / "test.jsonl"
+            versions_file = temp_path / "versions.json"
+
+            with log_file.open("w") as f:
+                for item in test_log_data:
+                    json.dump(item, f)
+                    f.write("\n")
+
+            with versions_file.open("w") as f:
+                json.dump(test_versions, f)
+
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                main(
+                    [
+                        "--packages",
+                        "numpy",
+                        "--log-path",
+                        str(log_file),
+                        "--captured-versions",
+                        str(versions_file),
+                        "--branch",
+                        "test-branch",
+                        "--generate-comparison",
+                    ]
+                )
+
+                # Check that bisect-comparison.txt was NOT created (no failed tests)
+                comparison_file = Path("bisect-comparison.txt")
+                assert not comparison_file.exists()
+
+            finally:
+                os.chdir(original_cwd)
+
+    @mock.patch("subprocess.run")
+    def test_main_generate_comparison_with_data(self, mock_subprocess):
+        """Test generating comparison with historical data."""
+        # Mock git log to return fake historical data
+        mock_result = mock.Mock()
+        mock_result.stdout = json.dumps(
+            {
+                "timestamp": "2024-01-01T10:00:00Z",
+                "test_status": "passed",
+                "packages": {"numpy": {"version": "1.20.0", "git_info": None}},
+                "failed_tests": [],
+            }
+        )
+        mock_result.returncode = 0
+        mock_subprocess.return_value = mock_result
+
+        test_log_data = [
+            {
+                "$report_type": "TestReport",
+                "nodeid": "test_example.py::test_failing",
+                "outcome": "failed",
+                "location": ("test_example.py", 10, "test_failing"),
+                "keywords": {},
+                "when": "call",
+                "longrepr": "Test failed",
+            },
+            {"$report_type": "SessionFinish", "exitstatus": "1"},
+        ]
+        test_versions = {
+            "python_version": "3.9.0",
+            "packages": {"numpy": {"version": "1.21.0", "git_info": None}},
+        }
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+            log_file = temp_path / "test.jsonl"
+            versions_file = temp_path / "versions.json"
+
+            with log_file.open("w") as f:
+                for item in test_log_data:
+                    json.dump(item, f)
+                    f.write("\n")
+
+            with versions_file.open("w") as f:
+                json.dump(test_versions, f)
+
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                main(
+                    [
+                        "--packages",
+                        "numpy",
+                        "--log-path",
+                        str(log_file),
+                        "--captured-versions",
+                        str(versions_file),
+                        "--branch",
+                        "test-branch",
+                        "--generate-comparison",
+                    ]
+                )
+
+                comparison_file = Path("bisect-comparison.txt")
+                assert comparison_file.exists()
+
+                content = comparison_file.read_text()
+                # Should contain comparison information
+                assert content.strip() != ""
+
+            finally:
+                os.chdir(original_cwd)
+
+    def test_main_invalid_args(self):
+        """Test main with invalid arguments."""
+        with pytest.raises(SystemExit):
+            main(["--invalid-arg"])
+
+    def test_main_missing_required_args(self):
+        """Test main with missing required arguments."""
+        with pytest.raises(SystemExit):
+            main(["--store-run"])
+
+    def test_main_missing_files(self):
+        """Test main with missing input files."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                # This should fail gracefully - the specific behavior depends on implementation
+                # At minimum it shouldn't crash with unhandled exceptions
+                try:
+                    main(
+                        [
+                            "--packages",
+                            "numpy",
+                            "--log-path",
+                            "nonexistent.jsonl",
+                            "--captured-versions",
+                            "nonexistent.json",
+                            "--branch",
+                            "test-branch",
+                            "--store-run",
+                        ]
+                    )
+                except (FileNotFoundError, SystemExit):
+                    # Expected behavior when files don't exist
+                    pass
+            finally:
+                os.chdir(original_cwd)
diff --git a/tests/test_track_packages.py b/tests/test_track_packages.py
new file mode 100644
index 0000000..d470ab6
--- /dev/null
+++ b/tests/test_track_packages.py
@@ -0,0 +1,503 @@
+"""Tests for track_packages module."""
+
+import json
+import subprocess
+import tempfile
+from pathlib import Path
+from unittest import mock
+
+from issue_from_pytest_log_action.track_packages import (
+    PACKAGE_METADATA,
+    clean_version_for_tag,
+    create_bisect_data,
+    extract_failed_tests_from_log,
+    find_last_successful_run_for_tests,
+    format_bisect_comparison,
+    generate_package_diff_link,
+    get_git_info,
+    get_package_changes,
+    retrieve_last_successful_run,
+)
+
+
+class TestPackageMetadata:
+    """Test package metadata constants."""
+
+    def test_package_metadata_structure(self):
+        """Test that package metadata has expected structure."""
+        assert isinstance(PACKAGE_METADATA, dict)
+        assert "numpy" in PACKAGE_METADATA
+        assert "github" in PACKAGE_METADATA["numpy"]
+        assert "tag_format" in PACKAGE_METADATA["numpy"]
+
+    def test_tag_formats(self):
+        """Test that tag formats are reasonable."""
+        for pkg, meta in PACKAGE_METADATA.items():
+            tag_format = meta["tag_format"]
+            assert "{version}" in tag_format
+            # Tag format should produce a valid tag
+            test_version = "1.0.0"
+            tag = tag_format.format(version=test_version)
+            assert test_version in tag
+
+
+class TestCleanVersionForTag:
+    """Test version cleaning for tag generation."""
+
+    def test_clean_stable_version(self):
+        """Test cleaning stable version."""
+        assert clean_version_for_tag("1.2.3") == "1.2.3"
+        assert clean_version_for_tag("2.0.0") == "2.0.0"
+
+    def test_clean_dev_version(self):
+        """Test cleaning dev version."""
+        assert clean_version_for_tag("1.2.3.dev0") == "1.2.3"
+        assert clean_version_for_tag("2.0.0.dev123") == "2.0.0"
+
+    def test_clean_nightly_version(self):
+        """Test cleaning nightly version."""
+        assert clean_version_for_tag("1.2.3.dev0+123.gabc123d") == "1.2.3"
+        assert clean_version_for_tag("2.1.0.dev0+456.gdef456a") == "2.1.0"
+
+    def test_clean_rc_version(self):
+        """Test cleaning release candidate version."""
+        assert clean_version_for_tag("1.2.3rc1") == "1.2.3rc1"
+        assert clean_version_for_tag("2.0.0a1") == "2.0.0a1"
+
+    def test_clean_post_version(self):
+        """Test cleaning post-release version."""
+        assert clean_version_for_tag("1.2.3.post1") == "1.2.3"
+        assert clean_version_for_tag("2.0.0.post123") == "2.0.0"
+
+    def test_clean_complex_version(self):
+        """Test cleaning complex version with multiple suffixes."""
+        assert clean_version_for_tag("1.2.3a1.dev0+abc.g123456") == "1.2.3a1"
+        assert clean_version_for_tag("2.0.0rc1.post1.dev0") == "2.0.0rc1"
+
+
+class TestGeneratePackageDiffLink:
+    """Test package diff link generation."""
+
+    def test_generate_diff_link_numpy(self):
+        """Test diff link for numpy."""
+        link = generate_package_diff_link("numpy", "1.21.0", "1.22.0")
+        assert link is not None
+        assert "github.com/numpy/numpy/compare" in link
+        assert "v1.21.0" in link
+        assert "v1.22.0" in link
+
+    def test_generate_diff_link_with_git_commit(self):
+        """Test diff link with git commit info."""
+        old_git_info = {"git_revision": "abc123"}
+        new_git_info = {"git_revision": "def456"}
+
+        link = generate_package_diff_link("numpy", "1.21.0", "1.22.0", old_git_info, new_git_info)
+        assert link is not None
+        assert "github.com/numpy/numpy/compare" in link
+        assert "abc123" in link
+        assert "def456" in link
+
+    def test_generate_diff_link_sqlalchemy_prefix(self):
+        """Test diff link for SQLAlchemy with rel_ prefix."""
+        link = generate_package_diff_link("sqlalchemy", "1.4.0", "1.4.1")
+        assert link is not None
+        assert "github.com/sqlalchemy/sqlalchemy/compare" in link
+        assert "rel_1_4_0" in link
+        assert "rel_1_4_1" in link
+
+    def test_generate_diff_link_unknown_package(self):
+        """Test diff link for unknown package."""
+        link = generate_package_diff_link("unknown_package", "1.0.0", "2.0.0")
+        assert link is None
+
+
+class TestGetPackageChanges:
+    """Test package change detection."""
+
+    def test_get_package_changes_version_change(self):
+        """Test detecting version changes."""
+        old_packages = {"numpy": "1.21.0", "pandas": "1.3.0"}
+        new_packages = {"numpy": "1.22.0", "pandas": "1.3.0"}
+
+        changes = get_package_changes(new_packages, old_packages)
+        assert len(changes) == 1
+        assert "numpy: 1.21.0 → 1.22.0" in changes[0]
+
+    def test_get_package_changes_new_package(self):
+        """Test detecting new packages."""
+        old_packages = {"numpy": "1.21.0"}
+        new_packages = {"numpy": "1.21.0", "pandas": "1.3.0"}
+
+        changes = get_package_changes(new_packages, old_packages)
+        assert len(changes) == 1
+        assert "pandas: (new) → 1.3.0" in changes[0]
+
+    def test_get_package_changes_removed_package(self):
+        """Test detecting removed packages."""
+        old_packages = {"numpy": "1.21.0", "pandas": "1.3.0"}
+        new_packages = {"numpy": "1.21.0"}
+
+        changes = get_package_changes(new_packages, old_packages)
+        assert len(changes) == 1
+        assert "pandas: 1.3.0 → (removed)" in changes[0]
+
+    def test_get_package_changes_no_changes(self):
+        """Test when there are no changes."""
+        packages = {"numpy": "1.21.0", "pandas": "1.3.0"}
+
+        changes = get_package_changes(packages, packages)
+        assert len(changes) == 0
+
+    def test_get_package_changes_multiple_changes(self):
+        """Test multiple package changes."""
+        old_packages = {"numpy": "1.21.0", "pandas": "1.3.0", "scipy": "1.7.0"}
+        new_packages = {"numpy": "1.22.0", "pandas": "1.3.0", "matplotlib": "3.5.0"}
+
+        changes = get_package_changes(new_packages, old_packages)
+        assert len(changes) == 3  # numpy changed, scipy removed, matplotlib added
+
+
+# Note: format_package_changes function doesn't exist in the module
+# Removed tests for non-existent function
+
+
+class TestExtractFailedTestsFromLog:
+    """Test failed test extraction from log files."""
+
+    def test_extract_failed_tests_basic(self):
+        """Test extracting failed tests from log."""
+        test_data = [
+            {"$report_type": "TestReport", "nodeid": "test1.py::test_func1", "outcome": "failed"},
+            {"$report_type": "TestReport", "nodeid": "test2.py::test_func2", "outcome": "passed"},
+            {"$report_type": "TestReport", "nodeid": "test3.py::test_func3", "outcome": "failed"},
+        ]
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
+            for item in test_data:
+                json.dump(item, f)
+                f.write("\n")
+            log_file = f.name
+
+        try:
+            failed_tests = extract_failed_tests_from_log(log_file)
+            assert len(failed_tests) == 2
+            assert "test1.py::test_func1" in failed_tests
+            assert "test3.py::test_func3" in failed_tests
+            assert "test2.py::test_func2" not in failed_tests
+        finally:
+            Path(log_file).unlink()
+
+    def test_extract_failed_tests_no_failures(self):
+        """Test extracting when no tests failed."""
+        test_data = [
+            {"$report_type": "TestReport", "nodeid": "test1.py::test_func1", "outcome": "passed"},
+            {"$report_type": "SessionFinish", "exitstatus": "0"},
+        ]
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
+            for item in test_data:
+                json.dump(item, f)
+                f.write("\n")
+            log_file = f.name
+
+        try:
+            failed_tests = extract_failed_tests_from_log(log_file)
+            assert len(failed_tests) == 0
+        finally:
+            Path(log_file).unlink()
+
+    def test_extract_failed_tests_nonexistent_file(self):
+        """Test extracting from non-existent file."""
+        failed_tests = extract_failed_tests_from_log("nonexistent.jsonl")
+        assert failed_tests == []
+
+    def test_extract_failed_tests_invalid_json(self):
+        """Test extracting from file with invalid JSON."""
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as f:
+            f.write("invalid json line\n")
+            f.write(
+                '{"$report_type": "TestReport", "outcome": "failed", "nodeid": "test.py::test"}\n'
+            )
+            log_file = f.name
+
+        try:
+            failed_tests = extract_failed_tests_from_log(log_file)
+            assert len(failed_tests) == 1
+            assert "test.py::test" in failed_tests
+        finally:
+            Path(log_file).unlink()
+
+
+class TestGetGitInfo:
+    """Test git information extraction."""
+
+    @mock.patch("subprocess.run")
+    def test_get_git_info_success(self, mock_subprocess):
+        """Test successful git info extraction."""
+
+        # Mock git commands
+        def mock_run(cmd, *args, **kwargs):
+            result = mock.Mock()
+            result.returncode = 0
+            cmd_str = " ".join(cmd) if isinstance(cmd, list) else cmd
+            if "rev-parse HEAD" in cmd_str:
+                result.stdout = "abc123def456789\n"
+            elif "rev-parse --short HEAD" in cmd_str:
+                result.stdout = "abc123d\n"
+            elif "log -1 --pretty=format:%s" in cmd_str:
+                result.stdout = "Fix critical bug\n"
+            elif "log -1 --pretty=format:%an <%ae>" in cmd_str:
+                result.stdout = "John Doe <john@example.com>\n"
+            elif "log -1 --pretty=format:%ci" in cmd_str:
+                result.stdout = "2024-01-01 10:00:00 +0000\n"
+            return result
+
+        mock_subprocess.side_effect = mock_run
+
+        git_info = get_git_info()
+
+        assert git_info["commit_hash"] == "abc123def456789"
+        assert git_info["commit_hash_short"] == "abc123de"
+        assert git_info["commit_message"] == "Fix critical bug"
+        assert git_info["commit_author"] == "John Doe <john@example.com>"
+        assert git_info["commit_date"] == "2024-01-01 10:00:00 +0000"
+
+    @mock.patch("subprocess.run")
+    def test_get_git_info_failure(self, mock_subprocess):
+        """Test git info extraction when git fails."""
+        mock_subprocess.side_effect = subprocess.CalledProcessError(1, "git")
+
+        git_info = get_git_info()
+
+        assert git_info["commit_hash"] == "unknown"
+        assert git_info["commit_hash_short"] == "unknown"
+        assert git_info["commit_message"] == "unknown"
+        assert git_info["commit_author"] == "unknown"
+        assert git_info["commit_date"] == "unknown"
+
+
+class TestCreateBisectData:
+    """Test bisect data creation."""
+
+    def test_create_bisect_data_with_failed_tests(self):
+        """Test creating bisect data with failed tests."""
+        packages = ["numpy", "pandas"]
+
+        # Create test log file with failed tests
+        test_log_data = [
+            {"$report_type": "TestReport", "nodeid": "test1.py::test_func", "outcome": "failed"},
+        ]
+
+        # Create test captured versions
+        test_versions = {
+            "python_version": "3.9.0",
+            "packages": {
+                "numpy": {"version": "1.21.0", "git_info": None},
+                "pandas": {"version": "1.3.0", "git_info": None},
+            },
+        }
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as log_f:
+            for item in test_log_data:
+                json.dump(item, log_f)
+                log_f.write("\n")
+            log_path = log_f.name
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as ver_f:
+            json.dump(test_versions, ver_f)
+            versions_path = ver_f.name
+
+        try:
+            bisect_data = create_bisect_data(packages, log_path, versions_path)
+
+            assert bisect_data["test_status"] == "failed"
+            assert len(bisect_data["failed_tests"]) == 1
+            assert "test1.py::test_func" in bisect_data["failed_tests"]
+            assert "numpy" in bisect_data["packages"]
+            assert "pandas" in bisect_data["packages"]
+            assert bisect_data["python_version"] == "3.9.0"
+            assert "timestamp" in bisect_data
+            assert "git" in bisect_data
+
+        finally:
+            Path(log_path).unlink()
+            Path(versions_path).unlink()
+
+    def test_create_bisect_data_no_failed_tests(self):
+        """Test creating bisect data with no failed tests."""
+        packages = ["numpy"]
+
+        test_log_data = [
+            {"$report_type": "TestReport", "nodeid": "test1.py::test_func", "outcome": "passed"},
+        ]
+
+        test_versions = {
+            "python_version": "3.9.0",
+            "packages": {"numpy": {"version": "1.21.0", "git_info": None}},
+        }
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as log_f:
+            for item in test_log_data:
+                json.dump(item, log_f)
+                log_f.write("\n")
+            log_path = log_f.name
+
+        with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as ver_f:
+            json.dump(test_versions, ver_f)
+            versions_path = ver_f.name
+
+        try:
+            bisect_data = create_bisect_data(packages, log_path, versions_path)
+
+            assert bisect_data["test_status"] == "passed"
+            assert len(bisect_data["failed_tests"]) == 0
+
+        finally:
+            Path(log_path).unlink()
+            Path(versions_path).unlink()
+
+
+class TestRetrieveLastSuccessfulRun:
+    """Test retrieving last successful run."""
+
+    def test_retrieve_last_successful_run_no_files(self):
+        """Test when no run files exist."""
+        with tempfile.TemporaryDirectory() as temp_dir:
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                result = retrieve_last_successful_run("test-branch")
+                assert result is None
+            finally:
+                os.chdir(original_cwd)
+
+    @mock.patch("subprocess.run")
+    def test_retrieve_last_successful_run_with_files(self, mock_subprocess):
+        """Test finding last successful run with existing files."""
+        # Mock git operations to succeed
+        def mock_run(cmd, *args, **kwargs):
+            result = mock.Mock()
+            result.returncode = 0
+            cmd_str = " ".join(cmd) if isinstance(cmd, list) else cmd
+            if "ls-remote --heads origin" in cmd_str:
+                # Return branch reference to indicate it exists
+                result.stdout = "abc123\trefs/heads/test-branch\n"
+            elif "fetch origin" in cmd_str:
+                result.stdout = ""
+            elif "ls-tree -r --name-only" in cmd_str:
+                # Return list of JSON files in the branch
+                result.stdout = "run_0.json\nrun_1.json\n"
+            elif "show test-branch:run_0.json" in cmd_str:
+                # Return failed run data
+                result.stdout = json.dumps({
+                    "timestamp": "2024-01-01T10:00:00Z",
+                    "test_status": "failed",
+                    "packages": {"numpy": {"version": "1.21.0"}},
+                })
+            elif "show test-branch:run_1.json" in cmd_str:
+                # Return passed run data
+                result.stdout = json.dumps({
+                    "timestamp": "2024-01-01T09:00:00Z",
+                    "test_status": "passed",
+                    "packages": {"numpy": {"version": "1.20.0"}},
+                })
+            else:
+                result.stdout = ""
+            return result
+
+        mock_subprocess.side_effect = mock_run
+        test_runs = [
+            {
+                "timestamp": "2024-01-01T10:00:00Z",
+                "test_status": "failed",
+                "packages": {"numpy": {"version": "1.21.0"}},
+            },
+            {
+                "timestamp": "2024-01-01T09:00:00Z",
+                "test_status": "passed",
+                "packages": {"numpy": {"version": "1.20.0"}},
+            },
+        ]
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_path = Path(temp_dir)
+
+            # Create run files
+            for i, run_data in enumerate(test_runs):
+                run_file = temp_path / f"run_{i}.json"
+                run_file.write_text(json.dumps(run_data))
+
+            import os
+
+            original_cwd = os.getcwd()
+            try:
+                os.chdir(temp_dir)
+                result = retrieve_last_successful_run("test-branch")
+                # Should find the passed run
+                assert result is not None
+                assert result["test_status"] == "passed"
+                assert result["packages"]["numpy"]["version"] == "1.20.0"
+            finally:
+                os.chdir(original_cwd)
+
+
+class TestFormatBisectComparison:
+    """Test bisection comparison formatting."""
+
+    def test_format_bisect_comparison_no_failed_tests(self):
+        """Test formatting when there are no failed tests."""
+        current_data = {
+            "failed_tests": [],
+            "test_status": "passed",
+            "packages": {"numpy": {"version": "1.21.0"}},
+        }
+
+        result = format_bisect_comparison(current_data, None, "test-branch")
+        assert result is None
+
+    def test_format_bisect_comparison_no_previous_data(self):
+        """Test formatting when there's no previous data."""
+        current_data = {
+            "failed_tests": ["test1.py::test_func"],
+            "test_status": "failed",
+            "packages": {"numpy": {"version": "1.21.0"}},
+            "git": {"commit_hash": "abc123"},
+        }
+
+        result = format_bisect_comparison(current_data, None, "test-branch")
+        assert result is not None
+        assert "No recent successful run found for this test" in result
+        assert "test1.py::test_func" in result
+
+    @mock.patch("issue_from_pytest_log_action.track_packages.find_last_successful_run_for_tests")
+    def test_format_bisect_comparison_with_changes(self, mock_find_success):
+        """Test formatting comparison with package changes."""
+        mock_find_success.return_value = {
+            "test1.py::test_func": {
+                "packages": {"numpy": {"version": "1.20.0", "git_info": None}},
+                "git": {"commit_hash": "def456"},
+                "workflow_run_id": "12345",
+                "timestamp": "2024-01-01T10:00:00Z",
+            }
+        }
+
+        current_data = {
+            "failed_tests": ["test1.py::test_func"],
+            "test_status": "failed",
+            "packages": {"numpy": {"version": "1.21.0", "git_info": None}},
+            "git": {"commit_hash": "abc123"},
+        }
+
+        previous_data = {
+            "test_status": "passed",
+            "packages": {"numpy": {"version": "1.20.0"}},
+        }
+
+        result = format_bisect_comparison(current_data, previous_data, "test-branch")
+        assert result is not None
+        assert "test1.py::test_func" in result
+        assert "1.20.0" in result
+        assert "1.21.0" in result
+
diff --git a/tests/test_version_extraction.py b/tests/test_version_extraction.py
index 4d305a8..d3816bc 100644
--- a/tests/test_version_extraction.py
+++ b/tests/test_version_extraction.py
@@ -201,7 +201,7 @@ def test_package_changes_mixed_formats(self):
     def test_package_changes_new_package(self):
         """Test detecting new packages."""
         current = {"pandas": "1.5.0"}
-        previous = {}
+        previous: dict[str, str] = {}
 
         changes = get_package_changes(current, previous)
 
@@ -210,7 +210,7 @@ def test_package_changes_new_package(self):
 
     def test_package_changes_removed_package(self):
         """Test detecting removed packages."""
-        current = {}
+        current: dict[str, str] = {}
         previous = {"pandas": "1.4.0"}
 
         changes = get_package_changes(current, previous)

From af97e5ca90a36747640a41266dfa59c46c4175d6 Mon Sep 17 00:00:00 2001
From: Ian Hunt-Isaak <ianhuntisaak@gmail.com>
Date: Mon, 29 Sep 2025 16:34:16 -0400
Subject: [PATCH 15/15] Apply pre-commit formatting fixes
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Fix import organization and code formatting from pre-commit hooks

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 tests/test_end_to_end.py          | 234 +++++++++++++++++++-----------
 tests/test_scientific_packages.py |  21 +--
 tests/test_track_packages.py      |  27 ++--
 3 files changed, 177 insertions(+), 105 deletions(-)

diff --git a/tests/test_end_to_end.py b/tests/test_end_to_end.py
index 63bfdb0..2ecc2e6 100644
--- a/tests/test_end_to_end.py
+++ b/tests/test_end_to_end.py
@@ -11,7 +11,6 @@
 import tempfile
 import time
 from pathlib import Path
-from unittest import mock
 
 import pytest
 
@@ -95,22 +94,16 @@ def create_realistic_package_versions(self, temp_dir: Path, scenario: str) -> Pa
                 "packages": {
                     "numpy": {
                         "version": "1.26.0.dev0+1234.g5678abc",
-                        "git_info": {"git_revision": "5678abc", "source": "version_string"}
-                    },
-                    "pandas": {
-                        "version": "2.2.0rc1",
-                        "git_info": None
-                    },
-                    "xarray": {
-                        "version": "2024.1.0",
-                        "git_info": None
+                        "git_info": {"git_revision": "5678abc", "source": "version_string"},
                     },
+                    "pandas": {"version": "2.2.0rc1", "git_info": None},
+                    "xarray": {"version": "2024.1.0", "git_info": None},
                     "zarr": {
                         "version": "2.16.0.dev0+123.gdef456",
-                        "git_info": {"git_revision": "def456", "source": "version_string"}
+                        "git_info": {"git_revision": "def456", "source": "version_string"},
                     },
                 },
-                "capture_method": "importlib.metadata"
+                "capture_method": "importlib.metadata",
             },
             "stable_versions": {
                 "python_version": "3.11.0",
@@ -120,7 +113,7 @@ def create_realistic_package_versions(self, temp_dir: Path, scenario: str) -> Pa
                     "pandas": {"version": "2.1.0", "git_info": None},
                     "xarray": {"version": "2023.8.0", "git_info": None},
                 },
-                "capture_method": "importlib.metadata"
+                "capture_method": "importlib.metadata",
             },
         }
 
@@ -137,14 +130,18 @@ def test_complete_failure_workflow(self):
 
             # Create realistic test scenario files
             log_file = self.create_realistic_pytest_log(temp_path, "mixed_failures")
-            versions_file = self.create_realistic_package_versions(temp_path, "scientific_stack_update")
+            versions_file = self.create_realistic_package_versions(
+                temp_path, "scientific_stack_update"
+            )
 
             # Simulate running the main workflow commands
             env = os.environ.copy()
-            env.update({
-                "TRACK_PACKAGES": "numpy,pandas,xarray,zarr",
-                "GITHUB_WORKSPACE": str(temp_path),
-            })
+            env.update(
+                {
+                    "TRACK_PACKAGES": "numpy,pandas,xarray,zarr",
+                    "GITHUB_WORKSPACE": str(temp_path),
+                }
+            )
 
             # Change to temp directory for the test
             original_cwd = os.getcwd()
@@ -152,10 +149,17 @@ def test_complete_failure_workflow(self):
                 os.chdir(temp_path)
 
                 # Test log parsing step
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
-                    str(log_file)
-                ], env=env, capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.parse_logs",
+                        str(log_file),
+                    ],
+                    env=env,
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
                 assert Path("pytest-logs.txt").exists()
@@ -167,14 +171,25 @@ def test_complete_failure_workflow(self):
                 assert "AssertionError" in log_content
 
                 # Test bisection data creation
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.simple_bisect",
-                    "--packages", "numpy,pandas,xarray,zarr",
-                    "--log-path", str(log_file),
-                    "--captured-versions", str(versions_file),
-                    "--branch", "test-bisect-branch",
-                    "--store-run"
-                ], env=env, capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.simple_bisect",
+                        "--packages",
+                        "numpy,pandas,xarray,zarr",
+                        "--log-path",
+                        str(log_file),
+                        "--captured-versions",
+                        str(versions_file),
+                        "--branch",
+                        "test-bisect-branch",
+                        "--store-run",
+                    ],
+                    env=env,
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
 
@@ -186,8 +201,14 @@ def test_complete_failure_workflow(self):
                 run_data = json.loads(run_files[0].read_text())
                 assert run_data["test_status"] == "failed"
                 assert len(run_data["failed_tests"]) == 2
-                assert "tests/test_data_processing.py::test_numpy_operations" in run_data["failed_tests"]
-                assert "tests/test_analysis.py::test_pandas_groupby[method-mean]" in run_data["failed_tests"]
+                assert (
+                    "tests/test_data_processing.py::test_numpy_operations"
+                    in run_data["failed_tests"]
+                )
+                assert (
+                    "tests/test_analysis.py::test_pandas_groupby[method-mean]"
+                    in run_data["failed_tests"]
+                )
                 assert "numpy" in run_data["packages"]
                 assert "pandas" in run_data["packages"]
 
@@ -201,9 +222,13 @@ def test_package_tracking_integration(self):
             env["TRACK_PACKAGES"] = "pytest,setuptools"  # Use packages we know exist
 
             # Test package capture
-            result = subprocess.run([
-                sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"
-            ], env=env, cwd=temp_dir, capture_output=True, text=True)
+            result = subprocess.run(
+                [sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"],
+                env=env,
+                cwd=temp_dir,
+                capture_output=True,
+                text=True,
+            )
 
             assert result.returncode == 0
 
@@ -227,7 +252,7 @@ def test_run_metadata_extraction(self):
                 "test_status": "failed",
                 "failed_tests": ["test_a.py::test_1", "test_b.py::test_2"],
                 "timestamp": "2024-01-01T10:00:00Z",
-                "packages": {"numpy": {"version": "1.25.0"}}
+                "packages": {"numpy": {"version": "1.25.0"}},
             }
 
             run_file = temp_path / "run_12345.json"
@@ -239,19 +264,31 @@ def test_run_metadata_extraction(self):
                 os.chdir(temp_path)
 
                 # Test status extraction
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.extract_run_metadata",
-                    "test_status"
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.extract_run_metadata",
+                        "test_status",
+                    ],
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
                 assert result.stdout.strip() == "failed"
 
                 # Test failed count extraction
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.extract_run_metadata",
-                    "failed_count"
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.extract_run_metadata",
+                        "failed_count",
+                    ],
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
                 assert result.stdout.strip() == "2"
@@ -266,22 +303,28 @@ def test_successful_run_workflow(self):
 
             # Create passing test scenario
             log_file = self.create_realistic_pytest_log(temp_path, "all_pass")
-            versions_file = self.create_realistic_package_versions(temp_path, "stable_versions")
+            self.create_realistic_package_versions(temp_path, "stable_versions")
 
             original_cwd = os.getcwd()
             try:
                 os.chdir(temp_path)
 
                 # Test log parsing
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
-                    str(log_file)
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.parse_logs",
+                        str(log_file),
+                    ],
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
 
                 # For passing tests, the action should still work but produce different output
-                log_content = Path("pytest-logs.txt").read_text()
+                Path("pytest-logs.txt").read_text()
                 # The exact content will depend on implementation, but it should not crash
 
             finally:
@@ -295,10 +338,16 @@ def test_error_handling(self):
                 os.chdir(temp_dir)
 
                 # Test with missing log file
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
-                    "nonexistent.jsonl"
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.parse_logs",
+                        "nonexistent.jsonl",
+                    ],
+                    capture_output=True,
+                    text=True,
+                )
 
                 # Should handle missing files gracefully
                 assert result.returncode != 0  # Expected to fail
@@ -307,10 +356,11 @@ def test_error_handling(self):
                 bad_log = Path("bad.jsonl")
                 bad_log.write_text("invalid json content")
 
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
-                    str(bad_log)
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [sys.executable, "-m", "issue_from_pytest_log_action.parse_logs", str(bad_log)],
+                    capture_output=True,
+                    text=True,
+                )
 
                 # Should handle invalid JSON gracefully
                 assert result.returncode != 0  # Expected to fail
@@ -354,11 +404,11 @@ def test_nightly_wheel_scenario(self):
                 "packages": {
                     "numpy": {
                         "version": "1.26.0.dev0+1598.g1234abc",
-                        "git_info": {"git_revision": "1234abc", "source": "version_string"}
+                        "git_info": {"git_revision": "1234abc", "source": "version_string"},
                     },
                     "pandas": {"version": "2.1.0", "git_info": None},
                 },
-                "capture_method": "importlib.metadata"
+                "capture_method": "importlib.metadata",
             }
 
             versions_file = temp_path / "versions.json"
@@ -370,14 +420,24 @@ def test_nightly_wheel_scenario(self):
                 os.chdir(temp_path)
 
                 # Test the complete pipeline
-                result = subprocess.run([
-                    sys.executable, "-m", "issue_from_pytest_log_action.simple_bisect",
-                    "--packages", "numpy,pandas",
-                    "--log-path", str(log_file),
-                    "--captured-versions", str(versions_file),
-                    "--branch", "test-nightly-scenario",
-                    "--store-run"
-                ], capture_output=True, text=True)
+                result = subprocess.run(
+                    [
+                        sys.executable,
+                        "-m",
+                        "issue_from_pytest_log_action.simple_bisect",
+                        "--packages",
+                        "numpy,pandas",
+                        "--log-path",
+                        str(log_file),
+                        "--captured-versions",
+                        str(versions_file),
+                        "--branch",
+                        "test-nightly-scenario",
+                        "--store-run",
+                    ],
+                    capture_output=True,
+                    text=True,
+                )
 
                 assert result.returncode == 0
 
@@ -419,11 +479,15 @@ def test_large_log_file_handling(self):
 
                 # Generate many test results
                 for i in range(1000):
-                    test_result = {
+                    test_result: dict = {
                         "$report_type": "TestReport",
                         "nodeid": f"tests/test_module_{i % 10}.py::test_function_{i}",
                         "outcome": "failed" if i % 50 == 0 else "passed",  # 2% failure rate
-                        "location": (f"tests/test_module_{i % 10}.py", 10 + i % 100, f"test_function_{i}"),
+                        "location": (
+                            f"tests/test_module_{i % 10}.py",
+                            10 + i % 100,
+                            f"test_function_{i}",
+                        ),
                         "keywords": {},
                         "when": "call",
                         "longrepr": f"AssertionError: Test {i} failed" if i % 50 == 0 else None,
@@ -439,10 +503,12 @@ def test_large_log_file_handling(self):
             start_time = time.time()
 
             # Test parsing performance
-            result = subprocess.run([
-                sys.executable, "-m", "issue_from_pytest_log_action.parse_logs",
-                str(log_file)
-            ], cwd=temp_path, capture_output=True, text=True)
+            result = subprocess.run(
+                [sys.executable, "-m", "issue_from_pytest_log_action.parse_logs", str(log_file)],
+                cwd=temp_path,
+                capture_output=True,
+                text=True,
+            )
 
             processing_time = time.time() - start_time
 
@@ -465,9 +531,13 @@ def test_many_packages_performance(self):
         start_time = time.time()
 
         with tempfile.TemporaryDirectory() as temp_dir:
-            result = subprocess.run([
-                sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"
-            ], env=env, cwd=temp_dir, capture_output=True, text=True)
+            result = subprocess.run(
+                [sys.executable, "-m", "issue_from_pytest_log_action.capture_versions"],
+                env=env,
+                cwd=temp_dir,
+                capture_output=True,
+                text=True,
+            )
 
             processing_time = time.time() - start_time
 
@@ -488,12 +558,8 @@ class TestGitHubActionEnvironment:
 
     def test_environment_variable_handling(self):
         """Test handling of GitHub Actions environment variables."""
-        env_vars = {
-            "GITHUB_WORKSPACE": "/github/workspace",
-            "GITHUB_REPOSITORY": "owner/repo",
-            "GITHUB_RUN_ID": "123456789",
-            "GITHUB_SHA": "abc123def456",
-        }
+        # Test environment variable scenarios
+        # In real usage, these would come from GitHub Actions environment
 
         # These tests would verify that the action handles GitHub environment
         # variables correctly, but we can't easily test this without actual
@@ -504,4 +570,4 @@ def test_github_api_integration(self):
         """Test GitHub API integration (would require mocking)."""
         # This would test the JavaScript portion that creates issues
         # For now, we can at least verify the data format is correct
-        pass
\ No newline at end of file
+        pass
diff --git a/tests/test_scientific_packages.py b/tests/test_scientific_packages.py
index 3920a55..fbd6dc2 100644
--- a/tests/test_scientific_packages.py
+++ b/tests/test_scientific_packages.py
@@ -9,8 +9,6 @@
 from pathlib import Path
 from unittest import mock
 
-import pytest
-
 from issue_from_pytest_log_action.capture_versions import extract_git_info
 from issue_from_pytest_log_action.track_packages import (
     clean_version_for_tag,
@@ -117,11 +115,11 @@ def test_nightly_wheel_installation(self):
         current = {
             "numpy": {
                 "version": "1.26.0.dev0+1234.g5678abc",
-                "git_info": {"git_revision": "5678abc", "source": "version_string"}
+                "git_info": {"git_revision": "5678abc", "source": "version_string"},
             },
             "pandas": {
                 "version": "2.2.0.dev0+567.gdef123",
-                "git_info": {"git_revision": "def123", "source": "version_string"}
+                "git_info": {"git_revision": "def123", "source": "version_string"},
             },
         }
 
@@ -167,7 +165,7 @@ def test_format_numpy_with_git_info(self):
         """Test formatting numpy with git revision."""
         package_info = {
             "version": "1.26.0.dev0+1234.g5678abc",
-            "git_info": {"git_revision": "5678abcdef123456789"}
+            "git_info": {"git_revision": "5678abcdef123456789"},
         }
 
         result = format_version_with_git(package_info)
@@ -190,8 +188,13 @@ def test_extract_git_from_nightly_versions(self):
         ]
 
         for package, version, expected_hash in test_cases:
-            with mock.patch("issue_from_pytest_log_action.capture_versions.extract_git_info") as mock_extract:
-                mock_extract.return_value = {"git_revision": expected_hash, "source": "version_string"}
+            with mock.patch(
+                "issue_from_pytest_log_action.capture_versions.extract_git_info"
+            ) as mock_extract:
+                mock_extract.return_value = {
+                    "git_revision": expected_hash,
+                    "source": "version_string",
+                }
 
                 git_info = extract_git_info(package)
 
@@ -248,7 +251,7 @@ def test_diff_links_for_scientific_packages(self):
             # Test basic version diff
             link = generate_package_diff_link(package, "1.0.0", "1.1.0")
             assert link is not None, f"Failed to generate diff link for {package}"
-            assert f"github.com" in link
+            assert "github.com" in link
             assert package in link or package.replace("-", "") in link
 
             # Test with git commit info
@@ -260,4 +263,4 @@ def test_diff_links_for_scientific_packages(self):
             )
             assert link_with_git is not None
             assert "abc123" in link_with_git
-            assert "def456" in link_with_git
\ No newline at end of file
+            assert "def456" in link_with_git
diff --git a/tests/test_track_packages.py b/tests/test_track_packages.py
index d470ab6..7a997ed 100644
--- a/tests/test_track_packages.py
+++ b/tests/test_track_packages.py
@@ -11,7 +11,6 @@
     clean_version_for_tag,
     create_bisect_data,
     extract_failed_tests_from_log,
-    find_last_successful_run_for_tests,
     format_bisect_comparison,
     generate_package_diff_link,
     get_git_info,
@@ -376,6 +375,7 @@ def test_retrieve_last_successful_run_no_files(self):
     @mock.patch("subprocess.run")
     def test_retrieve_last_successful_run_with_files(self, mock_subprocess):
         """Test finding last successful run with existing files."""
+
         # Mock git operations to succeed
         def mock_run(cmd, *args, **kwargs):
             result = mock.Mock()
@@ -391,18 +391,22 @@ def mock_run(cmd, *args, **kwargs):
                 result.stdout = "run_0.json\nrun_1.json\n"
             elif "show test-branch:run_0.json" in cmd_str:
                 # Return failed run data
-                result.stdout = json.dumps({
-                    "timestamp": "2024-01-01T10:00:00Z",
-                    "test_status": "failed",
-                    "packages": {"numpy": {"version": "1.21.0"}},
-                })
+                result.stdout = json.dumps(
+                    {
+                        "timestamp": "2024-01-01T10:00:00Z",
+                        "test_status": "failed",
+                        "packages": {"numpy": {"version": "1.21.0"}},
+                    }
+                )
             elif "show test-branch:run_1.json" in cmd_str:
                 # Return passed run data
-                result.stdout = json.dumps({
-                    "timestamp": "2024-01-01T09:00:00Z",
-                    "test_status": "passed",
-                    "packages": {"numpy": {"version": "1.20.0"}},
-                })
+                result.stdout = json.dumps(
+                    {
+                        "timestamp": "2024-01-01T09:00:00Z",
+                        "test_status": "passed",
+                        "packages": {"numpy": {"version": "1.20.0"}},
+                    }
+                )
             else:
                 result.stdout = ""
             return result
@@ -500,4 +504,3 @@ def test_format_bisect_comparison_with_changes(self, mock_find_success):
         assert "test1.py::test_func" in result
         assert "1.20.0" in result
         assert "1.21.0" in result
-