From 79e7c09b9c6ed58d09dd689b7ed5efc6e5db5813 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Tue, 7 Apr 2026 16:18:27 -0700
Subject: [PATCH 01/15] ref: Remove Kafka/Arroyo consumer code

Launchpad has fully migrated to TaskWorker mode for processing
artifacts. Remove all Kafka/Arroyo consumer infrastructure since
it is no longer in use.

Deleted:
- kafka.py (consumer, strategies, config)
- service.py (Kafka+HTTP orchestrator)
- arroyo_metrics.py (Arroyo metrics backend)
- ensure_kafka_topics.py and test_kafka.py scripts
- Kafka integration and E2E tests

Updated:
- CLI: removed `serve` command, worker is the only mode
- Dockerfile: default CMD changed from serve to worker
- CI: removed Kafka from test job, removed e2e job
- devservices: removed Kafka dependency
- Relocated ServiceConfig to artifact_processor.py
- Removed sentry-kafka-schemas and kafka-python deps

Note: sentry-arroyo and confluent-kafka remain as deps because
worker/app.py still uses KafkaProducer (to be cleaned up separately).

Co-Authored-By: Claude <noreply@anthropic.com>
---
 .github/workflows/ci.yml                      | 168 +-------
 Dockerfile                                    |   2 +-
 Makefile                                      |  49 +--
 devservices/config.yml                        |  31 +-
 docker-compose.e2e.yml                        |  34 +-
 requirements-dev.txt                          |   1 -
 requirements.txt                              |   1 -
 scripts/ensure_kafka_topics.py                |  67 ---
 scripts/test_kafka.py                         | 107 -----
 src/launchpad/artifact_processor.py           |  37 +-
 src/launchpad/cli.py                          |  58 ---
 src/launchpad/constants.py                    |   3 -
 src/launchpad/kafka.py                        | 390 ------------------
 src/launchpad/service.py                      | 163 --------
 src/launchpad/utils/arroyo_metrics.py         |  48 ---
 src/launchpad/utils/logging.py                |   2 -
 tests/e2e/test_e2e_flow.py                    | 319 +-------------
 tests/integration/test_kafka_service.py       | 242 -----------
 tests/integration/test_launchpad_service.py   |  51 +--
 .../unit/artifacts/test_artifact_processor.py |   4 +-
 20 files changed, 59 insertions(+), 1718 deletions(-)
 delete mode 100755 scripts/ensure_kafka_topics.py
 delete mode 100755 scripts/test_kafka.py
 delete mode 100644 src/launchpad/kafka.py
 delete mode 100644 src/launchpad/service.py
 delete mode 100644 src/launchpad/utils/arroyo_metrics.py
 delete mode 100644 tests/integration/test_kafka_service.py

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index dd542858..a4f1d938 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -64,191 +64,25 @@ jobs:
       - name: Install dependencies
         run: make install-dev
 
-      - name: Start Kafka with devservices
-        run: |
-          .venv/bin/devservices up --mode default
-
-          echo "Waiting for Kafka to be ready..."
-          KAFKA_READY=false
-          for i in {1..30}; do
-            KAFKA_CONTAINER=$(docker ps -qf "name=kafka")
-            if [ -z "$KAFKA_CONTAINER" ]; then
-              echo "Waiting for Kafka container to start... attempt $i/30"
-              sleep 2
-              continue
-            fi
-
-            HEALTH_STATUS=$(docker inspect --format='{{.State.Health.Status}}' $KAFKA_CONTAINER 2>/dev/null || echo "none")
-            if [ "$HEALTH_STATUS" = "healthy" ]; then
-              echo "Kafka is ready!"
-              KAFKA_READY=true
-              break
-            fi
-            echo "Waiting for Kafka health check (status: $HEALTH_STATUS)... attempt $i/30"
-            sleep 2
-          done
-
-          if [ "$KAFKA_READY" = "false" ]; then
-            echo "ERROR: Kafka failed to become healthy after 60 seconds"
-            echo "=== Docker containers ==="
-            docker ps -a
-            echo "=== Kafka logs ==="
-            docker logs $(docker ps -aqf "name=kafka") --tail 100 || echo "Could not get Kafka logs"
-            exit 1
-          fi
-
-          docker ps
-
       - name: Build Docker image with test fixtures
         run: docker build --build-arg TEST_BUILD=true -t launchpad-test .
 
       - name: Run all tests in Docker
         run: |
-          # Get Kafka container info for network connectivity
-          KAFKA_CONTAINER=$(docker ps -qf "name=kafka")
-          KAFKA_NETWORK=$(docker inspect $KAFKA_CONTAINER --format='{{range $net,$v := .NetworkSettings.Networks}}{{$net}}{{end}}')
-
           docker run --rm \
-            --network $KAFKA_NETWORK \
             -e LAUNCHPAD_ENV=development \
-            -e LAUNCHPAD_HOST=localhost \
-            -e LAUNCHPAD_PORT=2218 \
             -e LAUNCHPAD_RPC_SHARED_SECRET="launchpad-test-secret" \
-            -e KAFKA_BOOTSTRAP_SERVERS="kafka:9093" \
-            -e KAFKA_GROUP_ID="launchpad-test-ci" \
-            -e KAFKA_TOPICS="preprod-artifact-events" \
             --entrypoint python launchpad-test -m pytest -n auto tests/ --ignore=tests/e2e -v
 
-      - name: Show Kafka logs on failure
-        if: failure()
-        run: |
-          if docker ps -qf "name=kafka" >/dev/null 2>&1; then
-            echo "=== Kafka logs ==="
-            docker logs $(docker ps -qf "name=kafka") --tail 100
-          fi
-
       - name: Test CLI installation and basic functionality in Docker
         run: |
           docker run --rm \
             -e LAUNCHPAD_ENV=development \
-            -e LAUNCHPAD_HOST=localhost \
-            -e LAUNCHPAD_PORT=2218 \
             launchpad-test --help
 
-  e2e:
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6
-
-      - name: Set up Python
-        uses: actions/setup-python@a309ff8b426b58ec0e2a45f0f869d46889d02405 # v6
-        with:
-          python-version: "3.13"
-
-      - name: Install uv
-        uses: astral-sh/setup-uv@94527f2e458b27549849d47d273a16bec83a01e9 # v7
-        with:
-          enable-cache: true
-          cache-dependency-glob: pyproject.toml
-
-      - name: Install dependencies
-        run: make install-dev
-
-      - name: Start Kafka with devservices
-        run: |
-          .venv/bin/devservices up --mode default
-
-          echo "Waiting for Kafka to be ready..."
-          KAFKA_READY=false
-          for i in {1..30}; do
-            KAFKA_CONTAINER=$(docker ps -qf "name=kafka")
-            if [ -z "$KAFKA_CONTAINER" ]; then
-              echo "Waiting for Kafka container to start... attempt $i/30"
-              sleep 2
-              continue
-            fi
-
-            HEALTH_STATUS=$(docker inspect --format='{{.State.Health.Status}}' $KAFKA_CONTAINER 2>/dev/null || echo "none")
-            if [ "$HEALTH_STATUS" = "healthy" ]; then
-              echo "Kafka is ready!"
-              KAFKA_READY=true
-              break
-            fi
-            echo "Waiting for Kafka health check (status: $HEALTH_STATUS)... attempt $i/30"
-            sleep 2
-          done
-
-          if [ "$KAFKA_READY" = "false" ]; then
-            echo "ERROR: Kafka failed to become healthy after 60 seconds"
-            echo "=== Docker containers ==="
-            docker ps -a
-            echo "=== Kafka logs ==="
-            docker logs $(docker ps -aqf "name=kafka") --tail 100 || echo "Could not get Kafka logs"
-            exit 1
-          fi
-
-          docker ps
-
-      - name: Create Kafka topic
-        run: |
-          KAFKA_CONTAINER=$(docker ps -qf "name=kafka")
-          echo "Creating preprod-artifact-events topic..."
-          docker exec $KAFKA_CONTAINER kafka-topics --bootstrap-server localhost:9092 --create --topic preprod-artifact-events --partitions 1 --replication-factor 1 --if-not-exists
-          echo "Topic created successfully"
-
-      - name: Build E2E Docker images
-        run: docker compose -f docker-compose.e2e.yml build
-
-      - name: Start E2E services
-        run: |
-          # Start services in detached mode (minio, mock-sentry-api, launchpad)
-          docker compose -f docker-compose.e2e.yml up -d minio mock-sentry-api launchpad
-
-          # Wait for launchpad to be healthy
-          echo "Waiting for Launchpad to be healthy..."
-          LAUNCHPAD_READY=false
-          for i in {1..30}; do
-            if docker compose -f docker-compose.e2e.yml ps launchpad | grep -q "healthy"; then
-              echo "Launchpad is ready!"
-              LAUNCHPAD_READY=true
-              break
-            fi
-            echo "Waiting for Launchpad... attempt $i/30"
-            sleep 5
-          done
-
-          if [ "$LAUNCHPAD_READY" = "false" ]; then
-            echo "ERROR: Launchpad failed to become healthy"
-            docker compose -f docker-compose.e2e.yml logs launchpad
-            exit 1
-          fi
-
-          # Show running services
-          docker compose -f docker-compose.e2e.yml ps
-
-      - name: Run E2E tests
-        run: |
-          docker compose -f docker-compose.e2e.yml run --rm e2e-tests
-        timeout-minutes: 10
-
-      - name: Show service logs on failure
-        if: failure()
-        run: |
-          echo "=== Launchpad logs ==="
-          docker compose -f docker-compose.e2e.yml logs launchpad
-          echo "=== Mock API logs ==="
-          docker compose -f docker-compose.e2e.yml logs mock-sentry-api
-          echo "=== Kafka logs ==="
-          docker logs $(docker ps -qf "name=kafka") --tail 100 || echo "Could not get Kafka logs"
-
-      - name: Cleanup E2E environment
-        if: always()
-        run: docker compose -f docker-compose.e2e.yml down -v
-
   build:
     runs-on: ubuntu-latest
-    needs: [check, test, e2e]
+    needs: [check, test]
 
     steps:
       - name: Checkout code
diff --git a/Dockerfile b/Dockerfile
index 7bf9207a..d5b34273 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -114,4 +114,4 @@ ENV LAUNCHPAD_VERSION_SHA=$LAUNCHPAD_VERSION_SHA
 
 # Default command
 ENTRYPOINT ["launchpad"]
-CMD ["serve"]
+CMD ["worker"]
diff --git a/Makefile b/Makefile
index 21ec1ebc..3262061e 100644
--- a/Makefile
+++ b/Makefile
@@ -29,15 +29,7 @@ test-unit:
 test-integration:
 	$(PYTHON_VENV) -m pytest -n auto tests/integration/ -v
 
-test-e2e:  ## Run E2E tests with Docker Compose (requires devservices up)
-	@echo "Ensuring devservices Kafka is running..."
-	@if ! docker ps | grep -q kafka; then \
-		echo "Starting devservices..."; \
-		devservices up --mode default; \
-		sleep 10; \
-	else \
-		echo "Kafka already running"; \
-	fi
+test-e2e:  ## Run E2E tests with Docker Compose
 	@echo "Starting E2E test environment..."
 	docker compose -f docker-compose.e2e.yml up --build --abort-on-container-exit --exit-code-from e2e-tests
 	@echo "Cleaning up E2E environment..."
@@ -107,22 +99,10 @@ run-cli:  ## Run the CLI tool (use ARGS="..." to pass arguments, DEBUG=1 to run
 		$(PYTHON_VENV) -m launchpad.cli $(ARGS); \
 	fi
 
-serve:  ## Start the Launchpad server with proper Kafka configuration
-	@echo "Ensuring Kafka topics exist..."
-	$(PYTHON_VENV) scripts/ensure_kafka_topics.py
-	@echo "Starting Launchpad server..."
-	$(PYTHON_VENV) -m launchpad.cli serve --verbose
-
-worker:  ## Start the Launchpad TaskWorker (no HTTP server)
+worker:  ## Start the Launchpad TaskWorker
 	@echo "Starting Launchpad TaskWorker..."
 	$(PYTHON_VENV) -m launchpad.cli worker --verbose
 
-test-kafka-message:  ## Send a test message to Kafka (requires Kafka running)
-	$(PYTHON_VENV) scripts/test_kafka.py --count 1
-
-test-kafka-multiple:  ## Send multiple test messages to Kafka
-	$(PYTHON_VENV) scripts/test_kafka.py --count 5 --interval 0
-
 test-download-artifact:
 	$(PYTHON_VENV) scripts/test_download_artifact.py --verbose
 
@@ -132,31 +112,6 @@ test-artifact-update:
 test-artifact-size-analysis-upload:
 	$(PYTHON_VENV) scripts/test_artifact_size_analysis_upload.py --verbose
 
-test-service-integration:  ## Run full integration test with devservices
-	@echo "Starting Kafka services via devservices..."
-	@devservices up
-	@echo "Waiting for Kafka to be ready..."
-	@sleep 10
-	@echo "Starting Launchpad server in background..."
-	@set -e; \
-	$(PYTHON_VENV) -m launchpad.cli serve --verbose & \
-	LAUNCHPAD_PID=$$!; \
-	echo "Launchpad started with PID: $$LAUNCHPAD_PID"; \
-	sleep 5; \
-	echo "Sending test messages..."; \
-	$(PYTHON_VENV) scripts/test_kafka.py --count 3 --interval 1; \
-	sleep 5; \
-	echo "Stopping Launchpad gracefully..."; \
-	kill -TERM $$LAUNCHPAD_PID 2>/dev/null && echo "SIGTERM sent" || echo "Process not found"; \
-	sleep 8; \
-	if kill -0 $$LAUNCHPAD_PID 2>/dev/null; then \
-		echo "Process still running, sending SIGKILL..."; \
-		kill -KILL $$LAUNCHPAD_PID 2>/dev/null || true; \
-		sleep 2; \
-	fi; \
-	echo "Stopping devservices..."; \
-	devservices down
-
 # Show current status
 status:
 	@echo "Python version: $$($(PYTHON_VENV) --version)"
diff --git a/devservices/config.yml b/devservices/config.yml
index 39b8cb30..ff8c0766 100644
--- a/devservices/config.yml
+++ b/devservices/config.yml
@@ -3,47 +3,30 @@ x-sentry-service-config:
   version: 0.1
   service_name: launchpad
   dependencies:
-    kafka:
-      description: Shared instance of kafka used by sentry services
-      remote:
-        repo_name: sentry-shared-kafka
-        branch: main
-        repo_link: https://github.com/getsentry/sentry-shared-kafka.git
     launchpad:
       description: Service that powers preprod artifact analysis
   modes:
-    default: [kafka]
-    containerized: [kafka, launchpad]
+    default: []
+    containerized: [launchpad]
 
 x-programs:
   devserver:
-    command: make serve
+    command: make worker
 
-# Assuming we only have remote dependencies (currently the case), then below is only relevant when running launchpad as a dependency of the monolith.
+# Below is only relevant when running launchpad as a dependency of the monolith.
 services:
   launchpad:
     image: ghcr.io/getsentry/launchpad:nightly
-    ports:
-      - 127.0.0.1:2218:2218 # Bind to localhost only - no external access
     command:
-      - serve
+      - worker
       - --verbose
-    healthcheck:
-      test: curl -f http://127.0.0.1:2218/health || exit 1
-      interval: 10s
-      timeout: 5s
-      retries: 3
-      start_period: 30s
     environment:
       PYTHONUNBUFFERED: 1
-      KAFKA_BOOTSTRAP_SERVERS: kafka:9093
-      KAFKA_GROUP_ID: launchpad-devservices
-      KAFKA_TOPICS: preprod-artifact-events
-      LAUNCHPAD_HOST: "0.0.0.0" # Inside container, but port binding restricts access
-      LAUNCHPAD_PORT: "2218"
       LAUNCHPAD_ENV: "development"
       SENTRY_BASE_URL: "http://host.docker.internal:8000"
       LAUNCHPAD_RPC_SHARED_SECRET: "launchpad-also-very-long-value-haha"
+      LAUNCHPAD_WORKER_RPC_HOST: "host.docker.internal:50051"
+      LAUNCHPAD_WORKER_CONCURRENCY: "1"
     platform: linux/amd64
     extra_hosts:
       host.docker.internal: host-gateway
diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index d4bf388d..3f00fed9 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -1,5 +1,4 @@
-# Note: This E2E setup leverages your existing devservices Kafka
-# Run `devservices up` before starting these tests
+# E2E test setup for Launchpad
 
 services:
   # MinIO for ObjectStore (S3-compatible)
@@ -46,7 +45,6 @@ services:
       - mock-api-data:/app/data
     networks:
       - launchpad-e2e
-      - devservices
 
   # Launchpad service
   launchpad:
@@ -54,34 +52,23 @@ services:
       context: .
       dockerfile: Dockerfile
       args:
-        TEST_BUILD: "true"  # Include test fixtures
-    ports:
-      - "2218:2218"
+        TEST_BUILD: "true"
     environment:
       PYTHONUNBUFFERED: "1"
-      KAFKA_BOOTSTRAP_SERVERS: "kafka:9093"
-      KAFKA_GROUP_ID: "launchpad-e2e-test"
-      KAFKA_TOPICS: "preprod-artifact-events"
-      KAFKA_AUTO_OFFSET_RESET: "earliest"
-      LAUNCHPAD_HOST: "0.0.0.0"
-      LAUNCHPAD_PORT: "2218"
       LAUNCHPAD_ENV: "e2e-test"
       SENTRY_BASE_URL: "http://mock-sentry-api:8000"
       OBJECTSTORE_URL: "http://minio:9000"
       LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
-      SENTRY_DSN: ""  # Disable Sentry SDK in tests
+      LAUNCHPAD_WORKER_RPC_HOST: "host.docker.internal:50051"
+      LAUNCHPAD_WORKER_CONCURRENCY: "1"
+      SENTRY_DSN: ""
     depends_on:
       mock-sentry-api:
         condition: service_healthy
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:2218/health"]
-      interval: 10s
-      timeout: 5s
-      retries: 5
-      start_period: 30s
+    extra_hosts:
+      host.docker.internal: host-gateway
     networks:
       - launchpad-e2e
-      - devservices
 
   # Test orchestrator
   e2e-tests:
@@ -89,7 +76,6 @@ services:
       context: .
       dockerfile: tests/e2e/Dockerfile.test-runner
     environment:
-      KAFKA_BOOTSTRAP_SERVERS: "kafka:9093"
       MOCK_API_URL: "http://mock-sentry-api:8000"
       LAUNCHPAD_URL: "http://launchpad:2218"
       MINIO_ENDPOINT: "http://minio:9000"
@@ -97,8 +83,6 @@ services:
       MINIO_SECRET_KEY: "minioadmin"
       LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
     depends_on:
-      launchpad:
-        condition: service_healthy
       mock-sentry-api:
         condition: service_healthy
     volumes:
@@ -106,7 +90,6 @@ services:
     command: pytest e2e_tests/test_e2e_flow.py -v --tb=short
     networks:
       - launchpad-e2e
-      - devservices
 
 volumes:
   minio-data:
@@ -115,6 +98,3 @@ volumes:
 networks:
   launchpad-e2e:
     name: launchpad-e2e
-  devservices:
-    name: devservices
-    external: true
diff --git a/requirements-dev.txt b/requirements-dev.txt
index d09d5e21..52b5e412 100644
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
@@ -23,5 +23,4 @@ ty==0.0.1a20
 
 # Testing web endpoints
 sortedcontainers-stubs>=2.4.0
-kafka-python>=2.0.0
 sentry-protos>=0.4.11
diff --git a/requirements.txt b/requirements.txt
index 06e857b0..50d384c8 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -16,7 +16,6 @@ protobuf>=5.29.5,<6
 pydantic>=2.9.2,<2.10.0
 rich>=14.1.0
 sentry-arroyo==2.34.0
-sentry-kafka-schemas==2.1.2
 sentry-sdk>=2.36.0
 sortedcontainers>=2.4.0
 taskbroker-client>=0.1.5
diff --git a/scripts/ensure_kafka_topics.py b/scripts/ensure_kafka_topics.py
deleted file mode 100755
index e0e4d217..00000000
--- a/scripts/ensure_kafka_topics.py
+++ /dev/null
@@ -1,67 +0,0 @@
-#!/usr/bin/env python3
-"""Standalone utility to ensure Kafka topics exist for development."""
-
-import os
-import sys
-
-from confluent_kafka import KafkaException
-from confluent_kafka.admin import AdminClient, NewTopic
-from sentry_kafka_schemas import get_topic
-
-
-def create_kafka_topic(bootstrap_servers: str = "localhost:9092") -> bool:
-    """Create the launchpad Kafka topic. Returns True if successful."""
-    # Import launchpad constants (needs sys.path modification)
-    sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", "src"))
-    from launchpad.constants import PREPROD_ARTIFACT_EVENTS_TOPIC
-
-    admin_client = AdminClient({"bootstrap.servers": bootstrap_servers})
-    topic_name = PREPROD_ARTIFACT_EVENTS_TOPIC
-
-    try:
-        # Check if topic already exists
-        try:
-            existing_topics = admin_client.list_topics(timeout=10).topics
-            if topic_name in existing_topics:
-                print(f"✓ Topic exists: {topic_name}")
-                return True
-        except Exception:
-            pass  # Continue to create, handle TopicExistsException later
-
-        # Get topic configuration and create
-        topic_data = get_topic(topic_name)
-        config = topic_data.get("topic_creation_config", {})
-        partitions = topic_data.get("enforced_partition_count") or 1
-        replication = int(config.get("replication.factor", "1"))
-
-        # Create topic without config to avoid conflicts - config can be set later
-        new_topic = NewTopic(topic_name, partitions, replication)
-        futures = admin_client.create_topics([new_topic])
-        futures[topic_name].result()  # Wait for completion
-
-        print(f"✓ Created topic: {topic_name}")
-        return True
-
-    except KafkaException as e:
-        if e.args[0].code() == 36:  # TopicExistsException
-            print(f"✓ Topic exists: {topic_name}")
-            return True
-        print(f"✗ Failed to create topic: {e}")
-        return False
-    except Exception as e:
-        print(f"✗ Error: {e}")
-        return False
-
-
-if __name__ == "__main__":
-    if os.getenv("LAUNCHPAD_CREATE_KAFKA_TOPIC") != "1":
-        env_val = os.getenv("LAUNCHPAD_CREATE_KAFKA_TOPIC")
-        print(f"LAUNCHPAD_CREATE_KAFKA_TOPIC={env_val}")
-        print("Topic creation disabled")
-        sys.exit(0)
-
-    bootstrap_servers = os.getenv("KAFKA_BOOTSTRAP_SERVERS")
-    if not bootstrap_servers:
-        raise ValueError("KAFKA_BOOTSTRAP_SERVERS env var is required")
-    success = create_kafka_topic(bootstrap_servers)
-    sys.exit(0 if success else 1)
diff --git a/scripts/test_kafka.py b/scripts/test_kafka.py
deleted file mode 100755
index 7c439f42..00000000
--- a/scripts/test_kafka.py
+++ /dev/null
@@ -1,107 +0,0 @@
-#!/usr/bin/env python3
-"""Script to send test messages to Kafka for testing Launchpad consumer."""
-
-import json
-import sys
-import time
-from typing import Any, Dict
-
-import click
-from kafka import KafkaProducer
-
-sys.path.insert(0, "src")
-from launchpad.constants import PREPROD_ARTIFACT_EVENTS_TOPIC  # noqa: E402
-
-
-def create_producer(bootstrap_servers: str = "localhost:9092") -> KafkaProducer:
-    """Create a Kafka producer."""
-    return KafkaProducer(
-        bootstrap_servers=[bootstrap_servers],
-        value_serializer=lambda v: json.dumps(v).encode("utf-8"),
-        key_serializer=lambda k: k.encode("utf-8") if k else None,
-    )
-
-
-def create_preprod_artifact_event(
-    artifact_id: str | None = None, project_id: str | None = None, organization_id: str | None = None
-) -> Dict[str, Any]:
-    """Create a preprod artifact event message matching the schema."""
-    return {
-        "artifact_id": artifact_id or f"test-artifact-{int(time.time())}",
-        "project_id": project_id or f"test-project-{int(time.time())}",
-        "organization_id": organization_id or f"test-org-{int(time.time())}",
-        "requested_features": ["size_analysis"],
-    }
-
-
-@click.command()
-@click.option("--topic", default=PREPROD_ARTIFACT_EVENTS_TOPIC, help="Kafka topic to send messages to")
-@click.option("--bootstrap-servers", default="localhost:9092", help="Kafka bootstrap servers")
-@click.option("--artifact-id", help="Custom artifact ID (auto-generated if not provided)")
-@click.option("--project-id", help="Custom project ID (auto-generated if not provided)")
-@click.option("--organization-id", help="Custom organization ID (auto-generated if not provided)")
-@click.option("--custom-json", help="Custom JSON message to send (overrides other options)")
-@click.option("--count", default=1, help="Number of messages to send")
-@click.option("--interval", default=1.0, help="Interval between messages in seconds")
-def main(
-    topic: str,
-    bootstrap_servers: str,
-    artifact_id: str,
-    project_id: str,
-    organization_id: str,
-    custom_json: str,
-    count: int,
-    interval: float,
-) -> None:
-    """Send preprod artifact event messages to Kafka for Launchpad testing."""
-
-    try:
-        producer = create_producer(bootstrap_servers)
-        click.echo(f"Connected to Kafka at {bootstrap_servers}")
-
-        for i in range(count):
-            if custom_json:
-                try:
-                    message = json.loads(custom_json)
-                except json.JSONDecodeError as e:
-                    click.echo(f"Error parsing custom JSON: {e}", err=True)
-                    sys.exit(1)
-            else:
-                # Use provided IDs or generate them with counter
-                current_artifact_id = artifact_id or f"test-artifact-{int(time.time())}-{i+1}"
-                current_project_id = project_id or f"test-project-{int(time.time())}-{i+1}"
-                current_organization_id = organization_id or f"test-org-{int(time.time())}-{i+1}"
-
-                message = create_preprod_artifact_event(
-                    artifact_id=current_artifact_id,
-                    project_id=current_project_id,
-                    organization_id=current_organization_id,
-                )
-
-            # Send message
-            key = f"test-{i+1}"
-            future = producer.send(topic, value=message, key=key)
-
-            # Wait for the message to be sent
-            record_metadata = future.get(timeout=10)
-
-            click.echo(
-                f"Message {i+1}/{count} sent to {record_metadata.topic}:"
-                f"{record_metadata.partition}:{record_metadata.offset}"
-            )
-            click.echo(f"  Key: {key}")
-            click.echo(f"  Message: {json.dumps(message, indent=2)}")
-
-            if i < count - 1:
-                time.sleep(interval)
-
-        producer.close()
-        click.echo(f"Successfully sent {count} message(s) to topic '{topic}'")
-
-    except Exception as e:
-        click.echo(f"Error sending messages: {e}", err=True)
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/src/launchpad/artifact_processor.py b/src/launchpad/artifact_processor.py
index e0e86296..bf90179d 100644
--- a/src/launchpad/artifact_processor.py
+++ b/src/launchpad/artifact_processor.py
@@ -2,9 +2,11 @@
 
 import contextlib
 import json
+import os
 import tempfile
 import time
 
+from dataclasses import dataclass
 from datetime import datetime, timedelta
 from pathlib import Path
 from typing import Any, Iterator, cast
@@ -45,12 +47,42 @@
 from launchpad.tracing import request_context
 from launchpad.utils.file_utils import IdPrefix, id_from_bytes
 from launchpad.utils.logging import get_logger
-from launchpad.utils.objectstore import create_objectstore_client
+from launchpad.utils.objectstore import ObjectstoreConfig, create_objectstore_client
 from launchpad.utils.statsd import StatsdInterface, get_statsd
 
 logger = get_logger(__name__)
 
 
+@dataclass
+class ServiceConfig:
+    sentry_base_url: str
+    projects_to_skip: list[str]
+    objectstore_config: ObjectstoreConfig
+
+
+def get_service_config() -> ServiceConfig:
+    sentry_base_url = os.getenv("SENTRY_BASE_URL")
+    projects_to_skip_str = os.getenv("PROJECT_IDS_TO_SKIP")
+    projects_to_skip = projects_to_skip_str.split(",") if projects_to_skip_str else []
+
+    objectstore_config = ObjectstoreConfig(
+        objectstore_url=os.getenv("OBJECTSTORE_URL"),
+        key_id=os.getenv("OBJECTSTORE_SIGNING_KEY_ID"),
+        key_file=os.getenv("OBJECTSTORE_SIGNING_KEY_FILE"),
+    )
+    if expiry_seconds := os.getenv("OBJECTSTORE_TOKEN_EXPIRY_SECONDS"):
+        objectstore_config.token_expiry_seconds = int(expiry_seconds)
+
+    if sentry_base_url is None:
+        sentry_base_url = "http://getsentry.default"
+
+    return ServiceConfig(
+        sentry_base_url=sentry_base_url,
+        projects_to_skip=projects_to_skip,
+        objectstore_config=objectstore_config,
+    )
+
+
 class ArtifactProcessor:
     def __init__(
         self,
@@ -73,14 +105,11 @@ def process_message(
         statsd=None,
     ):
         """Process an artifact message with proper context and metrics.
-        This is used by the Kafka workers and so has to set up the context from scratch.
         If components are not provided, they will be created.
         """
         start_time = time.time()
 
         if service_config is None:
-            from launchpad.service import get_service_config
-
             service_config = get_service_config()
 
         initialize_sentry_sdk()
diff --git a/src/launchpad/cli.py b/src/launchpad/cli.py
index 4712b077..c3ab7fad 100644
--- a/src/launchpad/cli.py
+++ b/src/launchpad/cli.py
@@ -1,13 +1,11 @@
 from __future__ import annotations
 
-import logging
 import os
 
 import click
 
 from . import __version__
 from .distribution.cli import distribution_command
-from .service import run_service
 from .size.cli import app_icon_command, profile_dex_parsing_command, size_command
 from .utils.console import console
 from .utils.logging import setup_logging
@@ -26,62 +24,6 @@ def cli(ctx: click.Context, version: bool) -> None:
         click.echo(ctx.get_help())
 
 
-@cli.command()
-@click.option("--host", default="0.0.0.0", help="Host to bind the server to.", show_default=True)
-@click.option("--port", default=2218, help="Port to bind the server to.", show_default=True)
-@click.option("--dev", "mode", flag_value="development", help="Run in development mode (default).")
-@click.option("--prod", "mode", flag_value="production", help="Run in production mode.")
-@click.option("--verbose", "-v", is_flag=True, help="Enable verbose logging output.")
-def serve(host: str, port: int, mode: str | None, verbose: bool) -> None:
-    """Start the Launchpad server.
-
-    Runs the HTTP server with health check endpoints and Kafka consumer
-    for processing analysis requests.
-    """
-
-    # If SENTRY_REGION is set we are in a production environment. This
-    # isn't the correct way to do this (what about self-hosted?) but
-    # it's better than what we had previously where we ended up
-    # assuming development mode in production.
-    if mode is None:
-        region = os.getenv("SENTRY_REGION", None)
-        mode = "development" if region is None else "production"
-
-    # If verbose wasn't explicitly set and we're in development mode, enable verbose
-    if not verbose and mode == "development":
-        verbose = True
-
-    # Set environment variables for configuration
-    os.environ["LAUNCHPAD_ENV"] = mode
-    os.environ["LAUNCHPAD_HOST"] = host
-    os.environ["LAUNCHPAD_PORT"] = str(port)
-
-    setup_logging(verbose=verbose, quiet=False)
-
-    if not verbose:
-        # Reduce noise from some libraries
-        logging.getLogger("aiohttp.access").setLevel(logging.WARNING)
-
-    mode_display = "Development" if mode == "development" else "Production"
-    console.print(f"[bold blue]Launchpad {mode_display} Server v{__version__}[/bold blue]")
-    console.print(f"Starting server on [cyan]http://{host}:{port}[/cyan]")
-
-    mode_color = "green" if mode == "development" else "yellow"
-    console.print(f"Mode: [{mode_color}]{mode}[/{mode_color}]")
-    console.print("Press Ctrl+C to stop the server")
-    console.print()
-
-    try:
-        run_service()
-    except KeyboardInterrupt:
-        console.print("\n[yellow]Server stopped by user[/yellow]")
-    except Exception as e:
-        console.print(f"[bold red]Server error:[/bold red] {e}")
-        if verbose:
-            console.print_exception()
-        raise click.Abort()
-
-
 @cli.command()
 @click.option("--processing-pool-name", default="launchpad", help="Name of the processing pool.", show_default=True)
 @click.option("--verbose", "-v", is_flag=True, help="Enable verbose logging output.")
diff --git a/src/launchpad/constants.py b/src/launchpad/constants.py
index 4eb84c0f..ea079ef8 100644
--- a/src/launchpad/constants.py
+++ b/src/launchpad/constants.py
@@ -2,9 +2,6 @@
 
 from enum import Enum
 
-# Kafka topic names
-PREPROD_ARTIFACT_EVENTS_TOPIC = "preprod-artifact-events"
-
 
 # Error code constants (matching the Django model)
 class ProcessingErrorCode(Enum):
diff --git a/src/launchpad/kafka.py b/src/launchpad/kafka.py
deleted file mode 100644
index 0678c753..00000000
--- a/src/launchpad/kafka.py
+++ /dev/null
@@ -1,390 +0,0 @@
-"""Kafka consumer implementation for Launchpad using Arroyo."""
-
-from __future__ import annotations
-
-import logging
-import multiprocessing
-import os
-import sys
-import threading
-
-from dataclasses import dataclass
-from functools import partial
-from logging.handlers import QueueHandler, QueueListener
-from typing import Any, Mapping
-
-from arroyo import Message, Topic, configure_metrics
-from arroyo.backends.kafka import KafkaConsumer as ArroyoKafkaConsumer
-from arroyo.backends.kafka import KafkaPayload
-from arroyo.processing.processor import StreamProcessor
-from arroyo.processing.strategies import ProcessingStrategy, ProcessingStrategyFactory
-from arroyo.processing.strategies.commit import CommitOffsets
-from arroyo.processing.strategies.run_task_in_threads import RunTaskInThreads
-from arroyo.types import Commit, Partition
-from sentry_kafka_schemas import get_codec
-
-from launchpad.artifact_processor import ArtifactProcessor
-from launchpad.constants import PREPROD_ARTIFACT_EVENTS_TOPIC
-from launchpad.tracing import RequestLogFilter
-from launchpad.utils.arroyo_metrics import DatadogMetricsBackend
-from launchpad.utils.logging import get_logger
-
-logger = get_logger(__name__)
-
-DEFAULT_TASK_TIMEOUT_SECONDS = 720  # 12 minutes
-
-# Schema codec for preprod artifact events
-PREPROD_ARTIFACT_SCHEMA = get_codec(PREPROD_ARTIFACT_EVENTS_TOPIC)
-
-
-def _process_in_subprocess(decoded_message: Any, log_queue: multiprocessing.Queue[Any]) -> None:
-    """Worker function that runs in subprocess."""
-    root_logger = logging.getLogger()
-    root_logger.handlers.clear()
-
-    queue_handler = QueueHandler(log_queue)
-    queue_handler.addFilter(RequestLogFilter())
-
-    root_logger.addHandler(queue_handler)
-    root_logger.setLevel(logging.DEBUG)
-
-    try:
-        ArtifactProcessor.process_message(
-            artifact_id=decoded_message["artifact_id"],
-            project_id=decoded_message["project_id"],
-            organization_id=decoded_message["organization_id"],
-        )
-    except Exception:
-        logger.exception("Error processing message in subprocess")
-        sys.exit(1)
-
-
-def _kill_process(process: multiprocessing.Process, artifact_id: str) -> None:
-    """Gracefully terminate, then force kill a subprocess."""
-    process.terminate()
-    process.join(timeout=5)
-    if process.is_alive():
-        logger.warning(
-            "Process did not terminate gracefully, force killing",
-            extra={"artifact_id": artifact_id, "pid": process.pid},
-        )
-        process.kill()
-        process.join(timeout=1)  # Brief timeout to reap zombie, avoid infinite block
-        if process.is_alive():
-            logger.error(
-                "Process could not be killed, may become zombie",
-                extra={"artifact_id": artifact_id, "pid": process.pid},
-            )
-
-
-def process_kafka_message_with_service(
-    msg: Message[KafkaPayload],
-    log_queue: multiprocessing.Queue[Any],
-    process_registry: dict[int, tuple[multiprocessing.Process, str]],
-    registry_lock: threading.Lock,
-    factory: LaunchpadStrategyFactory,
-) -> Any:
-    """Process a Kafka message by spawning a fresh subprocess with timeout protection."""
-    timeout = int(os.getenv("KAFKA_TASK_TIMEOUT_SECONDS", str(DEFAULT_TASK_TIMEOUT_SECONDS)))
-    try:
-        decoded = PREPROD_ARTIFACT_SCHEMA.decode(msg.payload.value)
-    except Exception:
-        logger.exception("Failed to decode message")
-        raise
-
-    artifact_id = decoded.get("artifact_id", "unknown")
-
-    # Spawn actual processing in a subprocess
-    process = multiprocessing.Process(target=_process_in_subprocess, args=(decoded, log_queue))
-    process.start()
-
-    # Register the process for tracking (PID is always set after start())
-    with registry_lock:
-        process_registry[process.pid] = (process, artifact_id)  # type: ignore[index]
-
-    try:
-        process.join(timeout=timeout)
-
-        # Check if killed during rebalance
-        pid = process.pid
-        if pid is not None:
-            with registry_lock:
-                was_killed_by_rebalance = pid in factory._killed_during_rebalance
-                if was_killed_by_rebalance:
-                    factory._killed_during_rebalance.discard(pid)
-
-            if was_killed_by_rebalance:
-                # Wait for kill to complete, then don't commit offset
-                process.join(timeout=10)  # Give kill_active_processes time to finish
-                logger.warning(
-                    "Process killed during rebalance, message will be reprocessed",
-                    extra={"artifact_id": artifact_id},
-                )
-                raise TimeoutError("Subprocess killed during rebalance")
-
-        # Handle timeout (process still alive after full timeout)
-        if process.is_alive():
-            logger.error(
-                "Launchpad task killed after exceeding timeout",
-                extra={"timeout_seconds": timeout, "artifact_id": artifact_id},
-            )
-            _kill_process(process, artifact_id)
-            return None  # type: ignore[return-value]
-
-        if process.exitcode != 0:
-            logger.error(
-                "Process exited with non-zero code",
-                extra={"exit_code": process.exitcode, "artifact_id": artifact_id},
-            )
-            return None  # type: ignore[return-value]
-
-        return decoded  # type: ignore[no-any-return]
-    finally:
-        with registry_lock:
-            process_registry.pop(process.pid, None)
-
-
-def create_kafka_consumer() -> LaunchpadKafkaConsumer:
-    """Create and configure a Kafka consumer using environment variables."""
-    config = get_kafka_config()
-    configure_metrics(DatadogMetricsBackend(config.group_id))
-
-    environment = os.getenv("LAUNCHPAD_ENV")
-    if not environment:
-        raise ValueError("LAUNCHPAD_ENV environment variable is required")
-
-    # When all RunTaskInThreads threads are busy, Arroyo retries submit()
-    # in a backoff loop without calling consumer.poll(). If this exceeds
-    # max.poll.interval.ms (default 5min), the broker evicts the consumer,
-    # triggering a rebalance loop. Set it higher than the task timeout.
-    task_timeout = int(os.getenv("KAFKA_TASK_TIMEOUT_SECONDS", str(DEFAULT_TASK_TIMEOUT_SECONDS)))
-    max_poll_interval_ms = (task_timeout + 120) * 1000  # task timeout + 2 min buffer
-
-    consumer_config = {
-        "bootstrap.servers": config.bootstrap_servers,
-        "group.id": config.group_id,
-        "auto.offset.reset": config.auto_offset_reset,
-        "arroyo.strict.offset.reset": config.arroyo_strict_offset_reset,
-        "enable.auto.commit": False,
-        "enable.auto.offset.store": False,
-        "security.protocol": config.security_protocol,
-        "max.poll.interval.ms": max_poll_interval_ms,
-    }
-
-    # SASL is used in some prod environments.
-    if config.sasl_mechanism:
-        consumer_config.update(
-            {
-                "sasl.mechanism": config.sasl_mechanism,
-                "sasl.username": config.sasl_username,
-                "sasl.password": config.sasl_password,
-            }
-        )
-
-    arroyo_consumer = ArroyoKafkaConsumer(consumer_config)
-
-    strategy_factory = LaunchpadStrategyFactory(
-        concurrency=config.concurrency,
-        max_pending_futures=config.max_pending_futures,
-    )
-
-    topics = [Topic(topic) for topic in config.topics]
-    topic = topics[0] if topics else Topic("default")
-    processor = StreamProcessor(
-        consumer=arroyo_consumer,
-        topic=topic,
-        processor_factory=strategy_factory,
-        join_timeout=config.join_timeout_seconds,  # Drop in-flight work during rebalance before Kafka times out
-    )
-    return LaunchpadKafkaConsumer(processor, strategy_factory)
-
-
-# This wrapper is required to ensure that the active subprocesses are killed during rebalances due to the nature of run_task_in_threads.
-class ShutdownAwareStrategy(ProcessingStrategy[KafkaPayload]):
-    """Wrapper that kills active subprocesses during rebalance."""
-
-    def __init__(self, inner: ProcessingStrategy[KafkaPayload], factory: LaunchpadStrategyFactory):
-        self._inner = inner
-        self._factory = factory
-
-    def submit(self, message: Message[KafkaPayload]) -> None:
-        self._inner.submit(message)
-
-    def poll(self) -> None:
-        self._inner.poll()
-
-    def close(self) -> None:
-        # Kill all active subprocesses BEFORE closing inner strategy
-        self._factory.kill_active_processes()
-        self._inner.close()
-
-    def terminate(self) -> None:
-        self._factory.kill_active_processes()
-        self._inner.terminate()
-
-    def join(self, timeout: float | None = None) -> None:
-        self._inner.join(timeout)
-
-
-class LaunchpadKafkaConsumer:
-    processor: StreamProcessor[KafkaPayload]
-    strategy_factory: LaunchpadStrategyFactory
-    _running: bool
-
-    def __init__(
-        self,
-        processor: StreamProcessor[KafkaPayload],
-        strategy_factory: LaunchpadStrategyFactory,
-    ):
-        self.processor = processor
-        self.strategy_factory = strategy_factory
-        self._running = False
-
-    def run(self):
-        assert not self._running, "Already running"
-        logger.info(f"{self} running")
-        self._running = True
-
-        try:
-            self.processor.run()
-        finally:
-            self._running = False
-            try:
-                self.strategy_factory.close()
-            except Exception:
-                logger.exception("Error closing strategy factory")
-
-    def stop(self):
-        """Signal shutdown to the processor."""
-        logger.info(f"{self} stop commanded")
-        self.processor.signal_shutdown()
-
-    def is_healthy(self) -> bool:
-        return True
-
-
-class LaunchpadStrategyFactory(ProcessingStrategyFactory[KafkaPayload]):
-    """Factory for creating the processing strategy chain."""
-
-    def __init__(
-        self,
-        concurrency: int,
-        max_pending_futures: int,
-    ) -> None:
-        self._log_queue: multiprocessing.Queue[Any] = multiprocessing.Queue()
-        self._queue_listener = self._setup_queue_listener()
-        self._queue_listener.start()
-
-        self._active_processes: dict[int, tuple[multiprocessing.Process, str]] = {}
-        self._processes_lock = threading.Lock()
-        self._killed_during_rebalance: set[int] = set()
-
-        self.concurrency = concurrency
-        self.max_pending_futures = max_pending_futures
-
-    def _setup_queue_listener(self) -> QueueListener:
-        """Set up listener in main process to handle logs from workers."""
-        root_logger = logging.getLogger()
-        handlers = list(root_logger.handlers) if root_logger.handlers else []
-
-        return QueueListener(self._log_queue, *handlers, respect_handler_level=True)
-
-    def kill_active_processes(self) -> None:
-        """Kill all active subprocesses. Called during rebalancing."""
-        with self._processes_lock:
-            if self._active_processes:
-                logger.info(
-                    "Killing %d active subprocess(es) during rebalance",
-                    len(self._active_processes),
-                )
-                for pid, (process, artifact_id) in list(self._active_processes.items()):
-                    if process.is_alive():
-                        self._killed_during_rebalance.add(pid)
-                        logger.info("Terminating subprocess with PID %d", pid)
-                        _kill_process(process, artifact_id)
-                self._active_processes.clear()
-
-    def create_with_partitions(
-        self,
-        commit: Commit,
-        partitions: Mapping[Partition, int],
-    ) -> ProcessingStrategy[KafkaPayload]:
-        """Create the processing strategy chain."""
-        next_step: ProcessingStrategy[Any] = CommitOffsets(commit)
-
-        processing_function = partial(
-            process_kafka_message_with_service,
-            log_queue=self._log_queue,
-            process_registry=self._active_processes,
-            registry_lock=self._processes_lock,
-            factory=self,
-        )
-        inner_strategy = RunTaskInThreads(
-            processing_function=processing_function,
-            concurrency=self.concurrency,
-            max_pending_futures=self.max_pending_futures,
-            next_step=next_step,
-        )
-
-        return ShutdownAwareStrategy(inner_strategy, self)
-
-    def close(self) -> None:
-        """Clean up the logging queue and listener."""
-        try:
-            self._queue_listener.stop()
-            logger.debug("Closed queue listener")
-        except Exception:
-            logger.exception("Error stopping queue listener")
-
-
-@dataclass
-class KafkaConfig:
-    """Kafka configuration data."""
-
-    bootstrap_servers: str
-    group_id: str
-    topics: list[str]
-    concurrency: int
-    max_pending_futures: int
-    auto_offset_reset: str
-    arroyo_strict_offset_reset: bool | None
-    security_protocol: str
-    sasl_mechanism: str | None
-    sasl_username: str | None
-    sasl_password: str | None
-    join_timeout_seconds: float
-
-
-def get_kafka_config() -> KafkaConfig:
-    """Get Kafka configuration from environment variables."""
-    # Required configuration
-    bootstrap_servers = os.getenv("KAFKA_BOOTSTRAP_SERVERS")
-    if not bootstrap_servers:
-        raise ValueError("KAFKA_BOOTSTRAP_SERVERS env var is required")
-
-    group_id = os.getenv("KAFKA_GROUP_ID")
-    if not group_id:
-        raise ValueError("KAFKA_GROUP_ID env var is required")
-
-    topics_env = os.getenv("KAFKA_TOPICS")
-    if not topics_env:
-        raise ValueError("KAFKA_TOPICS env var is required")
-
-    # Parse arroyo_strict_offset_reset as boolean, default to None if invalid
-    arroyo_strict_offset_reset = {"true": True, "false": False}.get(os.getenv("ARROYO_STRICT_OFFSET_RESET", "").lower())
-
-    # Optional configuration with defaults
-    return KafkaConfig(
-        bootstrap_servers=bootstrap_servers,
-        group_id=group_id,
-        topics=topics_env.split(","),
-        concurrency=int(os.getenv("KAFKA_CONCURRENCY", "1")),
-        max_pending_futures=int(os.getenv("KAFKA_MAX_PENDING_FUTURES", "0")),
-        auto_offset_reset=os.getenv("KAFKA_AUTO_OFFSET_RESET", "latest"),  # latest = skip old messages
-        arroyo_strict_offset_reset=arroyo_strict_offset_reset,
-        security_protocol=os.environ.get("KAFKA_SECURITY_PROTOCOL", "plaintext"),
-        sasl_mechanism=os.environ.get("KAFKA_SASL_MECHANISM", None),
-        sasl_username=os.environ.get("KAFKA_SASL_USERNAME", None),
-        sasl_password=os.environ.get("KAFKA_SASL_PASSWORD", None),
-        join_timeout_seconds=float(os.getenv("KAFKA_JOIN_TIMEOUT_SECONDS", "10")),
-    )
diff --git a/src/launchpad/service.py b/src/launchpad/service.py
deleted file mode 100644
index d7e01617..00000000
--- a/src/launchpad/service.py
+++ /dev/null
@@ -1,163 +0,0 @@
-"""Main service orchestrator for Launchpad."""
-
-from __future__ import annotations
-
-import asyncio
-import os
-import signal
-import threading
-
-from dataclasses import dataclass
-
-from launchpad.sentry_client import SentryClient
-from launchpad.utils.logging import get_logger
-from launchpad.utils.objectstore import ObjectstoreConfig
-from launchpad.utils.statsd import NullStatsd, StatsdInterface, get_statsd
-
-from .kafka import LaunchpadKafkaConsumer, create_kafka_consumer
-from .sentry_sdk_init import initialize_sentry_sdk
-from .server import LaunchpadServer, get_server_config
-
-logger = get_logger(__name__)
-
-
-class LaunchpadService:
-    """Main service that orchestrates HTTP server and Kafka consumer.
-
-    The HTTP server runs in a background thread with its own event loop,
-    while the Kafka consumer runs in the main thread (required for signal handlers).
-    """
-
-    def __init__(self, statsd: StatsdInterface | None = None) -> None:
-        self.server: LaunchpadServer | None = None
-        self.kafka: LaunchpadKafkaConsumer | None = None
-        self._server_thread: threading.Thread | None = None
-        self._server_loop: asyncio.AbstractEventLoop | None = None
-        self._statsd = statsd or NullStatsd()
-        self._healthcheck_file: str | None = None
-        self._service_config: ServiceConfig | None = None
-        self._sentry_client: SentryClient | None = None
-        self._shutdown_requested = False
-
-    def setup(self) -> None:
-        initialize_sentry_sdk()
-        self._service_config = get_service_config()
-        self._sentry_client = SentryClient(base_url=self._service_config.sentry_base_url)
-
-        server_config = get_server_config()
-        self.server = LaunchpadServer(
-            self.is_healthy,
-            host=server_config.host,
-            port=server_config.port,
-            statsd=self._statsd,
-        )
-
-        self.kafka = create_kafka_consumer()
-        logger.info("Service components initialized")
-
-    def start(self) -> None:
-        if not self.server or not self.kafka:
-            raise RuntimeError("Service not properly initialized. Call setup() first.")
-
-        logger.info("Starting Launchpad service...")
-
-        def signal_handler(signum: int, frame) -> None:
-            if self._shutdown_requested:
-                logger.info(f"Received signal {signum} during shutdown, forcing exit...")
-                os._exit(1)
-
-            logger.info(f"Received signal {signum}, initiating shutdown...")
-            self._shutdown_requested = True
-            if self.kafka:
-                self.kafka.stop()
-
-        signal.signal(signal.SIGTERM, signal_handler)
-        signal.signal(signal.SIGINT, signal_handler)
-
-        # Start HTTP server in background thread
-        self._server_thread = threading.Thread(
-            target=self._run_http_server_thread,
-            name="launchpad-http-server",
-            daemon=True,
-        )
-        self._server_thread.start()
-
-        logger.info("Launchpad service started successfully")
-
-        try:
-            # Run Kafka consumer in main thread (blocking)
-            self.kafka.run()
-        finally:
-            logger.info("Cleaning up service resources...")
-            self._shutdown_server()
-            logger.info("Service cleanup completed")
-
-    def is_healthy(self) -> bool:
-        """Get overall service health status."""
-        is_server_healthy = self.server.is_healthy()
-        is_kafka_healthy = self.kafka.is_healthy()
-        return is_server_healthy and is_kafka_healthy
-
-    def _run_http_server_thread(self) -> None:
-        self._server_loop = asyncio.new_event_loop()
-        asyncio.set_event_loop(self._server_loop)
-
-        try:
-            self._server_loop.run_until_complete(self.server.start())
-            self._server_loop.run_forever()
-        finally:
-            self._server_loop.close()
-
-    def _shutdown_server(self) -> None:
-        if self._server_loop and self.server:
-            future = asyncio.run_coroutine_threadsafe(self.server.stop(), self._server_loop)
-            try:
-                future.result(timeout=10)
-            except Exception:
-                logger.warning("Error during server shutdown", exc_info=True)
-
-            self._server_loop.call_soon_threadsafe(self._server_loop.stop)
-
-        if self._server_thread and self._server_thread.is_alive():
-            self._server_thread.join(timeout=10)
-
-
-@dataclass
-class ServiceConfig:
-    """Service configuration data."""
-
-    sentry_base_url: str
-    projects_to_skip: list[str]
-    objectstore_config: ObjectstoreConfig
-
-
-def get_service_config() -> ServiceConfig:
-    """Get service configuration from environment."""
-    sentry_base_url = os.getenv("SENTRY_BASE_URL")
-    projects_to_skip_str = os.getenv("PROJECT_IDS_TO_SKIP")
-    projects_to_skip = projects_to_skip_str.split(",") if projects_to_skip_str else []
-
-    objectstore_config = ObjectstoreConfig(
-        objectstore_url=os.getenv("OBJECTSTORE_URL"),
-        key_id=os.getenv("OBJECTSTORE_SIGNING_KEY_ID"),
-        key_file=os.getenv("OBJECTSTORE_SIGNING_KEY_FILE"),
-    )
-    if expiry_seconds := os.getenv("OBJECTSTORE_TOKEN_EXPIRY_SECONDS"):
-        objectstore_config.token_expiry_seconds = int(expiry_seconds)
-
-    if sentry_base_url is None:
-        sentry_base_url = "http://getsentry.default"
-
-    return ServiceConfig(
-        sentry_base_url=sentry_base_url,
-        projects_to_skip=projects_to_skip,
-        objectstore_config=objectstore_config,
-    )
-
-
-def run_service() -> None:
-    """Run the Launchpad service."""
-    statsd = get_statsd()
-    service = LaunchpadService(statsd)
-    service.setup()
-    service.start()
diff --git a/src/launchpad/utils/arroyo_metrics.py b/src/launchpad/utils/arroyo_metrics.py
deleted file mode 100644
index 302912d2..00000000
--- a/src/launchpad/utils/arroyo_metrics.py
+++ /dev/null
@@ -1,48 +0,0 @@
-"""DataDog metrics backend for Arroyo."""
-
-from __future__ import annotations
-
-from typing import Optional, Union
-
-from arroyo.utils.metrics import MetricName, Metrics, Tags
-
-from launchpad.utils.statsd import get_statsd
-
-
-class DatadogMetricsBackend(Metrics):
-    """
-    DataDog metrics backend that implements Arroyo's Metrics protocol.
-
-    This bridges Arroyo's metrics interface with DataDog StatsD.
-    """
-
-    def __init__(self, group_id: str) -> None:
-        self._statsd = get_statsd("consumer")
-        self._constant_tags = {"consumer_group": group_id}
-
-    def increment(
-        self,
-        name: MetricName,
-        value: Union[int, float] = 1,
-        tags: Optional[Tags] = None,
-    ) -> None:
-        """Increments a counter metric by a given value."""
-        self._statsd.increment(name, value, tags=self._format_tags(tags))
-
-    def gauge(self, name: MetricName, value: Union[int, float], tags: Optional[Tags] = None) -> None:
-        """Sets a gauge metric to the given value."""
-        self._statsd.gauge(name, value, tags=self._format_tags(tags))
-
-    def timing(self, name: MetricName, value: Union[int, float], tags: Optional[Tags] = None) -> None:
-        """Records a timing metric."""
-        self._statsd.timing(name, value, tags=self._format_tags(tags))
-
-    def _format_tags(self, tags: Optional[Tags]) -> Optional[list[str]]:
-        """Convert Arroyo tags format to DataDog tags format, merging with constant tags."""
-        merged_tags = self._constant_tags.copy()
-        if tags:
-            merged_tags.update(tags)
-
-        if not merged_tags:
-            return None
-        return [f"{key}:{value}" for key, value in merged_tags.items()]
diff --git a/src/launchpad/utils/logging.py b/src/launchpad/utils/logging.py
index c3c151a1..722acf6b 100644
--- a/src/launchpad/utils/logging.py
+++ b/src/launchpad/utils/logging.py
@@ -141,8 +141,6 @@ def setup_logging(verbose: bool = False, quiet: bool = False) -> None:
 
     # Set levels for third-party libraries
     logging.getLogger("datadog.dogstatsd").setLevel(logging.ERROR)
-    logging.getLogger("arroyo.processing.processor").setLevel(logging.INFO)
-    logging.getLogger("arroyo.processing.strategies.run_task_with_multiprocessing").setLevel(logging.INFO)
     logging.getLogger("urllib3").setLevel(logging.WARNING)
     logging.getLogger("urllib3.connectionpool").setLevel(logging.WARNING)
 
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index 0e7181ae..d21ecf17 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -1,31 +1,21 @@
 """End-to-end tests for Launchpad service.
 
-Tests the full flow:
-1. Upload test artifact to mock API
-2. Send Kafka message to trigger processing
-3. Wait for Launchpad to process
-4. Verify results via mock API
+These tests require the E2E Docker Compose environment to be running.
+The full artifact processing flow tests need to be updated to use
+TaskWorker-based triggering instead of Kafka.
 """
 
-import json
 import os
 import time
 
 from pathlib import Path
 from typing import Any, Dict
 
-import pytest
 import requests
 
-from confluent_kafka import Producer
-
-# Configuration from environment
-KAFKA_BOOTSTRAP_SERVERS = os.getenv("KAFKA_BOOTSTRAP_SERVERS", "kafka:9093")
 MOCK_API_URL = os.getenv("MOCK_API_URL", "http://mock-sentry-api:8000")
 LAUNCHPAD_URL = os.getenv("LAUNCHPAD_URL", "http://launchpad:2218")
-KAFKA_TOPIC = "preprod-artifact-events"
 
-# Test fixtures
 FIXTURES_DIR = Path("/app/fixtures")
 IOS_FIXTURE = FIXTURES_DIR / "ios" / "HackerNews.xcarchive.zip"
 ANDROID_APK_FIXTURE = FIXTURES_DIR / "android" / "hn.apk"
@@ -33,7 +23,6 @@
 
 
 def wait_for_service(url: str, timeout: int = 60, service_name: str = "service") -> None:
-    """Wait for a service to be healthy."""
     start_time = time.time()
     while time.time() - start_time < timeout:
         try:
@@ -48,7 +37,6 @@ def wait_for_service(url: str, timeout: int = 60, service_name: str = "service")
 
 
 def upload_artifact_to_mock_api(artifact_id: str, file_path: Path) -> None:
-    """Upload an artifact file to the mock API."""
     with open(file_path, "rb") as f:
         files = {"file": (file_path.name, f, "application/zip")}
         response = requests.post(f"{MOCK_API_URL}/test/upload-artifact/{artifact_id}", files=files, timeout=30)
@@ -56,42 +44,7 @@ def upload_artifact_to_mock_api(artifact_id: str, file_path: Path) -> None:
         print(f"[OK] Uploaded artifact {artifact_id} ({file_path.name})")
 
 
-def send_kafka_message(artifact_id: str, org: str, project: str, features: list[str]) -> None:
-    """Send a Kafka message to trigger artifact processing."""
-    delivery_error = None
-
-    def delivery_callback(err, msg):
-        nonlocal delivery_error
-        if err:
-            delivery_error = err
-
-    producer = Producer({"bootstrap.servers": KAFKA_BOOTSTRAP_SERVERS, "client.id": "e2e-test-producer"})
-
-    message = {
-        "artifact_id": artifact_id,
-        "organization_id": org,
-        "project_id": project,
-        "requested_features": features,
-    }
-
-    producer.produce(
-        KAFKA_TOPIC,
-        key=artifact_id.encode("utf-8"),
-        value=json.dumps(message).encode("utf-8"),
-        callback=delivery_callback,
-    )
-    remaining = producer.flush(timeout=10)
-
-    if delivery_error:
-        raise RuntimeError(f"Kafka message delivery failed: {delivery_error}")
-    if remaining > 0:
-        raise RuntimeError(f"Failed to flush {remaining} Kafka messages")
-
-    print(f"[OK] Sent Kafka message for artifact {artifact_id}")
-
-
 def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: int = 3) -> Dict[str, Any]:
-    """Wait for artifact processing to complete and return results."""
     start_time = time.time()
     last_status = None
 
@@ -101,13 +54,12 @@ def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: in
             response.raise_for_status()
             results = response.json()
 
-            # Check if processing is complete
-            # Processing is complete when both metadata is updated AND size analysis file exists
             if results.get("artifact_metadata") and results.get("has_size_analysis_file"):
                 print(f"[OK] Processing completed for {artifact_id}")
                 return results
 
-            # Show progress
+            import json
+
             current_status = json.dumps(results, sort_keys=True)
             if current_status != last_status:
                 print(f"  Waiting for processing... (results so far: {results})")
@@ -122,267 +74,6 @@ def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: in
 
 
 def get_size_analysis_raw(artifact_id: str) -> Dict[str, Any]:
-    """Get the raw size analysis JSON for an artifact."""
     response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}/size-analysis-raw", timeout=10)
     response.raise_for_status()
     return response.json()
-
-
-class TestE2EFlow:
-    """End-to-end tests for full Launchpad service flow."""
-
-    @classmethod
-    def setup_class(cls):
-        """Wait for all services to be ready before running tests."""
-        print("\n=== Waiting for services to be ready ===")
-        wait_for_service(MOCK_API_URL, service_name="Mock Sentry API")
-        wait_for_service(LAUNCHPAD_URL, service_name="Launchpad")
-        print("=== All services ready ===\n")
-
-    def test_ios_xcarchive_full_flow(self):
-        """Test full flow with iOS .xcarchive.zip file."""
-        if not IOS_FIXTURE.exists():
-            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
-
-        artifact_id = "test-ios-001"
-        org = "test-org"
-        project = "test-ios-project"
-
-        print("\n=== Testing iOS .xcarchive.zip E2E flow ===")
-
-        # Step 1: Upload artifact to mock API
-        upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
-
-        # Step 2: Send Kafka message
-        send_kafka_message(artifact_id, org, project, ["size_analysis"])
-
-        # Step 3: Wait for processing
-        results = wait_for_processing(artifact_id, timeout=180)
-
-        # Step 4: Verify results
-        print("\n=== Verifying results ===")
-
-        # Check artifact metadata was updated
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
-        metadata = results["artifact_metadata"]
-
-        # Verify exact metadata values for HackerNews.xcarchive.zip
-        assert metadata["app_name"] == "HackerNews"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["build_version"] == "3.8"
-        assert metadata["build_number"] == 1
-        assert metadata["artifact_type"] == 0  # iOS xcarchive
-
-        # Verify iOS-specific nested info
-        assert "apple_app_info" in metadata
-        apple_info = metadata["apple_app_info"]
-        assert apple_info["is_simulator"] is False
-        assert apple_info["codesigning_type"] == "development"
-        assert apple_info["build_date"] == "2025-05-19T16:15:12"
-        assert apple_info["is_code_signature_valid"] is True
-        assert apple_info["main_binary_uuid"] == "BEB3C0D6-2518-343D-BB6F-FF5581C544E8"
-
-        # Check size analysis was uploaded
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
-
-        # Verify size analysis contents with exact values
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] == 6502319
-
-        # Verify treemap structure (root size is install size, different from download_size)
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "ios"
-        assert treemap["root"]["name"] == "HackerNews"
-        assert treemap["root"]["size"] == 9728000  # Install size, larger than download_size
-        assert treemap["root"]["is_dir"] is True
-        assert len(treemap["root"]["children"]) > 0
-
-        # Verify expected insight categories and their structure
-        insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
-        assert insights["duplicate_files"]["total_savings"] > 0
-        assert len(insights["duplicate_files"]["groups"]) > 0
-
-        assert "image_optimization" in insights
-        assert insights["image_optimization"]["total_savings"] > 0
-        assert len(insights["image_optimization"]["optimizable_files"]) > 0
-
-        assert "main_binary_exported_symbols" in insights
-        assert insights["main_binary_exported_symbols"]["total_savings"] > 0
-
-        print("[OK] iOS E2E test passed!")
-        print(f"  - Download size: {size_analysis['download_size']} bytes")
-        print(f"  - Treemap root size: {treemap['root']['size']} bytes")
-        print(f"  - Insight categories: {list(insights.keys())}")
-
-    def test_android_apk_full_flow(self):
-        """Test full flow with Android .apk file."""
-        if not ANDROID_APK_FIXTURE.exists():
-            pytest.skip(f"Android APK fixture not found: {ANDROID_APK_FIXTURE}")
-
-        artifact_id = "test-android-apk-001"
-        org = "test-org"
-        project = "test-android-project"
-
-        print("\n=== Testing Android .apk E2E flow ===")
-
-        # Step 1: Upload artifact to mock API
-        upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
-
-        # Step 2: Send Kafka message
-        send_kafka_message(artifact_id, org, project, ["size_analysis"])
-
-        # Step 3: Wait for processing
-        results = wait_for_processing(artifact_id, timeout=180)
-
-        # Step 4: Verify results
-        print("\n=== Verifying results ===")
-
-        # Check artifact metadata was updated
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
-        metadata = results["artifact_metadata"]
-
-        # Verify exact metadata values for hn.apk
-        assert metadata["app_name"] == "Hacker News"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["artifact_type"] == 2  # Android APK
-
-        # Verify Android-specific nested info
-        assert "android_app_info" in metadata
-        android_info = metadata["android_app_info"]
-        assert android_info["has_proguard_mapping"] is False
-
-        # Check size analysis was uploaded
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
-
-        # Verify size analysis contents with exact values
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] == 3670839
-
-        # Verify treemap structure and root size
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "android"
-        assert treemap["root"]["name"] == "Hacker News"
-        assert treemap["root"]["size"] == 7886041
-        assert treemap["root"]["is_dir"] is True
-        assert len(treemap["root"]["children"]) == 14
-
-        # Verify expected insight categories and their structure
-        insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
-        assert insights["duplicate_files"]["total_savings"] == 51709
-        assert len(insights["duplicate_files"]["groups"]) > 0
-
-        assert "multiple_native_library_archs" in insights
-        assert insights["multiple_native_library_archs"]["total_savings"] == 1891208
-
-        print("[OK] Android APK E2E test passed!")
-        print(f"  - Download size: {size_analysis['download_size']} bytes")
-        print(f"  - Treemap root size: {treemap['root']['size']} bytes")
-        print(f"  - Insight categories: {list(insights.keys())}")
-
-    def test_android_aab_full_flow(self):
-        """Test full flow with Android .aab file."""
-        if not ANDROID_AAB_FIXTURE.exists():
-            pytest.skip(f"Android AAB fixture not found: {ANDROID_AAB_FIXTURE}")
-
-        artifact_id = "test-android-aab-001"
-        org = "test-org"
-        project = "test-android-project"
-
-        print("\n=== Testing Android .aab E2E flow ===")
-
-        # Step 1: Upload artifact to mock API
-        upload_artifact_to_mock_api(artifact_id, ANDROID_AAB_FIXTURE)
-
-        # Step 2: Send Kafka message
-        send_kafka_message(artifact_id, org, project, ["size_analysis"])
-
-        # Step 3: Wait for processing
-        results = wait_for_processing(artifact_id, timeout=180)
-
-        # Step 4: Verify results
-        print("\n=== Verifying results ===")
-
-        # Check artifact metadata was updated
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
-        metadata = results["artifact_metadata"]
-
-        # Verify exact metadata values for hn.aab
-        assert metadata["app_name"] == "Hacker News"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["build_version"] == "1.0.2"
-        assert metadata["build_number"] == 13
-        assert metadata["artifact_type"] == 1  # Android AAB
-
-        # Verify Android-specific nested info
-        assert "android_app_info" in metadata
-        android_info = metadata["android_app_info"]
-        assert android_info["has_proguard_mapping"] is True
-
-        # Check size analysis was uploaded
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
-
-        # Verify size analysis contents
-        size_analysis = get_size_analysis_raw(artifact_id)
-        # AAB download size varies based on extracted APKs - verify it's positive
-        assert size_analysis["download_size"] > 0
-
-        # Verify treemap structure and root size
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "android"
-        assert treemap["root"]["name"] == "Hacker News"
-        assert treemap["root"]["size"] == 5932249
-        assert treemap["root"]["is_dir"] is True
-        assert len(treemap["root"]["children"]) == 14
-
-        # Verify expected insight categories for Android AAB
-        insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
-        assert insights["duplicate_files"]["total_savings"] >= 0
-        assert "groups" in insights["duplicate_files"]
-
-        print("[OK] Android AAB E2E test passed!")
-        print(f"  - Download size: {size_analysis['download_size']} bytes")
-        print(f"  - Treemap root size: {treemap['root']['size']} bytes")
-        print(f"  - Insight categories: {list(insights.keys())}")
-
-    def test_launchpad_health_check(self):
-        """Verify Launchpad service is healthy."""
-        response = requests.get(f"{LAUNCHPAD_URL}/health", timeout=10)
-        assert response.status_code == 200
-        data = response.json()
-        assert data["service"] == "launchpad"
-        assert data["status"] == "ok"
-        print("[OK] Launchpad health check passed")
-
-    def test_nonexistent_artifact_error_handling(self):
-        """Test that processing a non-existent artifact is handled gracefully."""
-        artifact_id = "test-nonexistent-artifact"
-        org = "test-org"
-        project = "test-project"
-
-        print("\n=== Testing non-existent artifact error handling ===")
-
-        # Don't upload any artifact - just send Kafka message for non-existent one
-        send_kafka_message(artifact_id, org, project, ["size_analysis"])
-
-        # Wait a bit for processing attempt
-        time.sleep(10)
-
-        # Check results - should have error metadata, no size analysis
-        response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}", timeout=10)
-        response.raise_for_status()
-        results = response.json()
-
-        # Verify no size analysis was uploaded (artifact download should have failed)
-        assert not results["has_size_analysis_file"], "Should not have size analysis for non-existent artifact"
-
-        # The artifact metadata may have error information
-        metadata = results.get("artifact_metadata", {})
-        # If error was recorded, it should indicate a download/processing failure
-        if metadata:
-            # Check if error fields are present (depends on implementation)
-            print(f"  Metadata received: {metadata}")
-
-        print("[OK] Non-existent artifact handled correctly (no size analysis produced)")
diff --git a/tests/integration/test_kafka_service.py b/tests/integration/test_kafka_service.py
deleted file mode 100644
index c0a4df0f..00000000
--- a/tests/integration/test_kafka_service.py
+++ /dev/null
@@ -1,242 +0,0 @@
-from __future__ import annotations
-
-import os
-import time
-
-from unittest.mock import patch
-
-import pytest
-
-from aiohttp.test_utils import TestClient, TestServer
-
-from launchpad.artifact_processor import ArtifactProcessor
-from launchpad.constants import PREPROD_ARTIFACT_EVENTS_TOPIC
-from launchpad.kafka import LaunchpadKafkaConsumer, create_kafka_consumer, get_kafka_config
-from launchpad.service import LaunchpadService, ObjectstoreConfig, ServiceConfig, get_service_config
-from launchpad.utils.statsd import FakeStatsd
-
-
-@pytest.fixture
-def kafka_env_vars():
-    env_vars = {
-        "KAFKA_BOOTSTRAP_SERVERS": os.getenv("KAFKA_BOOTSTRAP_SERVERS", "localhost:9092"),
-        "KAFKA_GROUP_ID": f"launchpad-test-{int(time.time())}",
-        "KAFKA_TOPICS": PREPROD_ARTIFACT_EVENTS_TOPIC,
-        "KAFKA_AUTO_OFFSET_RESET": "earliest",
-        "LAUNCHPAD_ENV": "development",
-        "SENTRY_BASE_URL": "http://test.sentry.io",
-    }
-    with patch.dict(os.environ, env_vars, clear=False):
-        yield env_vars
-
-
-class TestKafkaConfigIntegration:
-    """Integration tests for Kafka configuration loading."""
-
-    def test_kafka_config_from_environment(self, kafka_env_vars):
-        """Test that Kafka configuration is correctly loaded from environment variables."""
-        config = get_kafka_config()
-
-        assert config.bootstrap_servers == kafka_env_vars["KAFKA_BOOTSTRAP_SERVERS"]
-        assert config.group_id == kafka_env_vars["KAFKA_GROUP_ID"]
-        assert config.topics == [PREPROD_ARTIFACT_EVENTS_TOPIC]
-        assert config.auto_offset_reset == "earliest"
-
-    def test_kafka_config_missing_required_vars(self):
-        """Test that missing required environment variables raise errors."""
-        with patch.dict(os.environ, {}, clear=True):
-            with pytest.raises(ValueError, match="KAFKA_BOOTSTRAP_SERVERS"):
-                create_kafka_consumer()
-
-    def test_kafka_config_with_security_settings(self):
-        """Test that security configuration is properly loaded."""
-        with patch.dict(
-            os.environ,
-            {
-                "KAFKA_BOOTSTRAP_SERVERS": "localhost:9092",
-                "KAFKA_GROUP_ID": "test-group",
-                "KAFKA_TOPICS": "test-topic",
-                "KAFKA_SECURITY_PROTOCOL": "SASL_SSL",
-                "KAFKA_SASL_MECHANISM": "PLAIN",
-                "KAFKA_SASL_USERNAME": "test-user",
-                "KAFKA_SASL_PASSWORD": "test-pass",
-                "LAUNCHPAD_ENV": "development",
-            },
-        ):
-            config = get_kafka_config()
-            assert config.security_protocol == "SASL_SSL"
-            assert config.sasl_mechanism == "PLAIN"
-            assert config.sasl_username == "test-user"
-            assert config.sasl_password == "test-pass"
-
-
-@pytest.mark.integration
-@pytest.mark.skipif(
-    os.getenv("SKIP_KAFKA_INTEGRATION_TESTS") == "1",
-    reason="Kafka integration tests require running Kafka broker (devservices up)",
-)
-class TestKafkaConsumerIntegration:
-    """Integration tests that require a real Kafka broker.
-
-    These tests run by default in CI (which starts Kafka via devservices) and locally
-    with devservices running. Set SKIP_KAFKA_INTEGRATION_TESTS=1 to skip them.
-
-    Run with Kafka:
-        devservices up
-        pytest tests/integration/test_kafka_service.py::TestKafkaConsumerIntegration -v
-
-    Skip (fast mode):
-        SKIP_KAFKA_INTEGRATION_TESTS=1 pytest tests/integration/test_kafka_service.py -v
-    """
-
-    def test_kafka_consumer_creation(self, kafka_env_vars):
-        """Test that Kafka consumer can be created with real configuration."""
-        consumer = create_kafka_consumer()
-
-        assert isinstance(consumer, LaunchpadKafkaConsumer)
-        assert consumer.processor is not None
-
-
-@pytest.mark.integration
-class TestServiceIntegration:
-    def test_service_setup(self, kafka_env_vars):
-        """Test that service setup initializes real components correctly."""
-        fake_statsd = FakeStatsd()
-        service = LaunchpadService(fake_statsd)
-
-        with (
-            patch("launchpad.service.initialize_sentry_sdk"),
-            patch("launchpad.kafka.configure_metrics"),
-        ):
-            service.setup()
-
-            assert service._service_config is not None
-            assert service._sentry_client is not None
-            assert service.server is not None
-            assert service.kafka is not None
-
-    def test_service_config_loading(self):
-        """Test service configuration loading from environment."""
-
-        with patch.dict("os.environ", {}, clear=True):
-            config = get_service_config()
-            assert config.sentry_base_url == "http://getsentry.default"
-            assert config.projects_to_skip == []
-
-        with patch.dict(
-            "os.environ",
-            {
-                "SENTRY_BASE_URL": "https://custom.sentry.io",
-                "PROJECT_IDS_TO_SKIP": "project1,project2,project3",
-            },
-        ):
-            config = get_service_config()
-            assert config.sentry_base_url == "https://custom.sentry.io"
-            assert config.projects_to_skip == ["project1", "project2", "project3"]
-
-    @pytest.mark.asyncio
-    async def test_http_server_endpoints_integration(self, kafka_env_vars):
-        """Test HTTP server endpoints with real service components."""
-
-        fake_statsd = FakeStatsd()
-        service = LaunchpadService(fake_statsd)
-
-        with (
-            patch("launchpad.service.initialize_sentry_sdk"),
-            patch("launchpad.kafka.configure_metrics"),
-        ):
-            service.setup()
-
-            app = service.server.create_app()
-            server = TestServer(app)
-            client = TestClient(server)
-
-            await client.start_server()
-            try:
-                resp = await client.get("/health")
-                assert resp.status == 200
-                data = await resp.json()
-                assert data["service"] == "launchpad"
-
-                resp = await client.get("/ready")
-                assert resp.status == 200
-                data = await resp.json()
-                assert data["service"] == "launchpad"
-            finally:
-                await client.close()
-
-
-class TestMessageProcessingFlow:
-    """Test the message processing flow with real processing logic."""
-
-    def test_process_message_with_skipped_project(self):
-        """Test that projects in skip list are not processed."""
-
-        fake_statsd = FakeStatsd()
-        service_config = ServiceConfig(
-            sentry_base_url="http://test.sentry.io",
-            projects_to_skip=["skip-project"],
-            objectstore_config=ObjectstoreConfig(objectstore_url="http://test.objectstore.io"),
-        )
-
-        with patch.object(ArtifactProcessor, "process_artifact") as mock_process:
-            ArtifactProcessor.process_message(
-                artifact_id="test-123",
-                project_id="skip-project",
-                organization_id="test-org",
-                service_config=service_config,
-                statsd=fake_statsd,
-            )
-            mock_process.assert_not_called()
-
-    def test_process_message_with_allowed_project(self):
-        """Test that non-skipped projects are processed."""
-
-        fake_statsd = FakeStatsd()
-        service_config = ServiceConfig(
-            sentry_base_url="http://test.sentry.io",
-            projects_to_skip=["other-project"],
-            objectstore_config=ObjectstoreConfig(objectstore_url="http://test.objectstore.io"),
-        )
-
-        with patch.object(ArtifactProcessor, "process_artifact") as mock_process:
-            ArtifactProcessor.process_message(
-                artifact_id="test-123",
-                project_id="normal-project",
-                organization_id="test-org",
-                service_config=service_config,
-                statsd=fake_statsd,
-            )
-
-            mock_process.assert_called_once_with(
-                "test-org",
-                "normal-project",
-                "test-123",
-            )
-
-            calls = fake_statsd.calls
-            assert ("increment", {"metric": "artifact.processing.started", "value": 1, "tags": None}) in calls
-            assert ("increment", {"metric": "artifact.processing.completed", "value": 1, "tags": None}) in calls
-
-    def test_process_message_error_handling(self):
-        """Test that processing errors are handled gracefully."""
-
-        fake_statsd = FakeStatsd()
-        service_config = ServiceConfig(
-            sentry_base_url="http://test.sentry.io",
-            projects_to_skip=[],
-            objectstore_config=ObjectstoreConfig(objectstore_url="http://test.objectstore.io"),
-        )
-
-        with patch.object(ArtifactProcessor, "process_artifact", side_effect=RuntimeError("Test error")):
-            ArtifactProcessor.process_message(
-                artifact_id="test-123",
-                project_id="test-project",
-                organization_id="test-org",
-                service_config=service_config,
-                statsd=fake_statsd,
-            )
-
-            calls = fake_statsd.calls
-            increment_calls = [call for call in calls if call[0] == "increment"]
-            assert any(call[1]["metric"] == "artifact.processing.failed" for call in increment_calls)
diff --git a/tests/integration/test_launchpad_service.py b/tests/integration/test_launchpad_service.py
index 3154c3c4..2128b8a1 100644
--- a/tests/integration/test_launchpad_service.py
+++ b/tests/integration/test_launchpad_service.py
@@ -1,22 +1,15 @@
-"""Tests for the Launchpad service orchestration."""
+"""Tests for the Launchpad HTTP server."""
 
 from __future__ import annotations
 
-from unittest.mock import patch
-
 from aiohttp.test_utils import AioHTTPTestCase
 
 from launchpad.server import LaunchpadServer
-from launchpad.service import LaunchpadService
 from launchpad.utils.statsd import FakeStatsd
 
 
 class TestHealthyLaunchpadServer(AioHTTPTestCase):
-    """Test cases for LaunchpadServer."""
-
     async def get_application(self):
-        """Create the application for testing."""
-
         def mock_health_check() -> bool:
             return True
 
@@ -25,7 +18,6 @@ def mock_health_check() -> bool:
         return server.create_app()
 
     async def test_health_check(self):
-        """Test the health check endpoint."""
         resp = await self.client.request("GET", "/health")
         assert resp.status == 200
 
@@ -35,7 +27,6 @@ async def test_health_check(self):
         assert await resp.text() == '{"status": "ok", "service": "launchpad"}'
 
     async def test_ready_check(self):
-        """Test the readiness check endpoint."""
         resp = await self.client.request("GET", "/ready")
         assert resp.status == 200
 
@@ -44,43 +35,3 @@ async def test_ready_check(self):
             "status": "ok",
             "service": "launchpad",
         }
-
-
-class TestLaunchpadService:
-    """Test cases for LaunchpadService orchestration."""
-
-    def test_service_initialization(self):
-        """Test that LaunchpadService can be initialized properly."""
-        fake_statsd = FakeStatsd()
-        service = LaunchpadService(fake_statsd)
-
-        assert service._statsd is fake_statsd
-        assert service.server is None
-        assert service.kafka is None
-        assert service._service_config is None
-        assert service._sentry_client is None
-
-    def test_service_config_creation(self):
-        """Test ServiceConfig creation with default values."""
-        from launchpad.service import get_service_config
-
-        # Test with no environment variables set
-        with patch.dict("os.environ", {}, clear=True):
-            config = get_service_config()
-            assert config.sentry_base_url == "http://getsentry.default"  # Default value
-            assert isinstance(config.projects_to_skip, list)
-
-    def test_service_health_check_with_no_components(self):
-        """Test health check when components are not initialized."""
-        fake_statsd = FakeStatsd()
-        service = LaunchpadService(fake_statsd)
-
-        # Should handle None components gracefully
-        # This will likely raise an AttributeError, which is expected behavior
-        try:
-            result = service.is_healthy()
-            # If it doesn't raise, it should return False for unhealthy state
-            assert result is False
-        except AttributeError:
-            # Expected when server/kafka are None
-            pass
diff --git a/tests/unit/artifacts/test_artifact_processor.py b/tests/unit/artifacts/test_artifact_processor.py
index 6e797fd0..01611b1f 100644
--- a/tests/unit/artifacts/test_artifact_processor.py
+++ b/tests/unit/artifacts/test_artifact_processor.py
@@ -2,13 +2,13 @@
 
 from objectstore_client import Client as ObjectstoreClient
 
-from launchpad.artifact_processor import ArtifactProcessor
+from launchpad.artifact_processor import ArtifactProcessor, ServiceConfig
 from launchpad.constants import (
     ProcessingErrorCode,
     ProcessingErrorMessage,
 )
 from launchpad.sentry_client import SentryClient, SentryClientError
-from launchpad.service import ObjectstoreConfig, ServiceConfig
+from launchpad.utils.objectstore import ObjectstoreConfig
 from launchpad.utils.statsd import FakeStatsd
 
 

From ef7964e44eb9ba1494caf229324f6d06b5bc89da Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 10:33:54 -0700
Subject: [PATCH 02/15] ref: Remove unused HTTP server and its tests

The LaunchpadServer was only used by the Kafka/Arroyo service
orchestrator. With TaskWorker mode, no HTTP server is needed.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 src/launchpad/server.py                     | 239 --------------------
 tests/integration/test_launchpad_service.py |  37 ---
 2 files changed, 276 deletions(-)
 delete mode 100644 src/launchpad/server.py
 delete mode 100644 tests/integration/test_launchpad_service.py

diff --git a/src/launchpad/server.py b/src/launchpad/server.py
deleted file mode 100644
index 48b76d7d..00000000
--- a/src/launchpad/server.py
+++ /dev/null
@@ -1,239 +0,0 @@
-"""Launchpad HTTP server with health checks and async support."""
-
-from __future__ import annotations
-
-import asyncio
-import logging
-import os
-import sys
-
-from dataclasses import dataclass, replace
-from typing import Callable
-
-from aiohttp.typedefs import Handler
-from aiohttp.web import (
-    AppKey,
-    Application,
-    AppRunner,
-    Request,
-    Response,
-    StreamResponse,
-    TCPSite,
-    json_response,
-    middleware,
-)
-
-from .utils.logging import get_logger
-from .utils.statsd import CRITICAL, OK, NullStatsd, StatsdInterface
-
-logger = get_logger(__name__)
-
-# Define app keys using AppKey
-APP_KEY_DEBUG = AppKey("debug", bool)
-APP_KEY_ENVIRONMENT = AppKey("environment", str)
-
-
-@middleware
-async def security_headers_middleware(request: Request, handler: Handler) -> StreamResponse:
-    """Add security headers for production mode."""
-    response = await handler(request)
-
-    # Only add security headers in production
-    if not request.app.get(APP_KEY_DEBUG, False):
-        response.headers["X-Content-Type-Options"] = "nosniff"
-        response.headers["X-Frame-Options"] = "DENY"
-        response.headers["X-XSS-Protection"] = "1; mode=block"
-        response.headers["Strict-Transport-Security"] = "max-age=31536000; includeSubDomains"
-
-    return response
-
-
-class LaunchpadServer:
-    """Main server class for Launchpad."""
-
-    _running: bool
-    health_check_callback: Callable[[], bool]
-
-    def __init__(
-        self,
-        health_check_callback: Callable[[], bool],
-        host: str | None = None,
-        port: int | None = None,
-        config: ServerConfig | None = None,
-        setup_logging: bool = True,
-        statsd: StatsdInterface | None = None,
-    ) -> None:
-        self.app: Application | None = None
-        self._running = False
-        self._shutdown_event = asyncio.Event()
-        self.config = config or get_server_config()
-        self.health_check_callback = health_check_callback
-        self._statsd = statsd or NullStatsd()
-
-        # Override config with explicit parameters if provided
-        if host is not None or port is not None:
-            self.config = replace(
-                self.config,
-                host=host if host is not None else self.config.host,
-                port=port if port is not None else self.config.port,
-            )
-
-        self.host = self.config.host
-        self.port = self.config.port
-
-        # Only setup logging if requested (CLI handles its own logging)
-        if setup_logging:
-            self._setup_logging()
-
-    def _setup_logging(self) -> None:
-        """Configure logging based on environment."""
-        log_level = getattr(logging, self.config.log_level)
-
-        # Only configure if logging hasn't been configured yet
-        if not logging.getLogger().handlers:
-            logging.basicConfig(
-                level=log_level,
-                format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
-                datefmt="%Y-%m-%d %H:%M:%S",
-                stream=sys.stdout,
-            )
-
-        # Adjust aiohttp access log level
-        if not self.config.access_log:
-            logging.getLogger("aiohttp.access").setLevel(logging.WARNING)
-
-    def create_app(self) -> Application:
-        """Create the aiohttp application with routes."""
-        middlewares = [security_headers_middleware] if not self.config.debug else []
-
-        app = Application(
-            middlewares=middlewares,
-        )
-
-        # Store config in app using AppKey
-        app[APP_KEY_DEBUG] = self.config.debug
-        app[APP_KEY_ENVIRONMENT] = self.config.environment
-
-        app.router.add_get("/health", self.health_check)
-        app.router.add_get("/ready", self.health_check)
-        return app
-
-    def is_healthy(self):
-        return True
-
-    def health_check(self, request: Request) -> Response:
-        is_healthy = self.health_check_callback()
-        if is_healthy:
-            json_status = "ok"
-            statsd_status = OK
-            http_status = 200
-        else:
-            json_status = "error"
-            statsd_status = CRITICAL
-            http_status = 500
-
-        sentry_region = self.config.sentry_region
-
-        self._statsd.service_check(
-            "launchpad.health_check",
-            statsd_status,
-            tags=[f"sentry_region:{sentry_region}"],
-        )
-
-        return json_response(
-            {
-                "status": json_status,
-                "service": "launchpad",
-            },
-            status=http_status,
-        )
-
-    async def start(self):
-        """Start the HTTP server."""
-        logger.info(f"{self} start commanded")
-        self._task = asyncio.create_task(self.run())
-
-    async def run(self):
-        assert not self._running, "Already running"
-        logger.info(f"{self} running")
-        self._running = True
-        self.app = self.create_app()
-
-        runner = AppRunner(
-            self.app,
-            access_log=logger if self.config.access_log else None,
-        )
-        await runner.setup()
-
-        site = TCPSite(runner, self.host, self.port)
-        await site.start()
-
-        logger.info(
-            f"Launchpad server started on {self.host}:{self.port} "
-            f"(environment: {self.config.environment}, debug: {self.config.debug})"
-        )
-
-        await self._shutdown_event.wait()
-
-        logger.info("Shutting down server...")
-        await runner.cleanup()
-        self._running = False
-
-    async def stop(self, timeout_s=10):
-        logger.info(f"{self} stop commanded")
-        self._shutdown_event.set()
-        try:
-            await asyncio.wait_for(self._task, timeout=timeout_s)
-        except asyncio.TimeoutError:
-            logger.warning(f"{self} did not stop within timeout {timeout_s}s")
-            self._task.cancel()
-
-
-@dataclass
-class ServerConfig:
-    """Server configuration data."""
-
-    sentry_region: str
-    environment: str
-    host: str
-    port: int
-    debug: bool
-    log_level: str
-    access_log: bool
-
-
-def get_server_config() -> ServerConfig:
-    """Get server configuration from environment."""
-    environment = os.getenv("LAUNCHPAD_ENV")
-    if not environment:
-        raise ValueError("LAUNCHPAD_ENV environment variable is required")
-    environment = environment.lower()
-
-    is_production = environment == "production"
-
-    host = os.getenv("LAUNCHPAD_HOST")
-    if not host:
-        raise ValueError("LAUNCHPAD_HOST environment variable is required")
-
-    port_str = os.getenv("LAUNCHPAD_PORT")
-    if not port_str:
-        raise ValueError("LAUNCHPAD_PORT environment variable is required")
-
-    try:
-        port = int(port_str)
-    except ValueError:
-        raise ValueError(  # noqa: E501
-            f"LAUNCHPAD_PORT must be a valid integer, got: {port_str}"
-        )
-
-    sentry_region = os.getenv("SENTRY_REGION", "unknown")
-
-    return ServerConfig(
-        environment=environment,
-        sentry_region=sentry_region,
-        host=host,
-        port=port,
-        debug=not is_production,
-        log_level="WARNING" if is_production else "DEBUG",
-        access_log=not is_production,  # Disable access logs in prod
-    )
diff --git a/tests/integration/test_launchpad_service.py b/tests/integration/test_launchpad_service.py
deleted file mode 100644
index 2128b8a1..00000000
--- a/tests/integration/test_launchpad_service.py
+++ /dev/null
@@ -1,37 +0,0 @@
-"""Tests for the Launchpad HTTP server."""
-
-from __future__ import annotations
-
-from aiohttp.test_utils import AioHTTPTestCase
-
-from launchpad.server import LaunchpadServer
-from launchpad.utils.statsd import FakeStatsd
-
-
-class TestHealthyLaunchpadServer(AioHTTPTestCase):
-    async def get_application(self):
-        def mock_health_check() -> bool:
-            return True
-
-        fake_statsd = FakeStatsd()
-        server = LaunchpadServer(health_check_callback=mock_health_check, statsd=fake_statsd)
-        return server.create_app()
-
-    async def test_health_check(self):
-        resp = await self.client.request("GET", "/health")
-        assert resp.status == 200
-
-        # The health check has to be *precisely* this to pass, you
-        # can't add extra fields without changing the getsentry/ops
-        # repo:
-        assert await resp.text() == '{"status": "ok", "service": "launchpad"}'
-
-    async def test_ready_check(self):
-        resp = await self.client.request("GET", "/ready")
-        assert resp.status == 200
-
-        data = await resp.json()
-        assert data == {
-            "status": "ok",
-            "service": "launchpad",
-        }

From dd60b11fada9c121a907a0744892f72053e22011 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 10:41:46 -0700
Subject: [PATCH 03/15] fix: Add pyyaml as explicit dependency

Was previously pulled in transitively via sentry-kafka-schemas,
which was removed as part of the Kafka consumer cleanup.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 requirements.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/requirements.txt b/requirements.txt
index 50d384c8..cd78754a 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -14,6 +14,7 @@ pillow>=11.3.0
 pillow_heif>=1.1.0
 protobuf>=5.29.5,<6
 pydantic>=2.9.2,<2.10.0
+pyyaml>=6.0
 rich>=14.1.0
 sentry-arroyo==2.34.0
 sentry-sdk>=2.36.0

From bdb896ae14623cc208216eb0ad90d40dbf1b7c87 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 11:03:40 -0700
Subject: [PATCH 04/15] fix: Add file-based healthcheck and move import to
 top-level

Add Docker healthcheck for taskworker in devservices config using
the /tmp/health file that TaskWorker maintains. Move json import
out of while loop body in e2e tests.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 devservices/config.yml     | 6 ++++++
 tests/e2e/test_e2e_flow.py | 3 +--
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/devservices/config.yml b/devservices/config.yml
index ff8c0766..39dc098c 100644
--- a/devservices/config.yml
+++ b/devservices/config.yml
@@ -27,6 +27,12 @@ services:
       LAUNCHPAD_RPC_SHARED_SECRET: "launchpad-also-very-long-value-haha"
       LAUNCHPAD_WORKER_RPC_HOST: "host.docker.internal:50051"
       LAUNCHPAD_WORKER_CONCURRENCY: "1"
+    healthcheck:
+      test: ["CMD-SHELL", "[ -f /tmp/health ]"]
+      interval: 10s
+      timeout: 5s
+      retries: 3
+      start_period: 15s
     platform: linux/amd64
     extra_hosts:
       host.docker.internal: host-gateway
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index d21ecf17..c081192d 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -5,6 +5,7 @@
 TaskWorker-based triggering instead of Kafka.
 """
 
+import json
 import os
 import time
 
@@ -58,8 +59,6 @@ def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: in
                 print(f"[OK] Processing completed for {artifact_id}")
                 return results
 
-            import json
-
             current_status = json.dumps(results, sort_keys=True)
             if current_status != last_status:
                 print(f"  Waiting for processing... (results so far: {results})")

From 3f2795dda2a408456807818987e601de72ba5d4b Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 11:04:18 -0700
Subject: [PATCH 05/15] fix: Add file-based healthcheck to e2e compose
 launchpad service

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 docker-compose.e2e.yml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 3f00fed9..6f3d3648 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -62,6 +62,12 @@ services:
       LAUNCHPAD_WORKER_RPC_HOST: "host.docker.internal:50051"
       LAUNCHPAD_WORKER_CONCURRENCY: "1"
       SENTRY_DSN: ""
+    healthcheck:
+      test: ["CMD-SHELL", "[ -f /tmp/health ]"]
+      interval: 10s
+      timeout: 5s
+      retries: 3
+      start_period: 15s
     depends_on:
       mock-sentry-api:
         condition: service_healthy

From 790136b1c642df5c5be5f043746a103055d75c03 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 11:28:32 -0700
Subject: [PATCH 06/15] feat: Rewrite e2e tests for TaskWorker mode
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Replace Kafka consumer e2e setup with fully self-contained
TaskBroker-based infrastructure:

- Kafka (KRaft mode, no Zookeeper dependency)
- TaskBroker (ghcr.io/getsentry/taskbroker:nightly)
- Launchpad worker connecting via gRPC
- Test runner dispatches tasks via process_artifact.delay()

No devservices dependency needed — all infra is in docker-compose.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .github/workflows/ci.yml         |  68 ++++++++-
 docker-compose.e2e.yml           |  70 ++++++++--
 tests/e2e/Dockerfile.test-runner |  14 +-
 tests/e2e/test_e2e_flow.py       | 229 ++++++++++++++++++++++++++++---
 4 files changed, 350 insertions(+), 31 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index a4f1d938..7a32c1c2 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -80,9 +80,75 @@ jobs:
             -e LAUNCHPAD_ENV=development \
             launchpad-test --help
 
+  e2e:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6
+
+      - name: Build E2E Docker images
+        run: docker compose -f docker-compose.e2e.yml build
+
+      - name: Start E2E services
+        run: |
+          docker compose -f docker-compose.e2e.yml up -d kafka
+          echo "Waiting for Kafka to be healthy..."
+          for i in {1..30}; do
+            if docker compose -f docker-compose.e2e.yml ps kafka | grep -q "healthy"; then
+              echo "Kafka is ready!"
+              break
+            fi
+            echo "Waiting for Kafka... attempt $i/30"
+            sleep 3
+          done
+
+          docker compose -f docker-compose.e2e.yml up -d taskbroker minio mock-sentry-api
+          echo "Waiting for mock-sentry-api to be healthy..."
+          for i in {1..20}; do
+            if docker compose -f docker-compose.e2e.yml ps mock-sentry-api | grep -q "healthy"; then
+              echo "Mock Sentry API is ready!"
+              break
+            fi
+            echo "Waiting for Mock API... attempt $i/20"
+            sleep 3
+          done
+
+          docker compose -f docker-compose.e2e.yml up -d launchpad
+          echo "Waiting for Launchpad worker to be healthy..."
+          for i in {1..30}; do
+            if docker compose -f docker-compose.e2e.yml ps launchpad | grep -q "healthy"; then
+              echo "Launchpad is ready!"
+              break
+            fi
+            echo "Waiting for Launchpad... attempt $i/30"
+            sleep 5
+          done
+
+          docker compose -f docker-compose.e2e.yml ps
+
+      - name: Run E2E tests
+        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests
+        timeout-minutes: 10
+
+      - name: Show service logs on failure
+        if: failure()
+        run: |
+          echo "=== Launchpad logs ==="
+          docker compose -f docker-compose.e2e.yml logs launchpad
+          echo "=== TaskBroker logs ==="
+          docker compose -f docker-compose.e2e.yml logs taskbroker
+          echo "=== Mock API logs ==="
+          docker compose -f docker-compose.e2e.yml logs mock-sentry-api
+          echo "=== Kafka logs ==="
+          docker compose -f docker-compose.e2e.yml logs kafka
+
+      - name: Cleanup E2E environment
+        if: always()
+        run: docker compose -f docker-compose.e2e.yml down -v
+
   build:
     runs-on: ubuntu-latest
-    needs: [check, test]
+    needs: [check, test, e2e]
 
     steps:
       - name: Checkout code
diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 6f3d3648..1d14c04d 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -1,6 +1,50 @@
-# E2E test setup for Launchpad
+# E2E test setup for Launchpad (fully self-contained, no devservices needed)
 
 services:
+  # Kafka (KRaft mode, no Zookeeper)
+  kafka:
+    image: confluentinc/cp-kafka:7.7.1
+    environment:
+      KAFKA_NODE_ID: 1
+      KAFKA_LISTENER_SECURITY_PROTOCOL_MAP: CONTROLLER:PLAINTEXT,PLAINTEXT:PLAINTEXT
+      KAFKA_LISTENERS: PLAINTEXT://0.0.0.0:9092,CONTROLLER://0.0.0.0:9093
+      KAFKA_ADVERTISED_LISTENERS: PLAINTEXT://kafka:9092
+      KAFKA_CONTROLLER_QUORUM_VOTERS: 1@kafka:9093
+      KAFKA_CONTROLLER_LISTENER_NAMES: CONTROLLER
+      KAFKA_PROCESS_ROLES: broker,controller
+      CLUSTER_ID: e2e-test-cluster-id-001
+      KAFKA_OFFSETS_TOPIC_REPLICATION_FACTOR: 1
+      KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR: 1
+      KAFKA_TRANSACTION_STATE_LOG_MIN_ISR: 1
+      KAFKA_LOG_RETENTION_HOURS: 1
+    healthcheck:
+      test: ["CMD", "kafka-topics", "--bootstrap-server", "localhost:9092", "--list"]
+      interval: 10s
+      timeout: 10s
+      retries: 5
+      start_period: 20s
+    networks:
+      - launchpad-e2e
+
+  # TaskBroker (gRPC bridge between Kafka and workers)
+  taskbroker:
+    image: ghcr.io/getsentry/taskbroker:nightly
+    environment:
+      TASKBROKER_KAFKA_CLUSTER: "kafka:9092"
+      TASKBROKER_KAFKA_TOPIC: "taskworker-launchpad"
+      TASKBROKER_KAFKA_DEADLETTER_TOPIC: "taskworker-launchpad-dlq"
+      TASKBROKER_KAFKA_CONSUMER_GROUP: "taskbroker-launchpad"
+      TASKBROKER_CREATE_MISSING_TOPICS: "true"
+      TASKBROKER_GRPC_SHARED_SECRET: "test-secret-key-for-e2e"
+    ports:
+      - "127.0.0.1:50051:50051"
+    depends_on:
+      kafka:
+        condition: service_healthy
+    platform: linux/amd64
+    networks:
+      - launchpad-e2e
+
   # MinIO for ObjectStore (S3-compatible)
   minio:
     image: minio/minio:latest
@@ -46,7 +90,7 @@ services:
     networks:
       - launchpad-e2e
 
-  # Launchpad service
+  # Launchpad worker (connects to TaskBroker via gRPC)
   launchpad:
     build:
       context: .
@@ -59,36 +103,42 @@ services:
       SENTRY_BASE_URL: "http://mock-sentry-api:8000"
       OBJECTSTORE_URL: "http://minio:9000"
       LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
-      LAUNCHPAD_WORKER_RPC_HOST: "host.docker.internal:50051"
+      TASKWORKER_SHARED_SECRET: "test-secret-key-for-e2e"
+      LAUNCHPAD_WORKER_RPC_HOST: "taskbroker:50051"
       LAUNCHPAD_WORKER_CONCURRENCY: "1"
+      KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
+      TASKWORKER_TOPIC: "taskworker-launchpad"
       SENTRY_DSN: ""
     healthcheck:
       test: ["CMD-SHELL", "[ -f /tmp/health ]"]
       interval: 10s
       timeout: 5s
-      retries: 3
-      start_period: 15s
+      retries: 5
+      start_period: 30s
     depends_on:
+      taskbroker:
+        condition: service_started
       mock-sentry-api:
         condition: service_healthy
-    extra_hosts:
-      host.docker.internal: host-gateway
     networks:
       - launchpad-e2e
 
-  # Test orchestrator
+  # Test runner (dispatches tasks via taskbroker-client)
   e2e-tests:
     build:
       context: .
       dockerfile: tests/e2e/Dockerfile.test-runner
     environment:
       MOCK_API_URL: "http://mock-sentry-api:8000"
-      LAUNCHPAD_URL: "http://launchpad:2218"
       MINIO_ENDPOINT: "http://minio:9000"
       MINIO_ACCESS_KEY: "minioadmin"
       MINIO_SECRET_KEY: "minioadmin"
-      LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
+      KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
+      TASKWORKER_TOPIC: "taskworker-launchpad"
+      TASKWORKER_SHARED_SECRET: "test-secret-key-for-e2e"
     depends_on:
+      launchpad:
+        condition: service_healthy
       mock-sentry-api:
         condition: service_healthy
     volumes:
diff --git a/tests/e2e/Dockerfile.test-runner b/tests/e2e/Dockerfile.test-runner
index b48d4c0d..3529d384 100644
--- a/tests/e2e/Dockerfile.test-runner
+++ b/tests/e2e/Dockerfile.test-runner
@@ -2,7 +2,7 @@ FROM python:3.13-slim
 
 WORKDIR /app
 
-# Install system dependencies including build tools for confluent-kafka
+# Install system dependencies (librdkafka needed by confluent-kafka via taskbroker-client)
 RUN apt-get update && apt-get install -y --no-install-recommends \
     curl \
     gcc \
@@ -13,11 +13,19 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
 # Install Python test dependencies
 RUN pip install --no-cache-dir \
     pytest==8.3.3 \
-    pytest-asyncio==0.24.0 \
-    confluent-kafka==2.5.3 \
     requests==2.32.3 \
     boto3==1.35.0
 
+# Install launchpad package (gives us process_artifact.delay() via taskbroker-client)
+COPY requirements.txt /tmp/requirements.txt
+RUN pip install --no-cache-dir -r /tmp/requirements.txt
+
+COPY src/ /tmp/src/
+COPY pyproject.toml /tmp/pyproject.toml
+COPY README.md /tmp/README.md
+COPY LICENSE /tmp/LICENSE
+RUN pip install --no-cache-dir /tmp/
+
 # Copy only E2E test files (not the main test suite)
 # Copy to root to avoid pytest finding parent conftest.py
 COPY tests/e2e /app/e2e_tests
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index c081192d..d6719cb0 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -1,8 +1,10 @@
-"""End-to-end tests for Launchpad service.
+"""End-to-end tests for Launchpad service via TaskWorker.
 
-These tests require the E2E Docker Compose environment to be running.
-The full artifact processing flow tests need to be updated to use
-TaskWorker-based triggering instead of Kafka.
+Tests the full flow:
+1. Upload test artifact to mock API
+2. Dispatch task via taskbroker-client (process_artifact.delay())
+3. Wait for Launchpad worker to process
+4. Verify results via mock API
 """
 
 import json
@@ -12,10 +14,10 @@
 from pathlib import Path
 from typing import Any, Dict
 
+import pytest
 import requests
 
 MOCK_API_URL = os.getenv("MOCK_API_URL", "http://mock-sentry-api:8000")
-LAUNCHPAD_URL = os.getenv("LAUNCHPAD_URL", "http://launchpad:2218")
 
 FIXTURES_DIR = Path("/app/fixtures")
 IOS_FIXTURE = FIXTURES_DIR / "ios" / "HackerNews.xcarchive.zip"
@@ -23,18 +25,15 @@
 ANDROID_AAB_FIXTURE = FIXTURES_DIR / "android" / "hn.aab"
 
 
-def wait_for_service(url: str, timeout: int = 60, service_name: str = "service") -> None:
-    start_time = time.time()
-    while time.time() - start_time < timeout:
-        try:
-            response = requests.get(f"{url}/health", timeout=5)
-            if response.status_code == 200:
-                print(f"[OK] {service_name} is healthy")
-                return
-        except requests.exceptions.RequestException:
-            pass
-        time.sleep(2)
-    raise TimeoutError(f"{service_name} did not become healthy within {timeout}s")
+def dispatch_task(artifact_id: str, org: str, project: str) -> None:
+    from launchpad.worker.tasks import process_artifact
+
+    process_artifact.delay(
+        artifact_id=artifact_id,
+        project_id=project,
+        organization_id=org,
+    )
+    print(f"[OK] Dispatched task for artifact {artifact_id}")
 
 
 def upload_artifact_to_mock_api(artifact_id: str, file_path: Path) -> None:
@@ -76,3 +75,199 @@ def get_size_analysis_raw(artifact_id: str) -> Dict[str, Any]:
     response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}/size-analysis-raw", timeout=10)
     response.raise_for_status()
     return response.json()
+
+
+class TestE2EFlow:
+    @classmethod
+    def setup_class(cls):
+        print("\n=== Waiting for services to be ready ===")
+
+        start_time = time.time()
+        while time.time() - start_time < 60:
+            try:
+                response = requests.get(f"{MOCK_API_URL}/health", timeout=5)
+                if response.status_code == 200:
+                    print("[OK] Mock Sentry API is healthy")
+                    break
+            except requests.exceptions.RequestException:
+                pass
+            time.sleep(2)
+        else:
+            raise TimeoutError("Mock Sentry API did not become healthy within 60s")
+
+        print("=== All services ready ===\n")
+
+    def test_ios_xcarchive_full_flow(self):
+        if not IOS_FIXTURE.exists():
+            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
+
+        artifact_id = "test-ios-001"
+        org = "test-org"
+        project = "test-ios-project"
+
+        print("\n=== Testing iOS .xcarchive.zip E2E flow ===")
+
+        upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
+        dispatch_task(artifact_id, org, project)
+        results = wait_for_processing(artifact_id, timeout=180)
+
+        print("\n=== Verifying results ===")
+
+        assert results["artifact_metadata"], "Artifact metadata should be updated"
+        metadata = results["artifact_metadata"]
+
+        assert metadata["app_name"] == "HackerNews"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["build_version"] == "3.8"
+        assert metadata["build_number"] == 1
+        assert metadata["artifact_type"] == 0
+
+        assert "apple_app_info" in metadata
+        apple_info = metadata["apple_app_info"]
+        assert apple_info["is_simulator"] is False
+        assert apple_info["codesigning_type"] == "development"
+        assert apple_info["build_date"] == "2025-05-19T16:15:12"
+        assert apple_info["is_code_signature_valid"] is True
+        assert apple_info["main_binary_uuid"] == "BEB3C0D6-2518-343D-BB6F-FF5581C544E8"
+
+        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
+
+        size_analysis = get_size_analysis_raw(artifact_id)
+        assert size_analysis["download_size"] == 6502319
+
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "ios"
+        assert treemap["root"]["name"] == "HackerNews"
+        assert treemap["root"]["size"] == 9728000
+        assert treemap["root"]["is_dir"] is True
+        assert len(treemap["root"]["children"]) > 0
+
+        insights = size_analysis["insights"]
+        assert "duplicate_files" in insights
+        assert insights["duplicate_files"]["total_savings"] > 0
+        assert len(insights["duplicate_files"]["groups"]) > 0
+
+        assert "image_optimization" in insights
+        assert insights["image_optimization"]["total_savings"] > 0
+        assert len(insights["image_optimization"]["optimizable_files"]) > 0
+
+        assert "main_binary_exported_symbols" in insights
+        assert insights["main_binary_exported_symbols"]["total_savings"] > 0
+
+        print("[OK] iOS E2E test passed!")
+
+    def test_android_apk_full_flow(self):
+        if not ANDROID_APK_FIXTURE.exists():
+            pytest.skip(f"Android APK fixture not found: {ANDROID_APK_FIXTURE}")
+
+        artifact_id = "test-android-apk-001"
+        org = "test-org"
+        project = "test-android-project"
+
+        print("\n=== Testing Android .apk E2E flow ===")
+
+        upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
+        dispatch_task(artifact_id, org, project)
+        results = wait_for_processing(artifact_id, timeout=180)
+
+        print("\n=== Verifying results ===")
+
+        assert results["artifact_metadata"], "Artifact metadata should be updated"
+        metadata = results["artifact_metadata"]
+
+        assert metadata["app_name"] == "Hacker News"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["artifact_type"] == 2
+
+        assert "android_app_info" in metadata
+        android_info = metadata["android_app_info"]
+        assert android_info["has_proguard_mapping"] is False
+
+        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
+
+        size_analysis = get_size_analysis_raw(artifact_id)
+        assert size_analysis["download_size"] == 3670839
+
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "android"
+        assert treemap["root"]["name"] == "Hacker News"
+        assert treemap["root"]["size"] == 7886041
+        assert treemap["root"]["is_dir"] is True
+        assert len(treemap["root"]["children"]) == 14
+
+        insights = size_analysis["insights"]
+        assert "duplicate_files" in insights
+        assert insights["duplicate_files"]["total_savings"] == 51709
+        assert len(insights["duplicate_files"]["groups"]) > 0
+
+        assert "multiple_native_library_archs" in insights
+        assert insights["multiple_native_library_archs"]["total_savings"] == 1891208
+
+        print("[OK] Android APK E2E test passed!")
+
+    def test_android_aab_full_flow(self):
+        if not ANDROID_AAB_FIXTURE.exists():
+            pytest.skip(f"Android AAB fixture not found: {ANDROID_AAB_FIXTURE}")
+
+        artifact_id = "test-android-aab-001"
+        org = "test-org"
+        project = "test-android-project"
+
+        print("\n=== Testing Android .aab E2E flow ===")
+
+        upload_artifact_to_mock_api(artifact_id, ANDROID_AAB_FIXTURE)
+        dispatch_task(artifact_id, org, project)
+        results = wait_for_processing(artifact_id, timeout=180)
+
+        print("\n=== Verifying results ===")
+
+        assert results["artifact_metadata"], "Artifact metadata should be updated"
+        metadata = results["artifact_metadata"]
+
+        assert metadata["app_name"] == "Hacker News"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["build_version"] == "1.0.2"
+        assert metadata["build_number"] == 13
+        assert metadata["artifact_type"] == 1
+
+        assert "android_app_info" in metadata
+        android_info = metadata["android_app_info"]
+        assert android_info["has_proguard_mapping"] is True
+
+        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
+
+        size_analysis = get_size_analysis_raw(artifact_id)
+        assert size_analysis["download_size"] > 0
+
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "android"
+        assert treemap["root"]["name"] == "Hacker News"
+        assert treemap["root"]["size"] == 5932249
+        assert treemap["root"]["is_dir"] is True
+        assert len(treemap["root"]["children"]) == 14
+
+        insights = size_analysis["insights"]
+        assert "duplicate_files" in insights
+        assert insights["duplicate_files"]["total_savings"] >= 0
+        assert "groups" in insights["duplicate_files"]
+
+        print("[OK] Android AAB E2E test passed!")
+
+    def test_nonexistent_artifact_error_handling(self):
+        artifact_id = "test-nonexistent-artifact"
+        org = "test-org"
+        project = "test-project"
+
+        print("\n=== Testing non-existent artifact error handling ===")
+
+        dispatch_task(artifact_id, org, project)
+
+        time.sleep(15)
+
+        response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}", timeout=10)
+        response.raise_for_status()
+        results = response.json()
+
+        assert not results["has_size_analysis_file"], "Should not have size analysis for non-existent artifact"
+
+        print("[OK] Non-existent artifact handled correctly")

From 08f0fbeaa2c346c03172bebda7635dd4a2d0c692 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 11:49:29 -0700
Subject: [PATCH 07/15] fix: Fix e2e docker-compose config issues

- Remove external port mapping for taskbroker (only needed internally)
- Use JSON array format for TASKBROKER_GRPC_SHARED_SECRET (Vec<String>)
- Use JSON array format for TASKWORKER_SHARED_SECRET (parsed by orjson)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 docker-compose.e2e.yml | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 1d14c04d..773a1a78 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -35,9 +35,7 @@ services:
       TASKBROKER_KAFKA_DEADLETTER_TOPIC: "taskworker-launchpad-dlq"
       TASKBROKER_KAFKA_CONSUMER_GROUP: "taskbroker-launchpad"
       TASKBROKER_CREATE_MISSING_TOPICS: "true"
-      TASKBROKER_GRPC_SHARED_SECRET: "test-secret-key-for-e2e"
-    ports:
-      - "127.0.0.1:50051:50051"
+      TASKBROKER_GRPC_SHARED_SECRET: '["test-secret-key-for-e2e"]'
     depends_on:
       kafka:
         condition: service_healthy
@@ -103,7 +101,7 @@ services:
       SENTRY_BASE_URL: "http://mock-sentry-api:8000"
       OBJECTSTORE_URL: "http://minio:9000"
       LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
-      TASKWORKER_SHARED_SECRET: "test-secret-key-for-e2e"
+      TASKWORKER_SHARED_SECRET: '["test-secret-key-for-e2e"]'
       LAUNCHPAD_WORKER_RPC_HOST: "taskbroker:50051"
       LAUNCHPAD_WORKER_CONCURRENCY: "1"
       KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
@@ -135,7 +133,7 @@ services:
       MINIO_SECRET_KEY: "minioadmin"
       KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
       TASKWORKER_TOPIC: "taskworker-launchpad"
-      TASKWORKER_SHARED_SECRET: "test-secret-key-for-e2e"
+      TASKWORKER_SHARED_SECRET: '["test-secret-key-for-e2e"]'
     depends_on:
       launchpad:
         condition: service_healthy

From 41bc6fff698fecc4cae807d8c90fefb6708b9780 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 12:19:18 -0700
Subject: [PATCH 08/15] fix(e2e): Increase timeouts and max_child_task_count
 for TaskWorker

iOS analysis takes ~3 minutes, which was right at the 180s timeout
boundary. Increase test timeout to 360s and CI timeout to 30 minutes.
Bump LAUNCHPAD_WORKER_MAX_CHILD_TASK_COUNT to 10 so the child process
doesn't restart between tasks unnecessarily.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .github/workflows/ci.yml   | 2 +-
 docker-compose.e2e.yml     | 1 +
 tests/e2e/test_e2e_flow.py | 6 +++---
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 7a32c1c2..a12b30b0 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -128,7 +128,7 @@ jobs:
 
       - name: Run E2E tests
         run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests
-        timeout-minutes: 10
+        timeout-minutes: 30
 
       - name: Show service logs on failure
         if: failure()
diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 773a1a78..19afdf44 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -104,6 +104,7 @@ services:
       TASKWORKER_SHARED_SECRET: '["test-secret-key-for-e2e"]'
       LAUNCHPAD_WORKER_RPC_HOST: "taskbroker:50051"
       LAUNCHPAD_WORKER_CONCURRENCY: "1"
+      LAUNCHPAD_WORKER_MAX_CHILD_TASK_COUNT: "10"
       KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
       TASKWORKER_TOPIC: "taskworker-launchpad"
       SENTRY_DSN: ""
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index d6719cb0..ef4aa1f2 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -109,7 +109,7 @@ def test_ios_xcarchive_full_flow(self):
 
         upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
         dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=180)
+        results = wait_for_processing(artifact_id, timeout=360)
 
         print("\n=== Verifying results ===")
 
@@ -168,7 +168,7 @@ def test_android_apk_full_flow(self):
 
         upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
         dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=180)
+        results = wait_for_processing(artifact_id, timeout=360)
 
         print("\n=== Verifying results ===")
 
@@ -217,7 +217,7 @@ def test_android_aab_full_flow(self):
 
         upload_artifact_to_mock_api(artifact_id, ANDROID_AAB_FIXTURE)
         dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=180)
+        results = wait_for_processing(artifact_id, timeout=360)
 
         print("\n=== Verifying results ===")
 

From ab64fe81881aa8b13dce278705e7517366253002 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 12:49:56 -0700
Subject: [PATCH 09/15] fix(e2e): Mark iOS/AAB tests as slow, run all on CI

iOS analysis (LIEF + insights) takes ~6 min and AAB (bundletool)
takes several minutes. Mark these as @pytest.mark.slow so local
`make test-e2e` runs only fast tests (APK + error handling, ~23s).

CI runs all tests including slow ones with 600s timeouts.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .github/workflows/ci.yml   |   2 +-
 docker-compose.e2e.yml     |   2 +-
 tests/e2e/conftest.py      |   7 +-
 tests/e2e/test_e2e_flow.py | 171 +++++++++++++------------------------
 4 files changed, 66 insertions(+), 116 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index a12b30b0..d49bdc46 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -127,7 +127,7 @@ jobs:
           docker compose -f docker-compose.e2e.yml ps
 
       - name: Run E2E tests
-        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests
+        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests pytest e2e_tests/test_e2e_flow.py -v --tb=short
         timeout-minutes: 30
 
       - name: Show service logs on failure
diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 19afdf44..89f8844b 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -142,7 +142,7 @@ services:
         condition: service_healthy
     volumes:
       - ./tests/e2e/results:/app/results
-    command: pytest e2e_tests/test_e2e_flow.py -v --tb=short
+    command: pytest e2e_tests/test_e2e_flow.py -v --tb=short -m "not slow"
     networks:
       - launchpad-e2e
 
diff --git a/tests/e2e/conftest.py b/tests/e2e/conftest.py
index c1cf8b7d..a1c5f113 100644
--- a/tests/e2e/conftest.py
+++ b/tests/e2e/conftest.py
@@ -1,11 +1,12 @@
-"""Conftest for E2E tests - overrides main conftest to avoid importing launchpad."""
-
 import os
 
 import pytest
 
 
+def pytest_configure(config):
+    config.addinivalue_line("markers", "slow: marks tests as slow (iOS/AAB analysis takes several minutes)")
+
+
 @pytest.fixture(scope="session", autouse=True)
 def setup_test_environment():
-    """Set up test environment variables for E2E tests."""
     os.environ.setdefault("LAUNCHPAD_ENV", "e2e-test")
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index ef4aa1f2..dd0679aa 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -5,6 +5,10 @@
 2. Dispatch task via taskbroker-client (process_artifact.delay())
 3. Wait for Launchpad worker to process
 4. Verify results via mock API
+
+iOS and AAB tests are marked slow because they involve heavy analysis
+(LIEF binary parsing, bundletool) that takes several minutes on CI.
+Run with `pytest -m ""` or `pytest -m slow` to include them.
 """
 
 import json
@@ -97,65 +101,6 @@ def setup_class(cls):
 
         print("=== All services ready ===\n")
 
-    def test_ios_xcarchive_full_flow(self):
-        if not IOS_FIXTURE.exists():
-            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
-
-        artifact_id = "test-ios-001"
-        org = "test-org"
-        project = "test-ios-project"
-
-        print("\n=== Testing iOS .xcarchive.zip E2E flow ===")
-
-        upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
-        dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=360)
-
-        print("\n=== Verifying results ===")
-
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
-        metadata = results["artifact_metadata"]
-
-        assert metadata["app_name"] == "HackerNews"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["build_version"] == "3.8"
-        assert metadata["build_number"] == 1
-        assert metadata["artifact_type"] == 0
-
-        assert "apple_app_info" in metadata
-        apple_info = metadata["apple_app_info"]
-        assert apple_info["is_simulator"] is False
-        assert apple_info["codesigning_type"] == "development"
-        assert apple_info["build_date"] == "2025-05-19T16:15:12"
-        assert apple_info["is_code_signature_valid"] is True
-        assert apple_info["main_binary_uuid"] == "BEB3C0D6-2518-343D-BB6F-FF5581C544E8"
-
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
-
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] == 6502319
-
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "ios"
-        assert treemap["root"]["name"] == "HackerNews"
-        assert treemap["root"]["size"] == 9728000
-        assert treemap["root"]["is_dir"] is True
-        assert len(treemap["root"]["children"]) > 0
-
-        insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
-        assert insights["duplicate_files"]["total_savings"] > 0
-        assert len(insights["duplicate_files"]["groups"]) > 0
-
-        assert "image_optimization" in insights
-        assert insights["image_optimization"]["total_savings"] > 0
-        assert len(insights["image_optimization"]["optimizable_files"]) > 0
-
-        assert "main_binary_exported_symbols" in insights
-        assert insights["main_binary_exported_symbols"]["total_savings"] > 0
-
-        print("[OK] iOS E2E test passed!")
-
     def test_android_apk_full_flow(self):
         if not ANDROID_APK_FIXTURE.exists():
             pytest.skip(f"Android APK fixture not found: {ANDROID_APK_FIXTURE}")
@@ -164,15 +109,11 @@ def test_android_apk_full_flow(self):
         org = "test-org"
         project = "test-android-project"
 
-        print("\n=== Testing Android .apk E2E flow ===")
-
         upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
         dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=360)
+        results = wait_for_processing(artifact_id, timeout=120)
 
-        print("\n=== Verifying results ===")
-
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
+        assert results["artifact_metadata"]
         metadata = results["artifact_metadata"]
 
         assert metadata["app_name"] == "Hacker News"
@@ -180,10 +121,9 @@ def test_android_apk_full_flow(self):
         assert metadata["artifact_type"] == 2
 
         assert "android_app_info" in metadata
-        android_info = metadata["android_app_info"]
-        assert android_info["has_proguard_mapping"] is False
+        assert metadata["android_app_info"]["has_proguard_mapping"] is False
 
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
+        assert results["has_size_analysis_file"]
 
         size_analysis = get_size_analysis_raw(artifact_id)
         assert size_analysis["download_size"] == 3670839
@@ -203,25 +143,66 @@ def test_android_apk_full_flow(self):
         assert "multiple_native_library_archs" in insights
         assert insights["multiple_native_library_archs"]["total_savings"] == 1891208
 
-        print("[OK] Android APK E2E test passed!")
+    def test_nonexistent_artifact_error_handling(self):
+        artifact_id = "test-nonexistent-artifact"
+
+        dispatch_task(artifact_id, "test-org", "test-project")
+        time.sleep(15)
+
+        response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}", timeout=10)
+        response.raise_for_status()
+        results = response.json()
+
+        assert not results["has_size_analysis_file"]
+
+    @pytest.mark.slow
+    def test_ios_xcarchive_full_flow(self):
+        if not IOS_FIXTURE.exists():
+            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
+
+        artifact_id = "test-ios-001"
+
+        upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
+        dispatch_task(artifact_id, "test-org", "test-ios-project")
+        results = wait_for_processing(artifact_id, timeout=600)
+
+        assert results["artifact_metadata"]
+        metadata = results["artifact_metadata"]
+
+        assert metadata["app_name"] == "HackerNews"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["build_version"] == "3.8"
+        assert metadata["build_number"] == 1
+        assert metadata["artifact_type"] == 0
+
+        assert "apple_app_info" in metadata
+        apple_info = metadata["apple_app_info"]
+        assert apple_info["is_simulator"] is False
+        assert apple_info["codesigning_type"] == "development"
+        assert apple_info["is_code_signature_valid"] is True
+
+        assert results["has_size_analysis_file"]
+
+        size_analysis = get_size_analysis_raw(artifact_id)
+        assert size_analysis["download_size"] == 6502319
+
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "ios"
+        assert treemap["root"]["name"] == "HackerNews"
+        assert treemap["root"]["size"] == 9728000
 
+    @pytest.mark.slow
     def test_android_aab_full_flow(self):
         if not ANDROID_AAB_FIXTURE.exists():
             pytest.skip(f"Android AAB fixture not found: {ANDROID_AAB_FIXTURE}")
 
         artifact_id = "test-android-aab-001"
-        org = "test-org"
-        project = "test-android-project"
-
-        print("\n=== Testing Android .aab E2E flow ===")
 
         upload_artifact_to_mock_api(artifact_id, ANDROID_AAB_FIXTURE)
-        dispatch_task(artifact_id, org, project)
-        results = wait_for_processing(artifact_id, timeout=360)
+        dispatch_task(artifact_id, "test-org", "test-android-project")
+        results = wait_for_processing(artifact_id, timeout=600)
 
-        print("\n=== Verifying results ===")
-
-        assert results["artifact_metadata"], "Artifact metadata should be updated"
+        assert results["artifact_metadata"]
         metadata = results["artifact_metadata"]
 
         assert metadata["app_name"] == "Hacker News"
@@ -230,11 +211,7 @@ def test_android_aab_full_flow(self):
         assert metadata["build_number"] == 13
         assert metadata["artifact_type"] == 1
 
-        assert "android_app_info" in metadata
-        android_info = metadata["android_app_info"]
-        assert android_info["has_proguard_mapping"] is True
-
-        assert results["has_size_analysis_file"], "Size analysis file should be uploaded"
+        assert results["has_size_analysis_file"]
 
         size_analysis = get_size_analysis_raw(artifact_id)
         assert size_analysis["download_size"] > 0
@@ -243,31 +220,3 @@ def test_android_aab_full_flow(self):
         assert treemap["platform"] == "android"
         assert treemap["root"]["name"] == "Hacker News"
         assert treemap["root"]["size"] == 5932249
-        assert treemap["root"]["is_dir"] is True
-        assert len(treemap["root"]["children"]) == 14
-
-        insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
-        assert insights["duplicate_files"]["total_savings"] >= 0
-        assert "groups" in insights["duplicate_files"]
-
-        print("[OK] Android AAB E2E test passed!")
-
-    def test_nonexistent_artifact_error_handling(self):
-        artifact_id = "test-nonexistent-artifact"
-        org = "test-org"
-        project = "test-project"
-
-        print("\n=== Testing non-existent artifact error handling ===")
-
-        dispatch_task(artifact_id, org, project)
-
-        time.sleep(15)
-
-        response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}", timeout=10)
-        response.raise_for_status()
-        results = response.json()
-
-        assert not results["has_size_analysis_file"], "Should not have size analysis for non-existent artifact"
-
-        print("[OK] Non-existent artifact handled correctly")

From 5fa7c19223b8f73bc75f64ca21a3a60b8bb314f3 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 13:03:21 -0700
Subject: [PATCH 10/15] perf(e2e): Dispatch all tasks in parallel with
 concurrency=3

Restructure e2e tests to dispatch all artifact tasks upfront in
setup_class, then verify results individually. With worker
concurrency=3, iOS/APK/AAB process simultaneously so total time
is bounded by the slowest artifact (~6 min) rather than the sum.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 docker-compose.e2e.yml     |   2 +-
 tests/e2e/test_e2e_flow.py | 178 ++++++++++++++++++++-----------------
 2 files changed, 98 insertions(+), 82 deletions(-)

diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 89f8844b..83fd01de 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -103,7 +103,7 @@ services:
       LAUNCHPAD_RPC_SHARED_SECRET: "test-secret-key-for-e2e"
       TASKWORKER_SHARED_SECRET: '["test-secret-key-for-e2e"]'
       LAUNCHPAD_WORKER_RPC_HOST: "taskbroker:50051"
-      LAUNCHPAD_WORKER_CONCURRENCY: "1"
+      LAUNCHPAD_WORKER_CONCURRENCY: "3"
       LAUNCHPAD_WORKER_MAX_CHILD_TASK_COUNT: "10"
       KAFKA_BOOTSTRAP_SERVERS: "kafka:9092"
       TASKWORKER_TOPIC: "taskworker-launchpad"
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index dd0679aa..33e80ce7 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -1,14 +1,14 @@
 """End-to-end tests for Launchpad service via TaskWorker.
 
 Tests the full flow:
-1. Upload test artifact to mock API
-2. Dispatch task via taskbroker-client (process_artifact.delay())
-3. Wait for Launchpad worker to process
+1. Upload all test artifacts to mock API
+2. Dispatch all tasks via taskbroker-client (process_artifact.delay())
+3. Wait for Launchpad worker to process all artifacts in parallel
 4. Verify results via mock API
 
-iOS and AAB tests are marked slow because they involve heavy analysis
-(LIEF binary parsing, bundletool) that takes several minutes on CI.
-Run with `pytest -m ""` or `pytest -m slow` to include them.
+All artifact tasks are dispatched upfront and processed concurrently
+by the worker (LAUNCHPAD_WORKER_CONCURRENCY=3), so total time is
+bounded by the slowest artifact rather than the sum of all.
 """
 
 import json
@@ -64,11 +64,11 @@ def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: in
 
             current_status = json.dumps(results, sort_keys=True)
             if current_status != last_status:
-                print(f"  Waiting for processing... (results so far: {results})")
+                print(f"  [{artifact_id}] Waiting... (results so far: {results})")
                 last_status = current_status
 
         except requests.exceptions.RequestException as e:
-            print(f"  Error checking results: {e}")
+            print(f"  [{artifact_id}] Error checking results: {e}")
 
         time.sleep(check_interval)
 
@@ -81,46 +81,44 @@ def get_size_analysis_raw(artifact_id: str) -> Dict[str, Any]:
     return response.json()
 
 
+def wait_for_mock_api(timeout: int = 60) -> None:
+    start_time = time.time()
+    while time.time() - start_time < timeout:
+        try:
+            response = requests.get(f"{MOCK_API_URL}/health", timeout=5)
+            if response.status_code == 200:
+                print("[OK] Mock Sentry API is healthy")
+                return
+        except requests.exceptions.RequestException:
+            pass
+        time.sleep(2)
+    raise TimeoutError("Mock Sentry API did not become healthy within 60s")
+
+
 class TestE2EFlow:
+    """Fast e2e tests — APK processing + error handling.
+
+    These run locally on any architecture since APK analysis is lightweight.
+    """
+
     @classmethod
     def setup_class(cls):
-        print("\n=== Waiting for services to be ready ===")
-
-        start_time = time.time()
-        while time.time() - start_time < 60:
-            try:
-                response = requests.get(f"{MOCK_API_URL}/health", timeout=5)
-                if response.status_code == 200:
-                    print("[OK] Mock Sentry API is healthy")
-                    break
-            except requests.exceptions.RequestException:
-                pass
-            time.sleep(2)
-        else:
-            raise TimeoutError("Mock Sentry API did not become healthy within 60s")
-
-        print("=== All services ready ===\n")
+        wait_for_mock_api()
 
     def test_android_apk_full_flow(self):
         if not ANDROID_APK_FIXTURE.exists():
             pytest.skip(f"Android APK fixture not found: {ANDROID_APK_FIXTURE}")
 
         artifact_id = "test-android-apk-001"
-        org = "test-org"
-        project = "test-android-project"
 
         upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
-        dispatch_task(artifact_id, org, project)
+        dispatch_task(artifact_id, "test-org", "test-android-project")
         results = wait_for_processing(artifact_id, timeout=120)
 
-        assert results["artifact_metadata"]
         metadata = results["artifact_metadata"]
-
         assert metadata["app_name"] == "Hacker News"
         assert metadata["app_id"] == "com.emergetools.hackernews"
         assert metadata["artifact_type"] == 2
-
-        assert "android_app_info" in metadata
         assert metadata["android_app_info"]["has_proguard_mapping"] is False
 
         assert results["has_size_analysis_file"]
@@ -132,91 +130,109 @@ def test_android_apk_full_flow(self):
         assert treemap["platform"] == "android"
         assert treemap["root"]["name"] == "Hacker News"
         assert treemap["root"]["size"] == 7886041
-        assert treemap["root"]["is_dir"] is True
         assert len(treemap["root"]["children"]) == 14
 
         insights = size_analysis["insights"]
-        assert "duplicate_files" in insights
         assert insights["duplicate_files"]["total_savings"] == 51709
-        assert len(insights["duplicate_files"]["groups"]) > 0
-
-        assert "multiple_native_library_archs" in insights
         assert insights["multiple_native_library_archs"]["total_savings"] == 1891208
 
     def test_nonexistent_artifact_error_handling(self):
-        artifact_id = "test-nonexistent-artifact"
-
-        dispatch_task(artifact_id, "test-org", "test-project")
+        dispatch_task("test-nonexistent-artifact", "test-org", "test-project")
         time.sleep(15)
 
-        response = requests.get(f"{MOCK_API_URL}/test/results/{artifact_id}", timeout=10)
-        response.raise_for_status()
+        response = requests.get(f"{MOCK_API_URL}/test/results/test-nonexistent-artifact", timeout=10)
         results = response.json()
-
         assert not results["has_size_analysis_file"]
 
-    @pytest.mark.slow
-    def test_ios_xcarchive_full_flow(self):
-        if not IOS_FIXTURE.exists():
-            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
 
-        artifact_id = "test-ios-001"
+@pytest.mark.slow
+class TestE2EFlowAllPlatforms:
+    """Full platform e2e tests — dispatches iOS, APK, and AAB in parallel.
+
+    Requires LAUNCHPAD_WORKER_CONCURRENCY>=3 to process concurrently.
+    Total time is bounded by the slowest artifact (~6 min for iOS)
+    rather than the sum of all.
+    """
+
+    @classmethod
+    def setup_class(cls):
+        wait_for_mock_api()
+
+        cls.artifacts = {}
+
+        if ANDROID_APK_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-apk-parallel", ANDROID_APK_FIXTURE)
+            dispatch_task("test-apk-parallel", "test-org", "test-android-project")
+            cls.artifacts["apk"] = "test-apk-parallel"
+
+        if IOS_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-ios-parallel", IOS_FIXTURE)
+            dispatch_task("test-ios-parallel", "test-org", "test-ios-project")
+            cls.artifacts["ios"] = "test-ios-parallel"
+
+        if ANDROID_AAB_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-aab-parallel", ANDROID_AAB_FIXTURE)
+            dispatch_task("test-aab-parallel", "test-org", "test-android-project")
+            cls.artifacts["aab"] = "test-aab-parallel"
+
+        dispatch_task("test-nonexistent-parallel", "test-org", "test-project")
+        cls.artifacts["nonexistent"] = "test-nonexistent-parallel"
+
+        print(f"[OK] Dispatched {len(cls.artifacts)} tasks for parallel processing")
+
+    def test_android_apk(self):
+        artifact_id = self.artifacts.get("apk")
+        if not artifact_id:
+            pytest.skip("APK fixture not found")
 
-        upload_artifact_to_mock_api(artifact_id, IOS_FIXTURE)
-        dispatch_task(artifact_id, "test-org", "test-ios-project")
         results = wait_for_processing(artifact_id, timeout=600)
 
-        assert results["artifact_metadata"]
         metadata = results["artifact_metadata"]
+        assert metadata["app_name"] == "Hacker News"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["artifact_type"] == 2
+
+        assert results["has_size_analysis_file"]
+        size_analysis = get_size_analysis_raw(artifact_id)
+        assert size_analysis["download_size"] == 3670839
 
+    def test_ios_xcarchive(self):
+        artifact_id = self.artifacts.get("ios")
+        if not artifact_id:
+            pytest.skip("iOS fixture not found")
+
+        results = wait_for_processing(artifact_id, timeout=600)
+
+        metadata = results["artifact_metadata"]
         assert metadata["app_name"] == "HackerNews"
         assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["build_version"] == "3.8"
-        assert metadata["build_number"] == 1
         assert metadata["artifact_type"] == 0
-
-        assert "apple_app_info" in metadata
-        apple_info = metadata["apple_app_info"]
-        assert apple_info["is_simulator"] is False
-        assert apple_info["codesigning_type"] == "development"
-        assert apple_info["is_code_signature_valid"] is True
+        assert metadata["apple_app_info"]["is_simulator"] is False
 
         assert results["has_size_analysis_file"]
-
         size_analysis = get_size_analysis_raw(artifact_id)
         assert size_analysis["download_size"] == 6502319
+        assert size_analysis["treemap"]["root"]["size"] == 9728000
 
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "ios"
-        assert treemap["root"]["name"] == "HackerNews"
-        assert treemap["root"]["size"] == 9728000
-
-    @pytest.mark.slow
-    def test_android_aab_full_flow(self):
-        if not ANDROID_AAB_FIXTURE.exists():
-            pytest.skip(f"Android AAB fixture not found: {ANDROID_AAB_FIXTURE}")
-
-        artifact_id = "test-android-aab-001"
+    def test_android_aab(self):
+        artifact_id = self.artifacts.get("aab")
+        if not artifact_id:
+            pytest.skip("AAB fixture not found")
 
-        upload_artifact_to_mock_api(artifact_id, ANDROID_AAB_FIXTURE)
-        dispatch_task(artifact_id, "test-org", "test-android-project")
         results = wait_for_processing(artifact_id, timeout=600)
 
-        assert results["artifact_metadata"]
         metadata = results["artifact_metadata"]
-
         assert metadata["app_name"] == "Hacker News"
         assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["build_version"] == "1.0.2"
-        assert metadata["build_number"] == 13
         assert metadata["artifact_type"] == 1
 
         assert results["has_size_analysis_file"]
-
         size_analysis = get_size_analysis_raw(artifact_id)
         assert size_analysis["download_size"] > 0
+        assert size_analysis["treemap"]["root"]["size"] == 5932249
 
-        treemap = size_analysis["treemap"]
-        assert treemap["platform"] == "android"
-        assert treemap["root"]["name"] == "Hacker News"
-        assert treemap["root"]["size"] == 5932249
+    def test_nonexistent_artifact(self):
+        time.sleep(15)
+        response = requests.get(f"{MOCK_API_URL}/test/results/test-nonexistent-parallel", timeout=10)
+        results = response.json()
+        assert not results["has_size_analysis_file"]

From cddea81d436ae3b660f8f30b26801c209254edc5 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 13:46:58 -0700
Subject: [PATCH 11/15] perf(e2e): Limit Kafka JVM heap to reduce resource
 contention

Kafka's default heap (1GB+) causes CPU contention on CI runners
with limited cores, slowing down the CPU-bound artifact analysis.
Cap at 256MB since e2e only processes a handful of messages.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 docker-compose.e2e.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 83fd01de..461790df 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -17,6 +17,7 @@ services:
       KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR: 1
       KAFKA_TRANSACTION_STATE_LOG_MIN_ISR: 1
       KAFKA_LOG_RETENTION_HOURS: 1
+      KAFKA_HEAP_OPTS: "-Xmx256m -Xms256m"
     healthcheck:
       test: ["CMD", "kafka-topics", "--bootstrap-server", "localhost:9092", "--list"]
       interval: 10s

From 72d016c4992f806ede9f96506f92b1afa2212953 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 13:56:08 -0700
Subject: [PATCH 12/15] fix(e2e): Run only fast tests on CI, 5 min timeout

The iOS/AAB analysis takes 6+ minutes on CI due to CPU contention
with Kafka JVM. Run only APK + error handling tests (same as local).
iOS/AAB analysis is already covered by integration tests.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .github/workflows/ci.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index d49bdc46..94871e3b 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -127,8 +127,8 @@ jobs:
           docker compose -f docker-compose.e2e.yml ps
 
       - name: Run E2E tests
-        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests pytest e2e_tests/test_e2e_flow.py -v --tb=short
-        timeout-minutes: 30
+        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests
+        timeout-minutes: 5
 
       - name: Show service logs on failure
         if: failure()

From 095bc80f23bbddaffce26cf1cd281b4147c832ef Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 14:03:33 -0700
Subject: [PATCH 13/15] fix(worker): Set processing_deadline_duration to 12
 minutes

The default namespace processing_deadline_duration was 10 seconds,
causing TaskBroker to mark tasks as failed before analysis could
complete. Match the 12-minute deadline set on the sentry dispatch
side. This was the root cause of iOS/AAB e2e test timeouts.

Also re-enable all e2e tests on CI to validate the fix.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .github/workflows/ci.yml      | 2 +-
 src/launchpad/worker/tasks.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 94871e3b..520fe8b6 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -127,7 +127,7 @@ jobs:
           docker compose -f docker-compose.e2e.yml ps
 
       - name: Run E2E tests
-        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests
+        run: docker compose -f docker-compose.e2e.yml run --rm e2e-tests pytest e2e_tests/test_e2e_flow.py -v --tb=short
         timeout-minutes: 5
 
       - name: Show service logs on failure
diff --git a/src/launchpad/worker/tasks.py b/src/launchpad/worker/tasks.py
index b81004d2..0e58ff26 100644
--- a/src/launchpad/worker/tasks.py
+++ b/src/launchpad/worker/tasks.py
@@ -5,7 +5,7 @@
 
 logger = get_logger(__name__)
 
-default = app.taskregistry.create_namespace("default")
+default = app.taskregistry.create_namespace("default", processing_deadline_duration=60 * 12)
 
 
 @default.register(name="process_artifact")

From 63671d51e508a8befc320e0cb47b79c9cc4c7ce2 Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 14:07:25 -0700
Subject: [PATCH 14/15] ref(e2e): Remove slow markers, run all tests everywhere

Single test class dispatches all tasks in parallel via setup_class,
then verifies each artifact. No optional/slow separation.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 docker-compose.e2e.yml     |   2 +-
 tests/e2e/conftest.py      |   4 -
 tests/e2e/test_e2e_flow.py | 207 ++++++++++++++++++-------------------
 3 files changed, 100 insertions(+), 113 deletions(-)

diff --git a/docker-compose.e2e.yml b/docker-compose.e2e.yml
index 461790df..f702aa9b 100644
--- a/docker-compose.e2e.yml
+++ b/docker-compose.e2e.yml
@@ -143,7 +143,7 @@ services:
         condition: service_healthy
     volumes:
       - ./tests/e2e/results:/app/results
-    command: pytest e2e_tests/test_e2e_flow.py -v --tb=short -m "not slow"
+    command: pytest e2e_tests/test_e2e_flow.py -v --tb=short
     networks:
       - launchpad-e2e
 
diff --git a/tests/e2e/conftest.py b/tests/e2e/conftest.py
index a1c5f113..ca7dfcca 100644
--- a/tests/e2e/conftest.py
+++ b/tests/e2e/conftest.py
@@ -3,10 +3,6 @@
 import pytest
 
 
-def pytest_configure(config):
-    config.addinivalue_line("markers", "slow: marks tests as slow (iOS/AAB analysis takes several minutes)")
-
-
 @pytest.fixture(scope="session", autouse=True)
 def setup_test_environment():
     os.environ.setdefault("LAUNCHPAD_ENV", "e2e-test")
diff --git a/tests/e2e/test_e2e_flow.py b/tests/e2e/test_e2e_flow.py
index 33e80ce7..63f796eb 100644
--- a/tests/e2e/test_e2e_flow.py
+++ b/tests/e2e/test_e2e_flow.py
@@ -1,14 +1,10 @@
 """End-to-end tests for Launchpad service via TaskWorker.
 
 Tests the full flow:
-1. Upload all test artifacts to mock API
-2. Dispatch all tasks via taskbroker-client (process_artifact.delay())
-3. Wait for Launchpad worker to process all artifacts in parallel
+1. Upload test artifact to mock API
+2. Dispatch task via taskbroker-client (process_artifact.delay())
+3. Wait for Launchpad worker to process
 4. Verify results via mock API
-
-All artifact tasks are dispatched upfront and processed concurrently
-by the worker (LAUNCHPAD_WORKER_CONCURRENCY=3), so total time is
-bounded by the slowest artifact rather than the sum of all.
 """
 
 import json
@@ -48,7 +44,7 @@ def upload_artifact_to_mock_api(artifact_id: str, file_path: Path) -> None:
         print(f"[OK] Uploaded artifact {artifact_id} ({file_path.name})")
 
 
-def wait_for_processing(artifact_id: str, timeout: int = 120, check_interval: int = 3) -> Dict[str, Any]:
+def wait_for_processing(artifact_id: str, timeout: int = 180, check_interval: int = 3) -> Dict[str, Any]:
     start_time = time.time()
     last_status = None
 
@@ -81,39 +77,46 @@ def get_size_analysis_raw(artifact_id: str) -> Dict[str, Any]:
     return response.json()
 
 
-def wait_for_mock_api(timeout: int = 60) -> None:
-    start_time = time.time()
-    while time.time() - start_time < timeout:
-        try:
-            response = requests.get(f"{MOCK_API_URL}/health", timeout=5)
-            if response.status_code == 200:
-                print("[OK] Mock Sentry API is healthy")
-                return
-        except requests.exceptions.RequestException:
-            pass
-        time.sleep(2)
-    raise TimeoutError("Mock Sentry API did not become healthy within 60s")
+class TestE2EFlow:
+    @classmethod
+    def setup_class(cls):
+        print("\n=== Waiting for services to be ready ===")
+        start_time = time.time()
+        while time.time() - start_time < 60:
+            try:
+                response = requests.get(f"{MOCK_API_URL}/health", timeout=5)
+                if response.status_code == 200:
+                    print("[OK] Mock Sentry API is healthy")
+                    break
+            except requests.exceptions.RequestException:
+                pass
+            time.sleep(2)
+        else:
+            raise TimeoutError("Mock Sentry API did not become healthy within 60s")
+
+        print("=== Uploading and dispatching all tasks ===")
 
+        if ANDROID_APK_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-android-apk-001", ANDROID_APK_FIXTURE)
+            dispatch_task("test-android-apk-001", "test-org", "test-android-project")
 
-class TestE2EFlow:
-    """Fast e2e tests — APK processing + error handling.
+        if IOS_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-ios-001", IOS_FIXTURE)
+            dispatch_task("test-ios-001", "test-org", "test-ios-project")
 
-    These run locally on any architecture since APK analysis is lightweight.
-    """
+        if ANDROID_AAB_FIXTURE.exists():
+            upload_artifact_to_mock_api("test-android-aab-001", ANDROID_AAB_FIXTURE)
+            dispatch_task("test-android-aab-001", "test-org", "test-android-project")
 
-    @classmethod
-    def setup_class(cls):
-        wait_for_mock_api()
+        dispatch_task("test-nonexistent-artifact", "test-org", "test-project")
+
+        print("=== All tasks dispatched, processing in parallel ===\n")
 
     def test_android_apk_full_flow(self):
         if not ANDROID_APK_FIXTURE.exists():
             pytest.skip(f"Android APK fixture not found: {ANDROID_APK_FIXTURE}")
 
-        artifact_id = "test-android-apk-001"
-
-        upload_artifact_to_mock_api(artifact_id, ANDROID_APK_FIXTURE)
-        dispatch_task(artifact_id, "test-org", "test-android-project")
-        results = wait_for_processing(artifact_id, timeout=120)
+        results = wait_for_processing("test-android-apk-001")
 
         metadata = results["artifact_metadata"]
         assert metadata["app_name"] == "Hacker News"
@@ -123,116 +126,104 @@ def test_android_apk_full_flow(self):
 
         assert results["has_size_analysis_file"]
 
-        size_analysis = get_size_analysis_raw(artifact_id)
+        size_analysis = get_size_analysis_raw("test-android-apk-001")
         assert size_analysis["download_size"] == 3670839
 
         treemap = size_analysis["treemap"]
         assert treemap["platform"] == "android"
         assert treemap["root"]["name"] == "Hacker News"
         assert treemap["root"]["size"] == 7886041
+        assert treemap["root"]["is_dir"] is True
         assert len(treemap["root"]["children"]) == 14
 
         insights = size_analysis["insights"]
         assert insights["duplicate_files"]["total_savings"] == 51709
+        assert len(insights["duplicate_files"]["groups"]) > 0
         assert insights["multiple_native_library_archs"]["total_savings"] == 1891208
 
-    def test_nonexistent_artifact_error_handling(self):
-        dispatch_task("test-nonexistent-artifact", "test-org", "test-project")
-        time.sleep(15)
-
-        response = requests.get(f"{MOCK_API_URL}/test/results/test-nonexistent-artifact", timeout=10)
-        results = response.json()
-        assert not results["has_size_analysis_file"]
-
+    def test_ios_xcarchive_full_flow(self):
+        if not IOS_FIXTURE.exists():
+            pytest.skip(f"iOS fixture not found: {IOS_FIXTURE}")
 
-@pytest.mark.slow
-class TestE2EFlowAllPlatforms:
-    """Full platform e2e tests — dispatches iOS, APK, and AAB in parallel.
+        results = wait_for_processing("test-ios-001")
 
-    Requires LAUNCHPAD_WORKER_CONCURRENCY>=3 to process concurrently.
-    Total time is bounded by the slowest artifact (~6 min for iOS)
-    rather than the sum of all.
-    """
+        metadata = results["artifact_metadata"]
+        assert metadata["app_name"] == "HackerNews"
+        assert metadata["app_id"] == "com.emergetools.hackernews"
+        assert metadata["build_version"] == "3.8"
+        assert metadata["build_number"] == 1
+        assert metadata["artifact_type"] == 0
 
-    @classmethod
-    def setup_class(cls):
-        wait_for_mock_api()
+        assert "apple_app_info" in metadata
+        apple_info = metadata["apple_app_info"]
+        assert apple_info["is_simulator"] is False
+        assert apple_info["codesigning_type"] == "development"
+        assert apple_info["build_date"] == "2025-05-19T16:15:12"
+        assert apple_info["is_code_signature_valid"] is True
+        assert apple_info["main_binary_uuid"] == "BEB3C0D6-2518-343D-BB6F-FF5581C544E8"
 
-        cls.artifacts = {}
+        assert results["has_size_analysis_file"]
 
-        if ANDROID_APK_FIXTURE.exists():
-            upload_artifact_to_mock_api("test-apk-parallel", ANDROID_APK_FIXTURE)
-            dispatch_task("test-apk-parallel", "test-org", "test-android-project")
-            cls.artifacts["apk"] = "test-apk-parallel"
+        size_analysis = get_size_analysis_raw("test-ios-001")
+        assert size_analysis["download_size"] == 6502319
 
-        if IOS_FIXTURE.exists():
-            upload_artifact_to_mock_api("test-ios-parallel", IOS_FIXTURE)
-            dispatch_task("test-ios-parallel", "test-org", "test-ios-project")
-            cls.artifacts["ios"] = "test-ios-parallel"
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "ios"
+        assert treemap["root"]["name"] == "HackerNews"
+        assert treemap["root"]["size"] == 9728000
+        assert treemap["root"]["is_dir"] is True
+        assert len(treemap["root"]["children"]) > 0
 
-        if ANDROID_AAB_FIXTURE.exists():
-            upload_artifact_to_mock_api("test-aab-parallel", ANDROID_AAB_FIXTURE)
-            dispatch_task("test-aab-parallel", "test-org", "test-android-project")
-            cls.artifacts["aab"] = "test-aab-parallel"
+        insights = size_analysis["insights"]
+        assert "duplicate_files" in insights
+        assert insights["duplicate_files"]["total_savings"] > 0
+        assert len(insights["duplicate_files"]["groups"]) > 0
 
-        dispatch_task("test-nonexistent-parallel", "test-org", "test-project")
-        cls.artifacts["nonexistent"] = "test-nonexistent-parallel"
+        assert "image_optimization" in insights
+        assert insights["image_optimization"]["total_savings"] > 0
+        assert len(insights["image_optimization"]["optimizable_files"]) > 0
 
-        print(f"[OK] Dispatched {len(cls.artifacts)} tasks for parallel processing")
+        assert "main_binary_exported_symbols" in insights
+        assert insights["main_binary_exported_symbols"]["total_savings"] > 0
 
-    def test_android_apk(self):
-        artifact_id = self.artifacts.get("apk")
-        if not artifact_id:
-            pytest.skip("APK fixture not found")
+    def test_android_aab_full_flow(self):
+        if not ANDROID_AAB_FIXTURE.exists():
+            pytest.skip(f"Android AAB fixture not found: {ANDROID_AAB_FIXTURE}")
 
-        results = wait_for_processing(artifact_id, timeout=600)
+        results = wait_for_processing("test-android-aab-001")
 
         metadata = results["artifact_metadata"]
         assert metadata["app_name"] == "Hacker News"
         assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["artifact_type"] == 2
-
-        assert results["has_size_analysis_file"]
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] == 3670839
-
-    def test_ios_xcarchive(self):
-        artifact_id = self.artifacts.get("ios")
-        if not artifact_id:
-            pytest.skip("iOS fixture not found")
-
-        results = wait_for_processing(artifact_id, timeout=600)
+        assert metadata["build_version"] == "1.0.2"
+        assert metadata["build_number"] == 13
+        assert metadata["artifact_type"] == 1
 
-        metadata = results["artifact_metadata"]
-        assert metadata["app_name"] == "HackerNews"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["artifact_type"] == 0
-        assert metadata["apple_app_info"]["is_simulator"] is False
+        assert "android_app_info" in metadata
+        assert metadata["android_app_info"]["has_proguard_mapping"] is True
 
         assert results["has_size_analysis_file"]
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] == 6502319
-        assert size_analysis["treemap"]["root"]["size"] == 9728000
 
-    def test_android_aab(self):
-        artifact_id = self.artifacts.get("aab")
-        if not artifact_id:
-            pytest.skip("AAB fixture not found")
-
-        results = wait_for_processing(artifact_id, timeout=600)
+        size_analysis = get_size_analysis_raw("test-android-aab-001")
+        assert size_analysis["download_size"] > 0
 
-        metadata = results["artifact_metadata"]
-        assert metadata["app_name"] == "Hacker News"
-        assert metadata["app_id"] == "com.emergetools.hackernews"
-        assert metadata["artifact_type"] == 1
+        treemap = size_analysis["treemap"]
+        assert treemap["platform"] == "android"
+        assert treemap["root"]["name"] == "Hacker News"
+        assert treemap["root"]["size"] == 5932249
+        assert treemap["root"]["is_dir"] is True
+        assert len(treemap["root"]["children"]) == 14
 
-        assert results["has_size_analysis_file"]
-        size_analysis = get_size_analysis_raw(artifact_id)
-        assert size_analysis["download_size"] > 0
-        assert size_analysis["treemap"]["root"]["size"] == 5932249
+        insights = size_analysis["insights"]
+        assert "duplicate_files" in insights
+        assert insights["duplicate_files"]["total_savings"] >= 0
+        assert "groups" in insights["duplicate_files"]
 
-    def test_nonexistent_artifact(self):
+    def test_nonexistent_artifact_error_handling(self):
         time.sleep(15)
-        response = requests.get(f"{MOCK_API_URL}/test/results/test-nonexistent-parallel", timeout=10)
+
+        response = requests.get(f"{MOCK_API_URL}/test/results/test-nonexistent-artifact", timeout=10)
+        response.raise_for_status()
         results = response.json()
+
         assert not results["has_size_analysis_file"]

From 566d29d4101a7629fe1ad36708687d1e980ac9fe Mon Sep 17 00:00:00 2001
From: Nico Hinderling <NicoHinderling@users.noreply.github.com>
Date: Thu, 9 Apr 2026 14:12:42 -0700
Subject: [PATCH 15/15] ref: Address review feedback

- Remove stale env vars from .envrc (KAFKA_GROUP_ID, KAFKA_TOPICS,
  LAUNCHPAD_HOST, LAUNCHPAD_PORT, LAUNCHPAD_CREATE_KAFKA_TOPIC)
- Remove stale EXPOSE 2218 from Dockerfile (HTTP server is gone)
- Add failure exits to CI e2e health-check loops

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .envrc                   |  5 -----
 .github/workflows/ci.yml | 15 +++++++++++++++
 Dockerfile               |  3 ---
 3 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/.envrc b/.envrc
index 7b658b74..ca9e2007 100644
--- a/.envrc
+++ b/.envrc
@@ -2,12 +2,7 @@
 
 # Local development environment variables
 export KAFKA_BOOTSTRAP_SERVERS="localhost:9092"
-export KAFKA_GROUP_ID="launchpad-devservices"
-export KAFKA_TOPICS="preprod-artifact-events"
-export LAUNCHPAD_CREATE_KAFKA_TOPIC="1"
 export LAUNCHPAD_ENV="development"
-export LAUNCHPAD_HOST="0.0.0.0"
-export LAUNCHPAD_PORT="2218"
 export LAUNCHPAD_RPC_SHARED_SECRET="launchpad-also-very-long-value-haha"
 export SENTRY_BASE_URL="http://localhost:8000"
 
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 520fe8b6..c924687f 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -101,6 +101,11 @@ jobs:
             echo "Waiting for Kafka... attempt $i/30"
             sleep 3
           done
+          if ! docker compose -f docker-compose.e2e.yml ps kafka | grep -q "healthy"; then
+            echo "ERROR: Kafka failed to become healthy"
+            docker compose -f docker-compose.e2e.yml logs kafka
+            exit 1
+          fi
 
           docker compose -f docker-compose.e2e.yml up -d taskbroker minio mock-sentry-api
           echo "Waiting for mock-sentry-api to be healthy..."
@@ -112,6 +117,11 @@ jobs:
             echo "Waiting for Mock API... attempt $i/20"
             sleep 3
           done
+          if ! docker compose -f docker-compose.e2e.yml ps mock-sentry-api | grep -q "healthy"; then
+            echo "ERROR: Mock Sentry API failed to become healthy"
+            docker compose -f docker-compose.e2e.yml logs mock-sentry-api
+            exit 1
+          fi
 
           docker compose -f docker-compose.e2e.yml up -d launchpad
           echo "Waiting for Launchpad worker to be healthy..."
@@ -123,6 +133,11 @@ jobs:
             echo "Waiting for Launchpad... attempt $i/30"
             sleep 5
           done
+          if ! docker compose -f docker-compose.e2e.yml ps launchpad | grep -q "healthy"; then
+            echo "ERROR: Launchpad worker failed to become healthy"
+            docker compose -f docker-compose.e2e.yml logs launchpad
+            exit 1
+          fi
 
           docker compose -f docker-compose.e2e.yml ps
 
diff --git a/Dockerfile b/Dockerfile
index d5b34273..6f602142 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -106,9 +106,6 @@ RUN chown -R app:app /app
 # Switch to app user
 USER app
 
-# Expose ports
-EXPOSE 2218
-
 ARG LAUNCHPAD_VERSION_SHA
 ENV LAUNCHPAD_VERSION_SHA=$LAUNCHPAD_VERSION_SHA