From 60d48162da9e6736ceedd7e038f08fe72c021f18 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Fri, 24 Apr 2026 16:25:56 +0530
Subject: [PATCH 01/27] api deployment notification init

---
 backend/api_v2/notification.py                |  31 +-
 backend/notification_v2/enums.py              |  12 +
 .../migrations/0002_notification_notify_on.py |  30 ++
 backend/notification_v2/models.py             |  13 +-
 backend/notification_v2/serializers.py        |   7 +-
 backend/notification_v2/tests/__init__.py     |   0
 .../tests/test_notification_filter.py         | 321 ++++++++++++++++++
 backend/pipeline_v2/notification.py           |  31 +-
 .../notification-modal/CreateNotification.jsx |  13 +
 9 files changed, 448 insertions(+), 10 deletions(-)
 create mode 100644 backend/notification_v2/migrations/0002_notification_notify_on.py
 create mode 100644 backend/notification_v2/tests/__init__.py
 create mode 100644 backend/notification_v2/tests/test_notification_filter.py

diff --git a/backend/api_v2/notification.py b/backend/api_v2/notification.py
index 733084c637..a41ebc3000 100644
--- a/backend/api_v2/notification.py
+++ b/backend/api_v2/notification.py
@@ -1,8 +1,10 @@
 import logging
 
+from notification_v2.enums import NotificationTrigger
 from notification_v2.helper import NotificationHelper
 from notification_v2.models import Notification
 from pipeline_v2.dto import PipelineStatusPayload
+from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from api_v2.models import APIDeployment
@@ -16,11 +18,32 @@ def __init__(self, api: APIDeployment, workflow_execution: WorkflowExecution) ->
         self.api = api
         self.workflow_execution = workflow_execution
 
-    def send(self):
-        if not self.notifications.count():
-            logger.info(f"No notifications found for api {self.api}")
+    def send(self) -> None:
+        # Partition notifications by the run outcome so each row's notify_on
+        # preference is honored. STOPPED and any other non-terminal status
+        # fire only for ALL — explicit opt-ins to FAILURES/SUCCESS shouldn't.
+        status = self.workflow_execution.status
+        if status == ExecutionStatus.ERROR.value:
+            self.notifications = self.notifications.exclude(
+                notify_on=NotificationTrigger.SUCCESS_ONLY.value
+            )
+        elif status == ExecutionStatus.COMPLETED.value:
+            self.notifications = self.notifications.exclude(
+                notify_on=NotificationTrigger.FAILURES_ONLY.value
+            )
+        else:
+            self.notifications = self.notifications.filter(
+                notify_on=NotificationTrigger.ALL.value
+            )
+
+        if not self.notifications.exists():
+            logger.info(
+                "No notifications to dispatch for api %s (status=%s)",
+                self.api,
+                status,
+            )
             return
-        logger.info(f"Sending api status notification for api {self.api}")
+        logger.info("Sending api status notification for api %s", self.api)
 
         payload_dto = PipelineStatusPayload(
             type="API",
diff --git a/backend/notification_v2/enums.py b/backend/notification_v2/enums.py
index 991b08cac9..516b34074b 100644
--- a/backend/notification_v2/enums.py
+++ b/backend/notification_v2/enums.py
@@ -36,3 +36,15 @@ class PlatformType(Enum):
     @classmethod
     def choices(cls):
         return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
+
+
+class NotificationTrigger(Enum):
+    """Controls which run outcomes fire a notification."""
+
+    ALL = "ALL"
+    FAILURES_ONLY = "FAILURES_ONLY"
+    SUCCESS_ONLY = "SUCCESS_ONLY"
+
+    @classmethod
+    def choices(cls):
+        return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
diff --git a/backend/notification_v2/migrations/0002_notification_notify_on.py b/backend/notification_v2/migrations/0002_notification_notify_on.py
new file mode 100644
index 0000000000..53c1180126
--- /dev/null
+++ b/backend/notification_v2/migrations/0002_notification_notify_on.py
@@ -0,0 +1,30 @@
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("notification_v2", "0001_initial"),
+    ]
+
+    operations = [
+        migrations.AddField(
+            model_name="notification",
+            name="notify_on",
+            field=models.CharField(
+                max_length=50,
+                choices=[
+                    ("ALL", "All"),
+                    ("FAILURES_ONLY", "Failures only"),
+                    ("SUCCESS_ONLY", "Success only"),
+                ],
+                default="ALL",
+                db_comment=(
+                    "Controls which run outcomes trigger this notification. ALL "
+                    "(default) preserves the historical 'notify on every "
+                    "completion' behavior; FAILURES_ONLY fires only on failed "
+                    "runs (ERROR for API deployments, FAILURE for ETL "
+                    "pipelines); SUCCESS_ONLY fires only on successful runs."
+                ),
+            ),
+        ),
+    ]
diff --git a/backend/notification_v2/models.py b/backend/notification_v2/models.py
index 489a8c827e..4fe21cd6c4 100644
--- a/backend/notification_v2/models.py
+++ b/backend/notification_v2/models.py
@@ -5,7 +5,7 @@
 from pipeline_v2.models import Pipeline
 from utils.models.base_model import BaseModel
 
-from .enums import AuthorizationType, NotificationType, PlatformType
+from .enums import AuthorizationType, NotificationTrigger, NotificationType, PlatformType
 
 NOTIFICATION_NAME_MAX_LENGTH = 255
 
@@ -47,6 +47,17 @@ class Notification(BaseModel):
         default=True,
         db_comment="Flag indicating whether the notification is active or not.",
     )
+    notify_on = models.CharField(
+        max_length=50,
+        choices=NotificationTrigger.choices(),
+        default=NotificationTrigger.ALL.value,
+        db_comment=(
+            "Controls which run outcomes trigger this notification. ALL (default) "
+            "preserves the historical 'notify on every completion' behavior; "
+            "FAILURES_ONLY fires only on failed runs (ERROR for API deployments, "
+            "FAILURE for ETL pipelines); SUCCESS_ONLY fires only on successful runs."
+        ),
+    )
     # Foreign keys to specific models
     pipeline = models.ForeignKey(
         Pipeline,
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index 115487c481..784ec75413 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -1,7 +1,7 @@
 from rest_framework import serializers
 from utils.input_sanitizer import validate_name_field
 
-from .enums import AuthorizationType, NotificationType, PlatformType
+from .enums import AuthorizationType, NotificationTrigger, NotificationType, PlatformType
 from .models import Notification
 
 
@@ -12,6 +12,11 @@ class NotificationSerializer(serializers.ModelSerializer):
     max_retries = serializers.IntegerField(
         max_value=4, min_value=0, default=0, required=False
     )
+    notify_on = serializers.ChoiceField(
+        choices=NotificationTrigger.choices(),
+        default=NotificationTrigger.ALL.value,
+        required=False,
+    )
 
     class Meta:
         model = Notification
diff --git a/backend/notification_v2/tests/__init__.py b/backend/notification_v2/tests/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/backend/notification_v2/tests/test_notification_filter.py b/backend/notification_v2/tests/test_notification_filter.py
new file mode 100644
index 0000000000..7f887be500
--- /dev/null
+++ b/backend/notification_v2/tests/test_notification_filter.py
@@ -0,0 +1,321 @@
+"""Unit tests for the ``notify_on`` dispatch partition on notifications.
+
+Covers both dispatch paths that fan out to ``NotificationHelper.send_notification``:
+
+* ``APINotification.send`` — keyed on ``ExecutionStatus`` (ERROR, COMPLETED, STOPPED)
+* ``PipelineNotification.send`` — keyed on ``Pipeline.PipelineStatus``
+  (FAILURE, SUCCESS, INPROGRESS)
+
+Follows the repo convention (see ``usage_v2/tests/test_helper.py``) of stubbing
+Django-heavy modules at import time so the tests run without a live DB.
+"""
+
+from __future__ import annotations
+
+import sys
+import types
+from unittest.mock import MagicMock, patch
+
+
+# ---------------------------------------------------------------------------
+# Module-level stubs — must be installed BEFORE importing the modules under
+# test so Django's ORM imports resolve to our MagicMock-backed fakes.
+# ---------------------------------------------------------------------------
+
+
+def _ensure_mod(name: str) -> types.ModuleType:
+    """Force-install a fresh stub module in ``sys.modules``."""
+    mod = types.ModuleType(name)
+    sys.modules[name] = mod
+    return mod
+
+
+def _install_stubs() -> None:
+    # Only stub leaf modules that pull in Django ORM. Parent packages
+    # (api_v2, pipeline_v2, notification_v2, workflow_manager*) load normally.
+
+    exec_enums = _ensure_mod("workflow_manager.workflow_v2.enums")
+
+    class _ExecStatusNS:
+        class ERROR:
+            value = "ERROR"
+
+        class COMPLETED:
+            value = "COMPLETED"
+
+        class STOPPED:
+            value = "STOPPED"
+
+    exec_enums.ExecutionStatus = _ExecStatusNS  # type: ignore[attr-defined]
+
+    exec_models = _ensure_mod("workflow_manager.workflow_v2.models.execution")
+    exec_models.WorkflowExecution = MagicMock(name="WorkflowExecution")  # type: ignore[attr-defined]
+
+    api_models = _ensure_mod("api_v2.models")
+    api_models.APIDeployment = MagicMock(name="APIDeployment")  # type: ignore[attr-defined]
+
+    # notification_v2.models.Notification with a patchable ``objects``.
+    notif_models = _ensure_mod("notification_v2.models")
+
+    class _FakeNotification:
+        objects = MagicMock(name="Notification.objects")
+
+    notif_models.Notification = _FakeNotification  # type: ignore[attr-defined]
+
+    # notification_v2.helper.NotificationHelper
+    notif_helper = _ensure_mod("notification_v2.helper")
+
+    class _FakeHelper:
+        send_notification = MagicMock(name="NotificationHelper.send_notification")
+
+    notif_helper.NotificationHelper = _FakeHelper  # type: ignore[attr-defined]
+
+    # pipeline_v2.dto.PipelineStatusPayload
+    pipeline_dto = _ensure_mod("pipeline_v2.dto")
+    pipeline_dto.PipelineStatusPayload = MagicMock(name="PipelineStatusPayload")  # type: ignore[attr-defined]
+
+    # pipeline_v2.models.Pipeline with a PipelineStatus text-choices surface.
+    pipeline_models = _ensure_mod("pipeline_v2.models")
+
+    class _PipelineStatus:
+        SUCCESS = "SUCCESS"
+        FAILURE = "FAILURE"
+        INPROGRESS = "INPROGRESS"
+
+    class _FakePipeline:
+        PipelineStatus = _PipelineStatus
+
+    pipeline_models.Pipeline = _FakePipeline  # type: ignore[attr-defined]
+
+
+_install_stubs()
+
+
+# Now safe to import the modules under test.
+from api_v2 import notification as api_notification_mod  # noqa: E402
+from notification_v2.enums import NotificationTrigger  # noqa: E402
+from notification_v2.helper import NotificationHelper  # noqa: E402
+from notification_v2.models import Notification  # noqa: E402
+from pipeline_v2 import notification as pipeline_notification_mod  # noqa: E402
+from pipeline_v2.models import Pipeline  # noqa: E402
+
+
+# ---------------------------------------------------------------------------
+# Test helpers
+# ---------------------------------------------------------------------------
+
+
+def _make_queryset(notifications: list[MagicMock]) -> MagicMock:
+    """Return a MagicMock that mimics the chained QuerySet surface we use.
+
+    Supports:
+        qs.filter(notify_on=<value>)   -> qs with matching rows
+        qs.exclude(notify_on=<value>)  -> qs with non-matching rows
+        qs.exists()                    -> bool based on contents
+        iter(qs)                       -> notifications
+    """
+    qs = MagicMock(name="qs")
+    qs.__iter__ = lambda self: iter(notifications)
+
+    def _filter(**kwargs):
+        if "notify_on" in kwargs:
+            target = kwargs["notify_on"]
+            kept = [n for n in notifications if n.notify_on == target]
+            return _make_queryset(kept)
+        return _make_queryset(notifications)
+
+    def _exclude(**kwargs):
+        if "notify_on" in kwargs:
+            target = kwargs["notify_on"]
+            kept = [n for n in notifications if n.notify_on != target]
+            return _make_queryset(kept)
+        return _make_queryset(notifications)
+
+    qs.filter.side_effect = _filter
+    qs.exclude.side_effect = _exclude
+    qs.exists.return_value = bool(notifications)
+    qs.count.return_value = len(notifications)
+    return qs
+
+
+def _make_notification(*, notify_on: str) -> MagicMock:
+    n = MagicMock(name="Notification")
+    n.notify_on = notify_on
+    return n
+
+
+# ---------------------------------------------------------------------------
+# APINotification — 3 modes × 3 statuses
+# ---------------------------------------------------------------------------
+
+
+class TestAPINotificationFilter:
+    def _setup(self, *, status: str, notifications: list[MagicMock]):
+        Notification.objects.filter.reset_mock()
+        Notification.objects.filter.side_effect = None
+        Notification.objects.filter.return_value = _make_queryset(notifications)
+        NotificationHelper.send_notification.reset_mock()
+
+        api = MagicMock(name="APIDeployment")
+        api.api_name = "test-api"
+        api.id = "api-uuid"
+
+        execution = MagicMock(name="WorkflowExecution")
+        execution.status = status
+        execution.id = "exec-uuid"
+        execution.error_message = "boom" if status == "ERROR" else None
+
+        return api_notification_mod.APINotification(api=api, workflow_execution=execution)
+
+    # --- ALL: fires on every status ---
+    def test_all_fires_on_completed(self):
+        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        self._setup(status="COMPLETED", notifications=[n]).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_all_fires_on_error(self):
+        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        self._setup(status="ERROR", notifications=[n]).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_all_fires_on_stopped(self):
+        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        self._setup(status="STOPPED", notifications=[n]).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    # --- FAILURES_ONLY: fires on ERROR only ---
+    def test_failures_only_suppressed_on_completed(self):
+        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        self._setup(status="COMPLETED", notifications=[n]).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    def test_failures_only_fires_on_error(self):
+        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        self._setup(status="ERROR", notifications=[n]).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_failures_only_suppressed_on_stopped(self):
+        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        self._setup(status="STOPPED", notifications=[n]).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    # --- SUCCESS_ONLY: fires on COMPLETED only ---
+    def test_success_only_fires_on_completed(self):
+        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        self._setup(status="COMPLETED", notifications=[n]).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_success_only_suppressed_on_error(self):
+        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        self._setup(status="ERROR", notifications=[n]).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    def test_success_only_suppressed_on_stopped(self):
+        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        self._setup(status="STOPPED", notifications=[n]).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    # --- Mixed partition on a COMPLETED run: ALL + SUCCESS_ONLY fire, FAILURES_ONLY doesn't ---
+    def test_mixed_partition_on_completed(self):
+        all_mode = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        failures_only = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        success_only = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        notifier = self._setup(
+            status="COMPLETED", notifications=[all_mode, failures_only, success_only]
+        )
+        with patch.object(api_notification_mod, "PipelineStatusPayload") as payload_cls:
+            payload_cls.return_value.to_dict.return_value = {}
+            notifier.send()
+
+        assert NotificationHelper.send_notification.call_count == 1
+        kwargs = NotificationHelper.send_notification.call_args.kwargs
+        dispatched = sorted(n.notify_on for n in kwargs["notifications"])
+        assert dispatched == ["ALL", "SUCCESS_ONLY"]
+
+
+# ---------------------------------------------------------------------------
+# PipelineNotification — 3 modes × 3 statuses
+# ---------------------------------------------------------------------------
+
+
+class TestPipelineNotificationFilter:
+    def _setup(self, *, last_run_status: str, notifications: list[MagicMock]):
+        Notification.objects.filter.reset_mock()
+        Notification.objects.filter.side_effect = None
+        Notification.objects.filter.return_value = _make_queryset(notifications)
+        NotificationHelper.send_notification.reset_mock()
+
+        pipeline = MagicMock(name="Pipeline")
+        pipeline.id = "pipeline-uuid"
+        pipeline.pipeline_name = "test-pipeline"
+        pipeline.pipeline_type = "ETL"
+        pipeline.last_run_status = last_run_status
+
+        return pipeline_notification_mod.PipelineNotification(
+            pipeline=pipeline, execution_id="exec-uuid", error_message=None
+        )
+
+    # --- ALL ---
+    def test_all_fires_on_success(self):
+        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
+        ).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_all_fires_on_failure(self):
+        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
+        ).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    # --- FAILURES_ONLY ---
+    def test_failures_only_suppressed_on_success(self):
+        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
+        ).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    def test_failures_only_fires_on_failure(self):
+        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
+        ).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    # --- SUCCESS_ONLY ---
+    def test_success_only_fires_on_success(self):
+        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
+        ).send()
+        assert NotificationHelper.send_notification.call_count == 1
+
+    def test_success_only_suppressed_on_failure(self):
+        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        self._setup(
+            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
+        ).send()
+        NotificationHelper.send_notification.assert_not_called()
+
+    # --- Mixed partition on a SUCCESS run ---
+    def test_mixed_partition_on_success(self):
+        all_mode = _make_notification(notify_on=NotificationTrigger.ALL.value)
+        failures_only = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
+        success_only = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
+        notifier = self._setup(
+            last_run_status=Pipeline.PipelineStatus.SUCCESS,
+            notifications=[all_mode, failures_only, success_only],
+        )
+        with patch.object(
+            pipeline_notification_mod, "PipelineStatusPayload"
+        ) as payload_cls:
+            payload_cls.return_value.to_dict.return_value = {}
+            notifier.send()
+
+        assert NotificationHelper.send_notification.call_count == 1
+        kwargs = NotificationHelper.send_notification.call_args.kwargs
+        dispatched = sorted(n.notify_on for n in kwargs["notifications"])
+        assert dispatched == ["ALL", "SUCCESS_ONLY"]
diff --git a/backend/pipeline_v2/notification.py b/backend/pipeline_v2/notification.py
index dbfc0dea52..64df6f1126 100644
--- a/backend/pipeline_v2/notification.py
+++ b/backend/pipeline_v2/notification.py
@@ -1,5 +1,6 @@
 import logging
 
+from notification_v2.enums import NotificationTrigger
 from notification_v2.helper import NotificationHelper
 from notification_v2.models import Notification
 
@@ -23,11 +24,33 @@ def __init__(
         self.error_message = error_message
         self.execution_id = execution_id
 
-    def send(self):
-        if not self.notifications.count():
-            logger.info(f"No notifications found for pipeline {self.pipeline}")
+    def send(self) -> None:
+        # Partition notifications by the run outcome so each row's notify_on
+        # preference is honored. PipelineUtils.update_pipeline_status collapses
+        # both ERROR and STOPPED execution statuses into PipelineStatus.FAILURE,
+        # so FAILURES_ONLY subscribers get alerts for both on the pipeline side.
+        status = self.pipeline.last_run_status
+        if status == Pipeline.PipelineStatus.FAILURE:
+            self.notifications = self.notifications.exclude(
+                notify_on=NotificationTrigger.SUCCESS_ONLY.value
+            )
+        elif status == Pipeline.PipelineStatus.SUCCESS:
+            self.notifications = self.notifications.exclude(
+                notify_on=NotificationTrigger.FAILURES_ONLY.value
+            )
+        else:
+            self.notifications = self.notifications.filter(
+                notify_on=NotificationTrigger.ALL.value
+            )
+
+        if not self.notifications.exists():
+            logger.info(
+                "No notifications to dispatch for pipeline %s (status=%s)",
+                self.pipeline,
+                status,
+            )
             return
-        logger.info(f"Sending pipeline status notification for pipeline {self.pipeline}")
+        logger.info("Sending pipeline status notification for pipeline %s", self.pipeline)
         payload_dto = PipelineStatusPayload(
             type=self.pipeline.pipeline_type,
             pipeline_id=str(self.pipeline.id),
diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
index 9c207bd1a9..9302f9f1dc 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
@@ -12,6 +12,7 @@ const DEFAULT_FORM_DETAILS = {
   authorization_key: "",
   is_active: false,
   max_retries: 0,
+  notify_on: "ALL",
   pipeline: "",
   api: "",
   url: "",
@@ -54,6 +55,12 @@ const AUTHORIZATION_TYPES = [
   },
 ];
 
+const NOTIFY_ON_OPTIONS = [
+  { value: "ALL", label: "On every completion" },
+  { value: "FAILURES_ONLY", label: "On failures only" },
+  { value: "SUCCESS_ONLY", label: "On success only" },
+];
+
 function CreateNotification({
   setIsForm,
   type,
@@ -192,6 +199,12 @@ function CreateNotification({
       tooltip:
         "Specify the maximum number of times the notification should be retried if it fails.",
     },
+    {
+      label: "Notify on",
+      name: "notify_on",
+      component: <Select options={NOTIFY_ON_OPTIONS} />,
+      tooltip: "Choose which run outcomes should trigger this webhook.",
+    },
   ];
 
   return (

From 207277e008c25f8ed3ea86c320c087086579e3a4 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M
 <117059509+chandrasekharan-zipstack@users.noreply.github.com>
Date: Fri, 24 Apr 2026 13:18:02 +0530
Subject: [PATCH 02/27] UN-3431 [FIX] Stream tool-run logs to workflow
 execution UI with markdown rendering (#1927)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* [FIX] Make tool-run logs visible in workflow execution UI

Two stacked gaps were keeping tool-level log lines (Processing prompt,
Running LLM completion, lookup calls, etc.) out of the workflow
execution logs UI and the execution_log DB table for API / workflow
runs:

1. Empty log_events_id.  structure_tool_task seeded LOG_EVENTS_ID in
   StateStore but never threaded it into pipeline_ctx / agentic_ctx.
   ExecutorToolShim.stream_log gated publishing on
   self.log_events_id, so every tool-level log was dropped before it
   ever reached the broker.

2. Wrong payload shape.  Even with the channel threaded,
   stream_log used LogPublisher.log_progress(...) whose payload omits
   execution_id / organization_id / file_execution_id.
   get_validated_log_data (log_utils.py) requires those IDs and
   LogType == LOG to persist to execution_log, so tool-level messages
   were silently filtered at the Redis->DB drain step — orchestration
   logs persisted, tool logs did not.

Fixes:
- ExecutionContext gains execution_id + file_execution_id, populated
  in structure_tool_task for both the legacy pipeline and agentic
  contexts.
- LegacyExecutor caches the three IDs on self during execute() and
  passes them into every ExecutorToolShim construction
  (~7 callsites).
- ExecutorToolShim.stream_log now dual-emits: PROGRESS (unchanged,
  drives the IDE prompt-card live progress pane) plus LOG carrying
  the workflow IDs (feeds the workflow execution logs UI and persists
  to execution_log via the existing drain). LOG emission is gated on
  execution_id + organization_id being present, so bare IDE test
  runs without a workflow still behave as before.

Rendering polish
- The LogModal and pipeline LogsModal now pipe log text through the
  existing CustomMarkdown renderer, so backticked identifiers render
  as inline-code pills and embedded newlines break lines. This lets
  multi-line structured events (e.g. the lookup pre-call trio)
  surface as a single row with readable inner formatting.
- Prompt-key mentions inside legacy_executor tool logs are wrapped
  in backticks for consistency with the rest of the log surface.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Wrap prompt_name in backticks in remaining stream_log calls

Completes the consistency pass on tool-run log formatting: the table-
and line-item-extraction success and error paths still emitted prompt
names without backticks, so the markdown-rendered logs UI showed them
as bare text instead of inline-code pills. Matches the pattern already
applied to the other 9 stream_log calls in this file.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Validate URL schemes in CustomMarkdown link renderer

Workflow logs rendered via CustomMarkdown can contain tool-generated or
user-derived content, so an untrusted \`[text](url)\` sequence could
inject a \`javascript:\` or \`data:\` scheme and get clickable through
antd \`Typography.Link\`. Allow-list the safe external schemes (http,
https, mailto, tel) before rendering as a link; everything else falls
back to plain text while still honouring the existing internal-path
branch used for in-app navigation.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Thread workflow IDs into remaining shim/context callsites

Addresses CodeRabbit review gaps so the log-plumbing fix is consistent
across every pre-dispatch and plugin-dispatch path:

- `table_ctx` / `line_item_ctx` in `legacy_executor.py` now carry
  `log_events_id`, `execution_id`, `file_execution_id` from context so
  downstream table/line-item plugins that build their own
  `ExecutorToolShim` pass the `execution_id + organization_id` gate
  and emit workflow LOG payloads.
- `structure_tool_task.py` threads the same IDs into the bare
  pre-dispatch shim, so `X2Text.process()` calls during agentic
  extraction reach the workflow logs UI.
- `LogsModal.jsx` stores the raw log string in row data and lets the
  column renderer wrap it in `CustomMarkdown` — the previous map
  stored a `<CustomMarkdown />` element that was then passed back into
  `CustomMarkdown.text`, producing `[object Object]` for multi-row
  lookups.
- Dropped `getattr(context, ...)` on `execution_id` /
  `file_execution_id` now that they are dataclass fields — matches the
  direct access used for `organization_id`.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [REFACTOR] Trim overly specific comments in log-plumbing changes

Pass through the new comments added across this PR and either remove or
tighten the ones that restate what the code already shows. Keep only
the WHY lines that protect future readers from missing a non-obvious
constraint (XSS guard in CustomMarkdown, dual PROGRESS/LOG emission in
the shim, pre-dispatch shim needing workflow IDs so X2Text logs are
not silently dropped).

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [REFACTOR] Extract isSafeExternalUrl into shared helpers module

Moves the URL scheme allow-list check out of CustomMarkdown into
helpers/urlSafety.js so any future component that renders links from
user- or tool-derived content can reuse the same guard instead of
re-implementing it.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Tighten URL guard, split publish try/excepts, and extract shim builder

Addresses the must-fix and worth-doing comments from the PR review:

Security
- CustomMarkdown: treat protocol-relative URLs (`//host/...`) as external,
  not internal, so they can no longer skip the scheme guard via the
  `startsWith("/")` branch.
- `isSafeExternalUrl`: drop the `window.location.origin` base so bare
  strings ("javascript", "../foo") fail to parse instead of silently
  resolving to `https://<origin>/...` and passing the scheme check.

Silent failure + comment accuracy
- ExecutorToolShim.stream_log: split the PROGRESS and LOG publish paths
  into separate try/except blocks so a LogDataDTO validation failure on
  the LOG payload is no longer mis-attributed to "progress publish
  failed". Corrected the inline comments — the DB drop is driven by
  LogPublisher's `payload.type == 'LOG'` check, and only
  `execution_id` + `organization_id` are strictly required.

Refactor
- New `LegacyExecutor._build_shim()` helper — all seven
  ExecutorToolShim callsites now share one construction path so the
  workflow-ID plumbing can't drift out of sync across sites again.
- Thread `execution_id` / `file_execution_id` into the seven
  self-dispatched sub-`ExecutionContext`s alongside `log_events_id`,
  matching the table/line-item sites and keeping the context
  consistent for any downstream consumer that reads the IDs from the
  context rather than from the executor instance.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Address remaining type-design and silent-failure comments

- ExecutionContext: drop the BE-coupled inline comment, document the
  new IDs in the Attributes block, and enforce the invariant that
  execution_id implies organization_id via __post_init__.
- ExecutorToolShim: typed the three new IDs as str | None instead of
  str = "" so the signature matches the Optional semantics already
  enforced by the runtime guards.
- LegacyExecutor: move per-request state to __init__ so _log_component
  is no longer a class-level mutable default shared across instances;
  stop silently coercing None IDs to ""; add a one-shot warning when a
  tool-sourced run lands without workflow IDs so the silent-no-persist
  case is visible in GKE logs.
- structure_tool_task: emit the same warning when LOG_EVENTS_ID is
  absent from StateStore.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Surface first publish failure per shim at WARN

Both PROGRESS and LOG publish paths previously swallowed every broker
failure at DEBUG, so a misconfigured or down Redis broker meant every
tool-level log silently vanished with no operator-visible signal.

Track a per-shim _progress_publish_failed / _log_publish_failed flag
and log the first failure at WARNING (with traceback), then downgrade
subsequent failures on the same shim back to DEBUG. Preserves the
non-fatal semantics of the publish path while making broker outages
visible in GKE logs.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../custom-markdown/CustomMarkdown.jsx        |   8 +-
 .../components/logging/log-modal/LogModal.jsx |   2 +
 .../log-modal/LogsModal.jsx                   |   3 +-
 frontend/src/helpers/urlSafety.js             |  19 +++
 .../src/unstract/sdk1/execution/context.py    |  15 ++
 workers/executor/executor_tool_shim.py        |  90 ++++++++---
 workers/executor/executors/legacy_executor.py | 145 +++++++++++-------
 .../file_processing/structure_tool_task.py    |  26 +++-
 8 files changed, 232 insertions(+), 76 deletions(-)
 create mode 100644 frontend/src/helpers/urlSafety.js

diff --git a/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx b/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
index 9e895674b5..458f319557 100644
--- a/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
+++ b/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
@@ -3,6 +3,7 @@ import PropTypes from "prop-types";
 import { useMemo } from "react";
 import { Link as RouterLink } from "react-router-dom";
 
+import { isSafeExternalUrl } from "../../../helpers/urlSafety";
 import { useSessionStore } from "../../../store/session-store";
 
 const { Text, Link, Paragraph } = Typography;
@@ -54,11 +55,16 @@ const CustomMarkdown = ({
           </Text>
         );
       case "link": {
-        const isInternal = url?.startsWith("/");
+        // Protocol-relative URLs (`//evil.com/...`) also start with `/`
+        // so exclude them from the internal-route branch.
+        const isInternal = url?.startsWith("/") && !url.startsWith("//");
         if (isInternal) {
           const resolvedUrl = orgName ? `/${orgName}${url}` : url;
           return <RouterLink to={resolvedUrl}>{content}</RouterLink>;
         }
+        if (!isSafeExternalUrl(url)) {
+          return content;
+        }
         return (
           <Link href={url} target="_blank" rel="noopener noreferrer">
             {content}
diff --git a/frontend/src/components/logging/log-modal/LogModal.jsx b/frontend/src/components/logging/log-modal/LogModal.jsx
index 2f21cb050b..d709780313 100644
--- a/frontend/src/components/logging/log-modal/LogModal.jsx
+++ b/frontend/src/components/logging/log-modal/LogModal.jsx
@@ -13,6 +13,7 @@ import { useCopyToClipboard } from "../../../hooks/useCopyToClipboard";
 import { useExceptionHandler } from "../../../hooks/useExceptionHandler";
 import useRequestUrl from "../../../hooks/useRequestUrl";
 import { useAlertStore } from "../../../store/alert-store";
+import CustomMarkdown from "../../helpers/custom-markdown/CustomMarkdown";
 import { FilterDropdown, FilterIcon } from "../filter-dropdown/FilterDropdown";
 
 function LogModal({
@@ -120,6 +121,7 @@ function LogModal({
       title: "Log",
       dataIndex: "log",
       key: "log",
+      render: (log) => <CustomMarkdown text={log || ""} />,
     },
   ];
 
diff --git a/frontend/src/components/pipelines-or-deployments/log-modal/LogsModal.jsx b/frontend/src/components/pipelines-or-deployments/log-modal/LogsModal.jsx
index 09dd7ac047..9ab7e69f3b 100644
--- a/frontend/src/components/pipelines-or-deployments/log-modal/LogsModal.jsx
+++ b/frontend/src/components/pipelines-or-deployments/log-modal/LogsModal.jsx
@@ -41,7 +41,7 @@ const LogsModal = ({
       .then((res) => {
         const logDetails = res?.data?.results?.map((item) => ({
           id: item?.id,
-          log: <CustomMarkdown text={item?.data?.log} />,
+          log: item?.data?.log,
           type: item?.data?.type,
           stage: item?.data?.stage,
           level: item?.data?.level,
@@ -111,6 +111,7 @@ const LogsModal = ({
       title: "Log",
       dataIndex: "log",
       key: "log",
+      render: (log) => <CustomMarkdown text={log || ""} />,
     },
   ];
 
diff --git a/frontend/src/helpers/urlSafety.js b/frontend/src/helpers/urlSafety.js
new file mode 100644
index 0000000000..b5ca23e795
--- /dev/null
+++ b/frontend/src/helpers/urlSafety.js
@@ -0,0 +1,19 @@
+const SAFE_URL_SCHEMES = ["http:", "https:", "mailto:", "tel:"];
+
+// Guards against unsafe schemes (e.g. `javascript:`, `data:`) when
+// rendering links built from user- or tool-derived content.
+const isSafeExternalUrl = (url) => {
+  if (typeof url !== "string" || url === "") {
+    return false;
+  }
+  // Parse without a base so bare strings (e.g. "javascript", "../foo") fail
+  // instead of silently resolving to `https://<origin>/...` and passing.
+  try {
+    const parsed = new URL(url);
+    return SAFE_URL_SCHEMES.includes(parsed.protocol);
+  } catch {
+    return false;
+  }
+};
+
+export { isSafeExternalUrl, SAFE_URL_SCHEMES };
diff --git a/unstract/sdk1/src/unstract/sdk1/execution/context.py b/unstract/sdk1/src/unstract/sdk1/execution/context.py
index a1efb4c3f8..83eb650a29 100644
--- a/unstract/sdk1/src/unstract/sdk1/execution/context.py
+++ b/unstract/sdk1/src/unstract/sdk1/execution/context.py
@@ -68,6 +68,11 @@ class ExecutionContext:
         log_events_id: Socket.IO channel ID for streaming progress
             logs to the frontend.  ``None`` when not in an IDE
             session (no logs published).
+        execution_id: Workflow execution identifier for log
+            correlation. When set, ``organization_id`` must also be
+            set (enforced in ``__post_init__``).
+        file_execution_id: Child identifier for per-file execution
+            within a workflow run. Optional.
     """
 
     executor_name: str
@@ -78,6 +83,8 @@ class ExecutionContext:
     executor_params: dict[str, Any] = field(default_factory=dict)
     request_id: str | None = None
     log_events_id: str | None = None
+    execution_id: str | None = None
+    file_execution_id: str | None = None
 
     def __post_init__(self) -> None:
         """Validate required fields after initialization."""
@@ -89,6 +96,10 @@ def __post_init__(self) -> None:
             raise ValueError("run_id is required")
         if not self.execution_source:
             raise ValueError("execution_source is required")
+        # When execution_id is set, organization_id must be too — they
+        # travel together for workflow-level log correlation.
+        if self.execution_id and not self.organization_id:
+            raise ValueError("organization_id is required when execution_id is set")
 
         # Normalize enum values to plain strings for serialization
         if isinstance(self.operation, Operation):
@@ -111,6 +122,8 @@ def to_dict(self) -> dict[str, Any]:
             "executor_params": self.executor_params,
             "request_id": self.request_id,
             "log_events_id": self.log_events_id,
+            "execution_id": self.execution_id,
+            "file_execution_id": self.file_execution_id,
         }
 
     @classmethod
@@ -125,4 +138,6 @@ def from_dict(cls, data: dict[str, Any]) -> "ExecutionContext":
             executor_params=data.get("executor_params", {}),
             request_id=data.get("request_id"),
             log_events_id=data.get("log_events_id"),
+            execution_id=data.get("execution_id"),
+            file_execution_id=data.get("file_execution_id"),
         )
diff --git a/workers/executor/executor_tool_shim.py b/workers/executor/executor_tool_shim.py
index 63f48dd253..828e641398 100644
--- a/workers/executor/executor_tool_shim.py
+++ b/workers/executor/executor_tool_shim.py
@@ -60,6 +60,9 @@ def __init__(
         platform_api_key: str = "",
         log_events_id: str = "",
         component: dict[str, str] | None = None,
+        execution_id: str | None = None,
+        organization_id: str | None = None,
+        file_execution_id: str | None = None,
     ) -> None:
         """Initialize the shim.
 
@@ -72,10 +75,24 @@ def __init__(
             component: Structured identifier dict for log correlation
                 (``tool_id``, ``run_id``, ``doc_name``, optionally
                 ``prompt_key``).
+            execution_id: Workflow execution id. When provided with
+                ``organization_id``, enables persistent log attribution
+                to the ``execution_log`` table.
+            organization_id: Tenant/org scope for log persistence.
+            file_execution_id: File execution id (child of workflow
+                execution). Optional — populated for per-file tool runs.
         """
         self.platform_api_key = platform_api_key
         self.log_events_id = log_events_id
         self.component = component or {}
+        self.execution_id = execution_id
+        self.organization_id = organization_id
+        self.file_execution_id = file_execution_id
+        # Track whether we've already surfaced a publish failure on this
+        # shim so that a down broker is flagged loudly once instead of
+        # silently swallowing every subsequent log line at DEBUG.
+        self._progress_publish_failed = False
+        self._log_publish_failed = False
         # Initialize StreamMixin.  EXECUTION_BY_TOOL is not set in
         # the worker environment, so _exec_by_tool will be False.
         super().__init__(log_level=LogLevel.INFO)
@@ -145,24 +162,61 @@ def stream_log(
             return
 
         # Publish progress to frontend via the log consumer queue.
-        if self.log_events_id:
-            try:
-                wf_level = _SDK_TO_WF_LEVEL.get(level, "INFO")
-                payload = LogPublisher.log_progress(
-                    component=self.component,
-                    level=wf_level,
-                    state=stage,
-                    message=log,
-                )
-                LogPublisher.publish(
-                    channel_id=self.log_events_id,
-                    payload=payload,
-                )
-            except Exception:
-                logger.debug(
-                    "Failed to publish progress log (non-fatal)",
-                    exc_info=True,
-                )
+        if not self.log_events_id:
+            return
+
+        wf_level = _SDK_TO_WF_LEVEL.get(level, "INFO")
+
+        # PROGRESS payload — IDE prompt-card live updates only. Dropped at
+        # the DB persist layer because LogPublisher.publish only stores
+        # payloads whose `type == "LOG"`.
+        try:
+            progress_payload = LogPublisher.log_progress(
+                component=self.component,
+                level=wf_level,
+                state=stage,
+                message=log,
+            )
+            LogPublisher.publish(
+                channel_id=self.log_events_id,
+                payload=progress_payload,
+            )
+        except Exception:
+            first_failure = not self._progress_publish_failed
+            self._progress_publish_failed = True
+            logger.log(
+                logging.WARNING if first_failure else logging.DEBUG,
+                "Failed to publish progress log (non-fatal)",
+                exc_info=first_failure,
+            )
+
+        # LOG payload — feeds workflow logs UI and persists to execution_log.
+        # LogDataDTO validation requires `execution_id` and `organization_id`;
+        # `file_execution_id` is optional.
+        if not (self.execution_id and self.organization_id):
+            return
+
+        try:
+            log_payload = LogPublisher.log_workflow(
+                stage=stage,
+                message=log,
+                level=wf_level,
+                execution_id=self.execution_id,
+                file_execution_id=self.file_execution_id or None,
+                organization_id=self.organization_id,
+            )
+            LogPublisher.publish(
+                channel_id=self.log_events_id,
+                payload=log_payload,
+            )
+        except Exception:
+            first_failure = not self._log_publish_failed
+            self._log_publish_failed = True
+            logger.log(
+                logging.WARNING if first_failure else logging.DEBUG,
+                "Failed to publish workflow log (non-fatal)",
+                exc_info=first_failure,
+            )
 
     def stream_error_and_exit(self, message: str, err: Exception | None = None) -> None:
         """Log error and raise SdkError.
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 18e1f47749..2a7dfc160d 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -57,9 +57,13 @@ class LegacyExecutor(BaseExecutor):
         Operation.STRUCTURE_PIPELINE.value: "_handle_structure_pipeline",
     }
 
-    # Defaults for log streaming (overridden by execute()).
-    _log_events_id: str = ""
-    _log_component: dict[str, str] = {}
+    def __init__(self) -> None:
+        # Per-request state — overwritten on every ``execute()`` call.
+        self._log_events_id: str = ""
+        self._log_component: dict[str, str] = {}
+        self._execution_id: str | None = None
+        self._file_execution_id: str | None = None
+        self._organization_id: str | None = None
 
     @property
     def name(self) -> str:
@@ -77,8 +81,21 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
             NotImplementedError: From stub handlers (until 2D–2H).
         """
         # Extract log streaming info (set by tasks.py for IDE sessions).
-        self._log_events_id: str = context.log_events_id or ""
-        self._log_component: dict[str, str] = getattr(context, "_log_component", {})
+        self._log_events_id = context.log_events_id or ""
+        self._log_component = getattr(context, "_log_component", None) or {}
+        self._execution_id = context.execution_id
+        self._file_execution_id = context.file_execution_id
+        self._organization_id = context.organization_id
+        if (
+            context.execution_source == "tool"
+            and self._log_events_id
+            and not (self._execution_id and self._organization_id)
+        ):
+            logger.warning(
+                "Workflow IDs missing on tool context run_id=%s — tool-level "
+                "logs will reach the UI but won't persist to execution_log.",
+                context.run_id,
+            )
 
         handler_name = self._OPERATION_MAP.get(context.operation)
         if handler_name is None:
@@ -121,10 +138,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
             # Stream error to FE so the user sees the failure in real-time
             if self._log_events_id:
                 try:
-                    shim = ExecutorToolShim(
-                        log_events_id=self._log_events_id,
-                        component=self._log_component,
-                    )
+                    shim = self._build_shim()
                     shim.stream_log(
                         f"Error: {exc.message or type(exc).__name__}",
                         level=LogLevel.ERROR,
@@ -133,6 +147,26 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                     pass  # Best-effort — don't mask the original error
             return ExecutionResult.failure(error=exc.message)
 
+    def _build_shim(
+        self,
+        *,
+        platform_api_key: str = "",
+        component: dict[str, str] | None = None,
+    ) -> ExecutorToolShim:
+        """Construct an ``ExecutorToolShim`` pre-populated with the
+        log-streaming and workflow-attribution fields captured in
+        ``execute()``. Callers override ``platform_api_key`` and
+        ``component`` as needed; everything else is shared.
+        """
+        return ExecutorToolShim(
+            platform_api_key=platform_api_key,
+            log_events_id=self._log_events_id,
+            component=self._log_component if component is None else component,
+            execution_id=self._execution_id,
+            organization_id=self._organization_id,
+            file_execution_id=self._file_execution_id,
+        )
+
     # ------------------------------------------------------------------
     # Phase 2B — Extract handler
     # ------------------------------------------------------------------
@@ -173,11 +207,7 @@ def _handle_extract(self, context: ExecutionContext) -> ExecutionResult:
         execution_data_dir: str | None = params.get(IKeys.EXECUTION_DATA_DIR)
 
         # Build adapter shim and X2Text
-        shim = ExecutorToolShim(
-            platform_api_key=platform_api_key,
-            log_events_id=self._log_events_id,
-            component=self._log_component,
-        )
+        shim = self._build_shim(platform_api_key=platform_api_key)
         x2text = X2Text(
             tool=shim,
             adapter_instance_id=x2text_instance_id,
@@ -352,6 +382,8 @@ def _run_summarize_step(
             organization_id=context.organization_id,
             request_id=context.request_id,
             log_events_id=context.log_events_id,
+            execution_id=context.execution_id,
+            file_execution_id=context.file_execution_id,
             executor_params={
                 "llm_adapter_instance_id": llm_adapter_id,
                 "summarize_prompt": summarize_prompt,
@@ -427,6 +459,8 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
                 executor_params=extract_params,
                 request_id=context.request_id,
                 log_events_id=context.log_events_id,
+                execution_id=context.execution_id,
+                file_execution_id=context.file_execution_id,
             )
             extract_result = self._handle_extract(extract_ctx)
             if not extract_result.success:
@@ -454,6 +488,8 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
             executor_params=index_params,
             request_id=context.request_id,
             log_events_id=context.log_events_id,
+            execution_id=context.execution_id,
+            file_execution_id=context.file_execution_id,
         )
         index_result = self._handle_index(index_ctx)
         if not index_result.success:
@@ -519,10 +555,8 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
         extracted_text = ""
         index_metrics: dict = {}
 
-        shim = ExecutorToolShim(
+        shim = self._build_shim(
             platform_api_key=extract_params.get("platform_api_key", ""),
-            log_events_id=self._log_events_id,
-            component=self._log_component,
         )
         step = 1
 
@@ -539,6 +573,8 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
                 executor_params=extract_params,
                 request_id=context.request_id,
                 log_events_id=context.log_events_id,
+                execution_id=context.execution_id,
+                file_execution_id=context.file_execution_id,
             )
             extract_result = self._handle_extract(extract_ctx)
             if not extract_result.success:
@@ -643,6 +679,8 @@ def _run_pipeline_answer_step(
             executor_params=answer_params,
             request_id=context.request_id,
             log_events_id=context.log_events_id,
+            execution_id=context.execution_id,
+            file_execution_id=context.file_execution_id,
         )
         if is_single_pass:
             return self._handle_single_pass_extraction(answer_ctx)
@@ -745,6 +783,8 @@ def _run_pipeline_summarize(
                 organization_id=context.organization_id,
                 request_id=context.request_id,
                 log_events_id=context.log_events_id,
+                execution_id=context.execution_id,
+                file_execution_id=context.file_execution_id,
                 executor_params={
                     "llm_adapter_instance_id": llm_adapter_id,
                     "summarize_prompt": summarize_prompt,
@@ -840,6 +880,8 @@ def _run_pipeline_index(
                     organization_id=context.organization_id,
                     request_id=context.request_id,
                     log_events_id=context.log_events_id,
+                    execution_id=context.execution_id,
+                    file_execution_id=context.file_execution_id,
                     executor_params={
                         "embedding_instance_id": embedding,
                         "vector_db_instance_id": vector_db,
@@ -954,11 +996,7 @@ def _handle_index(self, context: ExecutionContext) -> ExecutionResult:
             usage_kwargs=usage_kwargs,
         )
 
-        shim = ExecutorToolShim(
-            platform_api_key=platform_api_key,
-            log_events_id=self._log_events_id,
-            component=self._log_component,
-        )
+        shim = self._build_shim(platform_api_key=platform_api_key)
         fs_instance = FileUtils.get_fs_instance(execution_source=execution_source)
 
         logger.info(
@@ -1199,11 +1237,7 @@ def _handle_answer_prompt(self, context: ExecutionContext) -> ExecutionResult:
         process_text_fn = None
         enable_highlight = tool_settings.get(PSKeys.ENABLE_HIGHLIGHT, False)
         enable_word_confidence = tool_settings.get(PSKeys.ENABLE_WORD_CONFIDENCE, False)
-        pipeline_shim = ExecutorToolShim(
-            platform_api_key=platform_api_key,
-            log_events_id=self._log_events_id,
-            component=self._log_component,
-        )
+        pipeline_shim = self._build_shim(platform_api_key=platform_api_key)
         if enable_highlight:
             from executor.executors.plugins import ExecutorPluginLoader
 
@@ -1371,7 +1405,7 @@ def _run_challenge_if_enabled(
         challenge_llm_id = tool_settings.get(PSKeys.CHALLENGE_LLM)
         if not challenge_llm_id:
             return
-        shim.stream_log(f"Running challenge for: {prompt_name}")
+        shim.stream_log(f"Running challenge for: `{prompt_name}`")
         challenge_llm = llm_cls(
             adapter_instance_id=challenge_llm_id,
             tool=shim,
@@ -1390,7 +1424,7 @@ def _run_challenge_if_enabled(
             metadata=metadata,
         )
         challenger.run()
-        shim.stream_log(f"Challenge verification completed for: {prompt_name}")
+        shim.stream_log(f"Challenge verification completed for: `{prompt_name}`")
         logger.info("Challenge completed: prompt=%s", prompt_name)
 
     @staticmethod
@@ -1412,7 +1446,7 @@ def _run_evaluation_if_enabled(
         evaluator_cls = ExecutorPluginLoader.get("evaluation")
         if not evaluator_cls:
             return
-        shim.stream_log(f"Running evaluation for: {prompt_name}")
+        shim.stream_log(f"Running evaluation for: `{prompt_name}`")
         evaluator = evaluator_cls(
             query=output.get(PSKeys.COMBINED_PROMPT, ""),
             context="\n".join(context_list),
@@ -1476,12 +1510,11 @@ def _execute_single_prompt(
             output.get(PSKeys.TYPE, "TEXT"),
         )
 
-        shim = ExecutorToolShim(
+        shim = self._build_shim(
             platform_api_key=platform_api_key,
-            log_events_id=self._log_events_id,
             component={**self._log_component, "prompt_key": prompt_name},
         )
-        shim.stream_log(f"Processing prompt: {prompt_name}")
+        shim.stream_log(f"Processing prompt: `{prompt_name}`")
 
         if variable_replacement_svc.is_variables_present(prompt_text=prompt_text):
             prompt_text = variable_replacement_svc.replace_variables_in_prompt(
@@ -1494,7 +1527,7 @@ def _execute_single_prompt(
                 custom_data=custom_data,
                 is_ide=execution_source == "ide",
             )
-            shim.stream_log(f"Resolved template variables for: {prompt_name}")
+            shim.stream_log(f"Resolved template variables for: `{prompt_name}`")
 
         logger.info(
             "Executing prompt: tool_id=%s name=%s run_id=%s", tool_id, prompt_name, run_id
@@ -1574,7 +1607,9 @@ def _execute_single_prompt(
                     adapter_instance_id=output[PSKeys.VECTOR_DB],
                     embedding=embedding,
                 )
-            shim.stream_log(f"Initialized LLM and retrieval adapters for: {prompt_name}")
+            shim.stream_log(
+                f"Initialized LLM and retrieval adapters for: `{prompt_name}`"
+            )
         except Exception as e:
             msg = f"Couldn't fetch adapter. {e}"
             logger.error(msg)
@@ -1588,7 +1623,7 @@ def _execute_single_prompt(
             retrieval_strategy = output.get(PSKeys.RETRIEVAL_STRATEGY)
             valid_strategies = {s.value for s in RetrievalStrategy}
             if retrieval_strategy in valid_strategies:
-                shim.stream_log(f"Retrieving context for: {prompt_name}")
+                shim.stream_log(f"Retrieving context for: `{prompt_name}`")
                 logger.info(
                     "Performing retrieval: prompt=%s strategy=%s chunk_size=%d",
                     prompt_name,
@@ -1613,14 +1648,14 @@ def _execute_single_prompt(
                     )
                 metadata[PSKeys.CONTEXT][prompt_name] = context_list
                 shim.stream_log(
-                    f"Retrieved {len(context_list)} context chunks for: {prompt_name}"
+                    f"Retrieved {len(context_list)} context chunks for: `{prompt_name}`"
                 )
                 logger.debug(
                     "Retrieved %d context chunks for prompt: %s",
                     len(context_list),
                     prompt_name,
                 )
-                shim.stream_log(f"Running LLM completion for: {prompt_name}")
+                shim.stream_log(f"Running LLM completion for: `{prompt_name}`")
                 answer = answer_prompt_svc.construct_and_run_prompt(
                     tool_settings=tool_settings,
                     output=output,
@@ -1652,7 +1687,7 @@ def _execute_single_prompt(
                 tool_id=tool_id,
                 doc_name=doc_name,
             )
-            shim.stream_log(f"Applied type conversion for: {prompt_name}")
+            shim.stream_log(f"Applied type conversion for: `{prompt_name}`")
 
             self._run_challenge_if_enabled(
                 tool_settings=tool_settings,
@@ -1676,7 +1711,7 @@ def _execute_single_prompt(
                 shim=shim,
                 prompt_name=prompt_name,
             )
-            shim.stream_log(f"Completed prompt: {prompt_name}")
+            shim.stream_log(f"Completed prompt: `{prompt_name}`")
 
             val = structured_output.get(prompt_name)
             if isinstance(val, str):
@@ -1725,6 +1760,9 @@ def _run_table_extraction(
             execution_source=execution_source,
             organization_id=context.organization_id,
             request_id=context.request_id,
+            log_events_id=self._log_events_id,
+            execution_id=self._execution_id,
+            file_execution_id=self._file_execution_id,
             executor_params={
                 "llm_adapter_instance_id": output.get(PSKeys.LLM, ""),
                 "table_settings": output.get(PSKeys.TABLE_SETTINGS, {}),
@@ -1736,9 +1774,8 @@ def _run_table_extraction(
             },
         )
         table_ctx._log_component = self._log_component
-        table_ctx.log_events_id = self._log_events_id
 
-        shim.stream_log(f"Running table extraction for: {prompt_name}")
+        shim.stream_log(f"Running table extraction for: `{prompt_name}`")
         table_result = table_executor.execute(table_ctx)
 
         if table_result.success:
@@ -1747,9 +1784,9 @@ def _run_table_extraction(
             metrics.setdefault(prompt_name, {}).update(
                 {"table_extraction": table_metrics}
             )
-            shim.stream_log(f"Table extraction completed for: {prompt_name}")
+            shim.stream_log(f"Table extraction completed for: `{prompt_name}`")
             logger.info("TABLE extraction completed: prompt=%s", prompt_name)
-            shim.stream_log(f"Completed prompt: {prompt_name}")
+            shim.stream_log(f"Completed prompt: `{prompt_name}`")
         else:
             structured_output[prompt_name] = ""
             error_msg = table_result.error or "unknown error"
@@ -1759,7 +1796,7 @@ def _run_table_extraction(
                 error_msg,
             )
             shim.stream_log(
-                f"Table extraction failed for {prompt_name}: {error_msg}",
+                f"Table extraction failed for `{prompt_name}`: {error_msg}",
                 level=LogLevel.ERROR,
             )
 
@@ -1799,6 +1836,9 @@ def _run_line_item_extraction(
             execution_source=prompt_run_args["execution_source"],
             organization_id=context.organization_id,
             request_id=context.request_id,
+            log_events_id=self._log_events_id,
+            execution_id=self._execution_id,
+            file_execution_id=self._file_execution_id,
             executor_params={
                 "llm_adapter_instance_id": output.get(PSKeys.LLM, ""),
                 "tool_settings": prompt_run_args["tool_settings"],
@@ -1813,9 +1853,8 @@ def _run_line_item_extraction(
             },
         )
         line_item_ctx._log_component = self._log_component
-        line_item_ctx.log_events_id = self._log_events_id
 
-        shim.stream_log(f"Running line-item extraction for: {prompt_name}")
+        shim.stream_log(f"Running line-item extraction for: `{prompt_name}`")
         line_item_result = line_item_executor.execute(line_item_ctx)
 
         if line_item_result.success:
@@ -1828,9 +1867,9 @@ def _run_line_item_extraction(
             context_list = data.get("context")
             if context_list:
                 metadata[PSKeys.CONTEXT][prompt_name] = context_list
-            shim.stream_log(f"Line-item extraction completed for: {prompt_name}")
+            shim.stream_log(f"Line-item extraction completed for: `{prompt_name}`")
             logger.info("LINE_ITEM extraction completed: prompt=%s", prompt_name)
-            shim.stream_log(f"Completed prompt: {prompt_name}")
+            shim.stream_log(f"Completed prompt: `{prompt_name}`")
         else:
             structured_output[prompt_name] = ""
             error_msg = line_item_result.error or "unknown error"
@@ -1840,7 +1879,7 @@ def _run_line_item_extraction(
                 error_msg,
             )
             shim.stream_log(
-                f"Line-item extraction failed for {prompt_name}: {error_msg}",
+                f"Line-item extraction failed for `{prompt_name}`: {error_msg}",
                 level=LogLevel.ERROR,
             )
 
@@ -2032,11 +2071,7 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
             f"Context:\n---------------\n{doc_context}\n-----------------\n\nSummary:"
         )
 
-        shim = ExecutorToolShim(
-            platform_api_key=platform_api_key,
-            log_events_id=self._log_events_id,
-            component=self._log_component,
-        )
+        shim = self._build_shim(platform_api_key=platform_api_key)
         usage_kwargs = {
             "run_id": context.run_id,
             PSKeys.LLM_USAGE_REASON: PSKeys.SUMMARIZE,
diff --git a/workers/file_processing/structure_tool_task.py b/workers/file_processing/structure_tool_task.py
index 8df8603855..87c9426376 100644
--- a/workers/file_processing/structure_tool_task.py
+++ b/workers/file_processing/structure_tool_task.py
@@ -24,6 +24,7 @@
 
 from file_processing.worker import app
 from shared.enums.task_enums import TaskName
+from shared.infrastructure.context import StateStore
 
 from unstract.sdk1.constants import ToolEnv, UsageKwargs
 from unstract.sdk1.execution.context import ExecutionContext
@@ -235,7 +236,22 @@ def _execute_structure_tool_impl(params: dict) -> dict:
     # ---- Step 1: Setup ----
     from executor.executor_tool_shim import ExecutorToolShim
 
-    shim = ExecutorToolShim(platform_api_key=platform_service_api_key)
+    # Workflow IDs on the pre-dispatch shim let X2Text/platform helper logs
+    # reach the workflow logs UI before the executor dispatch happens.
+    log_events_id = StateStore.get("LOG_EVENTS_ID") or ""
+    if not log_events_id:
+        logger.warning(
+            "LOG_EVENTS_ID missing from StateStore for execution_id=%s — "
+            "tool-level logs will not stream to the workflow logs UI.",
+            execution_id,
+        )
+    shim = ExecutorToolShim(
+        platform_api_key=platform_service_api_key,
+        log_events_id=log_events_id,
+        execution_id=execution_id,
+        file_execution_id=file_execution_id,
+        organization_id=organization_id,
+    )
 
     platform_helper = _create_platform_helper(shim, file_execution_id)
     dispatcher = ExecutionDispatcher(celery_app=app)
@@ -257,6 +273,7 @@ def _execute_structure_tool_impl(params: dict) -> dict:
             dispatcher=dispatcher,
             shim=shim,
             file_execution_id=file_execution_id,
+            execution_id=execution_id,
             organization_id=organization_id,
             source_file_name=source_file_name,
             fs=fs,
@@ -388,6 +405,9 @@ def _execute_structure_tool_impl(params: dict) -> dict:
         execution_source="tool",
         organization_id=organization_id,
         request_id=file_execution_id,
+        log_events_id=StateStore.get("LOG_EVENTS_ID") or "",
+        execution_id=execution_id,
+        file_execution_id=file_execution_id,
         executor_params={
             "extract_params": extract_params,
             "index_template": index_template,
@@ -533,6 +553,7 @@ def _run_agentic_extraction(
     dispatcher: ExecutionDispatcher,
     shim: Any,
     file_execution_id: str,
+    execution_id: str,
     organization_id: str,
     source_file_name: str,
     fs: Any,
@@ -587,6 +608,9 @@ def _run_agentic_extraction(
         execution_source="tool",
         organization_id=organization_id,
         request_id=file_execution_id,
+        log_events_id=StateStore.get("LOG_EVENTS_ID") or "",
+        execution_id=execution_id,
+        file_execution_id=file_execution_id,
         executor_params={
             "document_id": file_execution_id,
             "document_text": document_text,

From 29bdf64e55d46cd848ef6bc230a34040aabe901c Mon Sep 17 00:00:00 2001
From: Chandrasekharan M
 <117059509+chandrasekharan-zipstack@users.noreply.github.com>
Date: Fri, 24 Apr 2026 13:32:23 +0530
Subject: [PATCH 03/27] UN-3430 [FIX] Update modified_at field correctly for
 models (#1928)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* [FIX] Auto-bump modified_at on QuerySet.update() and bulk_update()

Django's auto_now=True only fires on Model.save(); QuerySet.update() and
bulk_update() bypass save(), so BaseModel.modified_at silently stayed at
the creation time for every bulk-path write. Audit trail drifted.

Introduce BaseModelQuerySet that injects modified_at=timezone.now() into
both paths, and expose it via BaseModelManager. Migrate all custom
managers on BaseModel subclasses to compose BaseModelManager so their
querysets inherit the overrides. Drop the ad-hoc modified_at=now() kwarg
in FileHistoryHelper now that the queryset handles it.

* [FIX] Materialize objs in BaseModelQuerySet.bulk_update to support generators

Addresses PR review: if callers pass a non-rewindable iterable (generator,
queryset iterator), the modified_at stamping loop would exhaust it before
super().bulk_update() saw it, silently updating zero rows. list(objs) up
front keeps generator callers working.

Also drop the mock-based unit test — it needed django.setup() at module
import which isn't viable without pytest-django, and proper DB-backed
coverage is tracked separately.

* [FIX] Auto-inject modified_at into BaseModel.save(update_fields=...)

Django only runs auto_now for fields listed in update_fields, so every
save(update_fields=["foo"]) on a BaseModel subclass silently drops the
modified_at bump — same family of bug as QuerySet.update/bulk_update.

Override BaseModel.save() to add modified_at to update_fields whenever
the caller supplies a restricted list without it. Also drop two dead
manual-assignment lines (execution.modified_at = timezone.now() before
save()) that were redundant with auto_now on a full save().

* [FIX] Auto-bump modified_at on upsert bulk_create and drop workarounds

QuerySet.bulk_create(update_conflicts=True, update_fields=[...]) runs an
UPDATE on conflict with only the listed fields — same auto_now-bypass as
save(update_fields=...) and QuerySet.update(). Patch BaseModelQuerySet's
bulk_create to inject modified_at into update_fields on upsert.

With that in place, the explicit "modified_at" entries in dashboard_metrics
upsert callers are redundant. Drop them.

* [REFACTOR] Tighten BaseModel auto-bump helpers and edge cases

- Extract `_with_modified_at` helper; single source of truth for the "inject
  modified_at into a partial field list" rule across `bulk_update`,
  `bulk_create` and `BaseModel.save`.
- Preserve Django's documented `save(update_fields=[])` no-op (signals-only
  save, no column writes) instead of rewriting it to `["modified_at"]`.
  Apply the same guard to `bulk_create(update_conflicts=True, update_fields=[])`.
- Match Django's positional `save()` signature (`force_insert`, `force_update`,
  `using`, `update_fields`) so callers passing flags positionally still hit
  the auto-bump override.
- Skip the per-obj `modified_at` stamp + `objs` materialization in
  `bulk_update` when the caller already listed `modified_at` — lets the
  opt-in path stay O(1) before the `super()` delegation.
- Docstring corrections: "previous save() timestamp" (not just creation
  time); manager-level convention note; precise `auto_now` semantics
  (attribute still updates in-memory, just isn't persisted without
  `update_fields` inclusion).
---
 backend/adapter_processor_v2/models.py        |   4 +-
 backend/api_v2/models.py                      |   4 +-
 backend/connector_v2/models.py                |   4 +-
 .../management/commands/backfill_metrics.py   |   6 +-
 backend/dashboard_metrics/models.py           |   8 +-
 backend/dashboard_metrics/tasks.py            |   6 +-
 backend/pipeline_v2/models.py                 |   4 +-
 .../prompt_studio_core_v2/models.py           |   4 +-
 .../prompt_studio_registry_v2/models.py       |   4 +-
 backend/tags/models.py                        |   4 +-
 backend/tool_instance_v2/models.py            |   4 +-
 backend/usage_v2/models.py                    |   4 +-
 backend/utils/models/base_model.py            | 113 ++++++++++++++++++
 backend/utils/models/org_aware_manager.py     |   4 +-
 .../workflow_manager/endpoint_v2/models.py    |   4 +-
 .../workflow_manager/file_execution/models.py |   4 +-
 backend/workflow_manager/internal_views.py    |   2 -
 .../workflow_v2/file_history_helper.py        |   1 -
 .../workflow_v2/models/execution.py           |   4 +-
 .../workflow_v2/models/workflow.py            |   4 +-
 backend/workflow_manager/workflow_v2/views.py |   2 -
 21 files changed, 151 insertions(+), 43 deletions(-)

diff --git a/backend/adapter_processor_v2/models.py b/backend/adapter_processor_v2/models.py
index 13be07cdc0..a6fab0c1f9 100644
--- a/backend/adapter_processor_v2/models.py
+++ b/backend/adapter_processor_v2/models.py
@@ -10,7 +10,7 @@
 from django.db.models import QuerySet
 from tenant_account_v2.models import OrganizationMember
 from utils.exceptions import InvalidEncryptionKey
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -29,7 +29,7 @@
 logger = logging.getLogger(__name__)
 
 
-class AdapterInstanceModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class AdapterInstanceModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def get_queryset(self) -> QuerySet[Any]:
         return super().get_queryset()
 
diff --git a/backend/api_v2/models.py b/backend/api_v2/models.py
index 532b67d2dc..cc19902bde 100644
--- a/backend/api_v2/models.py
+++ b/backend/api_v2/models.py
@@ -7,7 +7,7 @@
 from django.db.models.signals import post_delete
 from django.dispatch import receiver
 from pipeline_v2.models import Pipeline
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -24,7 +24,7 @@
 API_ENDPOINT_MAX_LENGTH = 255
 
 
-class APIDeploymentModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class APIDeploymentModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def for_user(self, user):
         """Filter API deployments that the user can access:
         - API deployments created by the user
diff --git a/backend/connector_v2/models.py b/backend/connector_v2/models.py
index c3d0e6108b..73ea38b57c 100644
--- a/backend/connector_v2/models.py
+++ b/backend/connector_v2/models.py
@@ -8,7 +8,7 @@
 from connector_processor.constants import ConnectorKeys
 from django.db import models
 from utils.fields import EncryptedBinaryField
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -22,7 +22,7 @@
 logger = logging.getLogger(__name__)
 
 
-class ConnectorInstanceModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class ConnectorInstanceModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def get_queryset(self) -> models.QuerySet:
         return super().get_queryset()
 
diff --git a/backend/dashboard_metrics/management/commands/backfill_metrics.py b/backend/dashboard_metrics/management/commands/backfill_metrics.py
index daf0b3130e..9c4d82baca 100644
--- a/backend/dashboard_metrics/management/commands/backfill_metrics.py
+++ b/backend/dashboard_metrics/management/commands/backfill_metrics.py
@@ -424,7 +424,7 @@ def _bulk_upsert_hourly(self, aggregations: dict) -> int:
                 "project",
                 "tag",
             ],
-            update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+            update_fields=["metric_type", "metric_value", "metric_count"],
         )
         return len(objects)
 
@@ -457,7 +457,7 @@ def _bulk_upsert_daily(self, aggregations: dict) -> int:
                 "project",
                 "tag",
             ],
-            update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+            update_fields=["metric_type", "metric_value", "metric_count"],
         )
         return len(objects)
 
@@ -490,6 +490,6 @@ def _bulk_upsert_monthly(self, aggregations: dict) -> int:
                 "project",
                 "tag",
             ],
-            update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+            update_fields=["metric_type", "metric_value", "metric_count"],
         )
         return len(objects)
diff --git a/backend/dashboard_metrics/models.py b/backend/dashboard_metrics/models.py
index 44fec5439a..2bc4baf6ac 100644
--- a/backend/dashboard_metrics/models.py
+++ b/backend/dashboard_metrics/models.py
@@ -3,7 +3,7 @@
 import uuid
 
 from django.db import models
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -25,19 +25,19 @@ class MetricType(models.TextChoices):
     HISTOGRAM = "histogram", "Histogram"
 
 
-class EventMetricsHourlyManager(DefaultOrganizationManagerMixin):
+class EventMetricsHourlyManager(DefaultOrganizationManagerMixin, BaseModelManager):
     """Manager for EventMetricsHourly with organization filtering."""
 
     pass
 
 
-class EventMetricsDailyManager(DefaultOrganizationManagerMixin):
+class EventMetricsDailyManager(DefaultOrganizationManagerMixin, BaseModelManager):
     """Manager for EventMetricsDaily with organization filtering."""
 
     pass
 
 
-class EventMetricsMonthlyManager(DefaultOrganizationManagerMixin):
+class EventMetricsMonthlyManager(DefaultOrganizationManagerMixin, BaseModelManager):
     """Manager for EventMetricsMonthly with organization filtering."""
 
     pass
diff --git a/backend/dashboard_metrics/tasks.py b/backend/dashboard_metrics/tasks.py
index 3246e7e46e..181c985137 100644
--- a/backend/dashboard_metrics/tasks.py
+++ b/backend/dashboard_metrics/tasks.py
@@ -121,7 +121,7 @@ def _bulk_upsert_hourly(aggregations: dict) -> int:
         objects,
         update_conflicts=True,
         unique_fields=["organization", "timestamp", "metric_name", "project", "tag"],
-        update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+        update_fields=["metric_type", "metric_value", "metric_count"],
     )
     return len(objects)
 
@@ -160,7 +160,7 @@ def _bulk_upsert_daily(aggregations: dict) -> int:
         objects,
         update_conflicts=True,
         unique_fields=["organization", "date", "metric_name", "project", "tag"],
-        update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+        update_fields=["metric_type", "metric_value", "metric_count"],
     )
     return len(objects)
 
@@ -199,7 +199,7 @@ def _bulk_upsert_monthly(aggregations: dict) -> int:
         objects,
         update_conflicts=True,
         unique_fields=["organization", "month", "metric_name", "project", "tag"],
-        update_fields=["metric_type", "metric_value", "metric_count", "modified_at"],
+        update_fields=["metric_type", "metric_value", "metric_count"],
     )
     return len(objects)
 
diff --git a/backend/pipeline_v2/models.py b/backend/pipeline_v2/models.py
index 00b12c8483..65fb5257a8 100644
--- a/backend/pipeline_v2/models.py
+++ b/backend/pipeline_v2/models.py
@@ -4,7 +4,7 @@
 from django.conf import settings
 from django.db import models
 from django.db.models import Q
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -18,7 +18,7 @@
 PIPELINE_NAME_LENGTH = 32
 
 
-class PipelineModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class PipelineModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def for_user(self, user):
         """Filter pipelines that the user can access:
         - Pipelines created by the user
diff --git a/backend/prompt_studio/prompt_studio_core_v2/models.py b/backend/prompt_studio/prompt_studio_core_v2/models.py
index 406c157efc..1e1802b776 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/models.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/models.py
@@ -8,7 +8,7 @@
 from django.db.models import QuerySet
 from utils.file_storage.constants import FileStorageKeys
 from utils.file_storage.helpers.prompt_studio_file_helper import PromptStudioFileHelper
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -21,7 +21,7 @@
 logger = logging.getLogger(__name__)
 
 
-class CustomToolModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class CustomToolModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def for_user(self, user: User) -> QuerySet[Any]:
         if getattr(user, "is_service_account", False):
             return self.all()
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/models.py b/backend/prompt_studio/prompt_studio_registry_v2/models.py
index c4cd54cc0f..34478c8e70 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/models.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/models.py
@@ -5,7 +5,7 @@
 from account_v2.models import User
 from django.db import models
 from django.db.models import QuerySet
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -21,7 +21,7 @@
 logger = logging.getLogger(__name__)
 
 
-class PromptStudioRegistryModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class PromptStudioRegistryModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def get_queryset(self) -> QuerySet[Any]:
         return super().get_queryset()
 
diff --git a/backend/tags/models.py b/backend/tags/models.py
index 94c5c8cf54..7f366152b0 100644
--- a/backend/tags/models.py
+++ b/backend/tags/models.py
@@ -1,7 +1,7 @@
 import uuid
 
 from django.db import models
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -9,7 +9,7 @@
 from utils.user_context import UserContext
 
 
-class TagModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class TagModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def get_or_create_tags(self, tag_names: list[str]) -> list["Tag"]:
         """Retrieves or creates tags based on a list of tag names.
 
diff --git a/backend/tool_instance_v2/models.py b/backend/tool_instance_v2/models.py
index 971f1249bf..d858da2323 100644
--- a/backend/tool_instance_v2/models.py
+++ b/backend/tool_instance_v2/models.py
@@ -3,7 +3,7 @@
 from account_v2.models import User
 from django.db import models
 from django.db.models import QuerySet
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from workflow_manager.workflow_v2.models.workflow import Workflow
 
 TOOL_ID_LENGTH = 64
@@ -11,7 +11,7 @@
 TOOL_STATUS_LENGTH = 32
 
 
-class ToolInstanceManager(models.Manager):
+class ToolInstanceManager(BaseModelManager):
     def get_instances_for_workflow(self, workflow: uuid.UUID) -> QuerySet["ToolInstance"]:
         return self.filter(workflow=workflow)
 
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 8da3d751ba..57ae3d143d 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -1,7 +1,7 @@
 import uuid
 
 from django.db import models
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -19,7 +19,7 @@ class LLMUsageReason(models.TextChoices):
     SUMMARIZE = "summarize", "Summarize"
 
 
-class UsageModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class UsageModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     pass
 
 
diff --git a/backend/utils/models/base_model.py b/backend/utils/models/base_model.py
index b26f0f67d2..c2b288b9ef 100644
--- a/backend/utils/models/base_model.py
+++ b/backend/utils/models/base_model.py
@@ -1,9 +1,122 @@
 from django.db import models
+from django.utils import timezone
+
+_AUTO_NOW_FIELD = "modified_at"
+
+
+def _with_modified_at(fields):
+    """Return a new list containing ``fields`` plus ``modified_at`` if absent.
+
+    Centralises the "inject modified_at into a partial field list" rule so
+    ``bulk_update``, ``bulk_create`` and ``BaseModel.save`` apply it the same
+    way.
+    """
+    fields = list(fields)
+    if _AUTO_NOW_FIELD not in fields:
+        fields.append(_AUTO_NOW_FIELD)
+    return fields
+
+
+class BaseModelQuerySet(models.QuerySet):
+    """QuerySet that mirrors ``auto_now`` semantics for bulk update paths.
+
+    ``modified_at = models.DateTimeField(auto_now=True)`` only fires on
+    ``Model.save()``. ``QuerySet.update()`` and ``QuerySet.bulk_update()``
+    issue raw SQL and bypass ``save()``, leaving ``modified_at`` at whatever
+    value it had before the bulk path ran (creation time for never-saved
+    rows, the previous save() timestamp for others) — silently drifting the
+    audit trail. This QuerySet patches both paths so callers don't have to
+    remember.
+
+    Callers can still override by passing ``modified_at`` explicitly (or by
+    including ``modified_at`` in the ``fields`` list for ``bulk_update``).
+
+    Note: this is a manager-level convention, not a model-level guarantee.
+    Subclasses that reassign ``objects`` to a plain ``models.Manager``, raw
+    SQL, and migration-time models returned by ``apps.get_model()`` all
+    bypass these overrides.
+    """
+
+    def update(self, **kwargs):
+        kwargs.setdefault(_AUTO_NOW_FIELD, timezone.now())
+        return super().update(**kwargs)
+
+    def bulk_update(self, objs, fields, *args, **kwargs):
+        # Stamp modified_at on each obj only when the caller didn't list it;
+        # materialize objs first because we iterate the sequence twice (once
+        # to stamp, once via super()) and a generator would be exhausted.
+        if _AUTO_NOW_FIELD not in fields:
+            objs = list(objs)
+            now = timezone.now()
+            for obj in objs:
+                obj.modified_at = now
+            fields = _with_modified_at(fields)
+        return super().bulk_update(objs, fields, *args, **kwargs)
+
+    def bulk_create(
+        self, objs, *args, update_conflicts=False, update_fields=None, **kwargs
+    ):
+        # On upsert-on-conflict Django runs an UPDATE with only the listed
+        # fields, which skips auto_now the same way save(update_fields=...)
+        # does. Insert-only bulk_create already handles auto_now itself.
+        if update_conflicts and update_fields:
+            update_fields = _with_modified_at(update_fields)
+        return super().bulk_create(
+            objs,
+            *args,
+            update_conflicts=update_conflicts,
+            update_fields=update_fields,
+            **kwargs,
+        )
+
+
+BaseModelManager = models.Manager.from_queryset(BaseModelQuerySet)
 
 
 class BaseModel(models.Model):
+    """Abstract base with managed ``created_at`` / ``modified_at`` timestamps.
+
+    Subclasses inherit ``BaseModelManager`` as the default manager, which
+    auto-bumps ``modified_at`` on ``QuerySet.update()``, ``bulk_update()``
+    and upsert-mode ``bulk_create()``. The ``save()`` override below does
+    the same for partial ``save(update_fields=[...])`` calls.
+
+    Subclasses that need a custom manager should compose ``BaseModelManager``
+    (e.g. ``class FooManager(MyMixin, BaseModelManager)``) — otherwise the
+    auto-bump on bulk paths is silently lost.
+    """
+
     created_at = models.DateTimeField(auto_now_add=True)
     modified_at = models.DateTimeField(auto_now=True)
 
+    objects = BaseModelManager()
+
     class Meta:
         abstract = True
+
+    def save(
+        self,
+        force_insert=False,
+        force_update=False,
+        using=None,
+        update_fields=None,
+        **kwargs,
+    ):
+        # Django's save(update_fields=...) only writes the listed columns.
+        # auto_now still updates modified_at on the in-memory instance, but
+        # the new value is never persisted unless modified_at is in
+        # update_fields. Auto-include it so partial saves don't silently drop
+        # the bump. Preserve Django's documented no-op semantics for
+        # update_fields=[] (signals-only save, no column writes).
+        #
+        # Signature mirrors Django's positional order so callers passing
+        # force_insert/force_update positionally still hit this override.
+        if update_fields:
+            update_fields = _with_modified_at(update_fields)
+        return super().save(
+            force_insert=force_insert,
+            force_update=force_update,
+            using=using,
+            update_fields=update_fields,
+            **kwargs,
+        )
diff --git a/backend/utils/models/org_aware_manager.py b/backend/utils/models/org_aware_manager.py
index 3ec6e70bd7..ab40303dbb 100644
--- a/backend/utils/models/org_aware_manager.py
+++ b/backend/utils/models/org_aware_manager.py
@@ -3,15 +3,15 @@
 import logging
 
 from django.core.exceptions import ImproperlyConfigured
-from django.db import models
 from django.db.utils import OperationalError, ProgrammingError
+from utils.models.base_model import BaseModelManager
 from utils.models.org_path_discovery import get_org_path
 from utils.user_context import UserContext
 
 logger = logging.getLogger(__name__)
 
 
-class OrgAwareManager(models.Manager):
+class OrgAwareManager(BaseModelManager):
     """Manager that auto-discovers FK path to Organization and applies
     org filtering to all queries in request context.
 
diff --git a/backend/workflow_manager/endpoint_v2/models.py b/backend/workflow_manager/endpoint_v2/models.py
index e07737ba7a..44742dfc36 100644
--- a/backend/workflow_manager/endpoint_v2/models.py
+++ b/backend/workflow_manager/endpoint_v2/models.py
@@ -2,12 +2,12 @@
 
 from connector_v2.models import ConnectorInstance
 from django.db import models
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.user_context import UserContext
 from workflow_manager.workflow_v2.models.workflow import Workflow
 
 
-class WorkflowEndpointModelManager(models.Manager):
+class WorkflowEndpointModelManager(BaseModelManager):
     def get_queryset(self):
         # Validating organization
         organization = UserContext.get_organization()
diff --git a/backend/workflow_manager/file_execution/models.py b/backend/workflow_manager/file_execution/models.py
index d5106855e0..105b3875a9 100644
--- a/backend/workflow_manager/file_execution/models.py
+++ b/backend/workflow_manager/file_execution/models.py
@@ -4,7 +4,7 @@
 
 from django.db import models
 from utils.common_utils import CommonUtils
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 
 from workflow_manager.endpoint_v2.dto import FileHash
 from workflow_manager.workflow_v2.enums import ExecutionStatus
@@ -15,7 +15,7 @@
 MIME_TYPE_LENGTH = 128
 
 
-class WorkflowFileExecutionManager(models.Manager):
+class WorkflowFileExecutionManager(BaseModelManager):
     def get_or_create_file_execution(
         self,
         workflow_execution: Any,
diff --git a/backend/workflow_manager/internal_views.py b/backend/workflow_manager/internal_views.py
index d11ae56179..c822e5e7b5 100644
--- a/backend/workflow_manager/internal_views.py
+++ b/backend/workflow_manager/internal_views.py
@@ -7,7 +7,6 @@
 
 from django.db import transaction
 from django.shortcuts import get_object_or_404
-from django.utils import timezone
 from rest_framework import status, viewsets
 from rest_framework.decorators import action
 from rest_framework.response import Response
@@ -2009,7 +2008,6 @@ def post(self, request):
                         if update.get("execution_time") is not None:
                             execution.execution_time = update["execution_time"]
 
-                        execution.modified_at = timezone.now()
                         execution.save()
 
                         successful_updates.append(
diff --git a/backend/workflow_manager/workflow_v2/file_history_helper.py b/backend/workflow_manager/workflow_v2/file_history_helper.py
index 12b0a9c2c0..687f88dfe9 100644
--- a/backend/workflow_manager/workflow_v2/file_history_helper.py
+++ b/backend/workflow_manager/workflow_v2/file_history_helper.py
@@ -288,7 +288,6 @@ def _increment_file_history(
             result=str(result),
             metadata=FileHistoryHelper._safe_str(metadata),
             error=FileHistoryHelper._safe_str(error),
-            modified_at=timezone.now(),
         )
         # Refresh from DB to get updated values
         file_history.refresh_from_db()
diff --git a/backend/workflow_manager/workflow_v2/models/execution.py b/backend/workflow_manager/workflow_v2/models/execution.py
index 93623118d7..45886bd64e 100644
--- a/backend/workflow_manager/workflow_v2/models/execution.py
+++ b/backend/workflow_manager/workflow_v2/models/execution.py
@@ -12,7 +12,7 @@
 from usage_v2.helper import UsageHelper
 from usage_v2.models import Usage
 from utils.common_utils import CommonUtils
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 
 from workflow_manager.execution.dto import ExecutionCache
 from workflow_manager.execution.execution_cache_utils import ExecutionCacheUtils
@@ -26,7 +26,7 @@
 EXECUTION_ERROR_LENGTH = 256
 
 
-class WorkflowExecutionManager(models.Manager):
+class WorkflowExecutionManager(BaseModelManager):
     """Custom manager for WorkflowExecution model to handle user-specific filtering."""
 
     def for_user(self, user) -> QuerySet:
diff --git a/backend/workflow_manager/workflow_v2/models/workflow.py b/backend/workflow_manager/workflow_v2/models/workflow.py
index dd945fc7f9..0029f95997 100644
--- a/backend/workflow_manager/workflow_v2/models/workflow.py
+++ b/backend/workflow_manager/workflow_v2/models/workflow.py
@@ -4,7 +4,7 @@
 from django.conf import settings
 from django.core.validators import MinValueValidator
 from django.db import models
-from utils.models.base_model import BaseModel
+from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
     DefaultOrganizationMixin,
@@ -15,7 +15,7 @@
 WORKFLOW_NAME_SIZE = 128
 
 
-class WorkflowModelManager(DefaultOrganizationManagerMixin, models.Manager):
+class WorkflowModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     def for_user(self, user):
         """Filter workflows that the user can access:
         - Workflows created by the user
diff --git a/backend/workflow_manager/workflow_v2/views.py b/backend/workflow_manager/workflow_v2/views.py
index dc428d948a..629b52bb22 100644
--- a/backend/workflow_manager/workflow_v2/views.py
+++ b/backend/workflow_manager/workflow_v2/views.py
@@ -6,7 +6,6 @@
 from django.db import transaction
 from django.db.models.query import QuerySet
 from django.shortcuts import get_object_or_404
-from django.utils import timezone
 from django.views.decorators.csrf import csrf_exempt
 from permissions.permission import IsOwner, IsOwnerOrSharedUserOrSharedToOrg
 from pipeline_v2.models import Pipeline
@@ -528,7 +527,6 @@ def status(self, request, id=None):
                 if validated_data.get("execution_time") is not None:
                     execution.execution_time = validated_data["execution_time"]
 
-                execution.modified_at = timezone.now()
                 execution.save()
 
                 logger.info(

From fd532bec8c1b5479fffc89494115308d09c09594 Mon Sep 17 00:00:00 2001
From: harini-venkataraman
 <115449948+harini-venkataraman@users.noreply.github.com>
Date: Tue, 28 Apr 2026 10:58:43 +0530
Subject: [PATCH 04/27] UN-3403 [FEAT] Agentic table extractor plugin with
 multi-agent LLM-powered table extraction (#1914)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Execution backend - revamp

* async flow

* Streaming progress to FE

* Removing multi hop in Prompt studio ide and structure tool

* UN-3234 [FIX] Add beta tag to agentic prompt studio navigation item

* Added executors for agentic prompt studio

* Added executors for agentic prompt studio

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* Removed redundant envs

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Removed redundant envs

* adding worker for callbacks

* adding worker for callbacks

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Pluggable apps and plugins to fit the new async prompt execution architecture

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Pluggable apps and plugins to fit the new async prompt execution architecture

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Pluggable apps and plugins to fit the new async prompt execution architecture

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* adding worker for callbacks

* fix: write output files in agentic extraction pipeline

Agentic extraction returned early without writing INFILE (JSON) or
METADATA.json, causing destination connectors to read the original PDF
and fail with "Expected tool output type: TXT, got: application/pdf".

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: replace hardcoded /tmp paths with secure temp dirs in tests (#1850)

* UN-3266 fix: replace hardcoded /tmp paths with secure temp dirs in tests

Replace hardcoded /tmp/ paths (SonarCloud S5443 security hotspots) with
pytest's tmp_path fixture or module-level tempfile.mkdtemp() constants
in all affected test files to avoid world-writable directory vulnerabilities.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

---------

Co-authored-by: Claude Sonnet 4.6 <noreply@anthropic.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Update docs

* UN-3266 fix: remove dead code with undefined names in fetch_response

Remove unreachable code block after the async callback return in
fetch_response that still referenced output_count_before and response
from the old synchronous implementation, causing ruff F821 errors.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* Un 3266 fix security hotspot tmp paths (#1851)

* UN-3266 fix: replace hardcoded /tmp paths with secure temp dirs in tests

Replace hardcoded /tmp/ paths (SonarCloud S5443 security hotspots) with
pytest's tmp_path fixture or module-level tempfile.mkdtemp() constants
in all affected test files to avoid world-writable directory vulnerabilities.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: resolve ruff linting failures across multiple files

- B026: pass url positionally in worker_celery.py to avoid star-arg after keyword
- N803: rename MockAsyncResult to mock_async_result in test_tasks.py
- E501/I001: fix long line and import sort in llm_whisperer helper
- ANN401: replace Any with object|None in dispatcher.py; add noqa in test helpers
- F841: remove unused workflow_id and result assignments

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

---------

Co-authored-by: Claude Sonnet 4.6 <noreply@anthropic.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>

* UN-3266 fix: resolve SonarCloud bugs S2259 and S1244 in PR #1849

- S2259: guard against None after _discover_plugins() in loader.py
  to satisfy static analysis on the dict[str,type]|None field type
- S1244: replace float equality checks with pytest.approx() in
  test_answer_prompt.py and test_phase2h.py

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: resolve SonarCloud code smells in PR #1849

- S5799: Merge all implicit string concatenations in log messages
  (legacy_executor.py, tasks.py, dispatcher.py, orchestrator.py,
   registry.py, variable_replacement.py, structure_tool_task.py)
- S1192: Extract duplicate literal to _NO_CELERY_APP_MSG constant in
  dispatcher.py
- S1871: Merge identical elif/else branches in tasks.py and
  test_sanity_phase6j.py
- S1186: Add comment to empty stub method in test_sanity_phase6a.py
- S1481: Remove unused local variables in test_sanity_phase6d/e/f/g/h/j
  and test_phase5d.py
- S117: Rename PascalCase local variables to snake_case in
  test_sanity_phase3/5/6i.py
- S5655: Broaden tool type annotation to StreamMixin in
  IndexingUtils.generate_index_key and PlatformHelper.get_adapter_config
- docker:S7031: Merge consecutive RUN instructions in
  worker-unified.Dockerfile
- javascript:S1128: Remove unused pollForCompletion import in
  usePromptRun.js

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* UN-3266 fix: wrap long log message in dispatcher.py to fix E501

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: resolve remaining SonarCloud S117 naming violations

Rename PascalCase local variables to snake_case to comply with S117:

- legacy_executor.py: rename tuple-unpacked _get_prompt_deps() results
  (AnswerPromptService→answer_prompt_svc, RetrievalService→retrieval_svc,
  VariableReplacementService→variable_replacement_svc, LLM→llm_cls,
  EmbeddingCompat→embedding_compat_cls, VectorDB→vector_db_cls) and
  update all downstream usages including _apply_type_conversion and
  _handle_summarize
- test_phase1_log_streaming.py: rename Mock* local variables to
  mock_* snake_case equivalents
- test_sanity_phase3.py: rename MockDispatcher→mock_dispatcher_cls
  and MockShim→mock_shim_cls across all 10 test methods
- test_sanity_phase5.py: rename MockShim→mock_shim, MockX2Text→mock_x2text
  in 6 test methods; MockDispatcher→mock_dispatcher_cls in dispatch test;
  fix LLM_cls→llm_cls, EmbeddingCompat→embedding_compat_cls,
  VectorDB→vector_db_cls in _mock_prompt_deps helper

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* UN-3266 fix: resolve remaining SonarCloud code smells in PR #1849

- test_sanity_phase2/4.py, test_answer_prompt.py: rename PascalCase
  local variables in _mock_prompt_deps/_mock_deps to snake_case
  (RetrievalService→retrieval_svc, VariableReplacementService→
  variable_replacement_svc, Index→index_cls, LLM_cls→llm_cls,
  EmbeddingCompat→embedding_compat_cls, VectorDB→vector_db_cls,
  AnswerPromptService→answer_prompt_svc_cls) — fixes S117
- test_sanity_phase3.py: remove unused local variable "result" — fixes S1481
- structure_tool_task.py: remove redundant json.JSONDecodeError from
  except clause (subclass of ValueError) — fixes S5713
- shared/workflow/execution/service.py: replace generic Exception with
  RuntimeError for structure tool failure — fixes S112
- run-worker-docker.sh: define EXECUTOR_WORKER_TYPE constant and
  replace 10 literal "executor" occurrences — fixes S1192

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: resolve SonarCloud cognitive complexity and code smell violations

- Reduce cognitive complexity in answer_prompt.py:
  - Extract _build_grammar_notes, _run_webhook_postprocess helpers
  - _is_safe_public_url: extracted _resolve_host_addresses helper
  - handle_json: early-return pattern eliminates nesting
  - construct_prompt: delegates grammar loop to _build_grammar_notes
- Reduce cognitive complexity in legacy_executor.py:
  - Extract _execute_single_prompt, _run_table_extraction helpers
  - Extract _run_challenge_if_enabled, _run_evaluation_if_enabled
  - Extract _inject_table_settings, _finalize_pipeline_result
  - Extract _convert_number_answer, _convert_scalar_answer
  - Extract _sanitize_dict_values helper
  - _handle_answer_prompt CC reduced from 50 to ~7
- Reduce CC in structure_tool_task.py: guard-clause refactor
- Reduce CC in backend: dto.py, deployment_helper.py,
  api_deployment_views.py, prompt_studio_helper.py
- Fix S117: rename PascalCase local vars in test_answer_prompt.py
- Fix S1192: extract EXECUTOR_WORKER_TYPE constant in run-worker.sh
- Fix S1172: remove unused params from structure_tool_task.py
- Fix S5713: remove redundant JSONDecodeError in json_repair_helper.py
- Fix S112/S5727 in test_execution.py

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: remove unused RetrievalStrategy import from _handle_answer_prompt

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* UN-3266 fix: rename UsageHelper params to lowercase (N803)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* UN-3266 fix: resolve remaining SonarCloud issues from check run 66691002192

- Add @staticmethod to _sanitize_null_values (fixes S2325 missing self)
- Reduce _execute_single_prompt params from 25 to 11 (S107)
  by grouping services as deps tuple and extracting exec params
  from context.executor_params
- Add NOSONAR suppression for raise exc in test helper (S112)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* UN-3266 fix: remove unused locals in _handle_answer_prompt (F841)

execution_id, file_hash, log_events_id, custom_data are now extracted
inside _execute_single_prompt from context.executor_params.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

* fix: resolve Biome linting errors in frontend source files

Auto-fixed 48 lint errors across 56 files: import ordering, block
statements, unused variable prefixing, and formatting issues.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: replace dynamic import of SharePermission with static import in Workflows

Resolves vite build warning about SharePermission.jsx being both
dynamically and statically imported across the codebase.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: resolve SonarCloud warnings in frontend components

- Remove unnecessary try-catch around PostHog event calls
- Flip negated condition in PromptOutput.handleTable for clarity

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Address PR #1849 review comments: fix null guards, dead code, and test drift

- Remove redundant inline `import uuid as _uuid` in views.py (use module-level uuid)
- URL-encode DB_USER in worker_celery.py result backend connection string
- Remove misleading task_queues=[Queue("executor")] from dispatch-only Celery app
- Remove dead `if not tool:` guards after objects.get() (already raises DoesNotExist)
- Move profile_manager/default_profile null checks before first dereference
- Reorder ProfileManager.objects.get before mark_document_indexed in tasks.py
- Handle ProfileManager.DoesNotExist as warning, not hard failure
- Wrap PostHog analytics in try/catch so failures don't block prompt execution
- Handle pending-indexing 200 response in usePromptRun.js (clear RUNNING status)
- Reset formData when metadata is missing in ConfigureDs.jsx
- Fix test_should_skip_extraction tests: function now takes 1 arg (outputs only)
- Fix agentic routing tests: mock X2Text.process, remove stale platform_helper kwarg

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Fix missing llm_usage_reason for summarize LLM usage tracking

Add PSKeys.LLM_USAGE_REASON to usage_kwargs in _handle_summarize() so
summarization costs appear under summarize_llm in API response metadata.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Fix single-pass extraction routing in LegacyExecutor

- Route _handle_structure_pipeline to _handle_single_pass_extraction when
  is_single_pass=True (was always calling _handle_answer_prompt)
- Delegate _handle_single_pass_extraction to cloud plugin via ExecutorRegistry,
  falling back to _handle_answer_prompt if plugin not installed

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* Fixing API depployment response mismatches

* Add complete_vision() method to SDK1 LLM for multimodal completions

Adds a new complete_vision() method alongside existing complete() that
accepts pre-built multimodal messages (text + image_url) in OpenAI-style
format. LiteLLM auto-translates for Anthropic/Bedrock/Vertex providers.
This enables the agentic table extractor plugin to send page images
alongside text prompts for VLM-based table detection and extraction.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Gate Run button by agentic table readiness checklist

- PromptCardItems loads AgenticTableChecklist plugin and owns the
  isAgenticTableReady state, rendering the checklist above the prompt
  text area and delegating the settings gear visibility to the plugin.
- Header and PromptOutput disable their Run buttons when
  isAgenticTableReady is false (default true for non-agentic types).

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* [FIX] Use correct primary key field in prompt count subquery (#1905)

ToolStudioPrompt uses prompt_id as its primary key, not id.
Count("id") causes FieldError on the list endpoint (500).

Co-authored-by: Chandrasekharan M <chandrasekharan@zipstack.com>
Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* [FIX] Add agentic_table as valid enforce_type choice

The cloud build adds "agentic_table" to the prompt enforce_type
dropdown, but the OSS ToolStudioPrompt model rejected it as an
invalid choice. Add AGENTIC_TABLE to EnforceType and ship a
matching migration so the value can be persisted.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Wire agentic_table enforce_type to executor dispatch

The single-prompt run flow had no branch for prompts with
enforce_type=agentic_table, so clicking Run silently fell through to
the legacy prompt-service path and never invoked the agentic_table
executor. Adds an AGENTIC_TABLE constant to TSPKeys, includes it in
the OperationNotSupported guard, and dispatches to
PayloadModifier.execute_agentic_table when the plugin is available
so the result still flows through _handle_response.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Add agentic_table queue to executor worker defaults

The ExecutionDispatcher derives the queue name from the executor name
(celery_executor_{name}), so dispatches to the agentic_table executor
land on celery_executor_agentic_table. The local docker-compose default
only listed celery_executor_legacy and celery_executor_agentic, so no
worker consumed the new queue and dispatch hung for the full 1-hour
result timeout. Adds the missing queue to the docker-compose default.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Dispatch agentic_table prompts to executor on IDE Run

The IDE Run button was building a legacy answer_prompt payload for
agentic_table prompts, so the agentic table executor was never
invoked. Branch fetch_response on enforce_type so agentic_table
prompts are built via the cloud payload_modifier plugin and
dispatched directly to celery_executor_agentic_table. Add the
enforce_type to the OSS dropdown choices and the JSON-dump set in
OutputManagerHelper so the persisted output is parseable by the FE
table renderer.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* UN-3266 [FIX] Reshape agentic_table executor output in IDE callback

The agentic_table executor returns {"output": {"tables": [...],
"page_count": ..., "headers": [...], ...}}, but
OutputManagerHelper.handle_prompt_output_update reads
outputs[prompt.prompt_key] when persisting prompt output. Without a
reshape the table list never lands under the prompt key and the FE
sees an empty result.

When cb_kwargs carries is_agentic_table=True and prompt_key (set by
the cloud build_agentic_table_payload), reshape outputs to
{prompt_key: tables} before calling update_prompt_output. The
executor itself also shapes its envelope, so this is a defensive
double-keying that keeps the legacy answer_prompt path untouched.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* Fixing timeout issues

* API deployment fixes for Agentic table extractor

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

* Fixing syntax issues

* Fix agentic_table executor reading INFILE after JSON overwrite

Read from SOURCE instead of INFILE when dispatching to the
agentic_table executor. INFILE gets overwritten with JSON output
by the regular pipeline, causing PDFium parse errors when the
agentic_table executor tries to process it as a PDF.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Signed-off-by: harini-venkataraman <115449948+harini-venkataraman@users.noreply.github.com>
Co-authored-by: Ghost Jake <89829542+Deepak-Kesavan@users.noreply.github.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Co-authored-by: Claude Sonnet 4.6 <noreply@anthropic.com>
Co-authored-by: Ritwik G <100672805+ritwik-g@users.noreply.github.com>
Co-authored-by: Chandrasekharan M <chandrasekharan@zipstack.com>
---
 .../prompt_studio_core_v2/constants.py        |   1 +
 .../prompt_studio_helper.py                   |  40 +++--
 .../static/select_choices.json                |   1 +
 .../prompt_studio_core_v2/views.py            |  59 ++++++-
 .../output_manager_helper.py                  |   8 +-
 .../prompt_studio_registry_v2/constants.py    |   1 +
 .../prompt_studio_registry_helper.py          |   9 +
 ...014_alter_toolstudioprompt_enforce_type.py |  41 +++++
 .../prompt_studio/prompt_studio_v2/models.py  |   1 +
 docker/docker-compose.yaml                    |   2 +-
 .../custom-tools/prompt-card/Header.jsx       |   4 +
 .../prompt-card/PromptCardItems.jsx           |  24 ++-
 .../custom-tools/prompt-card/PromptOutput.jsx |  14 +-
 frontend/src/hooks/usePromptRun.js            |   6 +-
 unstract/sdk1/src/unstract/sdk1/llm.py        |  90 ++++++++++
 workers/executor/executors/legacy_executor.py |  37 ++--
 .../executor/executors/retrievers/fusion.py   |   2 +-
 .../executors/retrievers/keyword_table.py     |   2 +-
 .../file_processing/structure_tool_task.py    | 161 ++++++++++++++----
 workers/ide_callback/tasks.py                 |  10 ++
 workers/tests/test_answer_prompt.py           |  16 +-
 21 files changed, 451 insertions(+), 78 deletions(-)
 create mode 100644 backend/prompt_studio/prompt_studio_v2/migrations/0014_alter_toolstudioprompt_enforce_type.py

diff --git a/backend/prompt_studio/prompt_studio_core_v2/constants.py b/backend/prompt_studio/prompt_studio_core_v2/constants.py
index c1ab14d380..03bd68c1d8 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/constants.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/constants.py
@@ -92,6 +92,7 @@ class ToolStudioPromptKeys:
     INCLUDE_METADATA = "include_metadata"
     TXT_EXTENTION = ".txt"
     TABLE = "table"
+    AGENTIC_TABLE = "agentic_table"
     PLATFORM_POSTAMBLE = "platform_postamble"
     WORD_CONFIDENCE_POSTAMBLE = "word_confidence_postamble"
     SUMMARIZE_AS_SOURCE = "summarize_as_source"
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index d0ffef3114..ff2b345505 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -1540,6 +1540,7 @@ def _execute_single_prompt(
         if (
             prompt_instance.enforce_type == TSPKeys.TABLE
             or prompt_instance.enforce_type == TSPKeys.RECORD
+            or prompt_instance.enforce_type == TSPKeys.AGENTIC_TABLE
         ) and not payload_modifier_plugin:
             raise OperationNotSupported()
 
@@ -1570,17 +1571,34 @@ def _execute_single_prompt(
             "Invoking prompt service",
         )
         try:
-            response = PromptStudioHelper._fetch_response(
-                doc_path=doc_path,
-                doc_name=doc_name,
-                tool=tool,
-                prompt=prompt_instance,
-                org_id=org_id,
-                document_id=document_id,
-                run_id=run_id,
-                profile_manager_id=profile_manager_id,
-                user_id=user_id,
-            )
+            if (
+                prompt_instance.enforce_type == TSPKeys.AGENTIC_TABLE
+                and payload_modifier_plugin
+            ):
+                modifier_service = payload_modifier_plugin["service_class"]()
+                response = modifier_service.execute_agentic_table(
+                    tool_id=tool_id,
+                    prompt_id=str(prompt_instance.prompt_id),
+                    prompt_key=prompt_name,
+                    prompt=prompt_instance.prompt,
+                    doc_path=doc_path,
+                    doc_name=doc_name,
+                    org_id=org_id,
+                    user_id=user_id,
+                    run_id=run_id,
+                )
+            else:
+                response = PromptStudioHelper._fetch_response(
+                    doc_path=doc_path,
+                    doc_name=doc_name,
+                    tool=tool,
+                    prompt=prompt_instance,
+                    org_id=org_id,
+                    document_id=document_id,
+                    run_id=run_id,
+                    profile_manager_id=profile_manager_id,
+                    user_id=user_id,
+                )
             return PromptStudioHelper._handle_response(
                 response=response,
                 run_id=run_id,
diff --git a/backend/prompt_studio/prompt_studio_core_v2/static/select_choices.json b/backend/prompt_studio/prompt_studio_core_v2/static/select_choices.json
index 3d59b2bf08..ee4c218ca2 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/static/select_choices.json
+++ b/backend/prompt_studio/prompt_studio_core_v2/static/select_choices.json
@@ -15,6 +15,7 @@
         "boolean":"boolean",
         "json":"json",
         "table":"table",
+        "agentic_table":"agentic_table",
         "line-item":"line-item"
     },
     "output_processing":{
diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 22c1a378bb..99edefd0b4 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -50,6 +50,7 @@
 from prompt_studio.prompt_studio_core_v2.exceptions import (
     DeploymentUsageCheckError,
     MaxProfilesReachedError,
+    OperationNotSupported,
     ToolDeleteError,
 )
 from prompt_studio.prompt_studio_core_v2.migration_utils import SummarizeMigrationUtils
@@ -509,6 +510,61 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
         document: DocumentManager = DocumentManager.objects.get(pk=document_id)
         doc_path = str(Path(doc_path) / document.document_name)
 
+        # Agentic table prompts have a separate executor worker. Build the
+        # payload via the cloud payload_modifier plugin and dispatch directly
+        # so the legacy answer_prompt path is bypassed.
+        if prompt.enforce_type == ToolStudioPromptKeys.AGENTIC_TABLE:
+            payload_modifier_plugin = get_plugin("payload_modifier")
+            if not payload_modifier_plugin:
+                raise OperationNotSupported()
+            modifier = payload_modifier_plugin["service_class"]()
+            context, cb_kwargs = modifier.build_agentic_table_payload(
+                tool=custom_tool,
+                prompt=prompt,
+                doc_path=doc_path,
+                doc_name=document.document_name,
+                org_id=org_id,
+                user_id=user_id,
+                document_id=document_id,
+                run_id=run_id,
+                profile_manager_id=profile_manager_id,
+            )
+
+            from prompt_studio.prompt_studio_output_manager_v2.models import (
+                PromptStudioOutputManager,
+            )
+
+            cb_kwargs["hubspot_user_id"] = request.user.pk
+            cb_kwargs[
+                "is_first_prompt_run"
+            ] = not PromptStudioOutputManager.objects.filter(
+                tool_id__in=CustomTool.objects.values_list("tool_id", flat=True)
+            ).exists()
+
+            dispatcher = PromptStudioHelper._get_dispatcher()
+            executor_task_id = str(uuid.uuid4())
+            cb_kwargs["executor_task_id"] = executor_task_id
+            cb_kwargs["dispatch_time"] = time.time()
+
+            task = dispatcher.dispatch_with_callback(
+                context,
+                on_success=signature(
+                    "ide_prompt_complete",
+                    kwargs={"callback_kwargs": cb_kwargs},
+                    queue="ide_callback",
+                ),
+                on_error=signature(
+                    "ide_prompt_error",
+                    kwargs={"callback_kwargs": cb_kwargs},
+                    queue="ide_callback",
+                ),
+                task_id=executor_task_id,
+            )
+            return Response(
+                {"task_id": task.id, "run_id": run_id, "status": "accepted"},
+                status=status.HTTP_202_ACCEPTED,
+            )
+
         context, cb_kwargs = PromptStudioHelper.build_fetch_response_payload(
             tool=custom_tool,
             doc_path=doc_path,
@@ -705,7 +761,7 @@ def single_pass_extraction(self, request: HttpRequest, pk: uuid) -> Response:
 
         # Fetch prompts eligible for single-pass extraction.
         # Mirrors the filtering in _execute_prompts_in_single_pass:
-        # only active, non-NOTES, non-TABLE/RECORD prompts.
+        # only active, non-NOTES, non-TABLE/RECORD/AGENTIC_TABLE prompts.
         prompts = list(
             ToolStudioPrompt.objects.filter(tool_id=custom_tool.tool_id).order_by(
                 "sequence_number"
@@ -718,6 +774,7 @@ def single_pass_extraction(self, request: HttpRequest, pk: uuid) -> Response:
             and p.active
             and p.enforce_type != ToolStudioPromptKeys.TABLE
             and p.enforce_type != ToolStudioPromptKeys.RECORD
+            and p.enforce_type != ToolStudioPromptKeys.AGENTIC_TABLE
         ]
         if not prompts:
             return Response(
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 405b91e00f..64932eb3f9 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -170,7 +170,13 @@ def update_or_create_prompt_output(
 
             # TODO: use enums here
             output = outputs.get(prompt.prompt_key)
-            if prompt.enforce_type in {"json", "table", "record", "line-item"}:
+            if prompt.enforce_type in {
+                "json",
+                "table",
+                "record",
+                "line-item",
+                "agentic_table",
+            }:
                 output = json.dumps(output)
             eval_metrics = outputs.get(f"{prompt.prompt_key}__evaluation", [])
             profile_manager = default_profile
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/constants.py b/backend/prompt_studio/prompt_studio_registry_v2/constants.py
index 785e77484c..35d6654851 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/constants.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/constants.py
@@ -12,6 +12,7 @@ class PromptStudioRegistryKeys:
     TABLE = "table"
     RECORD = "record"
     LINE_ITEM = "line-item"
+    AGENTIC_TABLE = "agentic_table"
 
 
 class PromptStudioRegistryErrors:
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 6ce1f72095..08d2c27baa 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -371,6 +371,15 @@ def frame_export_json(
                         prompt_id=prompt.prompt_id,
                         prompt=prompt.prompt,
                     )
+            elif prompt.enforce_type == PromptStudioRegistryKeys.AGENTIC_TABLE:
+                payload_modifier_plugin = get_plugin("payload_modifier")
+                if payload_modifier_plugin:
+                    modifier_service = payload_modifier_plugin["service_class"]()
+                    output = modifier_service.export_agentic_table_settings(
+                        output=output,
+                        tool_id=tool.tool_id,
+                        prompt_id=prompt.prompt_id,
+                    )
 
             outputs.append(output)
             output = {}
diff --git a/backend/prompt_studio/prompt_studio_v2/migrations/0014_alter_toolstudioprompt_enforce_type.py b/backend/prompt_studio/prompt_studio_v2/migrations/0014_alter_toolstudioprompt_enforce_type.py
new file mode 100644
index 0000000000..beae260ce2
--- /dev/null
+++ b/backend/prompt_studio/prompt_studio_v2/migrations/0014_alter_toolstudioprompt_enforce_type.py
@@ -0,0 +1,41 @@
+# Generated for agentic table enforce type
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        (
+            "prompt_studio_v2",
+            "0013_toolstudioprompt_enable_postprocessing_webhook_and_more",
+        ),
+    ]
+
+    operations = [
+        migrations.AlterField(
+            model_name="toolstudioprompt",
+            name="enforce_type",
+            field=models.TextField(
+                blank=True,
+                choices=[
+                    ("text", "Response sent as Text"),
+                    ("number", "Response sent as number"),
+                    ("email", "Response sent as email"),
+                    ("date", "Response sent as date"),
+                    ("boolean", "Response sent as boolean"),
+                    ("json", "Response sent as json"),
+                    (
+                        "line-item",
+                        "Response sent as line-item which is large a JSON output. If extraction stopped due to token limitation, we try to continue extraction from where it stopped",
+                    ),
+                    ("table", "Response sent as json"),
+                    (
+                        "agentic_table",
+                        "Response sent as agentic table extraction",
+                    ),
+                ],
+                db_comment="Field to store the type in             which the response to be returned.",
+                default="text",
+            ),
+        ),
+    ]
diff --git a/backend/prompt_studio/prompt_studio_v2/models.py b/backend/prompt_studio/prompt_studio_v2/models.py
index 74739bfe5a..b4c64f0912 100644
--- a/backend/prompt_studio/prompt_studio_v2/models.py
+++ b/backend/prompt_studio/prompt_studio_v2/models.py
@@ -31,6 +31,7 @@ class EnforceType(models.TextChoices):
             ),
         )
         TABLE = "table", "Response sent as json"
+        AGENTIC_TABLE = "agentic_table", "Response sent as agentic table extraction"
 
     class PromptType(models.TextChoices):
         PROMPT = "PROMPT", "Response sent as Text"
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index 4dd8c38667..bb40b324ef 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -529,7 +529,7 @@ services:
       - EXECUTOR_METRICS_PORT=8088
       - HEALTH_PORT=8088
       # Configurable Celery options
-      - CELERY_QUEUES_EXECUTOR=${CELERY_QUEUES_EXECUTOR:-celery_executor_legacy,celery_executor_agentic}
+      - CELERY_QUEUES_EXECUTOR=${CELERY_QUEUES_EXECUTOR:-celery_executor_legacy,celery_executor_agentic,celery_executor_agentic_table}
       - CELERY_POOL=${WORKER_EXECUTOR_POOL:-prefork}
       - CELERY_PREFETCH_MULTIPLIER=${WORKER_EXECUTOR_PREFETCH_MULTIPLIER:-1}
       - CELERY_CONCURRENCY=${WORKER_EXECUTOR_CONCURRENCY:-2}
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index 2b6d6b99c1..cea5e2d6d3 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -59,6 +59,7 @@ function Header({
   spsLoading,
   handleSpsLoading,
   enforceType,
+  isAgenticTableReady = true,
 }) {
   const {
     selectedDoc,
@@ -357,6 +358,7 @@ function Header({
                   )
                 }
                 disabled={
+                  !isAgenticTableReady ||
                   (updateStatus?.promptId === promptDetails?.prompt_id &&
                     updateStatus?.status ===
                       promptStudioUpdateStatus?.isUpdating) ||
@@ -380,6 +382,7 @@ function Header({
                   )
                 }
                 disabled={
+                  !isAgenticTableReady ||
                   (updateStatus?.promptId === promptDetails?.prompt_id &&
                     updateStatus?.status ===
                       promptStudioUpdateStatus?.isUpdating) ||
@@ -436,6 +439,7 @@ Header.propTypes = {
   spsLoading: PropTypes.object,
   handleSpsLoading: PropTypes.func.isRequired,
   enforceType: PropTypes.string,
+  isAgenticTableReady: PropTypes.bool,
 };
 
 export { Header };
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
index 90f4936a3a..6fd8b1bc6f 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
@@ -15,7 +15,6 @@ import { useEffect, useRef, useState } from "react";
 import { useCustomToolStore } from "../../../store/custom-tool-store";
 import { SpinnerLoader } from "../../widgets/spinner-loader/SpinnerLoader";
 import { EditableText } from "../editable-text/EditableText";
-import { TABLE } from "./constants";
 import { Header } from "./Header";
 import { OutputForIndex } from "./OutputForIndex";
 import { PromptOutput } from "./PromptOutput";
@@ -30,6 +29,16 @@ try {
   // The component will remain null of it is not available
 }
 
+let AgenticTableChecklist;
+try {
+  const mod = await import(
+    "../../../plugins/prompt-card/AgenticTableChecklist"
+  );
+  AgenticTableChecklist = mod.AgenticTableChecklist;
+} catch {
+  // The component will remain null of it is not available
+}
+
 function PromptCardItems({
   promptDetails,
   enforceTypeList,
@@ -82,6 +91,7 @@ function PromptCardItems({
   const divRef = useRef(null);
   const [enforceType, setEnforceType] = useState("");
   const [tableSettings, setTableSettings] = useState({});
+  const [isAgenticTableReady, setIsAgenticTableReady] = useState(true);
   const promptId = promptDetails?.prompt_id;
 
   useEffect(() => {
@@ -212,6 +222,7 @@ function PromptCardItems({
             spsLoading={spsLoading}
             handleSpsLoading={handleSpsLoading}
             enforceType={enforceType}
+            isAgenticTableReady={isAgenticTableReady}
           />
         </Space>
       </div>
@@ -222,6 +233,14 @@ function PromptCardItems({
       >
         <Collapse.Panel key={"1"} showArrow={false}>
           <div className="prompt-card-div-body">
+            {AgenticTableChecklist && (
+              <AgenticTableChecklist
+                promptId={promptDetails?.prompt_id}
+                promptText={promptText}
+                enforceType={enforceType}
+                onReadinessChange={setIsAgenticTableReady}
+              />
+            )}
             <EditableText
               isEditing={isEditingPrompt}
               setIsEditing={setIsEditingPrompt}
@@ -278,7 +297,7 @@ function PromptCardItems({
                         )}
                     </Space>
                     <Space>
-                      {enforceType === TABLE && TableExtractionSettingsBtn && (
+                      {TableExtractionSettingsBtn && (
                         <TableExtractionSettingsBtn
                           promptId={promptDetails?.prompt_id}
                           enforceType={enforceType}
@@ -324,6 +343,7 @@ function PromptCardItems({
               isChallenge={isChallenge}
               handleSelectHighlight={handleSelectHighlight}
               progressMsg={progressMsg}
+              isAgenticTableReady={isAgenticTableReady}
             />
           </Row>
         </Collapse.Panel>
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index 88df329744..38f7d924a6 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -67,6 +67,7 @@ function PromptOutput({
   isChallenge,
   handleSelectHighlight,
   progressMsg,
+  isAgenticTableReady = true,
 }) {
   const [openExpandModal, setOpenExpandModal] = useState(false);
   const { width: windowWidth } = useWindowDimensions();
@@ -386,7 +387,11 @@ function PromptOutput({
                             selectedDoc?.document_id,
                           )
                         }
-                        disabled={isPromptLoading || isPublicSource}
+                        disabled={
+                          !isAgenticTableReady ||
+                          isPromptLoading ||
+                          isPublicSource
+                        }
                       >
                         <PlayCircleOutlined className="prompt-card-actions-head" />
                       </Button>
@@ -404,7 +409,11 @@ function PromptOutput({
                             null,
                           )
                         }
-                        disabled={isPromptLoading || isPublicSource}
+                        disabled={
+                          !isAgenticTableReady ||
+                          isPromptLoading ||
+                          isPublicSource
+                        }
                       >
                         <PlayCircleFilled className="prompt-card-actions-head" />
                       </Button>
@@ -484,6 +493,7 @@ PromptOutput.propTypes = {
   isChallenge: PropTypes.bool,
   handleSelectHighlight: PropTypes.func.isRequired,
   progressMsg: PropTypes.object,
+  isAgenticTableReady: PropTypes.bool,
 };
 
 export { PromptOutput };
diff --git a/frontend/src/hooks/usePromptRun.js b/frontend/src/hooks/usePromptRun.js
index 44df3811c5..34fb42e7d7 100644
--- a/frontend/src/hooks/usePromptRun.js
+++ b/frontend/src/hooks/usePromptRun.js
@@ -16,7 +16,11 @@ import usePromptOutput from "./usePromptOutput";
 // Tracks the latest run nonce per (promptId, statusKey) so stale timeouts
 // from a previous run don't falsely cancel a newer run of the same combo.
 const runNonceMap = new Map();
-const SOCKET_TIMEOUT_MS = 5 * 60 * 1000; // 5 minutes
+// Safety-net timeout for the fire-and-forget prompt run flow. Must trail the
+// server-side LLM adapter timeout (default 900s in
+// unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/openai.json) so the UI
+// never gives up before the backend does. 16 minutes leaves a 1-minute buffer.
+const SOCKET_TIMEOUT_MS = 16 * 60 * 1000; // 16 minutes
 
 const usePromptRun = () => {
   const { pushPromptRunApi, freeActiveApi } = usePromptRunQueueStore();
diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index c1730e6613..4588e6946c 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -363,6 +363,96 @@ def complete(self, prompt: str, **kwargs: object) -> dict[str, object]:
                 message=error_msg, status_code=status_code, actual_err=e
             ) from e
 
+    @capture_metrics
+    def complete_vision(
+        self,
+        messages: list[dict[str, Any]],
+        **kwargs: object,
+    ) -> dict[str, object]:
+        """Chat completion with multimodal (text + image) messages.
+
+        Accepts pre-built messages with image_url content blocks::
+
+            [
+                {
+                    "role": "user",
+                    "content": [
+                        {"type": "text", "text": "..."},
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": "data:image/png;base64,..."},
+                        },
+                    ],
+                }
+            ]
+
+        LiteLLM auto-translates the OpenAI-style image format for
+        Anthropic, Bedrock, Vertex, and other providers.
+
+        Same error handling, usage tracking, and metrics as complete().
+
+        Args:
+            messages: List of message dicts with multimodal content.
+            **kwargs: Additional arguments passed to litellm.completion().
+
+        Returns:
+            dict with "response" key containing LLMResponseCompat.
+        """
+        try:
+            litellm.drop_params = True
+
+            logger.debug(
+                f"[sdk1][LLM]Invoking {self.adapter.get_provider()} "
+                f"vision completion API"
+            )
+
+            completion_kwargs = self.adapter.validate({**self.kwargs, **kwargs})
+            completion_kwargs.pop("cost_model", None)
+
+            response: dict[str, object] = litellm.completion(
+                messages=messages,
+                **completion_kwargs,
+            )
+
+            response_text = response["choices"][0]["message"]["content"]
+            finish_reason = response["choices"][0].get("finish_reason")
+
+            self._record_usage(
+                self._cost_model or self.kwargs["model"],
+                messages,
+                response.get("usage"),
+                "complete_vision",
+            )
+
+            if response_text is None:
+                self._raise_for_empty_response(finish_reason)
+
+            response_object = LLMResponseCompat(response_text)
+            response_object.raw = response
+            return {"response": response_object}
+
+        except LLMError:
+            raise
+        except SdkError:
+            raise
+        except Exception as e:
+            logger.error(f"[sdk1][LLM] Error during vision completion: {e}")
+
+            status_code = None
+            if hasattr(e, "status_code"):
+                status_code = e.status_code
+            elif hasattr(e, "http_status"):
+                status_code = e.http_status
+
+            error_msg = (
+                f"Error from LLM adapter '{self._get_adapter_info()}': "
+                f"{strip_litellm_prefix(str(e))}"
+            )
+
+            raise LLMError(
+                message=error_msg, status_code=status_code, actual_err=e
+            ) from e
+
     def stream_complete(
         self,
         prompt: str,
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 2a7dfc160d..3760aea067 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1909,25 +1909,36 @@ def _apply_type_conversion(
         prompt_name = output[PSKeys.NAME]
         output_type = output[PSKeys.TYPE]
 
+        # Defensive guard: agentic_table prompts must be dispatched to
+        # the dedicated agentic_table executor by the worker (Layer 2 in
+        # workers/file_processing/structure_tool_task.py). If one ever
+        # reaches this method, the legacy fallthrough below would store
+        # the raw LLM completion as a string. Skip silently with a
+        # warning so the caller's existing entry (if any) survives.
+        if output_type == "agentic_table":
+            logger.warning(
+                "Skipping agentic_table prompt %s in legacy executor — "
+                "should have been dispatched to agentic_table executor",
+                prompt_name,
+            )
+            return
+
         if output_type == PSKeys.NUMBER:
             structured_output[prompt_name] = LegacyExecutor._convert_number_answer(
                 answer, llm, answer_prompt_svc
             )
 
         elif output_type == PSKeys.EMAIL:
-            if answer.lower() == "na":
-                structured_output[prompt_name] = answer
-            else:
-                email_prompt = (
-                    f"Extract the email from the following text:\n{answer}"
-                    f"\n\nOutput just the email. "
-                    f"The email should be directly assignable to a string "
-                    f"variable. No explanation is required. If you cannot "
-                    f'extract the email, output "NA".'
-                )
-                structured_output[prompt_name] = answer_prompt_svc.run_completion(
-                    llm=llm, prompt=email_prompt
-                )
+            email_prompt = (
+                f"Extract the email from the following text:\n{answer}"
+                f"\n\nOutput just the email. "
+                f"The email should be directly assignable to a string "
+                f"variable. No explanation is required. If you cannot "
+                f'extract the email, output "NA".'
+            )
+            structured_output[prompt_name] = LegacyExecutor._convert_scalar_answer(
+                answer, llm, answer_prompt_svc, email_prompt
+            )
 
         elif output_type == PSKeys.DATE:
             date_prompt = (
diff --git a/workers/executor/executors/retrievers/fusion.py b/workers/executor/executors/retrievers/fusion.py
index 7449ddb8e6..be6810ad28 100644
--- a/workers/executor/executors/retrievers/fusion.py
+++ b/workers/executor/executors/retrievers/fusion.py
@@ -64,7 +64,7 @@ def retrieve(self) -> set[str]:
                 mode="simple",  # Use simple fusion mode (reciprocal rank fusion)
                 use_async=False,
                 verbose=True,
-                llm=llm,
+                llm=llm,  # LLM generates query variations
             )
 
             # Retrieve nodes using fusion technique
diff --git a/workers/executor/executors/retrievers/keyword_table.py b/workers/executor/executors/retrievers/keyword_table.py
index 912b2fb7f8..5c7db9ab4e 100644
--- a/workers/executor/executors/retrievers/keyword_table.py
+++ b/workers/executor/executors/retrievers/keyword_table.py
@@ -48,7 +48,7 @@ def retrieve(self) -> set[str]:
             keyword_index = KeywordTableIndex(
                 nodes=[node.node for node in all_nodes],
                 show_progress=True,
-                llm=llm,
+                llm=llm,  # Use the provided LLM instead of defaulting to OpenAI
             )
 
             # Create retriever from keyword index
diff --git a/workers/file_processing/structure_tool_task.py b/workers/file_processing/structure_tool_task.py
index 87c9426376..c0fdee1c00 100644
--- a/workers/file_processing/structure_tool_task.py
+++ b/workers/file_processing/structure_tool_task.py
@@ -301,7 +301,35 @@ def _execute_structure_tool_impl(params: dict) -> dict:
 
     tool_id = tool_metadata[_SK.TOOL_ID]
     tool_settings = tool_metadata[_SK.TOOL_SETTINGS]
-    outputs = tool_metadata[_SK.OUTPUTS]
+    all_outputs = tool_metadata[_SK.OUTPUTS]
+
+    # ---- Partition prompts by enforce_type ----
+    # Agentic table prompts run via a dedicated executor (page-by-page
+    # extraction + Agent-5 schema cleanup). Regular prompts continue
+    # through the legacy structure_pipeline. Use local variables so
+    # tool_metadata[_SK.OUTPUTS] is preserved for METADATA.json
+    # serialization downstream in _write_tool_result.
+    agentic_table_outputs = [o for o in all_outputs if o.get("type") == "agentic_table"]
+    regular_outputs = [o for o in all_outputs if o.get("type") != "agentic_table"]
+
+    # Validate readiness for each agentic_table prompt: if the export
+    # step did not populate agentic_table_settings, fail loudly so the
+    # user knows to re-export the tool instead of producing the
+    # legacy stringified-truncated output.
+    for at_output in agentic_table_outputs:
+        at_settings = at_output.get("agentic_table_settings") or {}
+        if not at_settings.get("target_table") or not at_settings.get("json_structure"):
+            return ExecutionResult.failure(
+                error=(
+                    f"Agentic table prompt '{at_output[_SK.NAME]}' is missing "
+                    f"agentic_table_settings in the exported tool metadata. "
+                    f"Re-export the tool from Prompt Studio after the fix is "
+                    f"deployed to populate target_table / json_structure / "
+                    f"instructions."
+                )
+            ).to_dict()
+
+    outputs = regular_outputs
 
     # Inject workflow-level settings into tool_settings
     tool_settings[_SK.CHALLENGE_LLM] = challenge_llm
@@ -388,42 +416,103 @@ def _execute_structure_tool_impl(params: dict) -> dict:
             "prompt_keys": prompt_keys,
         }
 
-    # ---- Step 6: Single dispatch to executor ----
-    logger.info(
-        "Dispatching structure_pipeline: tool_id=%s "
-        "skip_extract=%s summarize=%s single_pass=%s",
-        tool_id,
-        skip_extraction_and_indexing,
-        is_summarization_enabled,
-        is_single_pass_enabled,
-    )
-
-    pipeline_ctx = ExecutionContext(
-        executor_name="legacy",
-        operation="structure_pipeline",
-        run_id=file_execution_id,
-        execution_source="tool",
-        organization_id=organization_id,
-        request_id=file_execution_id,
-        log_events_id=StateStore.get("LOG_EVENTS_ID") or "",
-        execution_id=execution_id,
-        file_execution_id=file_execution_id,
-        executor_params={
-            "extract_params": extract_params,
-            "index_template": index_template,
-            "answer_params": answer_params,
-            "pipeline_options": pipeline_options,
-            "summarize_params": summarize_params,
-        },
-    )
-    pipeline_start = time.monotonic()
-    pipeline_result = dispatcher.dispatch(pipeline_ctx, timeout=EXECUTOR_TIMEOUT)
-    pipeline_elapsed = time.monotonic() - pipeline_start
-
-    if not pipeline_result.success:
-        return pipeline_result.to_dict()
+    # ---- Step 6a: Dispatch agentic_table prompts ----
+    # Each agentic_table prompt runs in its own executor invocation.
+    # The executor handles X2Text extraction internally; we just
+    # forward the document path and the per-prompt settings unpacked
+    # from agentic_table_settings (populated by Layer 1 export).
+    #
+    # Important: read from SOURCE, not INFILE. INFILE gets overwritten
+    # with JSON output at the end of this function (line ~508), so any
+    # subsequent reuse of the same file_execution_dir would surface JSON
+    # bytes to the agentic_table executor and fail PDF parsing
+    # ("PDFium: Data format error"). SOURCE is the immutable original
+    # PDF written alongside INFILE by the source connector.
+    agentic_source_path = str(execution_run_data_folder / "SOURCE")
+    agentic_results: dict[str, Any] = {}
+    for at_output in agentic_table_outputs:
+        at_settings = at_output.get("agentic_table_settings") or {}
+        json_structure = at_settings.get("json_structure")
+        if isinstance(json_structure, dict):
+            json_structure = json.dumps(json_structure)
+        agentic_params = {
+            "llm_adapter_instance_id": at_output["llm"],
+            "lite_llm_adapter_instance_id": at_settings.get(
+                "lite_llm_adapter_instance_id", ""
+            ),
+            "x2text_adapter_instance_id": tool_settings[_SK.X2TEXT_ADAPTER],
+            "input_file": agentic_source_path,
+            "source_file_name": source_file_name,
+            "target_table": at_settings.get("target_table", ""),
+            "json_structure": json_structure,
+            "instructions": at_settings.get("instructions", ""),
+            "starting_page": at_settings.get("start_page", 1),
+            "ending_page": at_settings.get("end_page") or None,
+            "parallel_pages": at_settings.get("parallel_pages", 4),
+            "execution_id": execution_id,
+            "PLATFORM_SERVICE_API_KEY": platform_service_api_key,
+        }
+        at_ctx = ExecutionContext(
+            executor_name="agentic_table",
+            operation="table_extract",
+            run_id=file_execution_id,
+            execution_source="tool",
+            organization_id=organization_id,
+            request_id=file_execution_id,
+            executor_params=agentic_params,
+        )
+        at_result = dispatcher.dispatch(at_ctx, timeout=EXECUTOR_TIMEOUT)
+        if not at_result.success:
+            return at_result.to_dict()
+        at_output_data = at_result.data.get("output", {}) or {}
+        agentic_results[at_output[_SK.NAME]] = at_output_data.get("tables", [])
+
+    # ---- Step 6b: Dispatch legacy structure_pipeline ----
+    # Skipped entirely when every prompt is agentic_table — the legacy
+    # pipeline has no work to do and the agentic_table executor does
+    # its own X2Text inside the runner.
+    if regular_outputs:
+        logger.info(
+            "Dispatching structure_pipeline: tool_id=%s "
+            "skip_extract=%s summarize=%s single_pass=%s",
+            tool_id,
+            skip_extraction_and_indexing,
+            is_summarization_enabled,
+            is_single_pass_enabled,
+        )
 
-    structured_output = pipeline_result.data
+        pipeline_ctx = ExecutionContext(
+            executor_name="legacy",
+            operation="structure_pipeline",
+            run_id=file_execution_id,
+            execution_source="tool",
+            organization_id=organization_id,
+            request_id=file_execution_id,
+            executor_params={
+                "extract_params": extract_params,
+                "index_template": index_template,
+                "answer_params": answer_params,
+                "pipeline_options": pipeline_options,
+                "summarize_params": summarize_params,
+            },
+        )
+        pipeline_start = time.monotonic()
+        pipeline_result = dispatcher.dispatch(pipeline_ctx, timeout=EXECUTOR_TIMEOUT)
+        pipeline_elapsed = time.monotonic() - pipeline_start
+
+        if not pipeline_result.success:
+            return pipeline_result.to_dict()
+
+        structured_output = pipeline_result.data
+        if agentic_results:
+            structured_output.setdefault("output", {}).update(agentic_results)
+    else:
+        # All-agentic case: skip the legacy pipeline entirely.
+        structured_output = {
+            "output": agentic_results,
+            "metadata": {"agentic_only": True},
+        }
+        pipeline_elapsed = 0.0
 
     # ---- Step 7: Write output files ----
     # (metadata/metrics merging already done by executor pipeline)
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index cb610678b1..d0dbce2563 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -392,6 +392,16 @@ def ide_prompt_complete(
         outputs = _json_safe(data.get("output", {}))
         metadata = _json_safe(data.get("metadata", {}))
 
+        # Agentic table executor returns {"tables": [...], "page_count": ...,
+        # "headers": [...], ...}, but OutputManagerHelper expects
+        # outputs[prompt.prompt_key] to be the value for that prompt. Reshape
+        # so the table list lands under the prompt key.
+        if cb.get("is_agentic_table"):
+            prompt_key = cb.get("prompt_key", "")
+            if prompt_key:
+                tables = outputs.get("tables", []) if isinstance(outputs, dict) else []
+                outputs = {prompt_key: tables}
+
         logger.info(
             "ide_prompt_complete: operation=%s output_keys=%s prompt_ids=%s "
             "doc=%s profile=%s",
diff --git a/workers/tests/test_answer_prompt.py b/workers/tests/test_answer_prompt.py
index 6c9fb9fce9..4b58c4c1ea 100644
--- a/workers/tests/test_answer_prompt.py
+++ b/workers/tests/test_answer_prompt.py
@@ -622,8 +622,8 @@ def test_invalid_strategy_skips_retrieval(
         )
         result = executor._handle_answer_prompt(ctx)
 
-        # Answer stays "NA" (top-level NA is preserved, not sanitized)
-        assert result.data[PSKeys.OUTPUT]["field_a"] == "NA"
+        # Answer stays "NA" which gets sanitized to None
+        assert result.data[PSKeys.OUTPUT]["field_a"] is None
 
 
 class TestHandleAnswerPromptMultiPrompt:
@@ -747,21 +747,21 @@ def test_vectordb_closed(self, mock_shim_cls, mock_deps):
 class TestNullSanitization:
     """Tests for _sanitize_null_values."""
 
-    def test_na_string_preserved(self):
-        """Top-level 'NA' string is preserved (not sanitized to None)."""
+    def test_na_string_becomes_none(self):
+        """Top-level 'NA' string → None."""
         from executor.executors.legacy_executor import LegacyExecutor
 
         output = {"field": "NA"}
         result = LegacyExecutor._sanitize_null_values(output)
-        assert result["field"] == "NA"
+        assert result["field"] is None
 
-    def test_na_case_insensitive_preserved(self):
-        """Top-level 'na' (lowercase) is preserved (not sanitized to None)."""
+    def test_na_case_insensitive(self):
+        """'na' (lowercase) → None."""
         from executor.executors.legacy_executor import LegacyExecutor
 
         output = {"field": "na"}
         result = LegacyExecutor._sanitize_null_values(output)
-        assert result["field"] == "na"
+        assert result["field"] is None
 
     def test_nested_list_na(self):
         """NA in nested list items → None."""

From 5d591dc4e35447bd67081f770a488f9fd88cc878 Mon Sep 17 00:00:00 2001
From: Kirtiman Mishra
 <110175055+kirtimanmishrazipstack@users.noreply.github.com>
Date: Tue, 28 Apr 2026 17:08:43 +0530
Subject: [PATCH 05/27] UN-3358 [FIX] Drop cross-region S3 buckets from
 connector listing (#1931)

* list bucket

* greptile review
---
 .../filesystems/minio/exceptions.py           | 12 ++++++----
 .../tests/filesystems/test_miniofs.py         | 22 ++++++++++++++++---
 2 files changed, 27 insertions(+), 7 deletions(-)

diff --git a/unstract/connectors/src/unstract/connectors/filesystems/minio/exceptions.py b/unstract/connectors/src/unstract/connectors/filesystems/minio/exceptions.py
index 2a4149ecaa..dd46e61b16 100644
--- a/unstract/connectors/src/unstract/connectors/filesystems/minio/exceptions.py
+++ b/unstract/connectors/src/unstract/connectors/filesystems/minio/exceptions.py
@@ -8,20 +8,24 @@
 class BucketProbeDisposition(Enum):
     """Action for a `list_objects_v2` probe failure, per S3 error code."""
 
-    DROP = "drop"  # Hide the bucket (no access, or bucket gone).
-    FAIL_OPEN = "fail_open"  # Region mismatch — keep bucket visible.
+    DROP = "drop"  # Hide the bucket (no access, bucket gone, or unreachable).
+    FAIL_OPEN = "fail_open"  # Keep the bucket visible despite the probe error.
     RETRY_FAIL_OPEN = "retry_fail_open"  # Throttled — retry once, then keep.
 
 
 # S3 `Error.Code` → probe disposition. Unlisted codes propagate.
 # `RequestTimeTooSkewed` is omitted deliberately: it's a system-wide clock
 # issue, not a bucket outcome — let it surface via `handle_s3fs_exception`.
+# `PermanentRedirect` / `IllegalLocationConstraintException` are dropped: the
+# connector is pinned to one `endpoint_url`, so cross-region buckets can't
+# be browsed through it regardless of IAM — listing them only surfaces a
+# confusing `[Errno 78]` on click.
 BUCKET_PROBE_DISPOSITION: dict[str, BucketProbeDisposition] = {
     "AccessDenied": BucketProbeDisposition.DROP,
     "AllAccessDisabled": BucketProbeDisposition.DROP,
     "NoSuchBucket": BucketProbeDisposition.DROP,
-    "PermanentRedirect": BucketProbeDisposition.FAIL_OPEN,
-    "IllegalLocationConstraintException": BucketProbeDisposition.FAIL_OPEN,
+    "PermanentRedirect": BucketProbeDisposition.DROP,
+    "IllegalLocationConstraintException": BucketProbeDisposition.DROP,
     "SlowDown": BucketProbeDisposition.RETRY_FAIL_OPEN,
     "Throttling": BucketProbeDisposition.RETRY_FAIL_OPEN,
     "ThrottlingException": BucketProbeDisposition.RETRY_FAIL_OPEN,
diff --git a/unstract/connectors/tests/filesystems/test_miniofs.py b/unstract/connectors/tests/filesystems/test_miniofs.py
index 3cf9ade1f2..9da9a1dcf0 100644
--- a/unstract/connectors/tests/filesystems/test_miniofs.py
+++ b/unstract/connectors/tests/filesystems/test_miniofs.py
@@ -104,15 +104,31 @@ def test_no_such_bucket_is_dropped(self) -> None:
         ):
             self.assertFalse(asyncio.run(fs._is_bucket_accessible("deleted")))
 
-    def test_permanent_redirect_bucket_is_kept(self) -> None:
-        # Fail-open: region mismatch keeps the bucket listed.
+    def test_permanent_redirect_bucket_is_dropped(self) -> None:
+        # Connector pins one endpoint_url; cross-region buckets are unreachable
+        # via this connector regardless of IAM, so drop them rather than fail
+        # later with [Errno 78] on click.
         fs = self._make_fs()
         with patch.object(
             fs,
             "_call_s3",
             new=AsyncMock(side_effect=_translated_error("PermanentRedirect")),
         ):
-            self.assertTrue(asyncio.run(fs._is_bucket_accessible("other-region")))
+            self.assertFalse(asyncio.run(fs._is_bucket_accessible("other-region")))
+
+    def test_illegal_location_constraint_bucket_is_dropped(self) -> None:
+        # Companion to PermanentRedirect: same cross-region condition surfaced
+        # as a 400 instead of a 301. Guards against a future edit reverting
+        # only one of the two cross-region entries in BUCKET_PROBE_DISPOSITION.
+        fs = self._make_fs()
+        with patch.object(
+            fs,
+            "_call_s3",
+            new=AsyncMock(
+                side_effect=_translated_error("IllegalLocationConstraintException")
+            ),
+        ):
+            self.assertFalse(asyncio.run(fs._is_bucket_accessible("wrong-region")))
 
     def test_throttling_retries_then_fails_open(self) -> None:
         fs = self._make_fs()

From 019f33ccf4cab9da8ce9c258bb3c1b6fcca92660 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Tue, 5 May 2026 20:49:03 +0530
Subject: [PATCH 06/27] payload metadata in api deployment

---
 backend/api_v2/notification.py                |  46 +++--
 backend/notification_v2/enums.py              |  12 --
 backend/notification_v2/internal_api_views.py | 195 ++++++++++--------
 .../migrations/0002_notification_notify_on.py |  30 ---
 .../0002_notification_notify_on_failures.py   |  23 +++
 backend/notification_v2/models.py             |  15 +-
 backend/notification_v2/serializers.py        |   8 +-
 backend/pipeline_v2/dto.py                    |  11 +-
 backend/pipeline_v2/notification.py           |  73 +++++--
 .../workflow_manager/internal_serializers.py  |   2 +
 backend/workflow_manager/internal_views.py    |  13 +-
 .../0020_workflowexecution_file_counts.py     |  36 ++++
 .../workflow_v2/models/execution.py           |  31 ++-
 .../notification-modal/CreateNotification.jsx |  23 +--
 .../core/src/unstract/core/data_models.py     |  12 ++
 workers/callback/tasks.py                     |   4 +
 workers/scheduler/tasks.py                    |   1 +
 workers/shared/api/internal_client.py         |   4 +
 workers/shared/clients/execution_client.py    |   8 +
 .../shared/patterns/notification/helper.py    |  33 ++-
 20 files changed, 361 insertions(+), 219 deletions(-)
 delete mode 100644 backend/notification_v2/migrations/0002_notification_notify_on.py
 create mode 100644 backend/notification_v2/migrations/0002_notification_notify_on_failures.py
 create mode 100644 backend/workflow_manager/workflow_v2/migrations/0020_workflowexecution_file_counts.py

diff --git a/backend/api_v2/notification.py b/backend/api_v2/notification.py
index a41ebc3000..57e810c0e9 100644
--- a/backend/api_v2/notification.py
+++ b/backend/api_v2/notification.py
@@ -1,6 +1,5 @@
 import logging
 
-from notification_v2.enums import NotificationTrigger
 from notification_v2.helper import NotificationHelper
 from notification_v2.models import Notification
 from pipeline_v2.dto import PipelineStatusPayload
@@ -12,6 +11,9 @@
 logger = logging.getLogger(__name__)
 
 
+_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
+
+
 class APINotification:
     def __init__(self, api: APIDeployment, workflow_execution: WorkflowExecution) -> None:
         self.notifications = Notification.objects.filter(api=api, is_active=True)
@@ -19,31 +21,32 @@ def __init__(self, api: APIDeployment, workflow_execution: WorkflowExecution) ->
         self.workflow_execution = workflow_execution
 
     def send(self) -> None:
-        # Partition notifications by the run outcome so each row's notify_on
-        # preference is honored. STOPPED and any other non-terminal status
-        # fire only for ALL — explicit opt-ins to FAILURES/SUCCESS shouldn't.
-        status = self.workflow_execution.status
-        if status == ExecutionStatus.ERROR.value:
-            self.notifications = self.notifications.exclude(
-                notify_on=NotificationTrigger.SUCCESS_ONLY.value
-            )
-        elif status == ExecutionStatus.COMPLETED.value:
-            self.notifications = self.notifications.exclude(
-                notify_on=NotificationTrigger.FAILURES_ONLY.value
-            )
-        else:
-            self.notifications = self.notifications.filter(
-                notify_on=NotificationTrigger.ALL.value
-            )
+        # Failure if the run hit a non-success terminal state OR any file errored.
+        # Partial-success runs land as status=COMPLETED with failed_files>0, so the
+        # status check alone misses them — see callback aggregation rules.
+        failed_files = self.workflow_execution.failed_files or 0
+        is_failure = (
+            self.workflow_execution.status in _FAILURE_STATUSES or failed_files > 0
+        )
+        if not is_failure:
+            # Success path: skip rows that opted into failure-only alerts.
+            self.notifications = self.notifications.filter(notify_on_failures=False)
 
         if not self.notifications.exists():
             logger.info(
-                "No notifications to dispatch for api %s (status=%s)",
+                "No notifications to dispatch for api %s (status=%s, failed_files=%s)",
                 self.api,
-                status,
+                self.workflow_execution.status,
+                failed_files,
             )
             return
-        logger.info("Sending api status notification for api %s", self.api)
+        logger.info(
+            "Sending api status notification for api %s (status=%s, successful=%s, failed=%s)",
+            self.api,
+            self.workflow_execution.status,
+            self.workflow_execution.successful_files or 0,
+            failed_files,
+        )
 
         payload_dto = PipelineStatusPayload(
             type="API",
@@ -52,6 +55,9 @@ def send(self) -> None:
             status=self.workflow_execution.status,
             execution_id=self.workflow_execution.id,
             error_message=self.workflow_execution.error_message,
+            total_files=self.workflow_execution.total_files,
+            successful_files=self.workflow_execution.successful_files,
+            failed_files=failed_files,
         )
 
         NotificationHelper.send_notification(
diff --git a/backend/notification_v2/enums.py b/backend/notification_v2/enums.py
index 516b34074b..991b08cac9 100644
--- a/backend/notification_v2/enums.py
+++ b/backend/notification_v2/enums.py
@@ -36,15 +36,3 @@ class PlatformType(Enum):
     @classmethod
     def choices(cls):
         return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
-
-
-class NotificationTrigger(Enum):
-    """Controls which run outcomes fire a notification."""
-
-    ALL = "ALL"
-    FAILURES_ONLY = "FAILURES_ONLY"
-    SUCCESS_ONLY = "SUCCESS_ONLY"
-
-    @classmethod
-    def choices(cls):
-        return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 6843d5a50c..3e3f386b17 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -10,14 +10,18 @@
 """
 
 import logging
+from typing import Any, cast
 
 from api_v2.models import APIDeployment
-from django.http import JsonResponse
+from django.db.models import QuerySet
+from django.http import HttpRequest, JsonResponse
 from django.shortcuts import get_object_or_404
 from django.views.decorators.csrf import csrf_exempt
 from django.views.decorators.http import require_http_methods
 from pipeline_v2.models import Pipeline
 from utils.organization_utils import filter_queryset_by_organization
+from workflow_manager.workflow_v2.enums import ExecutionStatus
+from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from notification_v2.models import Notification
 
@@ -26,10 +30,71 @@
 # Constants for error messages
 INTERNAL_SERVER_ERROR_MSG = "Internal server error"
 
+_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
+
+
+def _load_execution(execution_id: str | None) -> WorkflowExecution | None:
+    """Best-effort lookup; returns None on missing id or unknown row."""
+    if not execution_id:
+        return None
+    try:
+        return cast(WorkflowExecution, WorkflowExecution.objects.get(id=execution_id))
+    except WorkflowExecution.DoesNotExist:
+        logger.warning("WorkflowExecution %s not found", execution_id)
+        return None
+
+
+def _apply_failure_filter(
+    notifications_qs: QuerySet[Notification],
+    execution: WorkflowExecution | None,
+) -> QuerySet[Notification]:
+    """Drop notify_on_failures=True rows on success runs.
+
+    Mirrors the dispatch-side rule in backend/api_v2/notification.py and
+    backend/pipeline_v2/notification.py so both code paths agree on what
+    counts as a failure (status ∈ {ERROR, STOPPED} OR any file errored).
+
+    No execution → no filter, preserving legacy "return every active row"
+    behavior for callers that don't pass execution_id.
+    """
+    if execution is None:
+        return notifications_qs
+    failed_files = execution.failed_files or 0
+    is_failure = execution.status in _FAILURE_STATUSES or failed_files > 0
+    if not is_failure:
+        notifications_qs = notifications_qs.filter(notify_on_failures=False)
+    return notifications_qs
+
+
+def _execution_counts(execution: WorkflowExecution | None) -> dict[str, int]:
+    """File counts surfaced into webhook payloads. Empty dict on no execution."""
+    if execution is None:
+        return {}
+    return {
+        "total_files": execution.total_files or 0,
+        "successful_files": execution.successful_files or 0,
+        "failed_files": execution.failed_files or 0,
+    }
+
+
+def _serialize_notification(n: Notification) -> dict[str, Any]:
+    return {
+        "id": str(n.id),
+        "notification_type": n.notification_type,
+        "platform": n.platform,
+        "url": n.url,
+        "authorization_type": n.authorization_type,
+        "authorization_key": n.authorization_key,
+        "authorization_header": n.authorization_header,
+        "max_retries": n.max_retries,
+        "is_active": n.is_active,
+        "notify_on_failures": n.notify_on_failures,
+    }
+
 
 @csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
 @require_http_methods(["GET"])
-def get_pipeline_notifications(request, pipeline_id):
+def get_pipeline_notifications(request: HttpRequest, pipeline_id: str) -> JsonResponse:
     """Get active notifications for a pipeline or API deployment.
 
     Used by callback worker to fetch notification configuration.
@@ -41,83 +106,53 @@ def get_pipeline_notifications(request, pipeline_id):
             pipeline_queryset, request, "organization"
         )
 
+        execution = _load_execution(request.GET.get("execution_id"))
+        counts = _execution_counts(execution)
+
         if pipeline_queryset.exists():
             pipeline = pipeline_queryset.first()
-
-            # Get active notifications for this pipeline
             notifications = Notification.objects.filter(pipeline=pipeline, is_active=True)
-
-            notifications_data = []
-            for notification in notifications:
-                notifications_data.append(
-                    {
-                        "id": str(notification.id),
-                        "notification_type": notification.notification_type,
-                        "platform": notification.platform,
-                        "url": notification.url,
-                        "authorization_type": notification.authorization_type,
-                        "authorization_key": notification.authorization_key,
-                        "authorization_header": notification.authorization_header,
-                        "max_retries": notification.max_retries,
-                        "is_active": notification.is_active,
-                    }
-                )
-
+            notifications = _apply_failure_filter(notifications, execution)
+            serialized = [_serialize_notification(n) for n in notifications]
             return JsonResponse(
                 {
                     "status": "success",
                     "pipeline_id": str(pipeline.id),
                     "pipeline_name": pipeline.pipeline_name,
                     "pipeline_type": pipeline.pipeline_type,
-                    "notifications": notifications_data,
+                    "notifications": serialized,
+                    "execution_counts": counts,
                 }
             )
-        else:
-            # If not found in Pipeline, try APIDeployment model
-            api_queryset = APIDeployment.objects.filter(id=pipeline_id)
-            api_queryset = filter_queryset_by_organization(
-                api_queryset, request, "organization"
+
+        # If not found in Pipeline, try APIDeployment model
+        api_queryset = APIDeployment.objects.filter(id=pipeline_id)
+        api_queryset = filter_queryset_by_organization(
+            api_queryset, request, "organization"
+        )
+        if api_queryset.exists():
+            api = api_queryset.first()
+            notifications = Notification.objects.filter(api=api, is_active=True)
+            notifications = _apply_failure_filter(notifications, execution)
+            serialized = [_serialize_notification(n) for n in notifications]
+            return JsonResponse(
+                {
+                    "status": "success",
+                    "pipeline_id": str(api.id),
+                    "pipeline_name": api.api_name,
+                    "pipeline_type": "API",
+                    "notifications": serialized,
+                    "execution_counts": counts,
+                }
             )
 
-            if api_queryset.exists():
-                api = api_queryset.first()
-
-                # Get active notifications for this API deployment
-                notifications = Notification.objects.filter(api=api, is_active=True)
-
-                notifications_data = []
-                for notification in notifications:
-                    notifications_data.append(
-                        {
-                            "id": str(notification.id),
-                            "notification_type": notification.notification_type,
-                            "platform": notification.platform,
-                            "url": notification.url,
-                            "authorization_type": notification.authorization_type,
-                            "authorization_key": notification.authorization_key,
-                            "authorization_header": notification.authorization_header,
-                            "max_retries": notification.max_retries,
-                            "is_active": notification.is_active,
-                        }
-                    )
-
-                return JsonResponse(
-                    {
-                        "status": "success",
-                        "pipeline_id": str(api.id),
-                        "pipeline_name": api.api_name,
-                        "pipeline_type": "API",
-                        "notifications": notifications_data,
-                    }
-                )
-            else:
-                return JsonResponse(
-                    {
-                        "status": "error",
-                        "message": "Pipeline or API deployment not found",
-                    },
-                    status=404,
-                )
+        return JsonResponse(
+            {
+                "status": "error",
+                "message": "Pipeline or API deployment not found",
+            },
+            status=404,
+        )
     except Exception as e:
         logger.error(f"Error getting pipeline notifications for {pipeline_id}: {e}")
         return JsonResponse(
@@ -127,7 +162,7 @@ def get_pipeline_notifications(request, pipeline_id):
 
 @csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
 @require_http_methods(["GET"])
-def get_api_notifications(request, api_id):
+def get_api_notifications(request: HttpRequest, api_id: str) -> JsonResponse:
     """Get active notifications for an API deployment.
 
     Used by callback worker to fetch notification configuration.
@@ -140,24 +175,9 @@ def get_api_notifications(request, api_id):
         )
         api = get_object_or_404(api_queryset)
 
-        # Get active notifications for this API
+        execution = _load_execution(request.GET.get("execution_id"))
         notifications = Notification.objects.filter(api=api, is_active=True)
-
-        notifications_data = []
-        for notification in notifications:
-            notifications_data.append(
-                {
-                    "id": str(notification.id),
-                    "notification_type": notification.notification_type,
-                    "platform": notification.platform,
-                    "url": notification.url,
-                    "authorization_type": notification.authorization_type,
-                    "authorization_key": notification.authorization_key,
-                    "authorization_header": notification.authorization_header,
-                    "max_retries": notification.max_retries,
-                    "is_active": notification.is_active,
-                }
-            )
+        notifications = _apply_failure_filter(notifications, execution)
 
         return JsonResponse(
             {
@@ -165,7 +185,8 @@ def get_api_notifications(request, api_id):
                 "api_id": str(api.id),
                 "api_name": api.api_name,
                 "display_name": api.display_name,
-                "notifications": notifications_data,
+                "notifications": [_serialize_notification(n) for n in notifications],
+                "execution_counts": _execution_counts(execution),
             }
         )
 
@@ -182,7 +203,7 @@ def get_api_notifications(request, api_id):
 
 @csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
 @require_http_methods(["GET"])
-def get_pipeline_data(request, pipeline_id):
+def get_pipeline_data(request: HttpRequest, pipeline_id: str) -> JsonResponse:
     """Get basic pipeline data for notification purposes.
 
     Used by callback worker to determine pipeline type and name.
@@ -218,7 +239,7 @@ def get_pipeline_data(request, pipeline_id):
 
 @csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
 @require_http_methods(["GET"])
-def get_api_data(request, api_id):
+def get_api_data(request: HttpRequest, api_id: str) -> JsonResponse:
     """Get basic API deployment data for notification purposes.
 
     Used by callback worker to determine API name and details.
diff --git a/backend/notification_v2/migrations/0002_notification_notify_on.py b/backend/notification_v2/migrations/0002_notification_notify_on.py
deleted file mode 100644
index 53c1180126..0000000000
--- a/backend/notification_v2/migrations/0002_notification_notify_on.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from django.db import migrations, models
-
-
-class Migration(migrations.Migration):
-    dependencies = [
-        ("notification_v2", "0001_initial"),
-    ]
-
-    operations = [
-        migrations.AddField(
-            model_name="notification",
-            name="notify_on",
-            field=models.CharField(
-                max_length=50,
-                choices=[
-                    ("ALL", "All"),
-                    ("FAILURES_ONLY", "Failures only"),
-                    ("SUCCESS_ONLY", "Success only"),
-                ],
-                default="ALL",
-                db_comment=(
-                    "Controls which run outcomes trigger this notification. ALL "
-                    "(default) preserves the historical 'notify on every "
-                    "completion' behavior; FAILURES_ONLY fires only on failed "
-                    "runs (ERROR for API deployments, FAILURE for ETL "
-                    "pipelines); SUCCESS_ONLY fires only on successful runs."
-                ),
-            ),
-        ),
-    ]
diff --git a/backend/notification_v2/migrations/0002_notification_notify_on_failures.py b/backend/notification_v2/migrations/0002_notification_notify_on_failures.py
new file mode 100644
index 0000000000..ce0c3535b5
--- /dev/null
+++ b/backend/notification_v2/migrations/0002_notification_notify_on_failures.py
@@ -0,0 +1,23 @@
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("notification_v2", "0001_initial"),
+    ]
+
+    operations = [
+        migrations.AddField(
+            model_name="notification",
+            name="notify_on_failures",
+            field=models.BooleanField(
+                default=False,
+                db_comment=(
+                    "When True, fire only on failed runs — terminal status "
+                    "ERROR/STOPPED or any file in the run errored (partial "
+                    "failure). When False (default), fire on every terminal "
+                    "completion."
+                ),
+            ),
+        ),
+    ]
diff --git a/backend/notification_v2/models.py b/backend/notification_v2/models.py
index 4fe21cd6c4..e5238ec176 100644
--- a/backend/notification_v2/models.py
+++ b/backend/notification_v2/models.py
@@ -5,7 +5,7 @@
 from pipeline_v2.models import Pipeline
 from utils.models.base_model import BaseModel
 
-from .enums import AuthorizationType, NotificationTrigger, NotificationType, PlatformType
+from .enums import AuthorizationType, NotificationType, PlatformType
 
 NOTIFICATION_NAME_MAX_LENGTH = 255
 
@@ -47,15 +47,12 @@ class Notification(BaseModel):
         default=True,
         db_comment="Flag indicating whether the notification is active or not.",
     )
-    notify_on = models.CharField(
-        max_length=50,
-        choices=NotificationTrigger.choices(),
-        default=NotificationTrigger.ALL.value,
+    notify_on_failures = models.BooleanField(
+        default=False,
         db_comment=(
-            "Controls which run outcomes trigger this notification. ALL (default) "
-            "preserves the historical 'notify on every completion' behavior; "
-            "FAILURES_ONLY fires only on failed runs (ERROR for API deployments, "
-            "FAILURE for ETL pipelines); SUCCESS_ONLY fires only on successful runs."
+            "When True, fire only on failed runs — terminal status ERROR/STOPPED "
+            "or any file in the run errored (partial failure). When False "
+            "(default), fire on every terminal completion."
         ),
     )
     # Foreign keys to specific models
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index 784ec75413..4cb4f3c4cb 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -1,7 +1,7 @@
 from rest_framework import serializers
 from utils.input_sanitizer import validate_name_field
 
-from .enums import AuthorizationType, NotificationTrigger, NotificationType, PlatformType
+from .enums import AuthorizationType, NotificationType, PlatformType
 from .models import Notification
 
 
@@ -12,11 +12,7 @@ class NotificationSerializer(serializers.ModelSerializer):
     max_retries = serializers.IntegerField(
         max_value=4, min_value=0, default=0, required=False
     )
-    notify_on = serializers.ChoiceField(
-        choices=NotificationTrigger.choices(),
-        default=NotificationTrigger.ALL.value,
-        required=False,
-    )
+    notify_on_failures = serializers.BooleanField(default=False, required=False)
 
     class Meta:
         model = Notification
diff --git a/backend/pipeline_v2/dto.py b/backend/pipeline_v2/dto.py
index 5a87ba0825..b8ad7c8707 100644
--- a/backend/pipeline_v2/dto.py
+++ b/backend/pipeline_v2/dto.py
@@ -10,6 +10,9 @@ def __init__(
         status: str,
         execution_id: str | None = None,
         error_message: str | None = None,
+        total_files: int | None = None,
+        successful_files: int | None = None,
+        failed_files: int | None = None,
     ):
         self.type = type
         self.pipeline_id = pipeline_id
@@ -17,14 +20,20 @@ def __init__(
         self.status = status
         self.execution_id = execution_id
         self.error_message = error_message
+        self.total_files = total_files
+        self.successful_files = successful_files
+        self.failed_files = failed_files
 
     def to_dict(self) -> dict[str, Any]:
         """Convert the payload DTO to a dictionary."""
-        payload = {
+        payload: dict[str, Any] = {
             "type": self.type,
             "pipeline_id": str(self.pipeline_id),
             "pipeline_name": self.pipeline_name,
             "status": self.status,
+            "total_files": self.total_files or 0,
+            "successful_files": self.successful_files or 0,
+            "failed_files": self.failed_files or 0,
         }
         if self.execution_id:
             payload["execution_id"] = str(self.execution_id)
diff --git a/backend/pipeline_v2/notification.py b/backend/pipeline_v2/notification.py
index 64df6f1126..ec82145054 100644
--- a/backend/pipeline_v2/notification.py
+++ b/backend/pipeline_v2/notification.py
@@ -1,8 +1,9 @@
 import logging
 
-from notification_v2.enums import NotificationTrigger
 from notification_v2.helper import NotificationHelper
 from notification_v2.models import Notification
+from workflow_manager.workflow_v2.enums import ExecutionStatus
+from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from pipeline_v2.dto import PipelineStatusPayload
 from pipeline_v2.models import Pipeline
@@ -10,6 +11,9 @@
 logger = logging.getLogger(__name__)
 
 
+_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
+
+
 class PipelineNotification:
     def __init__(
         self,
@@ -24,33 +28,57 @@ def __init__(
         self.error_message = error_message
         self.execution_id = execution_id
 
-    def send(self) -> None:
-        # Partition notifications by the run outcome so each row's notify_on
-        # preference is honored. PipelineUtils.update_pipeline_status collapses
-        # both ERROR and STOPPED execution statuses into PipelineStatus.FAILURE,
-        # so FAILURES_ONLY subscribers get alerts for both on the pipeline side.
-        status = self.pipeline.last_run_status
-        if status == Pipeline.PipelineStatus.FAILURE:
-            self.notifications = self.notifications.exclude(
-                notify_on=NotificationTrigger.SUCCESS_ONLY.value
-            )
-        elif status == Pipeline.PipelineStatus.SUCCESS:
-            self.notifications = self.notifications.exclude(
-                notify_on=NotificationTrigger.FAILURES_ONLY.value
-            )
-        else:
-            self.notifications = self.notifications.filter(
-                notify_on=NotificationTrigger.ALL.value
+    def _load_execution(self) -> WorkflowExecution | None:
+        """Load the WorkflowExecution row for this dispatch, if available.
+
+        Falls back to None when no execution_id was supplied (e.g. legacy
+        callers); callers must handle the None case.
+        """
+        if not self.execution_id:
+            return None
+        try:
+            return WorkflowExecution.objects.get(id=self.execution_id)
+        except WorkflowExecution.DoesNotExist:
+            logger.warning(
+                "WorkflowExecution %s not found for pipeline notification",
+                self.execution_id,
             )
+            return None
+
+    def send(self) -> None:
+        execution = self._load_execution()
+        # Source of truth for partial-failure detection is the per-run aggregate
+        # written by the worker callback. Pipeline.last_run_status is a coarse
+        # collapse (ERROR/STOPPED → FAILURE) that hides per-file errors when
+        # at least one file succeeded.
+        failed_files = (execution.failed_files or 0) if execution else 0
+        execution_status = execution.status if execution else None
+        is_failure = (
+            execution_status in _FAILURE_STATUSES
+            or failed_files > 0
+            or self.pipeline.last_run_status == Pipeline.PipelineStatus.FAILURE
+        )
+        if not is_failure:
+            self.notifications = self.notifications.filter(notify_on_failures=False)
 
         if not self.notifications.exists():
             logger.info(
-                "No notifications to dispatch for pipeline %s (status=%s)",
+                "No notifications to dispatch for pipeline %s (status=%s, failed_files=%s)",
                 self.pipeline,
-                status,
+                self.pipeline.last_run_status,
+                failed_files,
             )
             return
-        logger.info("Sending pipeline status notification for pipeline %s", self.pipeline)
+        successful_files = (execution.successful_files or 0) if execution else 0
+        total_files = execution.total_files if execution else None
+        logger.info(
+            "Sending pipeline status notification for pipeline %s "
+            "(status=%s, successful=%s, failed=%s)",
+            self.pipeline,
+            self.pipeline.last_run_status,
+            successful_files,
+            failed_files,
+        )
         payload_dto = PipelineStatusPayload(
             type=self.pipeline.pipeline_type,
             pipeline_id=str(self.pipeline.id),
@@ -58,6 +86,9 @@ def send(self) -> None:
             status=self.pipeline.last_run_status,
             execution_id=self.execution_id,
             error_message=self.error_message,
+            total_files=total_files,
+            successful_files=successful_files,
+            failed_files=failed_files,
         )
 
         NotificationHelper.send_notification(
diff --git a/backend/workflow_manager/internal_serializers.py b/backend/workflow_manager/internal_serializers.py
index bed98c6853..cd221470cb 100644
--- a/backend/workflow_manager/internal_serializers.py
+++ b/backend/workflow_manager/internal_serializers.py
@@ -178,6 +178,8 @@ class WorkflowExecutionStatusUpdateSerializer(serializers.Serializer):
     total_files = serializers.IntegerField(
         required=False, min_value=0
     )  # Allow 0 but backend will only update if > 0
+    successful_files = serializers.IntegerField(required=False, min_value=0)
+    failed_files = serializers.IntegerField(required=False, min_value=0)
     attempts = serializers.IntegerField(required=False, min_value=0)
     execution_time = serializers.FloatField(required=False, min_value=0)
 
diff --git a/backend/workflow_manager/internal_views.py b/backend/workflow_manager/internal_views.py
index c822e5e7b5..52f100196a 100644
--- a/backend/workflow_manager/internal_views.py
+++ b/backend/workflow_manager/internal_views.py
@@ -513,10 +513,19 @@ def update_status(self, request, id=None):
                     increment_attempt=increment_attempt,
                 )
 
-                # Update total_files separately (not handled by update_execution)
+                # Update total_files / per-file aggregates separately (not handled by update_execution)
+                update_fields: list[str] = []
                 if validated_data.get("total_files") is not None:
                     execution.total_files = validated_data["total_files"]
-                    execution.save()
+                    update_fields.append("total_files")
+                if validated_data.get("successful_files") is not None:
+                    execution.successful_files = validated_data["successful_files"]
+                    update_fields.append("successful_files")
+                if validated_data.get("failed_files") is not None:
+                    execution.failed_files = validated_data["failed_files"]
+                    update_fields.append("failed_files")
+                if update_fields:
+                    execution.save(update_fields=update_fields)
 
                 logger.info(
                     f"Updated workflow execution {id} status to {validated_data['status']}"
diff --git a/backend/workflow_manager/workflow_v2/migrations/0020_workflowexecution_file_counts.py b/backend/workflow_manager/workflow_v2/migrations/0020_workflowexecution_file_counts.py
new file mode 100644
index 0000000000..6dba25f5be
--- /dev/null
+++ b/backend/workflow_manager/workflow_v2/migrations/0020_workflowexecution_file_counts.py
@@ -0,0 +1,36 @@
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("workflow_v2", "0019_remove_filehistory_trigram_index"),
+    ]
+
+    operations = [
+        migrations.AddField(
+            model_name="workflowexecution",
+            name="successful_files",
+            field=models.PositiveIntegerField(
+                blank=True,
+                null=True,
+                db_comment=(
+                    "Per-run aggregate of files that completed successfully. "
+                    "Written by the worker callback at terminal state. Null on "
+                    "rows created before this column was added."
+                ),
+            ),
+        ),
+        migrations.AddField(
+            model_name="workflowexecution",
+            name="failed_files",
+            field=models.PositiveIntegerField(
+                blank=True,
+                null=True,
+                db_comment=(
+                    "Per-run aggregate of files that errored. Written by the "
+                    "worker callback at terminal state. Null on rows created "
+                    "before this column was added."
+                ),
+            ),
+        ),
+    ]
diff --git a/backend/workflow_manager/workflow_v2/models/execution.py b/backend/workflow_manager/workflow_v2/models/execution.py
index 45886bd64e..4e3656b68d 100644
--- a/backend/workflow_manager/workflow_v2/models/execution.py
+++ b/backend/workflow_manager/workflow_v2/models/execution.py
@@ -16,7 +16,6 @@
 
 from workflow_manager.execution.dto import ExecutionCache
 from workflow_manager.execution.execution_cache_utils import ExecutionCacheUtils
-from workflow_manager.file_execution.models import WorkflowFileExecution
 from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models import Workflow
 
@@ -174,6 +173,24 @@ class Type(models.TextChoices):
     total_files = models.PositiveIntegerField(
         default=0, verbose_name="Total files", db_comment="Number of files to process"
     )
+    successful_files = models.PositiveIntegerField(
+        null=True,
+        blank=True,
+        db_comment=(
+            "Per-run aggregate of files that completed successfully. Written by "
+            "the worker callback at terminal state. Null on rows created before "
+            "this column was added."
+        ),
+    )
+    failed_files = models.PositiveIntegerField(
+        null=True,
+        blank=True,
+        db_comment=(
+            "Per-run aggregate of files that errored. Written by the worker "
+            "callback at terminal state. Null on rows created before this "
+            "column was added."
+        ),
+    )
     error_message = models.CharField(
         max_length=EXECUTION_ERROR_LENGTH,
         blank=True,
@@ -420,16 +437,8 @@ def get_last_run_statuses(cls, pipeline_id: uuid.UUID, limit: int = 5) -> list[d
 
         result = []
         for e in executions:
-            # TODO: Optimize by storing successful/failed counts directly in
-            # WorkflowExecution model. Current approach causes N+1 queries
-            # (2 queries per execution). Denormalized counts would eliminate
-            # these queries entirely.
-            successful = WorkflowFileExecution.objects.filter(
-                workflow_execution_id=e.id, status="COMPLETED"
-            ).count()
-            failed = WorkflowFileExecution.objects.filter(
-                workflow_execution_id=e.id, status="ERROR"
-            ).count()
+            successful = e.successful_files or 0
+            failed = e.failed_files or 0
 
             # Compute display_status: PARTIAL_SUCCESS if completed with mixed results
             display_status = e.status
diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
index 9302f9f1dc..65460376d4 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
@@ -1,4 +1,4 @@
-import { Button, Form, Input, Select, Space } from "antd";
+import { Button, Checkbox, Form, Input, Select, Space } from "antd";
 import PropTypes from "prop-types";
 import { useEffect, useState } from "react";
 import { getBackendErrorDetail } from "../../../helpers/GetStaticData";
@@ -12,7 +12,7 @@ const DEFAULT_FORM_DETAILS = {
   authorization_key: "",
   is_active: false,
   max_retries: 0,
-  notify_on: "ALL",
+  notify_on_failures: false,
   pipeline: "",
   api: "",
   url: "",
@@ -55,12 +55,6 @@ const AUTHORIZATION_TYPES = [
   },
 ];
 
-const NOTIFY_ON_OPTIONS = [
-  { value: "ALL", label: "On every completion" },
-  { value: "FAILURES_ONLY", label: "On failures only" },
-  { value: "SUCCESS_ONLY", label: "On success only" },
-];
-
 function CreateNotification({
   setIsForm,
   type,
@@ -199,12 +193,6 @@ function CreateNotification({
       tooltip:
         "Specify the maximum number of times the notification should be retried if it fails.",
     },
-    {
-      label: "Notify on",
-      name: "notify_on",
-      component: <Select options={NOTIFY_ON_OPTIONS} />,
-      tooltip: "Choose which run outcomes should trigger this webhook.",
-    },
   ];
 
   return (
@@ -233,6 +221,13 @@ function CreateNotification({
             </Form.Item>
           ),
       )}
+      <Form.Item
+        name="notify_on_failures"
+        valuePropName="checked"
+        tooltip="When enabled, only runs with at least one failed file or a run-level error/stop trigger this notification. Otherwise notifications fire on every completion."
+      >
+        <Checkbox>Notify on failures only</Checkbox>
+      </Form.Item>
       <Form.Item className="display-flex-right">
         <Space>
           <Button onClick={() => setIsForm(false)}>Cancel</Button>
diff --git a/unstract/core/src/unstract/core/data_models.py b/unstract/core/src/unstract/core/data_models.py
index 7e8e984a04..82da16a72e 100644
--- a/unstract/core/src/unstract/core/data_models.py
+++ b/unstract/core/src/unstract/core/data_models.py
@@ -510,6 +510,12 @@ class NotificationPayload:
     error_message: str | None = None
     organization_id: str | None = None
 
+    # Per-run file aggregates surfaced into webhook payloads.
+    # Default 0 lets receivers switch on a numeric value without None-checks.
+    total_files: int = 0
+    successful_files: int = 0
+    failed_files: int = 0
+
     # Metadata
     timestamp: datetime = field(default_factory=lambda: datetime.now(UTC))
     additional_data: dict[str, Any] = field(default_factory=dict)
@@ -565,6 +571,9 @@ def from_execution_status(
         error_message: str | None = None,
         organization_id: str | None = None,
         additional_data: dict[str, Any] | None = None,
+        total_files: int = 0,
+        successful_files: int = 0,
+        failed_files: int = 0,
     ) -> "NotificationPayload":
         """Create notification payload from execution status.
 
@@ -607,6 +616,9 @@ def from_execution_status(
             execution_id=execution_id,
             error_message=error_message,
             organization_id=organization_id,
+            total_files=total_files,
+            successful_files=successful_files,
+            failed_files=failed_files,
             additional_data=additional_data or {},
             _source=source,
         )
diff --git a/workers/callback/tasks.py b/workers/callback/tasks.py
index 42599f0659..eee5b97da3 100644
--- a/workers/callback/tasks.py
+++ b/workers/callback/tasks.py
@@ -381,12 +381,16 @@ def _update_execution_status_unified(
     try:
         # Consistent workflow execution status update across all callback types
         total_files = aggregated_results.get("total_files", 0)
+        successful_files = aggregated_results.get("successful_files", 0)
+        failed_files = aggregated_results.get("failed_files", 0)
 
         # Make the unified API call
         api_client.update_workflow_execution_status(
             execution_id=execution_id,
             status=final_status,
             total_files=total_files,
+            successful_files=successful_files,
+            failed_files=failed_files,
             organization_id=organization_id,
             error_message=error_message,
         )
diff --git a/workers/scheduler/tasks.py b/workers/scheduler/tasks.py
index 2e22946a58..65e5bd7af1 100644
--- a/workers/scheduler/tasks.py
+++ b/workers/scheduler/tasks.py
@@ -81,6 +81,7 @@ def _send_pipeline_status_notification(
             pipeline_id=pipeline_id,
             pipeline_name=pipeline_name,
             notification_payload=notification,
+            execution_id=execution_id,
         )
         logger.info(f"Notification sent successfully for {pipeline_type} {pipeline_id}")
     except Exception as notification_error:
diff --git a/workers/shared/api/internal_client.py b/workers/shared/api/internal_client.py
index def90bd86a..4964a2b377 100644
--- a/workers/shared/api/internal_client.py
+++ b/workers/shared/api/internal_client.py
@@ -603,6 +603,8 @@ def update_workflow_execution_status(
         status: str,
         error_message: str | None = None,
         total_files: int | None = None,
+        successful_files: int | None = None,
+        failed_files: int | None = None,
         attempts: int | None = None,
         execution_time: float | None = None,
         organization_id: str | None = None,
@@ -613,6 +615,8 @@ def update_workflow_execution_status(
             status,
             error_message,
             total_files,
+            successful_files,
+            failed_files,
             attempts,
             execution_time,
             organization_id,
diff --git a/workers/shared/clients/execution_client.py b/workers/shared/clients/execution_client.py
index 80e9ca6568..e1373eb9f5 100644
--- a/workers/shared/clients/execution_client.py
+++ b/workers/shared/clients/execution_client.py
@@ -265,6 +265,8 @@ def update_workflow_execution_status(
         status: str | TaskStatus,
         error_message: str | None = None,
         total_files: int | None = None,
+        successful_files: int | None = None,
+        failed_files: int | None = None,
         attempts: int | None = None,
         execution_time: float | None = None,
         organization_id: str | None = None,
@@ -276,6 +278,8 @@ def update_workflow_execution_status(
             status: New status (TaskStatus enum or string)
             error_message: Optional error message
             total_files: Optional total files count
+            successful_files: Optional count of files that completed successfully
+            failed_files: Optional count of files that errored
             attempts: Optional attempts count
             execution_time: Optional execution time
             organization_id: Optional organization ID override
@@ -292,6 +296,10 @@ def update_workflow_execution_status(
             data["error_message"] = error_message
         if total_files is not None:
             data["total_files"] = total_files
+        if successful_files is not None:
+            data["successful_files"] = successful_files
+        if failed_files is not None:
+            data["failed_files"] = failed_files
         if attempts is not None:
             data["attempts"] = attempts
         if execution_time is not None:
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index 977f5a875f..c4f4c5d518 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -104,6 +104,7 @@ def trigger_notification(
     pipeline_id: str,
     pipeline_name: str,
     notification_payload: NotificationPayload,
+    execution_id: str | None = None,
 ) -> None:
     """Trigger notifications for pipeline status updates.
 
@@ -111,10 +112,13 @@ def trigger_notification(
     Uses API client to fetch notification configuration.
     """
     try:
-        # Fetch pipeline notifications via API
+        # Pass execution_id so the backend filter respects notify_on_failures
+        # (see trigger_pipeline_notifications for the rationale).
+        params = {"execution_id": execution_id} if execution_id else None
         response_data = api_client._make_request(
             method="GET",
             endpoint=f"v1/webhook/pipeline/{pipeline_id}/notifications/",
+            params=params,
             timeout=10,
         )
 
@@ -176,10 +180,14 @@ def trigger_pipeline_notifications(
         return
 
     try:
-        # Fetch pipeline notifications via API
+        # Pass execution_id so the backend can drop notify_on_failures=True rows
+        # on success runs. Without it the endpoint is a no-op and we'd fire on
+        # every active row regardless of trigger preference.
+        params = {"execution_id": execution_id} if execution_id else None
         response_data = api_client._make_request(
             method="GET",
             endpoint=f"v1/webhook/pipeline/{pipeline_id}/notifications/",
+            params=params,
             timeout=10,
         )
 
@@ -204,7 +212,9 @@ def trigger_pipeline_notifications(
         else:
             workflow_type = WorkflowType.ETL  # Default fallback
 
-        # Create notification payload using dataclass
+        # File counts come from WorkflowExecution via the same endpoint so
+        # webhook receivers (Slack, raw API) see partial-success breakdowns.
+        counts = response_data.get("execution_counts") or {}
         payload = NotificationPayload.from_execution_status(
             pipeline_id=pipeline_id,
             pipeline_name=pipeline_name,
@@ -213,6 +223,9 @@ def trigger_pipeline_notifications(
             source=NotificationSource.CALLBACK_WORKER,
             execution_id=execution_id,
             error_message=error_message,
+            total_files=counts.get("total_files", 0),
+            successful_files=counts.get("successful_files", 0),
+            failed_files=counts.get("failed_files", 0),
         )
 
         logger.info(
@@ -261,9 +274,14 @@ def trigger_api_notifications(
         return
 
     try:
-        # Fetch API notifications via API
+        # See trigger_pipeline_notifications: execution_id powers the backend
+        # filter that respects notify_on_failures.
+        params = {"execution_id": execution_id} if execution_id else None
         response_data = api_client._make_request(
-            method="GET", endpoint=f"v1/webhook/api/{api_id}/notifications/", timeout=10
+            method="GET",
+            endpoint=f"v1/webhook/api/{api_id}/notifications/",
+            params=params,
+            timeout=10,
         )
 
         # _make_request already handles status codes and returns parsed data
@@ -277,7 +295,7 @@ def trigger_api_notifications(
             logger.info(f"No active notifications found for API {api_id}")
             return
 
-        # Create notification payload using dataclass
+        counts = response_data.get("execution_counts") or {}
         payload = NotificationPayload.from_execution_status(
             pipeline_id=api_id,
             pipeline_name=api_name,
@@ -286,6 +304,9 @@ def trigger_api_notifications(
             source=NotificationSource.CALLBACK_WORKER,
             execution_id=execution_id,
             error_message=error_message,
+            total_files=counts.get("total_files", 0),
+            successful_files=counts.get("successful_files", 0),
+            failed_files=counts.get("failed_files", 0),
         )
 
         logger.info(

From 9cd8eb1984891231e9cb1e673c0225be24534a55 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Tue, 5 May 2026 22:39:48 +0530
Subject: [PATCH 07/27] slack webhook payload

---
 .../tests/test_notification_filter.py         | 321 ------------------
 backend/pipeline_v2/dto.py                    |  14 +-
 .../core/src/unstract/core/data_models.py     |  24 +-
 .../notification/providers/slack_webhook.py   |   9 +-
 .../shared/patterns/notification/helper.py    |   3 +-
 5 files changed, 30 insertions(+), 341 deletions(-)
 delete mode 100644 backend/notification_v2/tests/test_notification_filter.py

diff --git a/backend/notification_v2/tests/test_notification_filter.py b/backend/notification_v2/tests/test_notification_filter.py
deleted file mode 100644
index 7f887be500..0000000000
--- a/backend/notification_v2/tests/test_notification_filter.py
+++ /dev/null
@@ -1,321 +0,0 @@
-"""Unit tests for the ``notify_on`` dispatch partition on notifications.
-
-Covers both dispatch paths that fan out to ``NotificationHelper.send_notification``:
-
-* ``APINotification.send`` — keyed on ``ExecutionStatus`` (ERROR, COMPLETED, STOPPED)
-* ``PipelineNotification.send`` — keyed on ``Pipeline.PipelineStatus``
-  (FAILURE, SUCCESS, INPROGRESS)
-
-Follows the repo convention (see ``usage_v2/tests/test_helper.py``) of stubbing
-Django-heavy modules at import time so the tests run without a live DB.
-"""
-
-from __future__ import annotations
-
-import sys
-import types
-from unittest.mock import MagicMock, patch
-
-
-# ---------------------------------------------------------------------------
-# Module-level stubs — must be installed BEFORE importing the modules under
-# test so Django's ORM imports resolve to our MagicMock-backed fakes.
-# ---------------------------------------------------------------------------
-
-
-def _ensure_mod(name: str) -> types.ModuleType:
-    """Force-install a fresh stub module in ``sys.modules``."""
-    mod = types.ModuleType(name)
-    sys.modules[name] = mod
-    return mod
-
-
-def _install_stubs() -> None:
-    # Only stub leaf modules that pull in Django ORM. Parent packages
-    # (api_v2, pipeline_v2, notification_v2, workflow_manager*) load normally.
-
-    exec_enums = _ensure_mod("workflow_manager.workflow_v2.enums")
-
-    class _ExecStatusNS:
-        class ERROR:
-            value = "ERROR"
-
-        class COMPLETED:
-            value = "COMPLETED"
-
-        class STOPPED:
-            value = "STOPPED"
-
-    exec_enums.ExecutionStatus = _ExecStatusNS  # type: ignore[attr-defined]
-
-    exec_models = _ensure_mod("workflow_manager.workflow_v2.models.execution")
-    exec_models.WorkflowExecution = MagicMock(name="WorkflowExecution")  # type: ignore[attr-defined]
-
-    api_models = _ensure_mod("api_v2.models")
-    api_models.APIDeployment = MagicMock(name="APIDeployment")  # type: ignore[attr-defined]
-
-    # notification_v2.models.Notification with a patchable ``objects``.
-    notif_models = _ensure_mod("notification_v2.models")
-
-    class _FakeNotification:
-        objects = MagicMock(name="Notification.objects")
-
-    notif_models.Notification = _FakeNotification  # type: ignore[attr-defined]
-
-    # notification_v2.helper.NotificationHelper
-    notif_helper = _ensure_mod("notification_v2.helper")
-
-    class _FakeHelper:
-        send_notification = MagicMock(name="NotificationHelper.send_notification")
-
-    notif_helper.NotificationHelper = _FakeHelper  # type: ignore[attr-defined]
-
-    # pipeline_v2.dto.PipelineStatusPayload
-    pipeline_dto = _ensure_mod("pipeline_v2.dto")
-    pipeline_dto.PipelineStatusPayload = MagicMock(name="PipelineStatusPayload")  # type: ignore[attr-defined]
-
-    # pipeline_v2.models.Pipeline with a PipelineStatus text-choices surface.
-    pipeline_models = _ensure_mod("pipeline_v2.models")
-
-    class _PipelineStatus:
-        SUCCESS = "SUCCESS"
-        FAILURE = "FAILURE"
-        INPROGRESS = "INPROGRESS"
-
-    class _FakePipeline:
-        PipelineStatus = _PipelineStatus
-
-    pipeline_models.Pipeline = _FakePipeline  # type: ignore[attr-defined]
-
-
-_install_stubs()
-
-
-# Now safe to import the modules under test.
-from api_v2 import notification as api_notification_mod  # noqa: E402
-from notification_v2.enums import NotificationTrigger  # noqa: E402
-from notification_v2.helper import NotificationHelper  # noqa: E402
-from notification_v2.models import Notification  # noqa: E402
-from pipeline_v2 import notification as pipeline_notification_mod  # noqa: E402
-from pipeline_v2.models import Pipeline  # noqa: E402
-
-
-# ---------------------------------------------------------------------------
-# Test helpers
-# ---------------------------------------------------------------------------
-
-
-def _make_queryset(notifications: list[MagicMock]) -> MagicMock:
-    """Return a MagicMock that mimics the chained QuerySet surface we use.
-
-    Supports:
-        qs.filter(notify_on=<value>)   -> qs with matching rows
-        qs.exclude(notify_on=<value>)  -> qs with non-matching rows
-        qs.exists()                    -> bool based on contents
-        iter(qs)                       -> notifications
-    """
-    qs = MagicMock(name="qs")
-    qs.__iter__ = lambda self: iter(notifications)
-
-    def _filter(**kwargs):
-        if "notify_on" in kwargs:
-            target = kwargs["notify_on"]
-            kept = [n for n in notifications if n.notify_on == target]
-            return _make_queryset(kept)
-        return _make_queryset(notifications)
-
-    def _exclude(**kwargs):
-        if "notify_on" in kwargs:
-            target = kwargs["notify_on"]
-            kept = [n for n in notifications if n.notify_on != target]
-            return _make_queryset(kept)
-        return _make_queryset(notifications)
-
-    qs.filter.side_effect = _filter
-    qs.exclude.side_effect = _exclude
-    qs.exists.return_value = bool(notifications)
-    qs.count.return_value = len(notifications)
-    return qs
-
-
-def _make_notification(*, notify_on: str) -> MagicMock:
-    n = MagicMock(name="Notification")
-    n.notify_on = notify_on
-    return n
-
-
-# ---------------------------------------------------------------------------
-# APINotification — 3 modes × 3 statuses
-# ---------------------------------------------------------------------------
-
-
-class TestAPINotificationFilter:
-    def _setup(self, *, status: str, notifications: list[MagicMock]):
-        Notification.objects.filter.reset_mock()
-        Notification.objects.filter.side_effect = None
-        Notification.objects.filter.return_value = _make_queryset(notifications)
-        NotificationHelper.send_notification.reset_mock()
-
-        api = MagicMock(name="APIDeployment")
-        api.api_name = "test-api"
-        api.id = "api-uuid"
-
-        execution = MagicMock(name="WorkflowExecution")
-        execution.status = status
-        execution.id = "exec-uuid"
-        execution.error_message = "boom" if status == "ERROR" else None
-
-        return api_notification_mod.APINotification(api=api, workflow_execution=execution)
-
-    # --- ALL: fires on every status ---
-    def test_all_fires_on_completed(self):
-        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        self._setup(status="COMPLETED", notifications=[n]).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_all_fires_on_error(self):
-        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        self._setup(status="ERROR", notifications=[n]).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_all_fires_on_stopped(self):
-        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        self._setup(status="STOPPED", notifications=[n]).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    # --- FAILURES_ONLY: fires on ERROR only ---
-    def test_failures_only_suppressed_on_completed(self):
-        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        self._setup(status="COMPLETED", notifications=[n]).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    def test_failures_only_fires_on_error(self):
-        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        self._setup(status="ERROR", notifications=[n]).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_failures_only_suppressed_on_stopped(self):
-        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        self._setup(status="STOPPED", notifications=[n]).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    # --- SUCCESS_ONLY: fires on COMPLETED only ---
-    def test_success_only_fires_on_completed(self):
-        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        self._setup(status="COMPLETED", notifications=[n]).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_success_only_suppressed_on_error(self):
-        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        self._setup(status="ERROR", notifications=[n]).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    def test_success_only_suppressed_on_stopped(self):
-        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        self._setup(status="STOPPED", notifications=[n]).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    # --- Mixed partition on a COMPLETED run: ALL + SUCCESS_ONLY fire, FAILURES_ONLY doesn't ---
-    def test_mixed_partition_on_completed(self):
-        all_mode = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        failures_only = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        success_only = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        notifier = self._setup(
-            status="COMPLETED", notifications=[all_mode, failures_only, success_only]
-        )
-        with patch.object(api_notification_mod, "PipelineStatusPayload") as payload_cls:
-            payload_cls.return_value.to_dict.return_value = {}
-            notifier.send()
-
-        assert NotificationHelper.send_notification.call_count == 1
-        kwargs = NotificationHelper.send_notification.call_args.kwargs
-        dispatched = sorted(n.notify_on for n in kwargs["notifications"])
-        assert dispatched == ["ALL", "SUCCESS_ONLY"]
-
-
-# ---------------------------------------------------------------------------
-# PipelineNotification — 3 modes × 3 statuses
-# ---------------------------------------------------------------------------
-
-
-class TestPipelineNotificationFilter:
-    def _setup(self, *, last_run_status: str, notifications: list[MagicMock]):
-        Notification.objects.filter.reset_mock()
-        Notification.objects.filter.side_effect = None
-        Notification.objects.filter.return_value = _make_queryset(notifications)
-        NotificationHelper.send_notification.reset_mock()
-
-        pipeline = MagicMock(name="Pipeline")
-        pipeline.id = "pipeline-uuid"
-        pipeline.pipeline_name = "test-pipeline"
-        pipeline.pipeline_type = "ETL"
-        pipeline.last_run_status = last_run_status
-
-        return pipeline_notification_mod.PipelineNotification(
-            pipeline=pipeline, execution_id="exec-uuid", error_message=None
-        )
-
-    # --- ALL ---
-    def test_all_fires_on_success(self):
-        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
-        ).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_all_fires_on_failure(self):
-        n = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
-        ).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    # --- FAILURES_ONLY ---
-    def test_failures_only_suppressed_on_success(self):
-        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
-        ).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    def test_failures_only_fires_on_failure(self):
-        n = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
-        ).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    # --- SUCCESS_ONLY ---
-    def test_success_only_fires_on_success(self):
-        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.SUCCESS, notifications=[n]
-        ).send()
-        assert NotificationHelper.send_notification.call_count == 1
-
-    def test_success_only_suppressed_on_failure(self):
-        n = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        self._setup(
-            last_run_status=Pipeline.PipelineStatus.FAILURE, notifications=[n]
-        ).send()
-        NotificationHelper.send_notification.assert_not_called()
-
-    # --- Mixed partition on a SUCCESS run ---
-    def test_mixed_partition_on_success(self):
-        all_mode = _make_notification(notify_on=NotificationTrigger.ALL.value)
-        failures_only = _make_notification(notify_on=NotificationTrigger.FAILURES_ONLY.value)
-        success_only = _make_notification(notify_on=NotificationTrigger.SUCCESS_ONLY.value)
-        notifier = self._setup(
-            last_run_status=Pipeline.PipelineStatus.SUCCESS,
-            notifications=[all_mode, failures_only, success_only],
-        )
-        with patch.object(
-            pipeline_notification_mod, "PipelineStatusPayload"
-        ) as payload_cls:
-            payload_cls.return_value.to_dict.return_value = {}
-            notifier.send()
-
-        assert NotificationHelper.send_notification.call_count == 1
-        kwargs = NotificationHelper.send_notification.call_args.kwargs
-        dispatched = sorted(n.notify_on for n in kwargs["notifications"])
-        assert dispatched == ["ALL", "SUCCESS_ONLY"]
diff --git a/backend/pipeline_v2/dto.py b/backend/pipeline_v2/dto.py
index b8ad7c8707..d0f27e7943 100644
--- a/backend/pipeline_v2/dto.py
+++ b/backend/pipeline_v2/dto.py
@@ -25,15 +25,21 @@ def __init__(
         self.failed_files = failed_files
 
     def to_dict(self) -> dict[str, Any]:
-        """Convert the payload DTO to a dictionary."""
+        """Convert the payload DTO to a dictionary.
+
+        File counts are nested in `additional_data` to match the worker-path
+        payload shape (NotificationPayload.from_execution_status).
+        """
         payload: dict[str, Any] = {
             "type": self.type,
             "pipeline_id": str(self.pipeline_id),
             "pipeline_name": self.pipeline_name,
             "status": self.status,
-            "total_files": self.total_files or 0,
-            "successful_files": self.successful_files or 0,
-            "failed_files": self.failed_files or 0,
+            "additional_data": {
+                "total_files": self.total_files or 0,
+                "successful_files": self.successful_files or 0,
+                "failed_files": self.failed_files or 0,
+            },
         }
         if self.execution_id:
             payload["execution_id"] = str(self.execution_id)
diff --git a/unstract/core/src/unstract/core/data_models.py b/unstract/core/src/unstract/core/data_models.py
index 82da16a72e..7642aa9ce1 100644
--- a/unstract/core/src/unstract/core/data_models.py
+++ b/unstract/core/src/unstract/core/data_models.py
@@ -510,14 +510,10 @@ class NotificationPayload:
     error_message: str | None = None
     organization_id: str | None = None
 
-    # Per-run file aggregates surfaced into webhook payloads.
-    # Default 0 lets receivers switch on a numeric value without None-checks.
-    total_files: int = 0
-    successful_files: int = 0
-    failed_files: int = 0
-
     # Metadata
     timestamp: datetime = field(default_factory=lambda: datetime.now(UTC))
+    # Per-run file aggregates (total/successful/failed) are nested here
+    # so receivers see them grouped rather than as top-level keys.
     additional_data: dict[str, Any] = field(default_factory=dict)
 
     # Internal tracking (not sent to external webhooks)
@@ -608,6 +604,17 @@ def from_execution_status(
                 f"Cannot create notification for non-final status: {execution_status}"
             )
 
+        # File counts are bundled inside additional_data so receivers see
+        # them grouped (e.g. Slack renders one "Additional Data" section).
+        # Caller-supplied additional_data takes precedence on key conflict.
+        merged_additional = {
+            "total_files": total_files,
+            "successful_files": successful_files,
+            "failed_files": failed_files,
+        }
+        if additional_data:
+            merged_additional.update(additional_data)
+
         return cls(
             type=workflow_type,
             pipeline_id=pipeline_id,
@@ -616,10 +623,7 @@ def from_execution_status(
             execution_id=execution_id,
             error_message=error_message,
             organization_id=organization_id,
-            total_files=total_files,
-            successful_files=successful_files,
-            failed_files=failed_files,
-            additional_data=additional_data or {},
+            additional_data=merged_additional,
             _source=source,
         )
 
diff --git a/workers/notification/providers/slack_webhook.py b/workers/notification/providers/slack_webhook.py
index 89206646a5..04e3532fa3 100644
--- a/workers/notification/providers/slack_webhook.py
+++ b/workers/notification/providers/slack_webhook.py
@@ -199,11 +199,10 @@ def _format_value(self, value: Any) -> str:
         elif isinstance(value, (list, tuple)):
             return "\n• " + "\n• ".join(str(item) for item in value)
         elif isinstance(value, dict):
-            # Format nested dictionary
-            items = []
-            for k, v in value.items():
-                items.append(f"  • {self._format_key(k)}: {v}")
-            return "\n" + "\n".join(items)
+            # Inline {Key: Value, Key: Value} so the receiver sees the
+            # whole dict on one line instead of a bulleted block.
+            items = [f"{self._format_key(k)}: {v}" for k, v in value.items()]
+            return "{" + ", ".join(items) + "}"
         elif value is None:
             return "_Not specified_"
         else:
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index c4f4c5d518..19f78fbb99 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -5,6 +5,7 @@
 """
 
 import logging
+from typing import Any
 
 from celery import current_app
 
@@ -335,7 +336,7 @@ def trigger_api_notifications(
 
 
 def handle_status_notifications(
-    api_client,
+    api_client: Any,
     pipeline_id: str,
     status: str,
     execution_id: str | None = None,

From aad0fa99bc5f1e3b6ad547f68207c381594f830f Mon Sep 17 00:00:00 2001
From: Kirtiman Mishra
 <110175055+kirtimanmishrazipstack@users.noreply.github.com>
Date: Thu, 7 May 2026 23:49:29 +0530
Subject: [PATCH 08/27] Uns 611 clubbed notification dispatch (#1951)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* UN-3439 [FIX] Accept wildcard subdomain origins in SocketIO and Django CORS (#1938)

* UN-3439 [FIX] Accept wildcard subdomain origins in SocketIO and Django CORS

Production socket connections were failing for `*.env.us-central.unstract.com`
because python-socketio does exact-string comparison on `cors_allowed_origins`,
so a literal `*` pattern silently rejected every real subdomain.

- Add `CORS_ALLOWED_ORIGIN_REGEXES` derived from `WEB_APP_ORIGIN_URL_WITH_WILD_CARD`.
- Wire SocketIO via `_RegexOrigin` whose `__eq__` does the regex match — single
  list entry covers all wildcard subdomains, no library subclass needed.
- Normalize `WEB_APP_ORIGIN_URL` through `urlparse` so trailing slashes / paths
  in env are stripped (also fixes the `…com//oauth-status/` double-slash).
- Add startup guard for malformed env values.

Resolves item #1 of UN-3439. Items #2/#3 (decoupling indexing from Socket.io,
fallback) are owned separately.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3439 [FIX] Address PR review: canonical origin, fullmatch, unhashable RegexOrigin, tests

Addresses five review comments on #1938:

1. coderabbitai (Major) — RFC 6454 canonicalization. Browsers serialize
   `Origin` headers with a lowercase host and no explicit default ports;
   `parsed_url.netloc` preserved both, so `https://APP.EXAMPLE.COM:443`
   would silently fail to match the browser's `https://app.example.com`.
   Switch to `parsed_url.hostname` + drop default ports, and reject
   non-http(s) schemes at startup.

2. greptile (P2) — `re.fullmatch` instead of `re.match`. With `re.match`
   plus `$`, a candidate ending in `\n` matches because `$` is allowed
   before an optional trailing newline. `fullmatch` removes the ambiguity.

3. self — `_RegexOrigin.__hash__` violated `a == b ⇒ hash(a) == hash(b)`
   (one fixed pattern hash vs. many matching strings). Today this is
   masked because python-socketio uses linear `__eq__` on a list, but if
   the allow-list is ever wrapped in a set, every legitimate subdomain
   would silently be rejected — exactly the failure mode UN-3439 closes.
   Make instances unhashable so the contract can't be broken.

4. self — No regression tests. Add `backend/utils/tests/test_cors_origin.py`
   (33 cases) covering: regex match/no-match, lookalike spoofing, scheme
   mismatch, trailing-newline rejection, non-string equality protocol,
   unhashability, ReDoS bounds, URL normalization (case, default ports,
   trailing slash, paths, queries), startup-guard rejections (empty,
   no-scheme, non-browser-scheme, no-host), and end-to-end via the same
   `RegexOrigin` path SocketIO uses.

5. self — Over-clever wildcard-to-regex builder. The
   `split('*').join(re.escape, ...)` construction generalised to N
   wildcards but the input has exactly one; replace with a direct rf-string
   that's self-evident on review.

Refactor for testability: extract `RegexOrigin` and `normalize_web_app_origin`
into `backend/utils/cors_origin.py` (Django-free, importable from settings
and tests). Settings now delegates to one helper call; `log_events.py`
imports `RegexOrigin`. No behavioural change beyond what each comment fixes.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3439 [FIX] Address SonarCloud quality gate

The Sonar quality gate failed with C reliability + 5 security hotspots, all
on the new test file:

- S905 (Bug, Major) — `{ro}` flagged as no-side-effect statement (Sonar
  doesn't see the implicit `__hash__` call). Drove the C reliability rating.
  Fix: use `len({ro})` so the side effect is via an explicit function call;
  test still asserts the same `TypeError`.
- S5727 (Code Smell, Critical) — `assert ro != None` is tautological and
  doesn't exercise `__eq__`. Switch to `(ro == None) is False` which directly
  tests that `NotImplemented` falls back to identity-equality.
- S5332 × 5 (Hotspots) — `http://` and `ftp://` literals in test data.
  These are intentional inputs proving the rejection logic. Annotate with
  `# NOSONAR` and an explanatory comment so the hotspots can be marked
  reviewed.

No production code changed; tests still 33/33 passing.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3439 [FIX] Remove last S5727 code smell — test __eq__ via dunder

Sonar S5727 correctly inferred that ``ro == None`` is statically always
False (NotImplemented falls back to identity), making the assertion look
tautological. The intent is to lock the protocol contract: ``__eq__`` must
return the ``NotImplemented`` sentinel for non-strings. Test that directly
via ``ro.__eq__(None) is NotImplemented`` instead of going through ``==``.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3439 [FIX] Address remaining CodeRabbit nits — port validation, ReDoS bound

Two minor follow-ups from the second CodeRabbit pass:

- `parsed.port` is a property that raises ValueError on malformed/out-of-range
  inputs (e.g. `:abc`, `:99999`). That bypassed our normalized config-error
  message and surfaced as a stack trace. Wrap the access and re-raise with
  the same actionable text. Adds two test cases (`https://example.com:abc`,
  `https://example.com:99999`) to lock the new behaviour.

- The 50ms ReDoS timing bound is too tight for noisy CI runners. Loosen to
  500ms — still orders of magnitude below what catastrophic backtracking
  would produce.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* ReverseMerge: V0.161.4 hotfix (#1943)

* Change csp to report only

* [HOTFIX] Bool-parse ENABLE_HIGHLIGHT_API_DEPLOYMENT env var (v0.161.4) (#1939)

[HOTFIX] Bool-parse ENABLE_HIGHLIGHT_API_DEPLOYMENT env var (#1937)

[FIX] Bool-parse ENABLE_HIGHLIGHT_API_DEPLOYMENT env var

os.environ.get returns the raw string when the variable is set, so
ENABLE_HIGHLIGHT_API_DEPLOYMENT="False" was truthy in Python (any
non-empty string is truthy). Wrap in CommonUtils.str_to_bool so
"False" / "false" / "0" actually evaluate to False.

The setting is consumed by the cloud configuration plugin's spec
default (ConfigSpec.default in plugins/configuration/cloud_config.py)
on cloud and on-prem builds. With this fix, an admin who explicitly
sets the env var to a falsy string sees highlight data stripped as
expected.

Co-authored-by: vishnuszipstack <117254672+vishnuszipstack@users.noreply.github.com>
Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Deepak K <89829542+Deepak-Kesavan@users.noreply.github.com>
Co-authored-by: vishnuszipstack <117254672+vishnuszipstack@users.noreply.github.com>
Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3448 [FIX] Remove vestigial `uv pip install` line in uv-lock-automation workflow (#1941)

* UN-3448 [FIX] Add --system flag to uv pip install in uv-lock-automation workflow

Modern uv requires uv pip install to run inside a virtual environment OR
with the explicit --system flag. The workflow currently has neither, so
it errors out:

  error: No virtual environment found for Python 3.12.9; run `uv venv`
  to create an environment, or pass `--system` to install into a
  non-virtual environment

This breaks every PR that touches a pyproject.toml (the workflow's
paths filter triggers on those). Last successful run was 2026-04-01,
before a behaviour change in uv or astral-sh/setup-uv@v7.

The --system flag is exactly what the error message suggests and is
correct here — we install pip into the runner's system Python; the
downstream uv-lock.sh script creates its own venvs as needed.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* UN-3448 [FIX] Remove vestigial `uv pip install` line per review

Per @jaseemjaskp's review: the pre-step `uv pip install ... pip` does
nothing useful for this workflow. The downstream uv-lock.sh script
uses uv sync at line 74, which manages its own venvs internally and
never invokes pip directly:

  $ grep -rn 'pip' docker/scripts/uv-lock-gen/
  docker/scripts/uv-lock-gen/uv-lock.sh:2:set -o pipefail

Only match is pipefail (shell option), no real pip references.

Removing the line entirely is cleaner than papering over with --system.
The line was likely copy-pasted from a sibling workflow that legitimately
needed pip in the system Python.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* ReverseMerge: V0.163.2 hotfix (#1946)

* [HOTFIX] Use importlib.util.find_spec for pluggable worker discovery (#1918)

* [FIX] Use importlib.util.find_spec for pluggable worker discovery

_verify_pluggable_worker_exists() previously checked for the literal file
`pluggable_worker/<name>/worker.py` on disk, which breaks when the plugin
has been compiled to a .so (Nuitka, Cython, or any C extension) — the
module is perfectly importable but the pre-check rejects it because only
the .py extension is considered.

Replace the filesystem check with importlib.util.find_spec(), which is
Python's standard way to ask "is this module resolvable by the import
system?". It honors every registered finder — source .py, compiled .so,
bytecode .pyc, namespace packages, zipimports — so the function now
matches what its docstring claims: verifying the module can be loaded,
not that a specific file extension is present.

Behavior is preserved for existing deployments:
- Images with no `pluggable_worker/<name>/` subpackage → find_spec
  raises ModuleNotFoundError (ImportError subclass) → returns False.
- Images with source .py → find_spec resolves the .py → returns True.
- Images with compiled .so → find_spec resolves the .so → returns True.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Handle ValueError from find_spec in pluggable worker verification

Greptile-flagged edge case: importlib.util.find_spec() can raise
ValueError (not just ImportError) when sys.modules has a partially
initialised module entry with __spec__ = None from a prior failed import.
Broaden the except to catch both.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FIX] Resolve api-deployment worker directory from enum import path

worker.py:452 did worker_type.value.replace("-", "_") to derive the
on-disk dir name. All WorkerType enum values already use underscores,
so the replace was a no-op; for API_DEPLOYMENT whose dir is
"api-deployment" (hyphen), it resolved to "api_deployment" and the
os.path.exists() check failed. Boot then logged a spurious
"❌ Worker directory not found: /app/api_deployment" at ERROR level.

The task registration path (builder + celery autodiscover via
to_import_path) is unaffected, so this was purely log noise — but
noise at ERROR level that masks real failures in log scans.

Fix: derive the directory from the authoritative to_import_path()
which already handles the hyphen case (api_deployment -> api-deployment).

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [HOTFIX] Add IAM Role / Instance Profile auth mode to AWS Bedrock adapter (#1944)

* [FEAT] Allow Bedrock to fall through to boto3's default credential chain

Match the S3/MinIO connector pattern: when AWS access keys are left blank
on the Bedrock LLM and embedding adapter forms, drop them from the kwargs
dict so boto3's default credential chain handles authentication. This
unlocks IAM role / instance profile / IRSA / AWS Profile scenarios on
hosts that already have ambient AWS credentials (e.g. EKS workers with
IRSA, EC2 with an instance profile).

- llm1/static/bedrock.json: clarify access-key descriptions to mention
  IRSA and instance profile (already non-required at v0.163.2 base).
- embedding1/static/bedrock.json: drop aws_access_key_id and
  aws_secret_access_key from top-level required; same description fix;
  expose aws_profile_name for parity with the LLM form.
- base1.py: AWSBedrockLLMParameters and AWSBedrockEmbeddingParameters
  now strip empty access-key values from the validated kwargs before
  returning, so empty strings don't override boto3's default chain.
  AWSBedrockEmbeddingParameters fields gain explicit None defaults
  and an aws_profile_name field.

Backward-compatible: existing adapters with access keys filled in
continue to work unchanged.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [FEAT] Add Authentication Type selector to Bedrock adapter form

Add an explicit `auth_type` selector with two options, making the auth
choice clear to users:

- "Access Keys" (default): existing flow, keys required
- "IAM Role / Instance Profile (on-prem AWS only)": no fields; relies on
  boto3's default credential chain (IRSA on EKS, task role on ECS,
  instance profile on EC2). Description on the selector explicitly notes
  this option is only for AWS-hosted Unstract deployments.

The form-only auth_type field is stripped before LiteLLM validation in
both AWSBedrockLLMParameters.validate() and AWSBedrockEmbeddingParameters.
validate(). Empty access keys continue to be stripped so boto3 falls
through to the default chain even when the access_keys arm is selected
without values (matches the S3/MinIO connector pattern).

Backward-compatible: legacy adapters without auth_type behave as
"Access Keys" mode (the default), and existing keys are forwarded
unchanged.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [REVIEW] Address Bedrock auth_type review feedback

Fixes the P0/P1 issues raised by greptile-apps and jaseemjaskp on
PR #1944.

Behaviour fixes:
- Stale-key leak in IAM Role mode: switching an existing adapter from
  Access Keys to IAM Role would carry truthy stored access keys through
  the strip-empty-only loop, so boto3 silently authenticated with the
  old long-lived credentials instead of falling through to the host's
  IRSA / instance-profile identity. Both LLM and embedding paths were
  affected.
- Silent acceptance of unknown auth_type: a typo (e.g. "access_key") or
  a malformed payload from a non-UI client passed through the dict
  comprehension untouched, with no enum guard.
- Cross-field validation gap: explicit Access Keys mode with blank or
  whitespace-only values silently fell through to the default
  credential chain instead of surfacing the misconfiguration.

Implementation:
- Add a module-level _resolve_bedrock_aws_credentials helper used by
  both AWSBedrockLLMParameters.validate() and AWSBedrock
  EmbeddingParameters.validate(), so the auth-type contract is
  expressed once.
  - Validates auth_type against an allowlist (None | "access_keys" |
    "iam_role"); raises ValueError on anything else.
  - iam_role: unconditionally drops aws_access_key_id and
    aws_secret_access_key.
  - access_keys (explicit): requires non-blank values; raises ValueError
    if either is empty or whitespace-only.
  - Legacy (auth_type absent): retains the lenient strip behaviour so
    pre-PR adapter configurations continue to deserialise unchanged.
- Restore aws_region_name as required (no `= None` default) on
  AWSBedrockEmbeddingParameters; only credentials may legitimately be
  absent.
- Drop the orphan aws_profile_name field from
  embedding1/static/bedrock.json: it was added for parity with the LLM
  form but lives outside the auth_type oneOf and contradicts the
  selector's "no further input" semantics. The LLM form already had
  aws_profile_name pre-PR and is left alone for backwards compatibility.

Tests:
- New tests/test_bedrock_adapter.py covers 15 cases across LLM and
  embedding adapters: legacy-no-auth-type, explicit access_keys with
  valid/blank/whitespace keys, iam_role with stale/no keys, unknown
  auth_type rejection, cross-field validation, and preservation of
  unrelated params (model_id, aws_profile_name, region, thinking).

Skipped (P2 nice-to-have):
- Comment-scope clarification, MinIO reference rewording,
  validate-mutates-caller'\''s-dict, and the LLM form description nit
  about aws_profile_name visibility. These don'\''t change behaviour
  and can be addressed in a follow-up.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

* [pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci

---------

Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>

---------

Co-authored-by: Chandrasekharan M <117059509+chandrasekharan-zipstack@users.noreply.github.com>
Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Co-authored-by: Athul <89829560+athul-rs@users.noreply.github.com>

* batch notification

---------

Co-authored-by: ali <117142933+muhammad-ali-e@users.noreply.github.com>
Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Co-authored-by: Ritwik G <100672805+ritwik-g@users.noreply.github.com>
Co-authored-by: Deepak K <89829542+Deepak-Kesavan@users.noreply.github.com>
Co-authored-by: vishnuszipstack <117254672+vishnuszipstack@users.noreply.github.com>
Co-authored-by: Praveen Kumar <praveen@zipstack.com>
Co-authored-by: Chandrasekharan M <117059509+chandrasekharan-zipstack@users.noreply.github.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Co-authored-by: Athul <89829560+athul-rs@users.noreply.github.com>
---
 .github/workflows/uv-lock-automation.yaml     |   2 -
 backend/api_v2/notification.py                |   8 +-
 backend/backend/settings/base.py              |  30 +-
 backend/configuration/enums.py                |   6 +
 backend/notification_v2/clubbed_renderer.py   | 138 +++++++++
 backend/notification_v2/enums.py              |  34 +++
 backend/notification_v2/helper.py             | 228 +++++++++++++--
 backend/notification_v2/internal_api_views.py | 265 +++++++++++++++++-
 .../notification_v2/internal_serializers.py   |   1 +
 backend/notification_v2/internal_urls.py      |  11 +
 .../0003_add_notification_buffer.py           | 148 ++++++++++
 backend/notification_v2/models.py             | 109 ++++++-
 backend/notification_v2/serializers.py        |  15 +-
 backend/notification_v2/tasks.py              |  51 ++++
 backend/notification_v2/tests/__init__.py     |   0
 backend/notification_v2/urls.py               |   9 +-
 backend/notification_v2/views.py              |  60 +++-
 backend/pipeline_v2/notification.py           |   9 +-
 backend/utils/cors_origin.py                  |  81 ++++++
 backend/utils/log_events.py                   |   8 +-
 backend/utils/tests/test_cors_origin.py       | 197 +++++++++++++
 .../notification-modal/CreateNotification.jsx |  63 ++++-
 .../settings/platform/PlatformSettings.jsx    |  95 ++++++-
 .../sdk1/src/unstract/sdk1/adapters/base1.py  |  93 +++++-
 .../adapters/embedding1/static/bedrock.json   |  68 ++++-
 .../sdk1/adapters/llm1/static/bedrock.json    |  66 ++++-
 unstract/sdk1/tests/test_bedrock_adapter.py   | 246 ++++++++++++++++
 .../process_notification_buffer.py            |  83 ++++++
 workers/log_consumer/scheduler.sh             |  48 ++--
 .../shared/patterns/notification/helper.py    | 129 ++++++---
 30 files changed, 2168 insertions(+), 133 deletions(-)
 create mode 100644 backend/notification_v2/clubbed_renderer.py
 create mode 100644 backend/notification_v2/migrations/0003_add_notification_buffer.py
 create mode 100644 backend/notification_v2/tasks.py
 delete mode 100644 backend/notification_v2/tests/__init__.py
 create mode 100644 backend/utils/cors_origin.py
 create mode 100644 backend/utils/tests/test_cors_origin.py
 create mode 100644 unstract/sdk1/tests/test_bedrock_adapter.py
 create mode 100755 workers/log_consumer/process_notification_buffer.py

diff --git a/.github/workflows/uv-lock-automation.yaml b/.github/workflows/uv-lock-automation.yaml
index 8cfc2f9ca2..52c3364386 100644
--- a/.github/workflows/uv-lock-automation.yaml
+++ b/.github/workflows/uv-lock-automation.yaml
@@ -36,8 +36,6 @@ jobs:
           version: "0.6.14"
           python-version: 3.12.9
 
-      - run: uv pip install --python=3.12.9 pip
-
       - name: Generate UV lockfiles
         env:
           GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
diff --git a/backend/api_v2/notification.py b/backend/api_v2/notification.py
index 57e810c0e9..4cefe92d24 100644
--- a/backend/api_v2/notification.py
+++ b/backend/api_v2/notification.py
@@ -1,6 +1,6 @@
 import logging
 
-from notification_v2.helper import NotificationHelper
+from notification_v2.helper import dispatch_with_delivery_mode
 from notification_v2.models import Notification
 from pipeline_v2.dto import PipelineStatusPayload
 from workflow_manager.workflow_v2.enums import ExecutionStatus
@@ -60,6 +60,8 @@ def send(self) -> None:
             failed_files=failed_files,
         )
 
-        NotificationHelper.send_notification(
-            notifications=self.notifications, payload=payload_dto.to_dict()
+        dispatch_with_delivery_mode(
+            list(self.notifications),
+            payload_dto.to_dict(),
+            error_context=f"api={self.api.id}",
         )
diff --git a/backend/backend/settings/base.py b/backend/backend/settings/base.py
index 2d493a91c3..f20109203f 100644
--- a/backend/backend/settings/base.py
+++ b/backend/backend/settings/base.py
@@ -12,11 +12,12 @@
 import logging
 import os
 from pathlib import Path
-from urllib.parse import quote, urlparse
+from urllib.parse import quote
 
 import httpx
 from dotenv import find_dotenv, load_dotenv
 from utils.common_utils import CommonUtils
+from utils.cors_origin import normalize_web_app_origin
 
 missing_settings = []
 
@@ -68,10 +69,18 @@ def get_required_setting(setting_key: str, default: str | None = None) -> str |
 )
 # Maximum number of files allowed per workflow page execution
 WORKFLOW_PAGE_MAX_FILES = int(os.environ.get("WORKFLOW_PAGE_MAX_FILES", 2))
-WEB_APP_ORIGIN_URL = os.environ.get("WEB_APP_ORIGIN_URL", "http://localhost:3000")
-parsed_url = urlparse(WEB_APP_ORIGIN_URL)
-WEB_APP_ORIGIN_URL_WITH_WILD_CARD = f"{parsed_url.scheme}://*.{parsed_url.netloc}"
+(
+    WEB_APP_ORIGIN_URL,
+    WEB_APP_ORIGIN_URL_WITH_WILD_CARD,
+    _CORS_SUBDOMAIN_REGEX,
+) = normalize_web_app_origin(
+    os.environ.get("WEB_APP_ORIGIN_URL", "http://localhost:3000")
+)
 CORS_ALLOWED_ORIGINS = [WEB_APP_ORIGIN_URL]
+# Wildcard subdomain regex consumed by django-cors-headers and (via the
+# RegexOrigin wrapper in utils/log_events.py) by the SocketIO engine.io
+# handshake — a single source of truth so HTTP and WS CORS cannot diverge.
+CORS_ALLOWED_ORIGIN_REGEXES = [_CORS_SUBDOMAIN_REGEX]
 
 DJANGO_APP_BACKEND_URL = os.environ.get("DJANGO_APP_BACKEND_URL", "http://localhost:8000")
 INTERNAL_SERVICE_API_KEY = os.environ.get("INTERNAL_SERVICE_API_KEY")
@@ -210,6 +219,15 @@ def get_required_setting(setting_key: str, default: str | None = None) -> str |
 
 INDEXING_FLAG_TTL = int(get_required_setting("INDEXING_FLAG_TTL"))
 NOTIFICATION_TIMEOUT = int(get_required_setting("NOTIFICATION_TIMEOUT", "5"))
+# Window for clubbing BATCHED notifications — also the flush cadence (seconds).
+# Default 1800 (30 min). Per-notification buffer rows precompute flush_after at
+# enqueue time, so changing this only affects rows enqueued after the restart.
+NOTIFICATION_CLUB_INTERVAL = int(os.environ.get("NOTIFICATION_CLUB_INTERVAL", "1800"))
+# Retention for terminal NotificationBuffer rows (DISPATCHED / DEAD_LETTER).
+# PENDING rows are never GC'd regardless of age.
+NOTIFICATION_BUFFER_RETENTION_DAYS = int(
+    os.environ.get("NOTIFICATION_BUFFER_RETENTION_DAYS", "7")
+)
 ATOMIC_REQUESTS = CommonUtils.str_to_bool(
     os.environ.get("DJANGO_ATOMIC_REQUESTS", "False")
 )
@@ -689,4 +707,6 @@ def filter(self, record):
     )
     raise ValueError(ERROR_MESSAGE)
 
-ENABLE_HIGHLIGHT_API_DEPLOYMENT = os.environ.get("ENABLE_HIGHLIGHT_API_DEPLOYMENT", False)
+ENABLE_HIGHLIGHT_API_DEPLOYMENT = CommonUtils.str_to_bool(
+    os.environ.get("ENABLE_HIGHLIGHT_API_DEPLOYMENT", "False")
+)
diff --git a/backend/configuration/enums.py b/backend/configuration/enums.py
index f35033a9f7..a11a0b58e7 100644
--- a/backend/configuration/enums.py
+++ b/backend/configuration/enums.py
@@ -61,6 +61,12 @@ class ConfigKey(Enum):
         max_value=settings.MAX_PARALLEL_FILE_BATCHES_MAX_VALUE,
     )
 
+    NOTIFICATION_CLUB_INTERVAL = ConfigSpec(
+        default=settings.NOTIFICATION_CLUB_INTERVAL,
+        value_type=ConfigType.INT,
+        help_text="Window (seconds) for clubbing BATCHED notifications.",
+    )
+
     def cast_value(self, raw_value: Any):
         converters = {
             ConfigType.INT: int,
diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
new file mode 100644
index 0000000000..6fd0de0a84
--- /dev/null
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -0,0 +1,138 @@
+"""Clubbed notification renderer.
+
+Builds one canonical JSON envelope from a group of buffered execution events
+and emits the platform-appropriate dispatch payload. Stays separate from the
+single-event SlackWebhook / APIWebhook providers so immediate-dispatch behavior
+stays untouched.
+
+Envelope shape (always the same — single-event groups use this too so consumers
+never need to branch on "is this batched?"):
+
+    {
+        "kind": "batch",
+        "summary": {
+            "pipeline": "<name>",
+            "interval_minutes": 30,
+            "total": N, "succeeded": S, "failed": F
+        },
+        "events": [{"execution_id": ..., "status": ..., "error": ...?}, ...]
+    }
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import Any
+
+from notification_v2.enums import PlatformType
+
+logger = logging.getLogger(__name__)
+
+# Hard cap on events per dispatch — extras roll over to the next flush tick.
+# Bounds memory + payload size and prevents a runaway backlog from creating an
+# unbounded HTTP body.
+MAX_BATCH_SIZE = 500
+# How many events Slack renders inline before collapsing the rest under a
+# "… and K more" footer. Slack tolerates much larger payloads, but readability
+# tanks past ~25 lines.
+SLACK_MAX_DISPLAY_EVENTS = 25
+
+_SUCCESS_STATUSES = {"COMPLETED", "SUCCESS"}
+
+
+def _is_success(status: str | None) -> bool:
+    if not status:
+        return False
+    return status.upper() in _SUCCESS_STATUSES
+
+
+def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
+    event: dict[str, Any] = {
+        "execution_id": payload.get("execution_id"),
+        "status": payload.get("status"),
+    }
+    error_message = payload.get("error_message")
+    if error_message:
+        event["error"] = error_message
+    return event
+
+
+def build_envelope(
+    payloads: list[dict[str, Any]], interval_seconds: int
+) -> dict[str, Any]:
+    """Build the canonical batch envelope.
+
+    Caps the events list at MAX_BATCH_SIZE; oldest-first ordering is the
+    caller's responsibility (the flush job sorts by created_at).
+    """
+    capped = payloads[:MAX_BATCH_SIZE]
+    succeeded = sum(1 for p in capped if _is_success(p.get("status")))
+    failed = len(capped) - succeeded
+    # Multiple pipelines can share an (org, url, auth_sig) group; we surface
+    # the first one's name as a representative. Mixed-pipeline batches are
+    # rare in practice and a v2 enhancement would aggregate distinct names.
+    pipeline_name = capped[0].get("pipeline_name") if capped else None
+    return {
+        "kind": "batch",
+        "summary": {
+            "pipeline": pipeline_name,
+            "interval_minutes": max(1, interval_seconds // 60),
+            "total": len(capped),
+            "succeeded": succeeded,
+            "failed": failed,
+        },
+        "events": [_event_from_payload(p) for p in capped],
+    }
+
+
+def _slack_event_line(event: dict[str, Any]) -> str:
+    parts = [f"— {event.get('execution_id') or 'unknown'}: {event.get('status')}"]
+    if event.get("error"):
+        parts.append(f"({event['error']})")
+    return " ".join(parts)
+
+
+def render_for_slack(envelope: dict[str, Any]) -> dict[str, Any]:
+    """Format the envelope as a Slack-compatible payload dict.
+
+    Returns the body shape Slack incoming webhooks expect (`text` field with
+    mrkdwn). Truncates inline events at SLACK_MAX_DISPLAY_EVENTS.
+    """
+    summary = envelope["summary"]
+    events: list[dict[str, Any]] = envelope["events"]
+    pipeline = summary.get("pipeline") or "pipeline"
+
+    header = f"*[Unstract] {summary['total']} executions for `{pipeline}`*"
+    counts = f"✅ {summary['succeeded']} succeeded  ❌ {summary['failed']} failed"
+
+    visible = events[:SLACK_MAX_DISPLAY_EVENTS]
+    lines = [_slack_event_line(e) for e in visible]
+    overflow = len(events) - len(visible)
+    if overflow > 0:
+        lines.append(f"… and {overflow} more executions")
+
+    body = "\n".join([header, counts, *lines])
+    return {"text": body}
+
+
+def render_clubbed_message(
+    payloads: list[dict[str, Any]], platform: str, interval_seconds: int
+) -> dict[str, Any]:
+    """Top-level entry point — returns the dispatch body for ``platform``.
+
+    Slack receives the rendered text payload; raw API webhooks receive the
+    canonical envelope unchanged so downstream consumers can parse it
+    programmatically.
+    """
+    envelope = build_envelope(payloads, interval_seconds)
+    if platform == PlatformType.SLACK.value:
+        return render_for_slack(envelope)
+    if platform == PlatformType.API.value:
+        return envelope
+    # Unknown platform — fall back to the raw envelope and warn so misrouted
+    # rows don't drop silently.
+    logger.warning(
+        "Unknown platform %s for clubbed dispatch; returning raw envelope",
+        platform,
+    )
+    return envelope
diff --git a/backend/notification_v2/enums.py b/backend/notification_v2/enums.py
index 991b08cac9..d6fed8b485 100644
--- a/backend/notification_v2/enums.py
+++ b/backend/notification_v2/enums.py
@@ -36,3 +36,37 @@ class PlatformType(Enum):
     @classmethod
     def choices(cls):
         return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
+
+
+class DeliveryMode(Enum):
+    """Per-notification dispatch mode.
+
+    IMMEDIATE fires on every workflow completion (pre-existing behavior).
+    BATCHED buffers events into NotificationBuffer and flushes them as one
+    clubbed message per (org, webhook_url, auth_sig) every
+    NOTIFICATION_CLUB_INTERVAL seconds.
+    """
+
+    IMMEDIATE = "IMMEDIATE"
+    BATCHED = "BATCHED"
+
+    @classmethod
+    def choices(cls):
+        return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
+
+
+class BufferStatus(Enum):
+    """Lifecycle states for a NotificationBuffer row.
+
+    PENDING       — waiting for the next flush tick.
+    DISPATCHED    — successfully sent as part of a clubbed message.
+    DEAD_LETTER   — Celery exhausted retries; terminal, never re-picked.
+    """
+
+    PENDING = "PENDING"
+    DISPATCHED = "DISPATCHED"
+    DEAD_LETTER = "DEAD_LETTER"
+
+    @classmethod
+    def choices(cls):
+        return [(e.value, e.name.replace("_", " ").capitalize()) for e in cls]
diff --git a/backend/notification_v2/helper.py b/backend/notification_v2/helper.py
index a454b9d82b..f217f2da18 100644
--- a/backend/notification_v2/helper.py
+++ b/backend/notification_v2/helper.py
@@ -1,35 +1,223 @@
+import hashlib
 import logging
+from collections.abc import Iterable
+from datetime import timedelta
 from typing import Any
 
-from notification_v2.enums import NotificationType, PlatformType
-from notification_v2.models import Notification
+from account_v2.models import Organization
+from django.utils import timezone
+
+from notification_v2.enums import (
+    AuthorizationType,
+    BufferStatus,
+    DeliveryMode,
+    NotificationType,
+    PlatformType,
+)
+from notification_v2.models import Notification, NotificationBuffer
 from notification_v2.provider.notification_provider import NotificationProvider
 from notification_v2.provider.registry import get_notification_provider
 
 logger = logging.getLogger(__name__)
 
+# Used as a stable salt-free input for SHA-256 grouping; collisions are
+# vanishingly improbable and the digest is never used as a security primitive.
+_AUTH_SIG_NONE = ""
+
+
+def compute_auth_sig(notification: Notification) -> str:
+    """SHA-256 hex of (auth_type + auth_key + auth_header) — never raw creds.
+
+    Identical auth configs produce the same sig (so grouping clubs them);
+    differing configs split into separate groups.
+    """
+    raw = "|".join(
+        [
+            notification.authorization_type or _AUTH_SIG_NONE,
+            notification.authorization_key or _AUTH_SIG_NONE,
+            notification.authorization_header or _AUTH_SIG_NONE,
+        ]
+    )
+    return hashlib.sha256(raw.encode("utf-8")).hexdigest()
+
+
+def webhook_url_hash(url: str | None) -> str:
+    """Short, log-safe fingerprint of a webhook URL (first 8 chars of SHA-256)."""
+    if not url:
+        return "none"
+    return hashlib.sha256(url.encode("utf-8")).hexdigest()[:8]
+
+
+def get_org_club_interval_seconds(organization: Organization) -> int:
+    """Per-org override of NOTIFICATION_CLUB_INTERVAL, falling back to env default.
+
+    Reads from the generic configuration KV table; returns the env-derived
+    default when the org has no override. The value is read at enqueue time
+    and baked into the row's flush_after — see mfbt §EC-2 / §EC-8: changing
+    the override only affects rows enqueued after the change.
+    """
+    # Local import: configuration depends on Django settings at import time
+    # and notification_v2.helper is imported during app boot.
+    from configuration.enums import ConfigKey
+    from configuration.models import Configuration
+
+    return int(
+        Configuration.get_value_by_organization(
+            ConfigKey.NOTIFICATION_CLUB_INTERVAL, organization
+        )
+    )
+
+
+def build_webhook_headers(notification: Notification) -> dict[str, str]:
+    """Build HTTP headers for a webhook dispatch from the notification's auth.
+
+    Mirrors the logic in ``provider/webhook/webhook.py`` and the worker-side
+    ``get_webhook_headers`` so the clubbed dispatcher and the immediate path
+    produce identical headers for the same auth config.
+    """
+    headers = {"Content-Type": "application/json"}
+    auth_type_raw = (notification.authorization_type or "").upper()
+    auth_key = notification.authorization_key
+    auth_header = notification.authorization_header
+    if auth_type_raw == AuthorizationType.BEARER.value and auth_key:
+        headers["Authorization"] = f"Bearer {auth_key}"
+    elif auth_type_raw == AuthorizationType.API_KEY.value and auth_key:
+        headers["Authorization"] = auth_key
+    elif (
+        auth_type_raw == AuthorizationType.CUSTOM_HEADER.value
+        and auth_header
+        and auth_key
+    ):
+        headers[auth_header] = auth_key
+    return headers
+
+
+def _resolve_organization(notification: Notification) -> Organization | None:
+    """Walk pipeline/api FK to find the owning org. Notification has no direct FK."""
+    pipeline = notification.pipeline
+    if pipeline and pipeline.organization_id:
+        return pipeline.organization
+    api = notification.api
+    if api and api.organization_id:
+        return api.organization
+    return None
+
+
+def split_by_delivery_mode(
+    notifications: "Iterable[Notification]",
+) -> tuple[list[Notification], list[Notification]]:
+    """Partition into (IMMEDIATE, BATCHED). Unknown modes default to IMMEDIATE."""
+    immediate: list[Notification] = []
+    batched: list[Notification] = []
+    for n in notifications:
+        if n.delivery_mode == DeliveryMode.BATCHED.value:
+            batched.append(n)
+        else:
+            immediate.append(n)
+    return immediate, batched
+
+
+def dispatch_with_delivery_mode(
+    notifications: "Iterable[Notification]",
+    payload: dict[str, Any],
+    *,
+    error_context: str = "",
+) -> None:
+    """Single-call entry point that splits IMMEDIATE / BATCHED and dispatches.
+
+    IMMEDIATE rows fire synchronously via NotificationHelper. BATCHED rows
+    enqueue into NotificationBuffer; an enqueue failure is logged but does
+    not abort the loop — other notifications still get their chance.
+
+    ``error_context`` lets callers tag failures with their dispatch source
+    (pipeline id, api id) for easier triage.
+    """
+    immediate, batched = split_by_delivery_mode(notifications)
+    if immediate:
+        NotificationHelper.send_notification(notifications=immediate, payload=payload)
+    for notification in batched:
+        try:
+            enqueue(notification, payload)
+        except Exception:
+            logger.exception(
+                "Failed to enqueue BATCHED notification %s%s",
+                notification.id,
+                f" ({error_context})" if error_context else "",
+            )
+
+
+def enqueue(notification: Notification, payload: dict[str, Any]) -> NotificationBuffer:
+    """Buffer a single execution event for a BATCHED notification.
+
+    Computes auth_sig and flush_after at write time so existing PENDING rows
+    keep their original cadence even if NOTIFICATION_CLUB_INTERVAL or the
+    notification's auth changes mid-window. Returns the persisted row.
+
+    Raises ValueError if the notification has no resolvable organization
+    (defensive — the FK chain via pipeline/api always provides one in practice).
+    """
+    organization = _resolve_organization(notification)
+    if organization is None:
+        raise ValueError(
+            f"Notification {notification.id} has no resolvable organization "
+            "(neither pipeline nor api FK populated)"
+        )
+
+    interval_seconds = get_org_club_interval_seconds(organization)
+    flush_after = timezone.now() + timedelta(seconds=interval_seconds)
+    auth_sig = compute_auth_sig(notification)
+    platform = notification.platform or PlatformType.API.value
+
+    buffer_row = NotificationBuffer.objects.create(
+        notification=notification,
+        organization=organization,
+        webhook_url=notification.url,
+        payload=payload,
+        platform=platform,
+        auth_sig=auth_sig,
+        flush_after=flush_after,
+        status=BufferStatus.PENDING.value,
+    )
+
+    # Structured log: org + URL fingerprint only — never the raw URL or any
+    # part of the auth tuple. Downstream metrics consumers grep on metric=.
+    logger.info(
+        "metric=notification_buffer_enqueued_total platform=%s org_id=%s "
+        "webhook_url_hash=%s notification_id=%s buffer_id=%s flush_after=%s",
+        platform,
+        organization.organization_id,
+        webhook_url_hash(notification.url),
+        notification.id,
+        buffer_row.id,
+        flush_after.isoformat(),
+    )
+    return buffer_row
+
 
 class NotificationHelper:
     @classmethod
     def send_notification(cls, notifications: list[Notification], payload: Any) -> None:
-        """Send notification Sends notifications using the appropriate provider
-        based on the notification type and platform.
+        """Dispatch IMMEDIATE notifications via the registered provider.
 
-        This method iterates through a list of `Notification` objects, determines the
-        appropriate notification provider based on the notification's type and
-        platform, and sends the notification with the provided payload. If an error
-        occurs due to an invalid notification type or platform, it logs the error.
+        Iterates over notifications, resolves the provider for each
+        (notification_type, platform) pair, and fires the webhook task. BATCHED
+        notifications must be routed to ``enqueue()`` instead — callers branch
+        on ``notification.delivery_mode`` before reaching this method.
 
         Args:
-            notifications (list[Notification]): A list of `Notification` instances to
-                be processed and sent.
-            payload (Any): The data to be sent with the notification. This can be any
-                format expected by the provider
-
-        Returns:
-                None
+            notifications: Active Notification rows to dispatch synchronously.
+            payload: Provider-specific payload (typically a dict).
         """
         for notification in notifications:
+            if notification.delivery_mode == DeliveryMode.BATCHED.value:
+                # Callers should not reach here for BATCHED — log loudly so
+                # routing regressions are visible without breaking dispatch.
+                logger.warning(
+                    "BATCHED notification %s reached IMMEDIATE dispatch path; "
+                    "skipping. Caller must branch on delivery_mode.",
+                    notification.id,
+                )
+                continue
             notification_type = NotificationType(notification.notification_type)
             platform_type = PlatformType(notification.platform)
             try:
@@ -40,9 +228,13 @@ def send_notification(cls, notifications: list[Notification], payload: Any) -> N
                     notification=notification, payload=payload
                 )
                 notifier.send()
-                logger.info(f"Sending notification to {notification}")
+                logger.info("Sending notification to %s", notification)
             except ValueError as e:
                 logger.error(
-                    f"Error in notification type {notification_type} and platform "
-                    f"{platform_type} for notification {notification}: {e}"
+                    "Error in notification type %s and platform %s for "
+                    "notification %s: %s",
+                    notification_type,
+                    platform_type,
+                    notification,
+                    e,
                 )
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 3e3f386b17..396bfb2081 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -9,13 +9,18 @@
 - These endpoints are not accessible from browsers and don't use session cookies
 """
 
+import json
 import logging
+from datetime import timedelta
 from typing import Any, cast
 
 from api_v2.models import APIDeployment
-from django.db.models import QuerySet
+from django.conf import settings
+from django.db import transaction
+from django.db.models import Min, QuerySet
 from django.http import HttpRequest, JsonResponse
 from django.shortcuts import get_object_or_404
+from django.utils import timezone
 from django.views.decorators.csrf import csrf_exempt
 from django.views.decorators.http import require_http_methods
 from pipeline_v2.models import Pipeline
@@ -23,7 +28,16 @@
 from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
-from notification_v2.models import Notification
+from backend.celery_service import app as celery_app
+from notification_v2.clubbed_renderer import render_clubbed_message
+from notification_v2.enums import BufferStatus, DeliveryMode
+from notification_v2.helper import (
+    build_webhook_headers,
+    enqueue,
+    get_org_club_interval_seconds,
+    webhook_url_hash,
+)
+from notification_v2.models import Notification, NotificationBuffer
 
 logger = logging.getLogger(__name__)
 
@@ -89,6 +103,9 @@ def _serialize_notification(n: Notification) -> dict[str, Any]:
         "max_retries": n.max_retries,
         "is_active": n.is_active,
         "notify_on_failures": n.notify_on_failures,
+        # Drives the worker-side IMMEDIATE-vs-BATCHED branch in
+        # workers/shared/patterns/notification/helper.py.
+        "delivery_mode": n.delivery_mode,
     }
 
 
@@ -271,3 +288,247 @@ def get_api_data(request: HttpRequest, api_id: str) -> JsonResponse:
         return JsonResponse(
             {"status": "error", "message": INTERNAL_SERVER_ERROR_MSG}, status=500
         )
+
+
+# Required fields on the enqueue endpoint body. Worker-side serialization
+# guarantees these — keep this list in sync with
+# workers/shared/patterns/notification/helper.py.
+_ENQUEUE_REQUIRED_FIELDS = (
+    "notification_id",
+    "execution_id",
+    "pipeline_id",
+    "pipeline_name",
+    "status",
+    "platform",
+)
+
+
+@csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
+@require_http_methods(["POST"])
+def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
+    """Buffer one execution event from a callback worker.
+
+    Worker code is model-free: it forwards a notification_id + structured
+    payload here and lets the backend write the NotificationBuffer row.
+    Rejects rows whose source notification is not BATCHED so a worker
+    routing bug cannot silently divert IMMEDIATE traffic into the buffer.
+    """
+    try:
+        body = json.loads(request.body.decode("utf-8") or "{}")
+    except json.JSONDecodeError:
+        return JsonResponse(
+            {"status": "error", "message": "Invalid JSON body"}, status=400
+        )
+
+    missing = [f for f in _ENQUEUE_REQUIRED_FIELDS if not body.get(f)]
+    if missing:
+        return JsonResponse(
+            {
+                "status": "error",
+                "message": f"Missing required fields: {', '.join(missing)}",
+            },
+            status=400,
+        )
+
+    try:
+        notification = Notification.objects.get(id=body["notification_id"])
+    except Notification.DoesNotExist:
+        return JsonResponse(
+            {"status": "error", "message": "Notification not found"}, status=404
+        )
+
+    if notification.delivery_mode != DeliveryMode.BATCHED.value:
+        # Hard-fail rather than silently auto-correcting — surfaces worker
+        # routing regressions instead of letting them drain into the buffer.
+        return JsonResponse(
+            {
+                "status": "error",
+                "message": (
+                    "Notification delivery_mode is not BATCHED; refuse to enqueue"
+                ),
+            },
+            status=409,
+        )
+
+    payload = {
+        "execution_id": body["execution_id"],
+        "pipeline_id": body["pipeline_id"],
+        "pipeline_name": body["pipeline_name"],
+        "status": body["status"],
+        "error_message": body.get("error_message"),
+        "platform": body["platform"],
+    }
+    try:
+        buffer_row = enqueue(notification, payload)
+    except ValueError as e:
+        return JsonResponse({"status": "error", "message": str(e)}, status=400)
+
+    return JsonResponse(
+        {"status": "success", "buffer_row_id": str(buffer_row.id)}, status=201
+    )
+
+
+def _gc_terminal_rows() -> int:
+    """Delete DISPATCHED / DEAD_LETTER rows older than the retention window.
+
+    PENDING rows are intentionally untouched regardless of age — they
+    represent live work the flush job still owns.
+    """
+    cutoff = timezone.now() - timedelta(days=settings.NOTIFICATION_BUFFER_RETENTION_DAYS)
+    deleted_count, _ = NotificationBuffer.objects.filter(
+        status__in=[BufferStatus.DISPATCHED.value, BufferStatus.DEAD_LETTER.value],
+        created_at__lt=cutoff,
+    ).delete()
+    return int(deleted_count)
+
+
+def _dispatch_group(
+    org_id: Any,
+    webhook_url: str,
+    auth_sig: str,
+) -> tuple[int, int]:
+    """Dispatch a single (org, url, auth_sig) group; returns (rows, succeeded).
+
+    Caller already filtered groups to MIN(flush_after) <= now. Locks rows
+    with SKIP LOCKED so a sibling replica skips them rather than blocking.
+    Re-fetches the source Notification each time for live auth (record may
+    have been edited between enqueue and flush).
+    """
+    with transaction.atomic():
+        rows = list(
+            NotificationBuffer.objects.select_for_update(skip_locked=True)
+            .filter(
+                status=BufferStatus.PENDING.value,
+                organization_id=org_id,
+                webhook_url=webhook_url,
+                auth_sig=auth_sig,
+            )
+            .order_by("created_at")[:_PROCESS_BUFFER_CAP]
+        )
+        if not rows:
+            # Either another replica claimed the rows (SKIP LOCKED) or they
+            # transitioned out of PENDING between the GROUP BY scan and the
+            # row-level lock. Either way: nothing to do here.
+            return 0, 0
+
+        # Live auth — read from the FIRST row's notification. If multiple
+        # notifications collide on (url, auth_sig) we have, by definition,
+        # identical auth, so this is safe.
+        first_notification = rows[0].notification
+        platform = rows[0].platform
+        payloads = [r.payload for r in rows]
+        # Per-org interval read here is cosmetic — used only for the
+        # `interval_minutes` field in the rendered message body. The
+        # cadence-controlling read happened at enqueue time and is
+        # already baked into each row's flush_after (mfbt §EC-2).
+        interval_seconds = get_org_club_interval_seconds(rows[0].organization)
+        body = render_clubbed_message(payloads, platform, interval_seconds)
+        headers = build_webhook_headers(first_notification)
+
+        buffer_ids = [str(r.id) for r in rows]
+        try:
+            celery_app.send_task(
+                "send_webhook_notification",
+                args=[
+                    first_notification.url,
+                    body,
+                    headers,
+                    settings.NOTIFICATION_TIMEOUT,
+                ],
+                kwargs={
+                    "max_retries": first_notification.max_retries,
+                    "retry_delay": 10,
+                    "platform": platform,
+                },
+                queue="notifications",
+                link_error=celery_app.signature(
+                    "notification_v2.mark_buffer_dead_letter",
+                    kwargs={"buffer_row_ids": buffer_ids},
+                ),
+            )
+        except Exception:
+            # Broker hiccup — leave rows PENDING for the next tick rather
+            # than mark them DEAD_LETTER. `exception` keeps stack context.
+            logger.exception(
+                "Broker dispatch failed for group org=%s url_hash=%s",
+                org_id,
+                webhook_url_hash(webhook_url),
+            )
+            return 0, 0
+
+        now = timezone.now()
+        NotificationBuffer.objects.filter(id__in=buffer_ids).update(
+            status=BufferStatus.DISPATCHED.value,
+            dispatched_at=now,
+        )
+        logger.info(
+            "metric=notification_batch_dispatched_total platform=%s result=success "
+            "org_id=%s webhook_url_hash=%s rows=%d",
+            platform,
+            org_id,
+            webhook_url_hash(webhook_url),
+            len(rows),
+        )
+        return len(rows), len(rows)
+
+
+# Per-group cap; matches the renderer's MAX_BATCH_SIZE so the rendered
+# events list and the dispatched row set stay in lock-step. Anything beyond
+# this rolls into the next flush tick.
+_PROCESS_BUFFER_CAP = 500
+
+
+@csrf_exempt  # Safe: Internal API with Bearer token auth, service-to-service only
+@require_http_methods(["POST"])
+def process_notification_buffer(request: HttpRequest) -> JsonResponse:
+    """Flush PENDING groups that have hit their flush_after; then GC.
+
+    Algorithm:
+    1. GROUP BY (org, url, auth_sig), HAVING MIN(flush_after) <= NOW()
+    2. For each group, in its own transaction: lock-skip-locked rows,
+       render, dispatch a single Celery task, mark rows DISPATCHED.
+    3. Sweep terminal rows older than NOTIFICATION_BUFFER_RETENTION_DAYS.
+
+    Concurrency: SELECT FOR UPDATE SKIP LOCKED makes parallel calls safe —
+    each replica skips groups another worker is already dispatching.
+    """
+    now = timezone.now()
+    groups = list(
+        NotificationBuffer.objects.filter(status=BufferStatus.PENDING.value)
+        .values("organization_id", "webhook_url", "auth_sig")
+        .annotate(earliest_flush=Min("flush_after"))
+        .filter(earliest_flush__lte=now)
+    )
+
+    dispatched_groups = 0
+    dispatched_rows = 0
+    for group in groups:
+        try:
+            rows, _succeeded = _dispatch_group(
+                org_id=group["organization_id"],
+                webhook_url=group["webhook_url"],
+                auth_sig=group["auth_sig"],
+            )
+        except Exception:
+            logger.exception(
+                "Failed dispatching group org=%s url_hash=%s",
+                group["organization_id"],
+                webhook_url_hash(group["webhook_url"]),
+            )
+            continue
+        if rows > 0:
+            dispatched_groups += 1
+            dispatched_rows += rows
+
+    gc_deleted = _gc_terminal_rows()
+    return JsonResponse(
+        {
+            "status": "success",
+            "dispatched_groups": dispatched_groups,
+            "dispatched_rows": dispatched_rows,
+            # DEAD_LETTER transitions are async (Celery link_error) — this
+            # response only covers transitions visible to this request.
+            "dead_letter_rows": 0,
+            "gc_deleted_rows": gc_deleted,
+        }
+    )
diff --git a/backend/notification_v2/internal_serializers.py b/backend/notification_v2/internal_serializers.py
index 94669d64a4..db7a35ab32 100644
--- a/backend/notification_v2/internal_serializers.py
+++ b/backend/notification_v2/internal_serializers.py
@@ -23,6 +23,7 @@ class Meta:
             "platform",
             "max_retries",
             "is_active",
+            "delivery_mode",
             "created_at",
             "modified_at",
             "pipeline",
diff --git a/backend/notification_v2/internal_urls.py b/backend/notification_v2/internal_urls.py
index 0414761089..a0f87f0250 100644
--- a/backend/notification_v2/internal_urls.py
+++ b/backend/notification_v2/internal_urls.py
@@ -21,6 +21,17 @@
 router.register(r"", WebhookInternalViewSet, basename="webhook-internal")
 
 urlpatterns = [
+    # Buffered (clubbed) notification dispatch endpoints
+    path(
+        "buffer/enqueue/",
+        internal_api_views.enqueue_notification_buffer,
+        name="enqueue_notification_buffer",
+    ),
+    path(
+        "buffer/process/",
+        internal_api_views.process_notification_buffer,
+        name="process_notification_buffer",
+    ),
     # Notification data endpoints for workers
     path(
         "pipeline/<str:pipeline_id>/notifications/",
diff --git a/backend/notification_v2/migrations/0003_add_notification_buffer.py b/backend/notification_v2/migrations/0003_add_notification_buffer.py
new file mode 100644
index 0000000000..7f5224849f
--- /dev/null
+++ b/backend/notification_v2/migrations/0003_add_notification_buffer.py
@@ -0,0 +1,148 @@
+import uuid
+
+import django.db.models.deletion
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("account_v2", "0001_initial"),
+        ("notification_v2", "0002_notification_notify_on_failures"),
+    ]
+
+    operations = [
+        migrations.AddField(
+            model_name="notification",
+            name="delivery_mode",
+            field=models.CharField(
+                choices=[("IMMEDIATE", "Immediate"), ("BATCHED", "Batched")],
+                default="IMMEDIATE",
+                max_length=16,
+                db_comment=(
+                    "IMMEDIATE fires on every completion (default, unchanged "
+                    "behavior). BATCHED buffers events and dispatches a single "
+                    "clubbed message per (org, webhook_url, auth_sig) every "
+                    "NOTIFICATION_CLUB_INTERVAL."
+                ),
+            ),
+        ),
+        migrations.CreateModel(
+            name="NotificationBuffer",
+            fields=[
+                ("created_at", models.DateTimeField(auto_now_add=True)),
+                ("modified_at", models.DateTimeField(auto_now=True)),
+                (
+                    "id",
+                    models.UUIDField(
+                        default=uuid.uuid4,
+                        editable=False,
+                        primary_key=True,
+                        serialize=False,
+                    ),
+                ),
+                (
+                    "webhook_url",
+                    models.URLField(
+                        db_comment="Denormalized destination URL; grouping key.",
+                    ),
+                ),
+                (
+                    "payload",
+                    models.JSONField(
+                        db_comment=(
+                            "Pre-structured execution data (execution_id, status, "
+                            "error_message, pipeline_name, pipeline_type) — NOT a "
+                            "final rendered message. The renderer formats this at "
+                            "dispatch time."
+                        ),
+                    ),
+                ),
+                (
+                    "platform",
+                    models.CharField(
+                        choices=[("SLACK", "Slack"), ("API", "Api")],
+                        max_length=50,
+                        db_comment=(
+                            "SLACK / API — drives renderer selection at flush time."
+                        ),
+                    ),
+                ),
+                (
+                    "auth_sig",
+                    models.CharField(
+                        max_length=64,
+                        db_comment=(
+                            "SHA-256 hex of (auth_type + auth_key + auth_header), "
+                            "computed at enqueue time. Grouping key — never store "
+                            "raw credentials here."
+                        ),
+                    ),
+                ),
+                (
+                    "flush_after",
+                    models.DateTimeField(
+                        db_comment=(
+                            "created_at + NOTIFICATION_CLUB_INTERVAL, precomputed "
+                            "at enqueue. Read-at-enqueue contract: changing the "
+                            "env var only affects rows enqueued after the restart."
+                        ),
+                    ),
+                ),
+                ("dispatched_at", models.DateTimeField(blank=True, null=True)),
+                (
+                    "status",
+                    models.CharField(
+                        choices=[
+                            ("PENDING", "Pending"),
+                            ("DISPATCHED", "Dispatched"),
+                            ("DEAD_LETTER", "Dead letter"),
+                        ],
+                        default="PENDING",
+                        max_length=16,
+                        db_comment=(
+                            "PENDING -> DISPATCHED on success, "
+                            "PENDING -> DEAD_LETTER on retry exhaustion."
+                        ),
+                    ),
+                ),
+                (
+                    "notification",
+                    models.ForeignKey(
+                        on_delete=django.db.models.deletion.CASCADE,
+                        related_name="buffer_rows",
+                        to="notification_v2.notification",
+                        db_comment=(
+                            "Source Notification. Cascade-delete is intentional: "
+                            "removing a Notification expresses intent to stop all "
+                            "future deliveries, including buffered ones."
+                        ),
+                    ),
+                ),
+                (
+                    "organization",
+                    models.ForeignKey(
+                        on_delete=django.db.models.deletion.CASCADE,
+                        related_name="notification_buffer_rows",
+                        to="account_v2.organization",
+                        db_comment=(
+                            "Tenant scope. Mandatory grouping key — prevents "
+                            "cross-tenant leakage at flush time."
+                        ),
+                    ),
+                ),
+            ],
+            options={
+                "verbose_name": "Notification Buffer",
+                "verbose_name_plural": "Notification Buffers",
+                "db_table": "notification_buffer",
+            },
+        ),
+        migrations.AddIndex(
+            model_name="notificationbuffer",
+            index=models.Index(
+                condition=models.Q(("status", "PENDING")),
+                fields=["organization", "webhook_url", "auth_sig", "flush_after"],
+                name="idx_notif_buffer_pending",
+            ),
+        ),
+    ]
diff --git a/backend/notification_v2/models.py b/backend/notification_v2/models.py
index e5238ec176..a8b077f339 100644
--- a/backend/notification_v2/models.py
+++ b/backend/notification_v2/models.py
@@ -1,13 +1,21 @@
 import uuid
 
+from account_v2.models import Organization
 from api_v2.models import APIDeployment
 from django.db import models
 from pipeline_v2.models import Pipeline
 from utils.models.base_model import BaseModel
 
-from .enums import AuthorizationType, NotificationType, PlatformType
+from .enums import (
+    AuthorizationType,
+    BufferStatus,
+    DeliveryMode,
+    NotificationType,
+    PlatformType,
+)
 
 NOTIFICATION_NAME_MAX_LENGTH = 255
+AUTH_SIG_LENGTH = 64  # SHA-256 hex digest
 
 
 class Notification(BaseModel):
@@ -55,6 +63,16 @@ class Notification(BaseModel):
             "(default), fire on every terminal completion."
         ),
     )
+    delivery_mode = models.CharField(
+        max_length=16,
+        choices=DeliveryMode.choices(),
+        default=DeliveryMode.IMMEDIATE.value,
+        db_comment=(
+            "IMMEDIATE fires on every completion (default, unchanged behavior). "
+            "BATCHED buffers events and dispatches a single clubbed message per "
+            "(org, webhook_url, auth_sig) every NOTIFICATION_CLUB_INTERVAL."
+        ),
+    )
     # Foreign keys to specific models
     pipeline = models.ForeignKey(
         Pipeline,
@@ -100,3 +118,92 @@ def __str__(self):
             f"Notification {self.id}: (Type: {self.notification_type}, "
             f"Platform: {self.platform}, Url: {self.url}))"
         )
+
+
+class NotificationBuffer(BaseModel):
+    """Per-execution event buffered for a BATCHED notification.
+
+    One row is written per workflow completion when the source Notification
+    has delivery_mode=BATCHED. The flush job groups rows by
+    (organization, webhook_url, auth_sig), renders one clubbed message per
+    group, and dispatches via the existing send_webhook_notification Celery
+    task. Group key includes auth_sig because two notifications may share the
+    same URL but use different credentials — they must dispatch separately.
+    """
+
+    id = models.UUIDField(primary_key=True, default=uuid.uuid4, editable=False)
+    notification = models.ForeignKey(
+        Notification,
+        on_delete=models.CASCADE,
+        related_name="buffer_rows",
+        db_comment=(
+            "Source Notification. Cascade-delete is intentional: removing a "
+            "Notification expresses intent to stop all future deliveries, "
+            "including buffered ones."
+        ),
+    )
+    organization = models.ForeignKey(
+        Organization,
+        on_delete=models.CASCADE,
+        related_name="notification_buffer_rows",
+        db_comment=(
+            "Tenant scope. Mandatory grouping key — prevents cross-tenant "
+            "leakage at flush time."
+        ),
+    )
+    webhook_url = models.URLField(
+        db_comment="Denormalized destination URL; grouping key.",
+    )
+    payload = models.JSONField(
+        db_comment=(
+            "Pre-structured execution data (execution_id, status, error_message, "
+            "pipeline_name, pipeline_type) — NOT a final rendered message. The "
+            "renderer formats this at dispatch time."
+        ),
+    )
+    platform = models.CharField(
+        max_length=50,
+        choices=PlatformType.choices(),
+        db_comment="SLACK / API — drives renderer selection at flush time.",
+    )
+    auth_sig = models.CharField(
+        max_length=AUTH_SIG_LENGTH,
+        db_comment=(
+            "SHA-256 hex of (auth_type + auth_key + auth_header), computed at "
+            "enqueue time. Grouping key — never store raw credentials here."
+        ),
+    )
+    flush_after = models.DateTimeField(
+        db_comment=(
+            "created_at + NOTIFICATION_CLUB_INTERVAL, precomputed at enqueue. "
+            "Read-at-enqueue contract: changing the env var only affects rows "
+            "enqueued after the restart."
+        ),
+    )
+    dispatched_at = models.DateTimeField(null=True, blank=True)
+    status = models.CharField(
+        max_length=16,
+        choices=BufferStatus.choices(),
+        default=BufferStatus.PENDING.value,
+        db_comment="PENDING -> DISPATCHED on success, PENDING -> DEAD_LETTER on retry exhaustion.",
+    )
+
+    class Meta:
+        verbose_name = "Notification Buffer"
+        verbose_name_plural = "Notification Buffers"
+        db_table = "notification_buffer"
+        indexes = [
+            # Partial covering index — supports Index Only Scans on the flush
+            # GROUP BY query and bounds index size to live PENDING backlog.
+            models.Index(
+                fields=["organization", "webhook_url", "auth_sig", "flush_after"],
+                name="idx_notif_buffer_pending",
+                condition=models.Q(status=BufferStatus.PENDING.value),
+            ),
+        ]
+
+    def __str__(self) -> str:
+        return (
+            f"NotificationBuffer {self.id}: status={self.status} "
+            f"flush_after={self.flush_after.isoformat() if self.flush_after else 'n/a'}"
+        )
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index 4cb4f3c4cb..b2602929fe 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -1,10 +1,18 @@
 from rest_framework import serializers
 from utils.input_sanitizer import validate_name_field
 
-from .enums import AuthorizationType, NotificationType, PlatformType
+from .enums import AuthorizationType, DeliveryMode, NotificationType, PlatformType
 from .models import Notification
 
 
+class NotificationSettingsSerializer(serializers.Serializer):
+    """Org-scoped notification batching settings (UNS-611 v2)."""
+
+    # No min/max here: mfbt is silent on bounds. Backend ConfigSpec accepts
+    # any int; constraining is a follow-up if/when product gives a number.
+    club_interval_seconds = serializers.IntegerField()
+
+
 class NotificationSerializer(serializers.ModelSerializer):
     notification_type = serializers.ChoiceField(choices=NotificationType.choices())
     authorization_type = serializers.ChoiceField(choices=AuthorizationType.choices())
@@ -13,6 +21,11 @@ class NotificationSerializer(serializers.ModelSerializer):
         max_value=4, min_value=0, default=0, required=False
     )
     notify_on_failures = serializers.BooleanField(default=False, required=False)
+    delivery_mode = serializers.ChoiceField(
+        choices=DeliveryMode.choices(),
+        default=DeliveryMode.IMMEDIATE.value,
+        required=False,
+    )
 
     class Meta:
         model = Notification
diff --git a/backend/notification_v2/tasks.py b/backend/notification_v2/tasks.py
new file mode 100644
index 0000000000..a143f9295e
--- /dev/null
+++ b/backend/notification_v2/tasks.py
@@ -0,0 +1,51 @@
+"""Celery tasks owned by notification_v2.
+
+Currently hosts ``mark_buffer_dead_letter`` — a thin task attached as a
+Celery ``link_error`` to the clubbed dispatch chain. When the underlying
+``send_webhook_notification`` task exhausts retries, this task converts
+the buffered rows from PENDING/DISPATCHED to terminal DEAD_LETTER so the
+flush job will not re-pick them.
+"""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import Iterable
+from typing import Any
+
+from backend.celery_service import app as celery_app
+from notification_v2.enums import BufferStatus
+from notification_v2.models import NotificationBuffer
+
+logger = logging.getLogger(__name__)
+
+
+@celery_app.task(name="notification_v2.mark_buffer_dead_letter")
+def mark_buffer_dead_letter(
+    request: Any,
+    exc: Any = None,
+    traceback: Any = None,
+    *,
+    buffer_row_ids: Iterable[str] | None = None,
+) -> int:
+    """Mark a clubbed dispatch's rows as DEAD_LETTER on terminal failure.
+
+    Celery's ``link_error`` signature passes ``(request, exc, traceback)`` to
+    the callback; the actual buffer ids are bound at dispatch time via task
+    kwargs. Returns the row count for visibility in flower.
+    """
+    if not buffer_row_ids:
+        logger.warning(
+            "mark_buffer_dead_letter invoked without buffer_row_ids — nothing to do"
+        )
+        return 0
+    ids = list(buffer_row_ids)
+    updated: int = NotificationBuffer.objects.filter(id__in=ids).update(
+        status=BufferStatus.DEAD_LETTER.value
+    )
+    logger.warning(
+        "metric=notification_batch_dispatched_total result=dead_letter rows=%d " "exc=%r",
+        updated,
+        exc,
+    )
+    return updated
diff --git a/backend/notification_v2/tests/__init__.py b/backend/notification_v2/tests/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/backend/notification_v2/urls.py b/backend/notification_v2/urls.py
index 2e356b4003..e41bb00f3a 100644
--- a/backend/notification_v2/urls.py
+++ b/backend/notification_v2/urls.py
@@ -1,7 +1,7 @@
 from django.urls import path
 from rest_framework.urlpatterns import format_suffix_patterns
 
-from .views import NotificationViewSet
+from .views import NotificationSettingsView, NotificationViewSet
 
 notification_list = NotificationViewSet.as_view({"get": "list", "post": "create"})
 notification_detail = NotificationViewSet.as_view(
@@ -16,6 +16,13 @@
 urlpatterns = format_suffix_patterns(
     [
         path("", notification_list, name="notification-list"),
+        # Org-scoped notification batching settings (UNS-611 v2). Mounted
+        # before the <uuid:pk> route so "settings" is not interpreted as a UUID.
+        path(
+            "settings/",
+            NotificationSettingsView.as_view(),
+            name="notification-settings",
+        ),
         path("<uuid:pk>/", notification_detail, name="notification-detail"),
         path(
             "pipeline/<uuid:pipeline_uuid>/",
diff --git a/backend/notification_v2/views.py b/backend/notification_v2/views.py
index 1410256ab6..207d4acc6b 100644
--- a/backend/notification_v2/views.py
+++ b/backend/notification_v2/views.py
@@ -1,14 +1,26 @@
+import logging
+
 from api_v2.deployment_helper import DeploymentHelper
 from api_v2.exceptions import APINotFound
+from configuration.enums import ConfigKey
+from configuration.models import Configuration
 from pipeline_v2.exceptions import PipelineNotFound
 from pipeline_v2.models import Pipeline
 from pipeline_v2.pipeline_processor import PipelineProcessor
-from rest_framework import viewsets
+from platform_api.permissions import IsOrganizationAdmin
+from rest_framework import status, viewsets
+from rest_framework.permissions import IsAuthenticated
+from rest_framework.request import Request
+from rest_framework.response import Response
+from rest_framework.views import APIView
+from utils.user_context import UserContext
 
 from notification_v2.constants import NotificationUrlConstant
 
 from .models import Notification
-from .serializers import NotificationSerializer
+from .serializers import NotificationSerializer, NotificationSettingsSerializer
+
+logger = logging.getLogger(__name__)
 
 
 class NotificationViewSet(viewsets.ModelViewSet):
@@ -39,3 +51,47 @@ def get_queryset(self):
             queryset = queryset.filter(api=api)
 
         return queryset
+
+
+class NotificationSettingsView(APIView):
+    """Org-scoped notification batching settings — currently just the club interval.
+
+    GET returns the org's effective interval (override or env-derived default).
+    PATCH writes/updates the override via the generic configuration KV table.
+
+    Read-at-enqueue contract (mfbt §EC-2 / §EC-8): updates take effect for
+    notifications enqueued after the change. Existing PENDING buffer rows
+    keep their original flush_after.
+    """
+
+    permission_classes = [IsAuthenticated, IsOrganizationAdmin]
+
+    def get(self, request: Request) -> Response:
+        organization = UserContext.get_organization()
+        value = Configuration.get_value_by_organization(
+            ConfigKey.NOTIFICATION_CLUB_INTERVAL, organization
+        )
+        return Response({"club_interval_seconds": int(value)})
+
+    def patch(self, request: Request) -> Response:
+        serializer = NotificationSettingsSerializer(data=request.data, partial=True)
+        serializer.is_valid(raise_exception=True)
+        organization = UserContext.get_organization()
+        new_value = serializer.validated_data.get("club_interval_seconds")
+        if new_value is None:
+            return Response(
+                {"detail": "club_interval_seconds is required."},
+                status=status.HTTP_400_BAD_REQUEST,
+            )
+        # ConfigKey.cast_value enforces type + any future bounds; bubble its
+        # ValueError up as a 400 instead of letting it 500.
+        try:
+            ConfigKey.NOTIFICATION_CLUB_INTERVAL.cast_value(new_value)
+        except ValueError as exc:
+            return Response({"detail": str(exc)}, status=status.HTTP_400_BAD_REQUEST)
+        Configuration.objects.update_or_create(
+            organization=organization,
+            key=ConfigKey.NOTIFICATION_CLUB_INTERVAL.name,
+            defaults={"value": str(new_value), "enabled": True},
+        )
+        return Response({"club_interval_seconds": int(new_value)})
diff --git a/backend/pipeline_v2/notification.py b/backend/pipeline_v2/notification.py
index ec82145054..5a40a37506 100644
--- a/backend/pipeline_v2/notification.py
+++ b/backend/pipeline_v2/notification.py
@@ -1,6 +1,6 @@
 import logging
 
-from notification_v2.helper import NotificationHelper
+from notification_v2.helper import dispatch_with_delivery_mode
 from notification_v2.models import Notification
 from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
@@ -90,7 +90,8 @@ def send(self) -> None:
             successful_files=successful_files,
             failed_files=failed_files,
         )
-
-        NotificationHelper.send_notification(
-            notifications=self.notifications, payload=payload_dto.to_dict()
+        dispatch_with_delivery_mode(
+            list(self.notifications),
+            payload_dto.to_dict(),
+            error_context=f"pipeline={self.pipeline.id}",
         )
diff --git a/backend/utils/cors_origin.py b/backend/utils/cors_origin.py
new file mode 100644
index 0000000000..aa640c6bc6
--- /dev/null
+++ b/backend/utils/cors_origin.py
@@ -0,0 +1,81 @@
+"""CORS origin helpers used by Django settings and SocketIO log events.
+
+Kept free of Django imports so the matching/normalization logic can be unit
+tested without bootstrapping the full project.
+"""
+
+from __future__ import annotations
+
+import re
+from urllib.parse import urlparse
+
+
+class RegexOrigin:
+    """Origin pattern that compares to strings via regex match.
+
+    python-socketio enforces CORS with ``origin in allowed_origins`` during the
+    engine.io handshake — overriding ``__eq__`` lets a single list entry cover
+    a wildcard subdomain so bad origins are rejected before ``connect`` runs.
+
+    Instances are intentionally unhashable: a hashable object must satisfy
+    ``a == b ⇒ hash(a) == hash(b)``, but ``__eq__`` here is asymmetric across
+    types (matches many strings, hashes only one pattern). Any code that put
+    one in a ``set``/``frozenset`` would silently break the CORS gate, so
+    ``__hash__`` is disabled to fail loud at construction time instead.
+
+    ``fullmatch`` (not ``match``) is used so ``$`` doesn't permit a trailing
+    newline — defense in depth even though WSGI strips them upstream.
+    """
+
+    def __init__(self, pattern: str) -> None:
+        self._regex = re.compile(pattern)
+
+    def __eq__(self, other: object) -> bool:
+        if isinstance(other, str):
+            return self._regex.fullmatch(other) is not None
+        return NotImplemented
+
+    __hash__ = None  # see class docstring
+
+
+def normalize_web_app_origin(env_value: str) -> tuple[str, str, str]:
+    """Parse and canonicalize ``WEB_APP_ORIGIN_URL`` for CORS/CSRF allow-lists.
+
+    Returns ``(origin, wildcard_origin, subdomain_regex)``:
+
+    - ``origin``: ``scheme://host[:port]`` form. Hostname is lowercased and
+      explicit default ports (:80 for http, :443 for https) are dropped, so
+      it matches what browsers serialize per RFC 6454.
+    - ``wildcard_origin``: same with a literal ``*.`` subdomain prefix, for
+      Django's ``CSRF_TRUSTED_ORIGINS`` (which fnmatches ``*``).
+    - ``subdomain_regex``: anchored pattern matching any subdomain of the
+      configured netloc, for ``CORS_ALLOWED_ORIGIN_REGEXES`` and SocketIO
+      via ``RegexOrigin``.
+
+    Raises:
+        ValueError: if the env value is not an http(s) URL with a host.
+    """
+    parsed = urlparse(env_value)
+    # `parsed.port` is a property that raises ValueError on malformed/out-of-range
+    # ports (e.g. `:abc`, `:99999`). Catch it here so misconfig surfaces with the
+    # same actionable message as every other validation failure.
+    try:
+        port = parsed.port
+    except ValueError as exc:
+        raise ValueError(
+            f"WEB_APP_ORIGIN_URL must be of the form http(s)://host[:port], "
+            f"got: {parsed.geturl()!r}"
+        ) from exc
+    if parsed.scheme not in {"http", "https"} or not parsed.hostname:
+        raise ValueError(
+            f"WEB_APP_ORIGIN_URL must be of the form http(s)://host[:port], "
+            f"got: {parsed.geturl()!r}"
+        )
+    default_port = {"http": 80, "https": 443}[parsed.scheme]
+    netloc = parsed.hostname
+    if port and port != default_port:
+        netloc = f"{netloc}:{port}"
+    origin = f"{parsed.scheme}://{netloc}"
+    wildcard = f"{parsed.scheme}://*.{netloc}"
+    subdomain_regex = rf"^{re.escape(parsed.scheme)}://[^/]+\.{re.escape(netloc)}$"
+    return origin, wildcard, subdomain_regex
diff --git a/backend/utils/log_events.py b/backend/utils/log_events.py
index f2ff725820..dcb66ed81c 100644
--- a/backend/utils/log_events.py
+++ b/backend/utils/log_events.py
@@ -11,9 +11,15 @@
 from unstract.core.data_models import LogDataDTO
 from unstract.core.log_utils import get_validated_log_data, store_execution_log
 from utils.constants import ExecutionLogConstants
+from utils.cors_origin import RegexOrigin
 
 logger = logging.getLogger(__name__)
 
+
+_cors_allowed_origins: list[Any] = list(settings.CORS_ALLOWED_ORIGINS)
+for _pattern in getattr(settings, "CORS_ALLOWED_ORIGIN_REGEXES", []):
+    _cors_allowed_origins.append(RegexOrigin(_pattern))
+
 _kombu_kwargs: dict[str, Any] = {"url": settings.SOCKET_IO_MANAGER_URL}
 if getattr(settings, "SOCKET_IO_TRANSPORT_OPTIONS", None):
     _kombu_kwargs["connection_options"] = {
@@ -23,7 +29,7 @@
 sio = socketio.Server(
     # Allowed values: {threading, eventlet, gevent, gevent_uwsgi}
     async_mode="threading",
-    cors_allowed_origins=settings.CORS_ALLOWED_ORIGINS,
+    cors_allowed_origins=_cors_allowed_origins,
     logger=False,
     engineio_logger=False,
     always_connect=True,
diff --git a/backend/utils/tests/test_cors_origin.py b/backend/utils/tests/test_cors_origin.py
new file mode 100644
index 0000000000..65628b4405
--- /dev/null
+++ b/backend/utils/tests/test_cors_origin.py
@@ -0,0 +1,197 @@
+"""Regression tests for utils.cors_origin — the CORS origin matcher and
+URL normalizer that gate browser ``Origin`` headers on every Django request
+and SocketIO handshake.
+
+UN-3439: production socket connections silently failed for wildcard subdomains
+because python-socketio does exact-string comparison. These tests pin the
+contract so the next refactor can't reopen the hole.
+"""
+
+from __future__ import annotations
+
+import time
+
+import pytest
+
+from utils.cors_origin import RegexOrigin, normalize_web_app_origin
+
+
+class TestRegexOrigin:
+    def test_subdomain_matches(self):
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        assert ("https://app.example.com" == ro) is True
+        assert ("https://api.example.com" == ro) is True
+
+    def test_deep_subdomain_matches(self):
+        """Multi-level subdomains are accepted — DNS-owned by the same party."""
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        assert ("https://dev.env.example.com" == ro) is True
+
+    def test_apex_does_not_match(self):
+        """Apex is covered by the exact-match CORS_ALLOWED_ORIGINS entry, not
+        the wildcard regex."""
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        assert ("https://example.com" == ro) is False
+
+    def test_lookalike_rejected(self):
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        assert ("https://attacker-example.com" == ro) is False
+        assert ("https://example.com.attacker.com" == ro) is False
+        assert ("https://x.example.com.attacker.com" == ro) is False
+
+    def test_wrong_scheme_rejected(self):
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        # NOSONAR — the `http://` URL is intentional test data: we are
+        # asserting it is *rejected* by an https-scoped pattern.
+        assert ("http://app.example.com" == ro) is False  # NOSONAR
+
+    def test_trailing_newline_rejected(self):
+        """``fullmatch`` (not ``match``) is required so ``$`` doesn't permit
+        a trailing ``\\n`` per Python regex semantics."""
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        assert ("https://app.example.com\n" == ro) is False
+
+    def test_in_operator_routes_to_eq(self):
+        """``origin in allowed_origins`` is exactly how python-socketio gates
+        the engine.io handshake — verify Python's reflected ``__eq__`` kicks in."""
+        allowed = [RegexOrigin(r"^https://[^/]+\.example\.com$")]
+        assert "https://app.example.com" in allowed
+        assert "https://evil.com" not in allowed
+
+    def test_non_string_returns_not_implemented(self):
+        """``__eq__`` must return the ``NotImplemented`` sentinel (not
+        ``False``) for non-strings so Python's reflected-equality protocol
+        can fall back to identity. Tested via direct dunder calls because
+        ``ro == None`` short-circuits before reaching ``__eq__``."""
+        ro = RegexOrigin(r"^x$")
+        assert ro.__eq__(None) is NotImplemented
+        assert ro.__eq__(42) is NotImplemented
+        assert ro.__eq__([]) is NotImplemented
+
+    def test_unhashable(self):
+        """``__hash__ = None`` prevents the equality/hash contract from being
+        violated if anyone wraps the allow-list in a ``set``/``frozenset``."""
+        ro = RegexOrigin(r"^x$")
+        with pytest.raises(TypeError):
+            hash(ro)
+        with pytest.raises(TypeError):
+            # `len({ro})` builds the set (calling __hash__) and consumes it via
+            # an explicit function call — keeps ruff from collapsing the
+            # statement and Sonar from flagging it as side-effect-free.
+            len({ro})
+
+    def test_no_redos(self):
+        """Pattern must complete on hostile input — ``[^/]+`` has no nested
+        quantifiers so backtracking is bounded. Threshold is generous (500ms)
+        so noisy CI runners don't flake; ReDoS would blow up by orders of
+        magnitude past this."""
+        ro = RegexOrigin(r"^https://[^/]+\.example\.com$")
+        hostile = "https://" + "a" * 10000 + ".evil.com"
+        start = time.perf_counter()
+        _ = hostile in [ro]
+        assert time.perf_counter() - start < 0.5
+
+
+class TestNormalizeWebAppOrigin:
+    def test_basic_https(self):
+        origin, wildcard, _ = normalize_web_app_origin("https://example.com")
+        assert origin == "https://example.com"
+        assert wildcard == "https://*.example.com"
+
+    def test_strips_trailing_slash(self):
+        origin, _, _ = normalize_web_app_origin("https://example.com/")
+        assert origin == "https://example.com"
+
+    def test_strips_path_and_query(self):
+        origin, _, _ = normalize_web_app_origin("https://example.com/path?q=1")
+        assert origin == "https://example.com"
+
+    def test_lowercases_hostname(self):
+        """Browsers serialize ``Origin`` with a lowercase host (RFC 6454);
+        django-cors-headers does case-sensitive string compare, so the env
+        value must be lowercased to match."""
+        origin, _, _ = normalize_web_app_origin("https://APP.EXAMPLE.COM")
+        assert origin == "https://app.example.com"
+
+    def test_drops_default_https_port(self):
+        """Browsers omit the explicit default port from ``Origin`` per
+        RFC 6454 — keeping ``:443`` would silently break exact match."""
+        origin, _, _ = normalize_web_app_origin("https://example.com:443")
+        assert origin == "https://example.com"
+
+    def test_drops_default_http_port(self):
+        # NOSONAR — `http://` URLs are intentional test data for the port
+        # normalization logic, not a runtime use of the insecure protocol.
+        origin, _, _ = normalize_web_app_origin("http://example.com:80")  # NOSONAR
+        assert origin == "http://example.com"  # NOSONAR
+
+    def test_keeps_non_default_port(self):
+        origin, wildcard, _ = normalize_web_app_origin("https://example.com:8443")
+        assert origin == "https://example.com:8443"
+        assert wildcard == "https://*.example.com:8443"
+
+    def test_localhost_default(self):
+        origin, _, _ = normalize_web_app_origin("http://localhost:3000")
+        assert origin == "http://localhost:3000"
+
+    @pytest.mark.parametrize(
+        "bad",
+        [
+            "",
+            "not-a-url",
+            "example.com",          # missing scheme
+            "//example.com",        # protocol-relative
+            "https://",             # missing host
+            "ftp://example.com",  # non-browser scheme  # NOSONAR — test input asserting ftp is rejected
+            "ws://example.com",  # not a top-level browser scheme
+            "https://example.com:abc",  # malformed port — urlparse raises on .port access
+            "https://example.com:99999",  # out-of-range port
+        ],
+    )
+    def test_rejects_misconfigured(self, bad):
+        """Fail fast at startup so misconfigured envs can't silently produce
+        CORS rules that match nothing real."""
+        with pytest.raises(ValueError, match="WEB_APP_ORIGIN_URL"):
+            normalize_web_app_origin(bad)
+
+
+class TestSubdomainRegexEndToEnd:
+    """End-to-end: the regex returned by ``normalize_web_app_origin`` is what
+    actually gates production. Verify via ``RegexOrigin`` (same path as
+    SocketIO uses)."""
+
+    def test_apex_env_accepts_subdomains(self):
+        _, _, pattern = normalize_web_app_origin("https://us-central.unstract.com")
+        ro = RegexOrigin(pattern)
+        # The exact failing origins from UN-3439:
+        assert "https://dev.env.us-central.unstract.com" in [ro]
+        assert "https://test.env.us-central.unstract.com" in [ro]
+
+    def test_apex_rejected_by_regex(self):
+        """Apex itself is *not* matched by the wildcard regex — that's the
+        exact-match CORS_ALLOWED_ORIGINS entry's job."""
+        _, _, pattern = normalize_web_app_origin("https://example.com")
+        ro = RegexOrigin(pattern)
+        assert "https://example.com" not in [ro]
+
+    @pytest.mark.parametrize(
+        "spoof",
+        [
+            "https://attacker-example.com",
+            "https://x.example.com.attacker.com",
+            "https://example.com.attacker.com",
+            "http://app.example.com",  # wrong scheme  # NOSONAR — test input asserting http is rejected
+            "https://app.example.com\n",  # trailing newline
+        ],
+    )
+    def test_spoofed_origins_rejected(self, spoof):
+        _, _, pattern = normalize_web_app_origin("https://example.com")
+        ro = RegexOrigin(pattern)
+        assert spoof not in [ro], f"should reject {spoof!r}"
+
+    def test_uppercase_env_still_accepts_lowercase_origin(self):
+        """Browser sends lowercase even if the env was set with uppercase;
+        normalization must canonicalize before regex compilation."""
+        _, _, pattern = normalize_web_app_origin("https://APP.EXAMPLE.COM")
+        ro = RegexOrigin(pattern)
+        assert "https://sub.app.example.com" in [ro]
diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
index 65460376d4..17066ed06b 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
@@ -2,6 +2,12 @@ import { Button, Checkbox, Form, Input, Select, Space } from "antd";
 import PropTypes from "prop-types";
 import { useEffect, useState } from "react";
 import { getBackendErrorDetail } from "../../../helpers/GetStaticData";
+import { useAxiosPrivate } from "../../../hooks/useAxiosPrivate";
+import { useSessionStore } from "../../../store/session-store";
+
+// Used only when the org's batch interval can't be fetched (network or auth
+// failure). Backend's env-derived default is also 30 min, so this matches.
+const FALLBACK_BATCH_INTERVAL_MINUTES = 30;
 
 const DEFAULT_FORM_DETAILS = {
   name: "",
@@ -13,6 +19,7 @@ const DEFAULT_FORM_DETAILS = {
   is_active: false,
   max_retries: 0,
   notify_on_failures: false,
+  delivery_mode: "IMMEDIATE",
   pipeline: "",
   api: "",
   url: "",
@@ -68,6 +75,37 @@ function CreateNotification({
   const [formDetails, setFormDetails] = useState(DEFAULT_FORM_DETAILS);
   const [backendErrors, setBackendErrors] = useState(null);
   const [resetForm, setResetForm] = useState(false);
+  const [batchIntervalMinutes, setBatchIntervalMinutes] = useState(
+    FALLBACK_BATCH_INTERVAL_MINUTES,
+  );
+  const axiosPrivate = useAxiosPrivate();
+  const { sessionDetails } = useSessionStore();
+
+  useEffect(() => {
+    // Read live org-scoped interval (UNS-611 v2). Fall back silently to the
+    // hardcoded 30-min default — the dropdown still labels something useful.
+    if (!sessionDetails?.orgId) {
+      return;
+    }
+    axiosPrivate({
+      method: "GET",
+      url: `/api/v1/unstract/${sessionDetails.orgId}/notifications/settings/`,
+    })
+      .then((res) => {
+        const seconds = res?.data?.club_interval_seconds;
+        if (typeof seconds === "number" && seconds > 0) {
+          setBatchIntervalMinutes(Math.max(1, Math.round(seconds / 60)));
+        }
+      })
+      .catch(() => {
+        // Non-fatal — keep fallback.
+      });
+  }, [sessionDetails?.orgId]);
+
+  const deliveryModes = [
+    { value: "IMMEDIATE", label: "Immediate" },
+    { value: "BATCHED", label: "Batched" },
+  ];
 
   useEffect(() => {
     if (editDetails) {
@@ -84,7 +122,18 @@ function CreateNotification({
   }, [formDetails]);
 
   const handleInputChange = (changedValues, allValues) => {
-    setFormDetails({ ...formDetails, ...allValues });
+    let nextValues = { ...formDetails, ...allValues };
+    // Failure alerts must not be delayed by the batch window — auto-select
+    // IMMEDIATE the moment the box is checked. The user can still override
+    // to BATCHED afterward and that choice will stick.
+    if (
+      Object.hasOwn(changedValues, "notify_on_failures") &&
+      changedValues.notify_on_failures === true
+    ) {
+      nextValues = { ...nextValues, delivery_mode: "IMMEDIATE" };
+      form.setFieldsValue({ delivery_mode: "IMMEDIATE" });
+    }
+    setFormDetails(nextValues);
     const changedFieldName = Object.keys(changedValues)[0];
     form.setFields([
       {
@@ -228,6 +277,18 @@ function CreateNotification({
       >
         <Checkbox>Notify on failures only</Checkbox>
       </Form.Item>
+      <Form.Item
+        label="Delivery Mode"
+        name="delivery_mode"
+        tooltip="Immediate fires on every completion. Batched buffers events and dispatches a single clubbed message per webhook every batch interval."
+        extra={
+          formDetails.delivery_mode === "BATCHED"
+            ? `Notifications will be batched and sent every ${batchIntervalMinutes} minutes. Org admins can change this in Platform Settings.`
+            : null
+        }
+      >
+        <Select options={deliveryModes} />
+      </Form.Item>
       <Form.Item className="display-flex-right">
         <Space>
           <Button onClick={() => setIsForm(false)}>Cancel</Button>
diff --git a/frontend/src/components/settings/platform/PlatformSettings.jsx b/frontend/src/components/settings/platform/PlatformSettings.jsx
index f255da6a73..0b39cebecf 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.jsx
+++ b/frontend/src/components/settings/platform/PlatformSettings.jsx
@@ -3,7 +3,17 @@ import {
   CopyOutlined,
   DeleteOutlined,
 } from "@ant-design/icons";
-import { Button, Col, Divider, Input, Radio, Row, Typography } from "antd";
+import {
+  Button,
+  Col,
+  Divider,
+  Input,
+  InputNumber,
+  Radio,
+  Row,
+  Space,
+  Typography,
+} from "antd";
 import { useEffect, useState } from "react";
 import { useNavigate } from "react-router-dom";
 
@@ -38,6 +48,9 @@ function PlatformSettings() {
   const [keys, setKeys] = useState(defaultKeys);
   const [isLoadingIndex, setLoadingIndex] = useState(null);
   const [isDeletingIndex, setDeletingIndex] = useState(null);
+  // UI shows minutes; wire format (and ConfigSpec.value) is seconds.
+  const [batchIntervalMinutes, setBatchIntervalMinutes] = useState(null);
+  const [isSavingInterval, setIsSavingInterval] = useState(false);
   const { sessionDetails } = useSessionStore();
   const { setAlertDetails } = useAlertStore();
   const axiosPrivate = useAxiosPrivate();
@@ -45,6 +58,58 @@ function PlatformSettings() {
   const handleException = useExceptionHandler();
   const { setPostHogCustomEvent } = usePostHogEvents();
 
+  useEffect(() => {
+    // Load org-scoped batch interval (UNS-611 v2). Falls back silently to
+    // null on failure so the rest of the page still renders.
+    axiosPrivate({
+      method: "GET",
+      url: `/api/v1/unstract/${sessionDetails?.orgId}/notifications/settings/`,
+    })
+      .then((res) => {
+        const seconds = res?.data?.club_interval_seconds;
+        if (typeof seconds === "number" && seconds > 0) {
+          setBatchIntervalMinutes(Math.round(seconds / 60));
+        }
+      })
+      .catch(() => {
+        // Non-fatal — admin just won't see a pre-filled value.
+      });
+  }, []);
+
+  const handleSaveInterval = () => {
+    if (!batchIntervalMinutes || batchIntervalMinutes < 1) {
+      setAlertDetails({
+        type: "error",
+        content: "Batch interval must be a positive number of minutes.",
+      });
+      return;
+    }
+    setIsSavingInterval(true);
+    axiosPrivate({
+      method: "PATCH",
+      url: `/api/v1/unstract/${sessionDetails?.orgId}/notifications/settings/`,
+      headers: {
+        "X-CSRFToken": sessionDetails?.csrfToken,
+        "Content-Type": "application/json",
+      },
+      data: { club_interval_seconds: batchIntervalMinutes * 60 },
+    })
+      .then(() => {
+        setAlertDetails({
+          type: "success",
+          content: "Notification batch interval updated.",
+        });
+      })
+      .catch((err) => {
+        setAlertDetails(
+          handleException(err, "Failed to update batch interval"),
+        );
+      })
+      .finally(() => {
+        setIsSavingInterval(false);
+      });
+  };
+
   useEffect(() => {
     const requestOptions = {
       method: "GET",
@@ -331,6 +396,34 @@ function PlatformSettings() {
                   );
                 })}
               </div>
+              <Divider />
+              <div className="plt-set-batch-interval">
+                <Typography.Title level={5}>
+                  Notification batching
+                </Typography.Title>
+                <Typography.Text type="secondary">
+                  Batched notifications enqueued after a change pick up the new
+                  value; in-flight rows keep their original cadence.
+                </Typography.Text>
+                <div style={{ marginTop: 12 }}>
+                  <Space>
+                    <Typography.Text>Batch interval (minutes)</Typography.Text>
+                    <InputNumber
+                      min={1}
+                      value={batchIntervalMinutes}
+                      onChange={(v) => setBatchIntervalMinutes(v)}
+                      placeholder="e.g. 30"
+                    />
+                    <Button
+                      type="primary"
+                      onClick={handleSaveInterval}
+                      loading={isSavingInterval}
+                    >
+                      Save
+                    </Button>
+                  </Space>
+                </div>
+              </div>
             </div>
           </IslandLayout>
         </div>
diff --git a/unstract/sdk1/src/unstract/sdk1/adapters/base1.py b/unstract/sdk1/src/unstract/sdk1/adapters/base1.py
index cb1c738cf4..d1aa475ec4 100644
--- a/unstract/sdk1/src/unstract/sdk1/adapters/base1.py
+++ b/unstract/sdk1/src/unstract/sdk1/adapters/base1.py
@@ -474,6 +474,71 @@ def validate_model(adapter_metadata: dict[str, "Any"]) -> str:
             return f"vertex_ai/{model}"
 
 
+# AWS Bedrock auth helpers: shared by LLM and Embedding param classes.
+# `auth_type` is a UI-only selector (Access Keys vs IAM Role / Instance
+# Profile) that drives form rendering. The backend translates the user's
+# choice into actual credential handling here so that both validate()
+# methods stay symmetric and a single bug fix applies to both paths.
+_BEDROCK_AWS_KEY_FIELDS: tuple[str, ...] = (
+    "aws_access_key_id",
+    "aws_secret_access_key",
+)
+_BEDROCK_VALID_AUTH_TYPES: frozenset[str | None] = frozenset(
+    {None, "access_keys", "iam_role"}
+)
+
+
+def _resolve_bedrock_aws_credentials(
+    adapter_metadata: dict[str, "Any"],
+    validated: dict[str, "Any"],
+) -> dict[str, "Any"]:
+    """Apply auth_type semantics to the validated LiteLLM kwargs.
+
+    Three cases:
+    - ``auth_type == "iam_role"``: drop access keys unconditionally so a
+      previously-saved adapter switched into IAM Role mode does not leak
+      stale long-lived credentials. boto3's default credential chain
+      (IRSA / instance profile / env vars / AWS Profile) takes over.
+    - ``auth_type == "access_keys"`` (explicit): require non-blank values.
+      A blank submission must surface as a clear error rather than
+      silently fall through to the default chain (which would hide the
+      mistake and authenticate with whatever ambient creds the host has).
+    - ``auth_type is None`` (legacy adapters created before this field
+      existed): lenient strip of empty/missing keys. Preserves backwards
+      compatibility for stored configurations.
+
+    Raises:
+        ValueError: on unknown ``auth_type`` (typo / non-UI client) or on
+            blank credentials when ``auth_type == "access_keys"``.
+    """
+    auth_type = adapter_metadata.get("auth_type")
+    if auth_type not in _BEDROCK_VALID_AUTH_TYPES:
+        raise ValueError(
+            f"Unknown auth_type {auth_type!r}; expected one of "
+            f"{sorted(t for t in _BEDROCK_VALID_AUTH_TYPES if t)!r} or absent."
+        )
+
+    if auth_type == "iam_role":
+        for key in _BEDROCK_AWS_KEY_FIELDS:
+            validated.pop(key, None)
+        return validated
+
+    if auth_type == "access_keys":
+        for key in _BEDROCK_AWS_KEY_FIELDS:
+            value = validated.get(key)
+            if not isinstance(value, str) or not value.strip():
+                raise ValueError(f"{key} is required when auth_type is 'access_keys'.")
+        return validated
+
+    # Legacy adapters with no auth_type: strip blanks silently to
+    # preserve the pre-PR behaviour where empty key fields fell through
+    # to boto3's default chain.
+    for key in _BEDROCK_AWS_KEY_FIELDS:
+        if not validated.get(key):
+            validated.pop(key, None)
+    return validated
+
+
 class AWSBedrockLLMParameters(BaseChatCompletionParameters):
     """See https://docs.litellm.ai/docs/providers/bedrock."""
 
@@ -525,11 +590,12 @@ def validate(adapter_metadata: dict[str, "Any"]) -> dict[str, "Any"]:
                 result_metadata["thinking"] = thinking_config
                 result_metadata["temperature"] = 1
 
-        # Create validation metadata excluding control fields
+        # Create validation metadata excluding control fields. `auth_type` is
+        # a UI-only selector that drives form rendering; LiteLLM never sees it.
         validation_metadata = {
             k: v
             for k, v in result_metadata.items()
-            if k not in ("enable_thinking", "budget_tokens", "thinking")
+            if k not in ("enable_thinking", "budget_tokens", "thinking", "auth_type")
         }
 
         validated = AWSBedrockLLMParameters(**validation_metadata).model_dump()
@@ -538,7 +604,11 @@ def validate(adapter_metadata: dict[str, "Any"]) -> dict[str, "Any"]:
         if enable_thinking and "thinking" in result_metadata:
             validated["thinking"] = result_metadata["thinking"]
 
-        return validated
+        # Apply Bedrock auth semantics: IAM Role mode drops keys, Access
+        # Keys mode requires non-blank values, legacy (no auth_type) is
+        # lenient. Reads auth_type from result_metadata since validation_
+        # metadata strips it before Pydantic.
+        return _resolve_bedrock_aws_credentials(result_metadata, validated)
 
     @staticmethod
     def validate_model(adapter_metadata: dict[str, "Any"]) -> str:
@@ -959,8 +1029,10 @@ def validate_model(adapter_metadata: dict[str, "Any"]) -> str:
 class AWSBedrockEmbeddingParameters(BaseEmbeddingParameters):
     """See https://docs.litellm.ai/docs/providers/bedrock."""
 
-    aws_access_key_id: str | None
-    aws_secret_access_key: str | None
+    # Region is still mandatory — credentials are the only fields that
+    # may be absent (IAM Role / Instance Profile mode).
+    aws_access_key_id: str | None = None
+    aws_secret_access_key: str | None = None
     aws_region_name: str | None
 
     @staticmethod
@@ -973,7 +1045,16 @@ def validate(adapter_metadata: dict[str, "Any"]) -> dict[str, "Any"]:
         ):
             adapter_metadata["aws_region_name"] = adapter_metadata["region_name"]
 
-        return AWSBedrockEmbeddingParameters(**adapter_metadata).model_dump()
+        # `auth_type` is a UI-only selector; strip before LiteLLM kwargs.
+        validation_metadata = {
+            k: v for k, v in adapter_metadata.items() if k != "auth_type"
+        }
+
+        validated = AWSBedrockEmbeddingParameters(**validation_metadata).model_dump()
+
+        # Apply Bedrock auth semantics: IAM Role drops keys, Access Keys
+        # requires non-blank values, legacy (no auth_type) is lenient.
+        return _resolve_bedrock_aws_credentials(adapter_metadata, validated)
 
     @staticmethod
     def validate_model(adapter_metadata: dict[str, "Any"]) -> str:
diff --git a/unstract/sdk1/src/unstract/sdk1/adapters/embedding1/static/bedrock.json b/unstract/sdk1/src/unstract/sdk1/adapters/embedding1/static/bedrock.json
index 81829a0f49..200d8f5bfb 100644
--- a/unstract/sdk1/src/unstract/sdk1/adapters/embedding1/static/bedrock.json
+++ b/unstract/sdk1/src/unstract/sdk1/adapters/embedding1/static/bedrock.json
@@ -2,9 +2,7 @@
     "title": "Bedrock Embeddings",
     "type": "object",
     "required": [
-      "aws_secret_access_key",
       "region_name",
-      "aws_access_key_id",
       "model",
       "adapter_name"
     ],
@@ -21,18 +19,6 @@
         "default": "amazon.titan-embed-text-v2:0",
         "description": "Model name. Refer to [Bedrock's documentation](https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html) for the list of available models."
       },
-      "aws_access_key_id": {
-        "type": "string",
-        "title": "AWS Access Key ID",
-        "description": "Provide your AWS Access Key ID",
-        "format": "password"
-      },
-      "aws_secret_access_key": {
-        "type": "string",
-        "title": "AWS Secret Access Key",
-        "description": "Provide your AWS Secret Access Key",
-        "format": "password"
-      },
       "region_name": {
         "type": "string",
         "title": "AWS Region name",
@@ -53,6 +39,60 @@
         "title": "Timeout",
         "default": 900,
         "description": "Timeout in seconds"
+      },
+      "auth_type": {
+        "type": "string",
+        "title": "Authentication Type",
+        "enum": [
+          "access_keys",
+          "iam_role"
+        ],
+        "enumNames": [
+          "Access Keys",
+          "IAM Role / Instance Profile (on-prem AWS only)"
+        ],
+        "default": "access_keys",
+        "description": "Choose **Access Keys** for any deployment (provide your AWS Access Key ID and Secret). Choose **IAM Role / Instance Profile** only when Unstract is hosted on AWS infrastructure that already has ambient credentials — for example EKS pods with IRSA, ECS tasks with a task role, or EC2 instances with an instance profile. The on-prem option requires no further input; boto3 picks up the host's identity automatically."
+      }
+    },
+    "dependencies": {
+      "auth_type": {
+        "oneOf": [
+          {
+            "properties": {
+              "auth_type": {
+                "enum": [
+                  "access_keys"
+                ]
+              },
+              "aws_access_key_id": {
+                "type": "string",
+                "title": "AWS Access Key ID",
+                "description": "Provide your AWS Access Key ID.",
+                "format": "password"
+              },
+              "aws_secret_access_key": {
+                "type": "string",
+                "title": "AWS Secret Access Key",
+                "description": "Provide your AWS Secret Access Key.",
+                "format": "password"
+              }
+            },
+            "required": [
+              "aws_access_key_id",
+              "aws_secret_access_key"
+            ]
+          },
+          {
+            "properties": {
+              "auth_type": {
+                "enum": [
+                  "iam_role"
+                ]
+              }
+            }
+          }
+        ]
       }
     }
   }
diff --git a/unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/bedrock.json b/unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/bedrock.json
index 9adb8b8ceb..03f23d1376 100644
--- a/unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/bedrock.json
+++ b/unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/bedrock.json
@@ -19,18 +19,6 @@
       "default": "amazon.titan-text-express-v1",
       "description": "Model name. Refer to [Bedrock's documentation](https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html) for the list of available models."
     },
-    "aws_access_key_id": {
-      "type": "string",
-      "title": "AWS Access Key ID",
-      "description": "Provide your AWS Access Key ID. Leave empty if using AWS Profile or IAM role.",
-      "format": "password"
-    },
-    "aws_secret_access_key": {
-      "type": "string",
-      "title": "AWS Secret Access Key",
-      "description": "Provide your AWS Secret Access Key. Leave empty if using AWS Profile or IAM role.",
-      "format": "password"
-    },
     "region_name": {
       "type": "string",
       "title": "AWS Region Name",
@@ -75,6 +63,60 @@
       "title": "Enable Extended Thinking",
       "default": false,
       "description": "Enhance reasoning for complex tasks with step-by-step transparency. Available only for Claude 3.7 Sonnet."
+    },
+    "auth_type": {
+      "type": "string",
+      "title": "Authentication Type",
+      "enum": [
+        "access_keys",
+        "iam_role"
+      ],
+      "enumNames": [
+        "Access Keys",
+        "IAM Role / Instance Profile (on-prem AWS only)"
+      ],
+      "default": "access_keys",
+      "description": "Choose **Access Keys** for any deployment (provide your AWS Access Key ID and Secret). Choose **IAM Role / Instance Profile** only when Unstract is hosted on AWS infrastructure that already has ambient credentials — for example EKS pods with IRSA, ECS tasks with a task role, or EC2 instances with an instance profile. The on-prem option requires no further input; boto3 picks up the host's identity automatically."
+    }
+  },
+  "dependencies": {
+    "auth_type": {
+      "oneOf": [
+        {
+          "properties": {
+            "auth_type": {
+              "enum": [
+                "access_keys"
+              ]
+            },
+            "aws_access_key_id": {
+              "type": "string",
+              "title": "AWS Access Key ID",
+              "description": "Provide your AWS Access Key ID.",
+              "format": "password"
+            },
+            "aws_secret_access_key": {
+              "type": "string",
+              "title": "AWS Secret Access Key",
+              "description": "Provide your AWS Secret Access Key.",
+              "format": "password"
+            }
+          },
+          "required": [
+            "aws_access_key_id",
+            "aws_secret_access_key"
+          ]
+        },
+        {
+          "properties": {
+            "auth_type": {
+              "enum": [
+                "iam_role"
+              ]
+            }
+          }
+        }
+      ]
     }
   },
   "allOf": [
diff --git a/unstract/sdk1/tests/test_bedrock_adapter.py b/unstract/sdk1/tests/test_bedrock_adapter.py
new file mode 100644
index 0000000000..4d4b7c1cd7
--- /dev/null
+++ b/unstract/sdk1/tests/test_bedrock_adapter.py
@@ -0,0 +1,246 @@
+"""Unit tests for the AWS Bedrock LLM and embedding adapters.
+
+Covers the auth_type selector behaviour added alongside the IAM Role /
+Instance Profile mode, plus backwards compatibility for legacy adapter
+configurations stored before auth_type existed.
+"""
+
+import pytest
+from unstract.sdk1.adapters.base1 import (
+    AWSBedrockEmbeddingParameters,
+    AWSBedrockLLMParameters,
+)
+
+# ── LLM: validate auth_type semantics ────────────────────────────────────────
+
+
+def test_llm_legacy_no_auth_type_keeps_keys() -> None:
+    """Legacy adapters without auth_type must keep working unchanged."""
+    out = AWSBedrockLLMParameters.validate(
+        {
+            "model": "anthropic.claude-3-haiku-20240307-v1:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "AKIAFAKE",
+            "aws_secret_access_key": "secret",
+        }
+    )
+    assert out["aws_access_key_id"] == "AKIAFAKE"
+    assert out["aws_secret_access_key"] == "secret"
+    assert out["aws_region_name"] == "us-east-1"
+    assert "auth_type" not in out
+
+
+def test_llm_access_keys_mode_keeps_keys_and_strips_auth_type() -> None:
+    out = AWSBedrockLLMParameters.validate(
+        {
+            "auth_type": "access_keys",
+            "model": "anthropic.claude-3-haiku-20240307-v1:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "AKIAFAKE",
+            "aws_secret_access_key": "secret",
+        }
+    )
+    assert out["aws_access_key_id"] == "AKIAFAKE"
+    assert out["aws_secret_access_key"] == "secret"
+    assert "auth_type" not in out
+
+
+def test_llm_iam_role_mode_drops_keys_even_when_present() -> None:
+    """IAM Role mode unconditionally drops access keys.
+
+    A saved adapter switched into IAM mode must not silently leak the
+    previously stored long-lived credentials.
+    """
+    out = AWSBedrockLLMParameters.validate(
+        {
+            "auth_type": "iam_role",
+            "model": "us.anthropic.claude-haiku-4-5-20251001-v1:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "STALE_KEY",
+            "aws_secret_access_key": "STALE_SECRET",
+        }
+    )
+    assert "aws_access_key_id" not in out
+    assert "aws_secret_access_key" not in out
+    assert out["aws_region_name"] == "us-east-1"
+    assert "auth_type" not in out
+
+
+def test_llm_iam_role_mode_with_no_keys() -> None:
+    out = AWSBedrockLLMParameters.validate(
+        {
+            "auth_type": "iam_role",
+            "model": "us.anthropic.claude-haiku-4-5-20251001-v1:0",
+            "region_name": "us-east-1",
+        }
+    )
+    assert "aws_access_key_id" not in out
+    assert "aws_secret_access_key" not in out
+
+
+def test_llm_access_keys_mode_blank_keys_raises() -> None:
+    """Blank values must surface a clear error.
+
+    Falling through to boto3's default chain would hide the user's
+    misconfiguration and authenticate with whatever ambient creds the
+    host happens to have.
+    """
+    with pytest.raises(ValueError, match="aws_access_key_id is required"):
+        AWSBedrockLLMParameters.validate(
+            {
+                "auth_type": "access_keys",
+                "model": "anthropic.claude-3-haiku-20240307-v1:0",
+                "region_name": "us-east-1",
+                "aws_access_key_id": "",
+                "aws_secret_access_key": "",
+            }
+        )
+
+
+def test_llm_access_keys_mode_whitespace_keys_raises() -> None:
+    with pytest.raises(ValueError, match="aws_secret_access_key is required"):
+        AWSBedrockLLMParameters.validate(
+            {
+                "auth_type": "access_keys",
+                "model": "anthropic.claude-3-haiku-20240307-v1:0",
+                "region_name": "us-east-1",
+                "aws_access_key_id": "AKIAFAKE",
+                "aws_secret_access_key": "   ",
+            }
+        )
+
+
+def test_llm_unknown_auth_type_raises() -> None:
+    """A typo or non-UI client must not silently fall through."""
+    with pytest.raises(ValueError, match="Unknown auth_type"):
+        AWSBedrockLLMParameters.validate(
+            {
+                "auth_type": "access_key",  # typo: missing 's'
+                "model": "anthropic.claude-3-haiku-20240307-v1:0",
+                "region_name": "us-east-1",
+                "aws_access_key_id": "AKIAFAKE",
+                "aws_secret_access_key": "secret",
+            }
+        )
+
+
+def test_llm_other_params_preserved_through_strip() -> None:
+    """Non-credential params survive the auth-type handling.
+
+    model_id, aws_profile_name, region, and thinking config must pass
+    through both the strip and the resolver unchanged.
+    """
+    out = AWSBedrockLLMParameters.validate(
+        {
+            "auth_type": "iam_role",
+            "model": "anthropic.claude-3-7-sonnet-20250219-v1:0",
+            "region_name": "us-east-1",
+            "aws_profile_name": "dev-profile",
+            "model_id": (
+                "arn:aws:bedrock:us-east-1:1234:application-inference-profile/abc"
+            ),
+            "enable_thinking": True,
+            "budget_tokens": 4096,
+        }
+    )
+    assert out["aws_profile_name"] == "dev-profile"
+    assert out["aws_region_name"] == "us-east-1"
+    assert out["model_id"].endswith("application-inference-profile/abc")
+    assert out["thinking"] == {"type": "enabled", "budget_tokens": 4096}
+
+
+# ── Embedding: same auth_type matrix ─────────────────────────────────────────
+
+
+def test_embedding_legacy_no_auth_type_keeps_keys() -> None:
+    out = AWSBedrockEmbeddingParameters.validate(
+        {
+            "model": "amazon.titan-embed-text-v2:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "AKIAFAKE",
+            "aws_secret_access_key": "secret",
+        }
+    )
+    assert out["aws_access_key_id"] == "AKIAFAKE"
+    assert out["aws_secret_access_key"] == "secret"
+    assert "auth_type" not in out
+
+
+def test_embedding_access_keys_mode_keeps_keys() -> None:
+    out = AWSBedrockEmbeddingParameters.validate(
+        {
+            "auth_type": "access_keys",
+            "model": "amazon.titan-embed-text-v2:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "AKIAFAKE",
+            "aws_secret_access_key": "secret",
+        }
+    )
+    assert out["aws_access_key_id"] == "AKIAFAKE"
+    assert out["aws_secret_access_key"] == "secret"
+    assert "auth_type" not in out
+
+
+def test_embedding_iam_role_mode_drops_stale_keys() -> None:
+    """Embedding-side parity with the LLM stale-key fix."""
+    out = AWSBedrockEmbeddingParameters.validate(
+        {
+            "auth_type": "iam_role",
+            "model": "amazon.titan-embed-text-v2:0",
+            "region_name": "us-east-1",
+            "aws_access_key_id": "STALE_KEY",
+            "aws_secret_access_key": "STALE_SECRET",
+        }
+    )
+    assert "aws_access_key_id" not in out
+    assert "aws_secret_access_key" not in out
+    assert out["aws_region_name"] == "us-east-1"
+
+
+def test_embedding_iam_role_mode_with_no_keys() -> None:
+    out = AWSBedrockEmbeddingParameters.validate(
+        {
+            "auth_type": "iam_role",
+            "model": "amazon.titan-embed-text-v2:0",
+            "region_name": "us-east-1",
+        }
+    )
+    assert "aws_access_key_id" not in out
+    assert "aws_secret_access_key" not in out
+
+
+def test_embedding_access_keys_mode_blank_keys_raises() -> None:
+    with pytest.raises(ValueError, match="aws_access_key_id is required"):
+        AWSBedrockEmbeddingParameters.validate(
+            {
+                "auth_type": "access_keys",
+                "model": "amazon.titan-embed-text-v2:0",
+                "region_name": "us-east-1",
+                "aws_access_key_id": "",
+                "aws_secret_access_key": "",
+            }
+        )
+
+
+def test_embedding_unknown_auth_type_raises() -> None:
+    with pytest.raises(ValueError, match="Unknown auth_type"):
+        AWSBedrockEmbeddingParameters.validate(
+            {
+                "auth_type": "iamrole",  # typo
+                "model": "amazon.titan-embed-text-v2:0",
+                "region_name": "us-east-1",
+            }
+        )
+
+
+def test_embedding_region_required_when_absent() -> None:
+    """aws_region_name is still mandatory even though credentials are not."""
+    from pydantic import ValidationError
+
+    with pytest.raises(ValidationError):
+        AWSBedrockEmbeddingParameters.validate(
+            {
+                "auth_type": "iam_role",
+                "model": "amazon.titan-embed-text-v2:0",
+            }
+        )
diff --git a/workers/log_consumer/process_notification_buffer.py b/workers/log_consumer/process_notification_buffer.py
new file mode 100755
index 0000000000..7f93a8dfe6
--- /dev/null
+++ b/workers/log_consumer/process_notification_buffer.py
@@ -0,0 +1,83 @@
+#!/usr/bin/env python3
+"""Trigger backend processing of the notification buffer.
+
+Mirrors process_log_history.py: a thin wrapper around an internal API call
+that the log_consumer scheduler.sh fires on every tick. The backend owns the
+actual GROUP BY / SKIP LOCKED / dispatch logic. Idempotent — safe to run
+under multiple replicas (the backend's row-level lock prevents duplicate
+dispatch).
+
+Usage:
+    python process_notification_buffer.py
+"""
+
+import logging
+import os
+import sys
+
+import httpx
+
+logger = logging.getLogger(__name__)
+
+# Endpoint must match the URL registered in
+# backend/notification_v2/internal_urls.py + backend/backend/internal_base_urls.py
+PROCESS_BUFFER_ENDPOINT = "v1/webhook/buffer/process/"
+
+
+def process_notification_buffer() -> bool:
+    """Hit the backend's process-buffer endpoint; return True on success.
+
+    Returns False on auth/network failure so the calling scheduler can log
+    the failure and proceed to the next tick. Never raises — the scheduler
+    is supposed to keep ticking.
+    """
+    internal_api_base_url = os.getenv("INTERNAL_API_BASE_URL")
+    internal_api_key = os.getenv("INTERNAL_SERVICE_API_KEY")
+
+    if not internal_api_base_url:
+        logger.error("INTERNAL_API_BASE_URL environment variable not set")
+        return False
+    if not internal_api_key:
+        logger.error("INTERNAL_SERVICE_API_KEY environment variable not set")
+        return False
+
+    url = f"{internal_api_base_url.rstrip('/')}/{PROCESS_BUFFER_ENDPOINT}"
+    # Longer timeout than process_log_history (60s vs 30s): a flush tick can
+    # involve multiple Celery dispatches, GC, and per-group rendering.
+    transport = httpx.HTTPTransport(retries=3)
+    try:
+        with httpx.Client(transport=transport) as client:
+            response = client.post(
+                url,
+                headers={"Authorization": f"Bearer {internal_api_key}"},
+                timeout=60.0,
+            )
+    except httpx.HTTPError as e:
+        logger.error("HTTP error calling process-buffer: %s", e)
+        return False
+    except Exception:
+        logger.exception("Unexpected error calling process-buffer")
+        return False
+
+    if response.status_code != 200:
+        logger.error(
+            "Backend returned status %s on process-buffer: %s",
+            response.status_code,
+            response.text[:500],
+        )
+        return False
+
+    result = response.json()
+    if result.get("dispatched_groups", 0) > 0 or result.get("gc_deleted_rows", 0) > 0:
+        logger.info(
+            "Notification buffer flush: groups=%s rows=%s gc=%s",
+            result.get("dispatched_groups", 0),
+            result.get("dispatched_rows", 0),
+            result.get("gc_deleted_rows", 0),
+        )
+    return True
+
+
+if __name__ == "__main__":
+    success = process_notification_buffer()
+    sys.exit(0 if success else 1)
diff --git a/workers/log_consumer/scheduler.sh b/workers/log_consumer/scheduler.sh
index a5572b21eb..0bf7dca96d 100755
--- a/workers/log_consumer/scheduler.sh
+++ b/workers/log_consumer/scheduler.sh
@@ -1,19 +1,26 @@
 #!/usr/bin/env bash
-set -euo pipefail
+set -uo pipefail
+# Note: pipefail without -e — one task's failure must not abort the loop.
 
 INTERVAL="${LOG_HISTORY_CONSUMER_INTERVAL:-5}"
-TASK_NAME="process_log_history"
 
-# Task trigger command - can be overridden via environment variable
-DEFAULT_TRIGGER_CMD="/app/.venv/bin/python /app/log_consumer/process_log_history.py"
-TRIGGER_CMD="${TASK_TRIGGER_COMMAND:-$DEFAULT_TRIGGER_CMD}"
+# Task 1: log history consumer (existing).
+DEFAULT_LOG_HISTORY_CMD="/app/.venv/bin/python /app/log_consumer/process_log_history.py"
+LOG_HISTORY_CMD="${TASK_TRIGGER_COMMAND:-$DEFAULT_LOG_HISTORY_CMD}"
+
+# Task 2: notification buffer flush (UNS-611 clubbed dispatch).
+# The endpoint short-circuits on an empty PENDING set, so polling on the same
+# 5s tick is cheap. Real dispatch cadence is gated by NOTIFICATION_CLUB_INTERVAL
+# on the backend (rows precompute flush_after at enqueue time).
+DEFAULT_BUFFER_FLUSH_CMD="/app/.venv/bin/python /app/log_consumer/process_notification_buffer.py"
+BUFFER_FLUSH_CMD="${NOTIFICATION_BUFFER_TASK_COMMAND:-$DEFAULT_BUFFER_FLUSH_CMD}"
 
 echo "=========================================="
-echo "Log History Scheduler Starting"
+echo "Log Consumer Scheduler Starting"
 echo "=========================================="
-echo "Task: ${TASK_NAME}"
 echo "Interval: ${INTERVAL} seconds"
-echo "Trigger Command: ${TRIGGER_CMD}"
+echo "Task 1 (log history): ${LOG_HISTORY_CMD}"
+echo "Task 2 (notification buffer flush): ${BUFFER_FLUSH_CMD}"
 echo "=========================================="
 
 cleanup() {
@@ -27,20 +34,27 @@ cleanup() {
 
 trap cleanup SIGTERM SIGINT
 
+run_task() {
+    # $1 = display name, $2 = command. Returns the command's exit code but
+    # never propagates failure — the caller logs it and moves on.
+    local task_name="$1"
+    local cmd="$2"
+    echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] Triggering ${task_name}..."
+    if eval "${cmd}" 2>&1; then
+        echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] ✓ ${task_name} OK"
+    else
+        local exit_code=$?
+        echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] ✗ ${task_name} failed with exit code ${exit_code}"
+    fi
+}
+
 run_count=0
 
 while true; do
     run_count=$((run_count + 1))
 
-    echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] Triggering ${TASK_NAME}..."
-
-    if eval "${TRIGGER_CMD}" 2>&1; then
-        echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] ✓ Task completed successfully"
-    else
-        exit_code=$?
-        echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] ✗ Task failed with exit code ${exit_code}"
-        echo "[$(date '+%Y-%m-%d %H:%M:%S')] [Run #${run_count}] Will retry after ${INTERVAL} seconds"
-    fi
+    run_task "process_log_history" "${LOG_HISTORY_CMD}"
+    run_task "process_notification_buffer" "${BUFFER_FLUSH_CMD}"
 
     echo "[$(date '+%Y-%m-%d %H:%M:%S')] Sleeping for ${INTERVAL} seconds..."
     echo ""
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index 19f78fbb99..f46385bf0b 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -19,6 +19,90 @@
 
 logger = logging.getLogger(__name__)
 
+# Mirrors notification_v2.enums.DeliveryMode.BATCHED. Worker stays string-only
+# so it does not import Django enums.
+DELIVERY_MODE_BATCHED = "BATCHED"
+ENQUEUE_BUFFER_ENDPOINT = "v1/webhook/buffer/enqueue/"
+
+
+def _enqueue_to_buffer(
+    api_client: Any,
+    notification: dict[str, Any],
+    payload: NotificationPayload,
+) -> bool:
+    """POST a single execution event to the backend's buffer endpoint.
+
+    Worker writes nothing to the DB itself — the backend owns NotificationBuffer
+    rows. Returns True on success so callers can fall back to immediate dispatch
+    if the buffer endpoint is unavailable. The fallback decision is opinionated:
+    we keep behavior conservative and DON'T fall back so a misconfigured or
+    outage-mode backend can't silently turn BATCHED into IMMEDIATE.
+    """
+    try:
+        api_client._make_request(
+            method="POST",
+            endpoint=ENQUEUE_BUFFER_ENDPOINT,
+            data={
+                "notification_id": notification["id"],
+                "execution_id": payload.execution_id,
+                "pipeline_id": payload.pipeline_id,
+                "pipeline_name": payload.pipeline_name,
+                "status": payload.status.value
+                if hasattr(payload.status, "value")
+                else payload.status,
+                "error_message": payload.error_message,
+                "platform": notification.get("platform"),
+            },
+            timeout=10,
+        )
+        logger.info(
+            "Enqueued BATCHED notification %s for pipeline %s execution %s",
+            notification["id"],
+            payload.pipeline_id,
+            payload.execution_id,
+        )
+        return True
+    except Exception as e:
+        logger.error(
+            "Failed to enqueue BATCHED notification %s for pipeline %s: %s",
+            notification["id"],
+            payload.pipeline_id,
+            e,
+        )
+        return False
+
+
+def _route_notification(
+    api_client: Any,
+    notification: dict[str, Any],
+    payload: NotificationPayload,
+) -> None:
+    """IMMEDIATE -> existing worker queue; BATCHED -> backend enqueue endpoint.
+
+    Defaults to IMMEDIATE when delivery_mode is missing so older backend
+    builds (pre-UNS-611) keep working unchanged.
+    """
+    if notification.get("notification_type") != "WEBHOOK":
+        logger.debug(
+            "Skipping non-webhook notification type: %s",
+            notification.get("notification_type"),
+        )
+        return
+
+    if notification.get("delivery_mode") == DELIVERY_MODE_BATCHED:
+        _enqueue_to_buffer(api_client, notification, payload)
+        return
+
+    send_notification_to_worker(
+        url=notification["url"],
+        payload=payload,
+        auth_type=notification.get("authorization_type", "NONE"),
+        auth_key=notification.get("authorization_key"),
+        auth_header=notification.get("authorization_header"),
+        max_retries=notification.get("max_retries", 0),
+        platform=notification.get("platform"),
+    )
+
 
 def get_webhook_headers(
     auth_type: str, auth_key: str | None, auth_header: str | None
@@ -140,20 +224,7 @@ def trigger_notification(
 
         # Send each notification
         for notification in active_notifications:
-            if notification.get("notification_type") == "WEBHOOK":
-                send_notification_to_worker(
-                    url=notification["url"],
-                    payload=notification_payload,
-                    auth_type=notification.get("authorization_type", "NONE"),
-                    auth_key=notification.get("authorization_key"),
-                    auth_header=notification.get("authorization_header"),
-                    max_retries=notification.get("max_retries", 0),
-                    platform=notification.get("platform"),
-                )
-            else:
-                logger.debug(
-                    f"Skipping non-webhook notification type: {notification.get('notification_type')}"
-                )
+            _route_notification(api_client, notification, notification_payload)
 
     except Exception as e:
         logger.error(f"Error triggering pipeline notifications for {pipeline_id}: {e}")
@@ -235,20 +306,7 @@ def trigger_pipeline_notifications(
 
         # Send each notification
         for notification in active_notifications:
-            if notification.get("notification_type") == "WEBHOOK":
-                send_notification_to_worker(
-                    url=notification["url"],
-                    payload=payload,
-                    auth_type=notification.get("authorization_type", "NONE"),
-                    auth_key=notification.get("authorization_key"),
-                    auth_header=notification.get("authorization_header"),
-                    max_retries=notification.get("max_retries", 0),
-                    platform=notification.get("platform"),
-                )
-            else:
-                logger.debug(
-                    f"Skipping non-webhook notification type: {notification.get('notification_type')}"
-                )
+            _route_notification(api_client, notification, payload)
 
     except Exception as e:
         logger.error(f"Error triggering pipeline notifications for {pipeline_id}: {e}")
@@ -316,20 +374,7 @@ def trigger_api_notifications(
 
         # Send each notification
         for notification in active_notifications:
-            if notification.get("notification_type") == "WEBHOOK":
-                send_notification_to_worker(
-                    url=notification["url"],
-                    payload=payload,
-                    auth_type=notification.get("authorization_type", "NONE"),
-                    auth_key=notification.get("authorization_key"),
-                    auth_header=notification.get("authorization_header"),
-                    max_retries=notification.get("max_retries", 0),
-                    platform=notification.get("platform"),
-                )
-            else:
-                logger.debug(
-                    f"Skipping non-webhook notification type: {notification.get('notification_type')}"
-                )
+            _route_notification(api_client, notification, payload)
 
     except Exception as e:
         logger.error(f"Error triggering API notifications for {api_id}: {e}")

From b8bf719fc58f2fef7a7cfed8add1cf3b1a254428 Mon Sep 17 00:00:00 2001
From: Kirtiman Mishra
 <110175055+kirtimanmishrazipstack@users.noreply.github.com>
Date: Tue, 12 May 2026 17:36:07 +0530
Subject: [PATCH 09/27] Uns 611 clubbed notification dispatch (#1959)

* batch notification

* notification slack
---
 backend/notification_v2/clubbed_renderer.py   | 193 +++++++++++------
 backend/notification_v2/helper.py             |   8 +
 backend/notification_v2/internal_api_views.py |   6 +
 .../provider/webhook/api_webhook.py           |  23 ++-
 .../provider/webhook/slack_webhook.py         |  55 ++---
 .../provider/webhook/webhook.py               |   6 +-
 .../notification/providers/_clubbed_format.py | 139 +++++++++++++
 workers/notification/providers/api_webhook.py |  36 ++--
 .../notification/providers/slack_webhook.py   | 194 ++----------------
 .../shared/patterns/notification/helper.py    |  18 +-
 10 files changed, 384 insertions(+), 294 deletions(-)
 create mode 100644 workers/notification/providers/_clubbed_format.py

diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
index 6fd0de0a84..ee1ca0c355 100644
--- a/backend/notification_v2/clubbed_renderer.py
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -1,26 +1,39 @@
-"""Clubbed notification renderer.
+"""Canonical envelope + renderer for every dispatch — IMMEDIATE and BATCHED.
 
-Builds one canonical JSON envelope from a group of buffered execution events
-and emits the platform-appropriate dispatch payload. Stays separate from the
-single-event SlackWebhook / APIWebhook providers so immediate-dispatch behavior
-stays untouched.
-
-Envelope shape (always the same — single-event groups use this too so consumers
-never need to branch on "is this batched?"):
+The same envelope shape feeds every channel × mode cell so receivers never
+need to branch on "is this batched?":
 
     {
-        "kind": "batch",
         "summary": {
-            "pipeline": "<name>",
-            "interval_minutes": 30,
-            "total": N, "succeeded": S, "failed": F
+            "total": N, "succeeded": S, "failed": F,
+            "interval_minutes": int | None,   # None for IMMEDIATE
         },
-        "events": [{"execution_id": ..., "status": ..., "error": ...?}, ...]
+        "events": [
+            {
+                "type": "ETL" | "TASK" | "API",
+                "pipeline_name": "...",
+                "status": "ERROR" | "SUCCESS" | ...,
+                "execution_id": "...",
+                "timestamp": "2026-05-05T17:03:34+00:00",
+                "additional_data": {
+                    "total_files": int,
+                    "successful_files": int,
+                    "failed_files": int,
+                },
+                "error_message": "...",   # only on failure
+            },
+            ...
+        ]
     }
+
+Slack receives `{"text": "<mrkdwn>"}` pre-rendered from this envelope; API
+receivers see the envelope unchanged so programmatic consumers always parse
+the same shape. `pipeline_id` is intentionally absent from every event dict.
 """
 
 from __future__ import annotations
 
+import datetime
 import logging
 from typing import Any
 
@@ -28,17 +41,25 @@
 
 logger = logging.getLogger(__name__)
 
-# Hard cap on events per dispatch — extras roll over to the next flush tick.
-# Bounds memory + payload size and prevents a runaway backlog from creating an
-# unbounded HTTP body.
+# Hard cap on events per dispatch; the rest roll into the next flush tick.
 MAX_BATCH_SIZE = 500
-# How many events Slack renders inline before collapsing the rest under a
-# "… and K more" footer. Slack tolerates much larger payloads, but readability
-# tanks past ~25 lines.
+# Slack inlines this many events before collapsing the rest under an
+# "_… and K more_" footer. Slack tolerates much larger payloads, but
+# readability tanks past ~25 lines.
 SLACK_MAX_DISPLAY_EVENTS = 25
 
 _SUCCESS_STATUSES = {"COMPLETED", "SUCCESS"}
 
+# Middle dot (U+00B7) padded by single spaces — the per-event field separator.
+_SEPARATOR = " · "
+_MISSING = "—"  # em-dash placeholder for missing fields
+_DIVIDER = "———"  # triple em-dash divider between header and events
+
+# Slack emoji shortcodes — render the same as the literal unicode glyphs and
+# stay readable in source.
+_EMOJI_SUCCESS = ":white_check_mark:"
+_EMOJI_FAILURE = ":x:"
+
 
 def _is_success(status: str | None) -> bool:
     if not status:
@@ -46,83 +67,139 @@ def _is_success(status: str | None) -> bool:
     return status.upper() in _SUCCESS_STATUSES
 
 
+def _humanize_timestamp(iso: str | None) -> str:
+    """Render an ISO timestamp as `2026 May 11 11:38:31 AM` (POSIX `%-d`).
+
+    Falls back to the missing placeholder on falsy / unparseable input so a
+    partial row still renders without raising.
+    """
+    if not iso:
+        return _MISSING
+    try:
+        dt = datetime.datetime.fromisoformat(iso)
+    except (TypeError, ValueError):
+        return _MISSING
+    return dt.strftime("%Y %b %-d %I:%M:%S %p")
+
+
+def _format_file_count(event: dict[str, Any]) -> str:
+    """Render the file-count summary; empty string when no totals available."""
+    counts = event.get("additional_data") or {}
+    total = counts.get("total_files")
+    if total is None:
+        return ""
+    if _is_success(event.get("status")):
+        successful = counts.get("successful_files", 0)
+        return f"{_EMOJI_SUCCESS} {successful}/{total} files"
+    failed = counts.get("failed_files", 0)
+    return f"{_EMOJI_FAILURE} {failed}/{total} files"
+
+
+def _format_event_line(event: dict[str, Any]) -> str:
+    """Format one event as a single Slack mrkdwn line.
+
+    Fields are middle-dot separated; the file-count column is omitted when
+    `additional_data` is empty so the line collapses to 5 fields, not 6.
+    """
+    parts = [
+        _humanize_timestamp(event.get("timestamp")),
+        f"*{event.get('execution_id') or _MISSING}*",
+        event.get("type") or _MISSING,
+        event.get("pipeline_name") or _MISSING,
+        event.get("status") or _MISSING,
+    ]
+    file_count = _format_file_count(event)
+    if file_count:
+        parts.append(file_count)
+    return _SEPARATOR.join(parts)
+
+
 def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
+    """Project a buffered payload into the canonical per-event dict.
+
+    Unified shape across Slack/API and IMMEDIATE/BATCHED. `pipeline_id` is
+    intentionally dropped here — neither channel surfaces it. Missing keys
+    fall back to empty values so partial rows from older enqueue builds
+    still render.
+    """
     event: dict[str, Any] = {
-        "execution_id": payload.get("execution_id"),
-        "status": payload.get("status"),
+        "type": payload.get("type") or "",
+        "pipeline_name": payload.get("pipeline_name") or "",
+        "status": payload.get("status") or "",
+        "execution_id": payload.get("execution_id") or "",
+        "timestamp": payload.get("timestamp") or "",
+        "additional_data": payload.get("additional_data") or {},
     }
     error_message = payload.get("error_message")
     if error_message:
-        event["error"] = error_message
+        event["error_message"] = error_message
     return event
 
 
 def build_envelope(
-    payloads: list[dict[str, Any]], interval_seconds: int
+    payloads: list[dict[str, Any]],
+    interval_seconds: int | None,
 ) -> dict[str, Any]:
-    """Build the canonical batch envelope.
+    """Build the canonical envelope used by every dispatch path.
 
-    Caps the events list at MAX_BATCH_SIZE; oldest-first ordering is the
-    caller's responsibility (the flush job sorts by created_at).
+    `interval_seconds=None` signals IMMEDIATE — `summary.interval_minutes`
+    becomes null so consumers can distinguish modes if they need to. For
+    BATCHED, pass the per-org cadence in seconds (rendered as minutes).
     """
     capped = payloads[:MAX_BATCH_SIZE]
     succeeded = sum(1 for p in capped if _is_success(p.get("status")))
     failed = len(capped) - succeeded
-    # Multiple pipelines can share an (org, url, auth_sig) group; we surface
-    # the first one's name as a representative. Mixed-pipeline batches are
-    # rare in practice and a v2 enhancement would aggregate distinct names.
-    pipeline_name = capped[0].get("pipeline_name") if capped else None
+    interval_minutes: int | None
+    if interval_seconds is None:
+        interval_minutes = None
+    else:
+        interval_minutes = max(1, interval_seconds // 60)
     return {
-        "kind": "batch",
         "summary": {
-            "pipeline": pipeline_name,
-            "interval_minutes": max(1, interval_seconds // 60),
             "total": len(capped),
             "succeeded": succeeded,
             "failed": failed,
+            "interval_minutes": interval_minutes,
         },
         "events": [_event_from_payload(p) for p in capped],
     }
 
 
-def _slack_event_line(event: dict[str, Any]) -> str:
-    parts = [f"— {event.get('execution_id') or 'unknown'}: {event.get('status')}"]
-    if event.get("error"):
-        parts.append(f"({event['error']})")
-    return " ".join(parts)
-
-
 def render_for_slack(envelope: dict[str, Any]) -> dict[str, Any]:
-    """Format the envelope as a Slack-compatible payload dict.
+    """Render the envelope as `{"text": "<mrkdwn>"}` for Slack.
 
-    Returns the body shape Slack incoming webhooks expect (`text` field with
-    mrkdwn). Truncates inline events at SLACK_MAX_DISPLAY_EVENTS.
+    Header + divider are emitted for every dispatch — IMMEDIATE, BATCHED N=1,
+    and BATCHED N>1 all share the same shape. Visible events are capped at
+    SLACK_MAX_DISPLAY_EVENTS with an `_… and K more_` overflow footer.
     """
     summary = envelope["summary"]
     events: list[dict[str, Any]] = envelope["events"]
-    pipeline = summary.get("pipeline") or "pipeline"
-
-    header = f"*[Unstract] {summary['total']} executions for `{pipeline}`*"
-    counts = f"✅ {summary['succeeded']} succeeded  ❌ {summary['failed']} failed"
-
+    total = summary["total"]
+    noun = "execution" if total == 1 else "executions"
+    header = (
+        f"*{total} {noun}* "
+        f"({_EMOJI_SUCCESS} {summary['succeeded']} succeeded  "
+        f"{_EMOJI_FAILURE} {summary['failed']} failed)"
+    )
     visible = events[:SLACK_MAX_DISPLAY_EVENTS]
-    lines = [_slack_event_line(e) for e in visible]
+    sections: list[str] = [header, _DIVIDER]
+    sections.extend(_format_event_line(e) for e in visible)
     overflow = len(events) - len(visible)
     if overflow > 0:
-        lines.append(f"… and {overflow} more executions")
-
-    body = "\n".join([header, counts, *lines])
-    return {"text": body}
+        sections.append(_DIVIDER)
+        sections.append(f"_… and {overflow} more executions_")
+    return {"text": "\n".join(sections)}
 
 
 def render_clubbed_message(
-    payloads: list[dict[str, Any]], platform: str, interval_seconds: int
+    payloads: list[dict[str, Any]],
+    platform: str,
+    interval_seconds: int | None,
 ) -> dict[str, Any]:
-    """Top-level entry point — returns the dispatch body for ``platform``.
+    """Top-level entry — returns the dispatch body for `platform`.
 
-    Slack receives the rendered text payload; raw API webhooks receive the
-    canonical envelope unchanged so downstream consumers can parse it
-    programmatically.
+    Used by every dispatch site (BATCHED flush, IMMEDIATE backend providers)
+    so the receiver-visible payload is identical regardless of mode.
     """
     envelope = build_envelope(payloads, interval_seconds)
     if platform == PlatformType.SLACK.value:
diff --git a/backend/notification_v2/helper.py b/backend/notification_v2/helper.py
index f217f2da18..908c0dd993 100644
--- a/backend/notification_v2/helper.py
+++ b/backend/notification_v2/helper.py
@@ -168,6 +168,14 @@ def enqueue(notification: Notification, payload: dict[str, Any]) -> Notification
     auth_sig = compute_auth_sig(notification)
     platform = notification.platform or PlatformType.API.value
 
+    # Stamp a buffered-at timestamp so renderers can surface it consistently
+    # alongside IMMEDIATE. Worker callers already supply one; backend
+    # dispatchers (PipelineStatusPayload.to_dict) don't, so default here.
+    payload = {
+        **payload,
+        "timestamp": payload.get("timestamp") or timezone.now().isoformat(),
+    }
+
     buffer_row = NotificationBuffer.objects.create(
         notification=notification,
         organization=organization,
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 396bfb2081..09f3a83f5d 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -350,13 +350,19 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
             status=409,
         )
 
+    # type / timestamp / additional_data stay optional during rollout — older
+    # worker builds that don't forward them still produce a usable row
+    # (renderer falls back to "Type: —" / no Additional Data line).
     payload = {
+        "type": body.get("type", ""),
         "execution_id": body["execution_id"],
         "pipeline_id": body["pipeline_id"],
         "pipeline_name": body["pipeline_name"],
         "status": body["status"],
         "error_message": body.get("error_message"),
         "platform": body["platform"],
+        "timestamp": body.get("timestamp"),
+        "additional_data": body.get("additional_data") or {},
     }
     try:
         buffer_row = enqueue(notification, payload)
diff --git a/backend/notification_v2/provider/webhook/api_webhook.py b/backend/notification_v2/provider/webhook/api_webhook.py
index 9f1264b9e7..f1b2d347c0 100644
--- a/backend/notification_v2/provider/webhook/api_webhook.py
+++ b/backend/notification_v2/provider/webhook/api_webhook.py
@@ -1,13 +1,30 @@
+from typing import Any
+
+from notification_v2.clubbed_renderer import build_envelope
 from notification_v2.provider.webhook.webhook import Webhook
 
 
 class APIWebhook(Webhook):
-    def send(self):
-        """Send the API webhook notification."""
+    def send(self) -> None:
+        """Send the API webhook notification.
+
+        Wraps the IMMEDIATE event in the canonical envelope before queueing
+        so the receiver-visible JSON shape matches BATCHED dispatches —
+        `{"summary": {...}, "events": [{...}]}`.
+        """
+        self.payload = self.format_payload()
         super().send()
 
-    def get_headers(self):
+    def get_headers(self) -> dict[str, str]:
         """API-specific headers."""
         headers = super().get_headers()
         headers["Content-Type"] = "application/json"
         return headers
+
+    def format_payload(self) -> dict[str, Any]:
+        """Wrap a single IMMEDIATE event in the canonical envelope.
+
+        `interval_seconds=None` -> `summary.interval_minutes` is null;
+        receivers can use that to distinguish IMMEDIATE from BATCHED.
+        """
+        return build_envelope(payloads=[self.payload], interval_seconds=None)
diff --git a/backend/notification_v2/provider/webhook/slack_webhook.py b/backend/notification_v2/provider/webhook/slack_webhook.py
index 45e260b680..4eb8c599d2 100644
--- a/backend/notification_v2/provider/webhook/slack_webhook.py
+++ b/backend/notification_v2/provider/webhook/slack_webhook.py
@@ -1,60 +1,35 @@
 import logging
+from typing import Any
 
+from notification_v2.clubbed_renderer import render_clubbed_message
+from notification_v2.enums import PlatformType
 from notification_v2.provider.webhook.webhook import Webhook
 
 logger = logging.getLogger(__name__)
 
 
 class SlackWebhook(Webhook):
-    def send(self):
+    def send(self) -> None:
         """Send the Slack webhook notification."""
         formatted_payload = self.format_payload()
         self.payload = formatted_payload
         super().send()
 
-    def get_headers(self):
+    def get_headers(self) -> dict[str, str]:
         """Slack-specific headers."""
         headers = super().get_headers()
         headers["Content-Type"] = "application/json"
         return headers
 
-    def format_payload(self) -> dict:
-        """Format the payload to match Slack's expected structure."""
-        if "text" not in self.payload:
-            # Construct a basic Slack message with 'text' field
-            formatted_payload = {
-                "text": "Notification",
-                "blocks": self.create_blocks_from_payload(),
-            }
-        else:
-            # If 'text' is already present, format accordingly
-            formatted_payload = {
-                "text": self.payload.pop("text"),
-                "blocks": self.create_blocks_from_payload(),
-            }
-        return formatted_payload
+    def format_payload(self) -> dict[str, Any]:
+        """Render the IMMEDIATE event through the canonical envelope.
 
-    def create_blocks_from_payload(self) -> list:
-        """Create Slack blocks from the given payload."""
-        blocks = []
-        # Header
-        blocks.append(
-            {
-                "type": "section",
-                "text": {"type": "mrkdwn", "text": "*Unstract Update:*"},
-            }
+        Single shared renderer for IMMEDIATE and BATCHED so receivers see the
+        same Slack body shape regardless of delivery mode. `interval_seconds`
+        is None for IMMEDIATE — `summary.interval_minutes` resolves to null.
+        """
+        return render_clubbed_message(
+            payloads=[self.payload],
+            platform=PlatformType.SLACK.value,
+            interval_seconds=None,
         )
-        # Add a divider for separation
-        blocks.append({"type": "divider"})
-        # Add each key-value pair to the blocks
-        for key, value in self.payload.items():
-            formatted_key = key.replace("_", " ").title()
-            blocks.append(
-                {
-                    "type": "section",
-                    "text": {"type": "mrkdwn", "text": f"*{formatted_key}:* {value}"},
-                }
-            )
-        # Footer
-        blocks.append({"type": "section", "text": {"type": "mrkdwn", "text": "*---*"}})
-        return blocks
diff --git a/backend/notification_v2/provider/webhook/webhook.py b/backend/notification_v2/provider/webhook/webhook.py
index 549336a5f9..40ddc53e61 100644
--- a/backend/notification_v2/provider/webhook/webhook.py
+++ b/backend/notification_v2/provider/webhook/webhook.py
@@ -17,7 +17,7 @@ class HeaderConstants:
 
 
 class Webhook(NotificationProvider):
-    def send(self):
+    def send(self) -> None:
         """Send the webhook notification."""
         try:
             headers = self.get_headers()
@@ -51,7 +51,7 @@ def validate(self):
             raise ValueError("Payload is required.")
         return super().validate()
 
-    def get_headers(self):
+    def get_headers(self) -> dict[str, str]:
         """Get the headers for the notification based on the authorization type and key.
 
         Raises:
@@ -60,7 +60,7 @@ def get_headers(self):
         Returns:
             dict[str, str]: A dictionary containing the headers.
         """
-        headers = {}
+        headers: dict[str, str] = {}
         try:
             authorization_type = AuthorizationType(
                 self.notification.authorization_type.upper()
diff --git a/workers/notification/providers/_clubbed_format.py b/workers/notification/providers/_clubbed_format.py
new file mode 100644
index 0000000000..dfcfa4add8
--- /dev/null
+++ b/workers/notification/providers/_clubbed_format.py
@@ -0,0 +1,139 @@
+"""Worker-side mirror of backend/notification_v2/clubbed_renderer.
+
+Producing the same envelope shape and Slack mrkdwn body the backend renders
+so worker-callback IMMEDIATE payloads (flat per-event dicts) match the
+canonical wire format used by backend BATCHED dispatches. Backend pre-renders
+for its own dispatches — this module covers only the worker-callback IMMEDIATE
+path. Keep the constants and string output byte-identical to
+`backend/notification_v2/clubbed_renderer.py`; promote to `unstract/core/` if
+a third site ever needs the same logic.
+"""
+
+from __future__ import annotations
+
+import datetime
+from typing import Any
+
+MAX_BATCH_SIZE = 500
+SLACK_MAX_DISPLAY_EVENTS = 25
+
+_SUCCESS_STATUSES = {"COMPLETED", "SUCCESS"}
+_SEPARATOR = " · "
+_MISSING = "—"
+_DIVIDER = "———"
+_EMOJI_SUCCESS = ":white_check_mark:"
+_EMOJI_FAILURE = ":x:"
+
+
+def _is_success(status: str | None) -> bool:
+    if not status:
+        return False
+    return status.upper() in _SUCCESS_STATUSES
+
+
+def _humanize_timestamp(iso: str | None) -> str:
+    if not iso:
+        return _MISSING
+    try:
+        dt = datetime.datetime.fromisoformat(iso)
+    except (TypeError, ValueError):
+        return _MISSING
+    return dt.strftime("%Y %b %-d %I:%M:%S %p")
+
+
+def _format_file_count(event: dict[str, Any]) -> str:
+    counts = event.get("additional_data") or {}
+    total = counts.get("total_files")
+    if total is None:
+        return ""
+    if _is_success(event.get("status")):
+        successful = counts.get("successful_files", 0)
+        return f"{_EMOJI_SUCCESS} {successful}/{total} files"
+    failed = counts.get("failed_files", 0)
+    return f"{_EMOJI_FAILURE} {failed}/{total} files"
+
+
+def _format_event_line(event: dict[str, Any]) -> str:
+    parts = [
+        _humanize_timestamp(event.get("timestamp")),
+        f"*{event.get('execution_id') or _MISSING}*",
+        event.get("type") or _MISSING,
+        event.get("pipeline_name") or _MISSING,
+        event.get("status") or _MISSING,
+    ]
+    file_count = _format_file_count(event)
+    if file_count:
+        parts.append(file_count)
+    return _SEPARATOR.join(parts)
+
+
+def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
+    """Project a flat per-event payload into the canonical shape.
+
+    Drops `pipeline_id` and `_source` — neither appears in receiver-visible
+    output. Mirrors the backend projection so renderer input is identical.
+    """
+    event: dict[str, Any] = {
+        "type": payload.get("type") or "",
+        "pipeline_name": payload.get("pipeline_name") or "",
+        "status": payload.get("status") or "",
+        "execution_id": payload.get("execution_id") or "",
+        "timestamp": payload.get("timestamp") or "",
+        "additional_data": payload.get("additional_data") or {},
+    }
+    error_message = payload.get("error_message")
+    if error_message:
+        event["error_message"] = error_message
+    return event
+
+
+def build_envelope(
+    payloads: list[dict[str, Any]],
+    interval_seconds: int | None,
+) -> dict[str, Any]:
+    """Build the canonical `{summary, events}` envelope.
+
+    `interval_seconds=None` for IMMEDIATE -> `summary.interval_minutes` null.
+    """
+    capped = payloads[:MAX_BATCH_SIZE]
+    succeeded = sum(1 for p in capped if _is_success(p.get("status")))
+    failed = len(capped) - succeeded
+    interval_minutes: int | None
+    if interval_seconds is None:
+        interval_minutes = None
+    else:
+        interval_minutes = max(1, interval_seconds // 60)
+    return {
+        "summary": {
+            "total": len(capped),
+            "succeeded": succeeded,
+            "failed": failed,
+            "interval_minutes": interval_minutes,
+        },
+        "events": [_event_from_payload(p) for p in capped],
+    }
+
+
+def render_slack_text(envelope: dict[str, Any]) -> str:
+    """Render the envelope as Slack mrkdwn body text.
+
+    Always emits header + divider regardless of event count so IMMEDIATE,
+    BATCHED N=1, and BATCHED N>1 all share the same shape.
+    """
+    summary = envelope["summary"]
+    events: list[dict[str, Any]] = envelope["events"]
+    total = summary["total"]
+    noun = "execution" if total == 1 else "executions"
+    header = (
+        f"*{total} {noun}* "
+        f"({_EMOJI_SUCCESS} {summary['succeeded']} succeeded  "
+        f"{_EMOJI_FAILURE} {summary['failed']} failed)"
+    )
+    visible = events[:SLACK_MAX_DISPLAY_EVENTS]
+    sections: list[str] = [header, _DIVIDER]
+    sections.extend(_format_event_line(e) for e in visible)
+    overflow = len(events) - len(visible)
+    if overflow > 0:
+        sections.append(_DIVIDER)
+        sections.append(f"_… and {overflow} more executions_")
+    return "\n".join(sections)
diff --git a/workers/notification/providers/api_webhook.py b/workers/notification/providers/api_webhook.py
index 8c54d2d19d..19ff1d12c3 100644
--- a/workers/notification/providers/api_webhook.py
+++ b/workers/notification/providers/api_webhook.py
@@ -1,10 +1,14 @@
 """API Webhook Notification Provider
 
-Standard API webhook provider for generic webhook endpoints.
+Wraps worker-callback IMMEDIATE payloads (flat per-event dict) in the
+canonical envelope so API webhook receivers always see the same
+``{"summary": {...}, "events": [...]}`` shape — IMMEDIATE or BATCHED.
+Backend dispatches already arrive in envelope form and pass through.
 """
 
 from typing import Any
 
+from notification.providers._clubbed_format import build_envelope
 from notification.providers.webhook_provider import WebhookProvider
 from shared.infrastructure.logging import WorkerLogger
 
@@ -14,11 +18,12 @@
 class APIWebhook(WebhookProvider):
     """Standard API webhook provider.
 
-    Handles generic webhook notifications without platform-specific formatting.
-    Sends the payload as-is in JSON format.
+    Normalises the payload to the canonical envelope before POSTing so
+    programmatic consumers parse one schema regardless of how the
+    notification was produced.
     """
 
-    def __init__(self):
+    def __init__(self) -> None:
         """Initialize API webhook provider."""
         super().__init__()
         self.provider_name = "APIWebhook"
@@ -26,16 +31,17 @@ def __init__(self):
     def prepare_data(self, notification_data: dict[str, Any]) -> dict[str, Any]:
         """Prepare API webhook data.
 
-        For standard API webhooks, we send the payload as-is without
-        any special formatting.
+        Wraps a flat per-event payload in the canonical envelope; payloads
+        already in envelope shape (backend-built) pass through.
+        """
+        prepared_data = super().prepare_data(notification_data)
 
-        Args:
-            notification_data: Raw notification data
+        if "payload" in prepared_data:
+            payload = prepared_data["payload"]
+            if isinstance(payload, dict) and "events" not in payload:
+                prepared_data["payload"] = build_envelope(
+                    payloads=[payload], interval_seconds=None
+                )
 
-        Returns:
-            Prepared notification data
-        """
-        logger.debug(
-            f"Preparing standard API webhook data for {notification_data.get('url')}"
-        )
-        return super().prepare_data(notification_data)
+        logger.debug(f"Prepared API webhook data for {notification_data.get('url')}")
+        return prepared_data
diff --git a/workers/notification/providers/slack_webhook.py b/workers/notification/providers/slack_webhook.py
index 04e3532fa3..4532af5672 100644
--- a/workers/notification/providers/slack_webhook.py
+++ b/workers/notification/providers/slack_webhook.py
@@ -1,11 +1,17 @@
 """Slack Webhook Notification Provider
 
-This provider handles Slack-specific webhook notifications with proper
-payload formatting for Slack's Block Kit API.
+Renders worker-callback IMMEDIATE payloads (flat per-event dict) into the
+same single-line Slack body the backend produces for IMMEDIATE/BATCHED via
+clubbed_renderer. Backend-rendered payloads (`{"text": "<mrkdwn>"}`) pass
+through unchanged.
 """
 
 from typing import Any
 
+from notification.providers._clubbed_format import (
+    build_envelope,
+    render_slack_text,
+)
 from notification.providers.webhook_provider import WebhookProvider
 from shared.infrastructure.logging import WorkerLogger
 
@@ -15,11 +21,11 @@
 class SlackWebhook(WebhookProvider):
     """Slack-specific webhook provider.
 
-    Formats payloads according to Slack's expected structure,
-    including support for Block Kit formatting.
+    Renders flat IMMEDIATE payloads via the worker-side mirror of the backend
+    clubbed renderer, then sends them as Slack-native ``text`` mrkdwn.
     """
 
-    def __init__(self):
+    def __init__(self) -> None:
         """Initialize Slack webhook provider."""
         super().__init__()
         self.provider_name = "SlackWebhook"
@@ -27,9 +33,6 @@ def __init__(self):
     def prepare_data(self, notification_data: dict[str, Any]) -> dict[str, Any]:
         """Prepare Slack-specific webhook data.
 
-        Formats the payload to match Slack's expected structure
-        with 'text' field and optional Block Kit blocks.
-
         Args:
             notification_data: Raw notification data
 
@@ -38,7 +41,6 @@ def prepare_data(self, notification_data: dict[str, Any]) -> dict[str, Any]:
         """
         prepared_data = super().prepare_data(notification_data)
 
-        # Format payload for Slack
         if "payload" in prepared_data:
             prepared_data["payload"] = self.format_payload(prepared_data["payload"])
 
@@ -47,170 +49,18 @@ def prepare_data(self, notification_data: dict[str, Any]) -> dict[str, Any]:
     def format_payload(self, payload: dict[str, Any]) -> dict[str, Any]:
         """Format the payload to match Slack's expected structure.
 
-        Args:
-            payload: Original payload
-
-        Returns:
-            Slack-formatted payload with 'text' field and optional blocks
-        """
-        # If payload already has 'text' field, enhance it with blocks
-        if "text" in payload:
-            formatted_payload = {
-                "text": payload.pop("text"),
-                "blocks": self.create_blocks_from_payload(payload),
-            }
-        else:
-            # Construct a Slack message from the payload
-            formatted_payload = {
-                "text": self._get_summary_text(payload),
-                "blocks": self.create_blocks_from_payload(payload),
-            }
-
-        return formatted_payload
-
-    def create_blocks_from_payload(self, payload: dict[str, Any]) -> list[dict[str, Any]]:
-        """Create Slack Block Kit blocks from the payload.
-
-        Args:
-            payload: Payload to convert to blocks
-
-        Returns:
-            List of Slack Block Kit blocks
+        Two input shapes are accepted:
+        - Backend-rendered ``{"text": "<mrkdwn>"}`` (BATCHED dispatch and
+          backend IMMEDIATE through ``clubbed_renderer``) — passed through.
+        - Flat per-event dict from the worker-callback IMMEDIATE path —
+          wrapped in a single-event envelope and rendered to the canonical
+          single-line mrkdwn body.
         """
-        blocks = []
-
-        # Header block
-        blocks.append(
-            {
-                "type": "section",
-                "text": {"type": "mrkdwn", "text": "*Unstract Notification*"},
-            }
-        )
-
-        # Add divider for visual separation
-        blocks.append({"type": "divider"})
-
-        # Add each key-value pair as a section
-        for key, value in payload.items():
-            if value is None or value == "":
-                continue
-
-            # Format key for display
-            formatted_key = self._format_key(key)
-
-            # Format value based on type
-            formatted_value = self._format_value(value)
-
-            # Create section block with inline format
-            blocks.append(
-                {
-                    "type": "section",
-                    "text": {
-                        "type": "mrkdwn",
-                        "text": f"*{formatted_key}:* {formatted_value}",
-                    },
-                }
-            )
-
-        # Add timestamp footer if not already present
-        if not any("timestamp" in str(block).lower() for block in blocks):
-            from datetime import datetime
-
-            blocks.append({"type": "divider"})
-            blocks.append(
-                {
-                    "type": "context",
-                    "elements": [
-                        {
-                            "type": "mrkdwn",
-                            "text": f"_Sent at {datetime.now().strftime('%Y-%m-%d %H:%M:%S UTC')}_",
-                        }
-                    ],
-                }
-            )
-
-        return blocks
-
-    def _get_summary_text(self, payload: dict[str, Any]) -> str:
-        """Generate summary text from payload.
+        if "text" in payload and len(payload) == 1:
+            return {"text": payload["text"]}
 
-        Args:
-            payload: Payload to summarize
-
-        Returns:
-            Summary text for Slack notification
-        """
-        # Priority order for summary fields
-        summary_fields = [
-            "message",
-            "status",
-            "pipeline_name",
-            "workflow_name",
-            "api_name",
-            "error",
-            "result",
-            "summary",
-        ]
-
-        for field in summary_fields:
-            if field in payload and payload[field]:
-                return str(payload[field])
-
-        # Default summary
-        return "Unstract Notification"
-
-    def _format_key(self, key: str) -> str:
-        """Format dictionary key for display.
-
-        Args:
-            key: Raw key name
-
-        Returns:
-            Formatted key for display
-        """
-        # Replace underscores with spaces and capitalize
-        formatted = key.replace("_", " ").title()
-
-        # Special formatting for known keys
-        key_mapping = {
-            "Pipeline Name": "Pipeline Name",
-            "Api Name": "API Name",
-            "Workflow Name": "Workflow Name",
-            "Status": "Status",
-            "Error": "Error",
-            "Success": "Success",
-            "Execution Id": "Execution Id",
-            "Organization Id": "Organization Id",
-        }
-
-        return key_mapping.get(formatted, formatted)
-
-    def _format_value(self, value: Any) -> str:
-        """Format value for Slack display.
-
-        Args:
-            value: Value to format
-
-        Returns:
-            Formatted value string
-        """
-        if isinstance(value, bool):
-            return "✅ Yes" if value else "❌ No"
-        elif isinstance(value, (list, tuple)):
-            return "\n• " + "\n• ".join(str(item) for item in value)
-        elif isinstance(value, dict):
-            # Inline {Key: Value, Key: Value} so the receiver sees the
-            # whole dict on one line instead of a bulleted block.
-            items = [f"{self._format_key(k)}: {v}" for k, v in value.items()]
-            return "{" + ", ".join(items) + "}"
-        elif value is None:
-            return "_Not specified_"
-        else:
-            # Format long strings
-            value_str = str(value)
-            if len(value_str) > 500:
-                return value_str[:497] + "..."
-            return value_str
+        envelope = build_envelope(payloads=[payload], interval_seconds=None)
+        return {"text": render_slack_text(envelope)}
 
     def get_destination(self, notification_data: dict[str, Any]) -> str:
         """Extract webhook URL from notification data with masking for security."""
@@ -229,4 +79,4 @@ def get_destination(self, notification_data: dict[str, Any]) -> str:
                 # Mask long URLs that might contain tokens
                 return url[:30] + "..." + url[-10:]
 
-        return url
+        return str(url)
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index f46385bf0b..0148bc2f5f 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -39,19 +39,31 @@ def _enqueue_to_buffer(
     outage-mode backend can't silently turn BATCHED into IMMEDIATE.
     """
     try:
+        # Forward the full per-event shape so the backend renderer can match
+        # IMMEDIATE's KV layout per event (Type / Pipeline Id / Pipeline Name
+        # / Status / Execution Id / Timestamp / Additional Data). Older
+        # backend builds that ignore the extra fields stay unaffected.
+        payload_type = (
+            payload.type.value if hasattr(payload.type, "value") else payload.type
+        )
+        payload_status = (
+            payload.status.value if hasattr(payload.status, "value") else payload.status
+        )
+        payload_timestamp = payload.timestamp.isoformat() if payload.timestamp else None
         api_client._make_request(
             method="POST",
             endpoint=ENQUEUE_BUFFER_ENDPOINT,
             data={
                 "notification_id": notification["id"],
+                "type": payload_type,
                 "execution_id": payload.execution_id,
                 "pipeline_id": payload.pipeline_id,
                 "pipeline_name": payload.pipeline_name,
-                "status": payload.status.value
-                if hasattr(payload.status, "value")
-                else payload.status,
+                "status": payload_status,
                 "error_message": payload.error_message,
                 "platform": notification.get("platform"),
+                "timestamp": payload_timestamp,
+                "additional_data": payload.additional_data or {},
             },
             timeout=10,
         )

From 37930d22fc82a6c1d8d9ca67843cb6cae531fc6f Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Tue, 12 May 2026 18:57:24 +0530
Subject: [PATCH 10/27] notification API

---
 backend/notification_v2/clubbed_renderer.py   | 36 ++++++-------------
 backend/notification_v2/internal_api_views.py |  8 +----
 .../provider/webhook/api_webhook.py           |  6 ++--
 .../provider/webhook/slack_webhook.py         |  4 +--
 .../notification/providers/_clubbed_format.py | 21 ++++-------
 workers/notification/providers/api_webhook.py |  4 +--
 .../notification/providers/slack_webhook.py   |  2 +-
 7 files changed, 25 insertions(+), 56 deletions(-)

diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
index ee1ca0c355..fc85120f7a 100644
--- a/backend/notification_v2/clubbed_renderer.py
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -4,17 +4,14 @@
 need to branch on "is this batched?":
 
     {
-        "summary": {
-            "total": N, "succeeded": S, "failed": F,
-            "interval_minutes": int | None,   # None for IMMEDIATE
-        },
+        "summary": {"total": N, "succeeded": S, "failed": F},
         "events": [
             {
                 "type": "ETL" | "TASK" | "API",
                 "pipeline_name": "...",
                 "status": "ERROR" | "SUCCESS" | ...,
                 "execution_id": "...",
-                "timestamp": "2026-05-05T17:03:34+00:00",
+                "timestamp": "2026 May 5 5:03:34 PM",
                 "additional_data": {
                     "total_files": int,
                     "successful_files": int,
@@ -102,7 +99,7 @@ def _format_event_line(event: dict[str, Any]) -> str:
     `additional_data` is empty so the line collapses to 5 fields, not 6.
     """
     parts = [
-        _humanize_timestamp(event.get("timestamp")),
+        event.get("timestamp") or _MISSING,
         f"*{event.get('execution_id') or _MISSING}*",
         event.get("type") or _MISSING,
         event.get("pipeline_name") or _MISSING,
@@ -118,16 +115,16 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
     """Project a buffered payload into the canonical per-event dict.
 
     Unified shape across Slack/API and IMMEDIATE/BATCHED. `pipeline_id` is
-    intentionally dropped here — neither channel surfaces it. Missing keys
-    fall back to empty values so partial rows from older enqueue builds
-    still render.
+    intentionally dropped here — neither channel surfaces it. Timestamps are
+    humanized once at projection so Slack and API consumers see the same
+    string (implicit UTC, no timezone suffix).
     """
     event: dict[str, Any] = {
         "type": payload.get("type") or "",
         "pipeline_name": payload.get("pipeline_name") or "",
         "status": payload.get("status") or "",
         "execution_id": payload.get("execution_id") or "",
-        "timestamp": payload.get("timestamp") or "",
+        "timestamp": _humanize_timestamp(payload.get("timestamp")),
         "additional_data": payload.get("additional_data") or {},
     }
     error_message = payload.get("error_message")
@@ -136,30 +133,20 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
     return event
 
 
-def build_envelope(
-    payloads: list[dict[str, Any]],
-    interval_seconds: int | None,
-) -> dict[str, Any]:
+def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
     """Build the canonical envelope used by every dispatch path.
 
-    `interval_seconds=None` signals IMMEDIATE — `summary.interval_minutes`
-    becomes null so consumers can distinguish modes if they need to. For
-    BATCHED, pass the per-org cadence in seconds (rendered as minutes).
+    Summary carries only `{total, succeeded, failed}` — same shape for
+    IMMEDIATE and BATCHED so receivers parse one envelope, not two.
     """
     capped = payloads[:MAX_BATCH_SIZE]
     succeeded = sum(1 for p in capped if _is_success(p.get("status")))
     failed = len(capped) - succeeded
-    interval_minutes: int | None
-    if interval_seconds is None:
-        interval_minutes = None
-    else:
-        interval_minutes = max(1, interval_seconds // 60)
     return {
         "summary": {
             "total": len(capped),
             "succeeded": succeeded,
             "failed": failed,
-            "interval_minutes": interval_minutes,
         },
         "events": [_event_from_payload(p) for p in capped],
     }
@@ -194,14 +181,13 @@ def render_for_slack(envelope: dict[str, Any]) -> dict[str, Any]:
 def render_clubbed_message(
     payloads: list[dict[str, Any]],
     platform: str,
-    interval_seconds: int | None,
 ) -> dict[str, Any]:
     """Top-level entry — returns the dispatch body for `platform`.
 
     Used by every dispatch site (BATCHED flush, IMMEDIATE backend providers)
     so the receiver-visible payload is identical regardless of mode.
     """
-    envelope = build_envelope(payloads, interval_seconds)
+    envelope = build_envelope(payloads)
     if platform == PlatformType.SLACK.value:
         return render_for_slack(envelope)
     if platform == PlatformType.API.value:
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 09f3a83f5d..bf07e2c9c4 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -34,7 +34,6 @@
 from notification_v2.helper import (
     build_webhook_headers,
     enqueue,
-    get_org_club_interval_seconds,
     webhook_url_hash,
 )
 from notification_v2.models import Notification, NotificationBuffer
@@ -423,12 +422,7 @@ def _dispatch_group(
         first_notification = rows[0].notification
         platform = rows[0].platform
         payloads = [r.payload for r in rows]
-        # Per-org interval read here is cosmetic — used only for the
-        # `interval_minutes` field in the rendered message body. The
-        # cadence-controlling read happened at enqueue time and is
-        # already baked into each row's flush_after (mfbt §EC-2).
-        interval_seconds = get_org_club_interval_seconds(rows[0].organization)
-        body = render_clubbed_message(payloads, platform, interval_seconds)
+        body = render_clubbed_message(payloads, platform)
         headers = build_webhook_headers(first_notification)
 
         buffer_ids = [str(r.id) for r in rows]
diff --git a/backend/notification_v2/provider/webhook/api_webhook.py b/backend/notification_v2/provider/webhook/api_webhook.py
index f1b2d347c0..9864d84a4a 100644
--- a/backend/notification_v2/provider/webhook/api_webhook.py
+++ b/backend/notification_v2/provider/webhook/api_webhook.py
@@ -24,7 +24,7 @@ def get_headers(self) -> dict[str, str]:
     def format_payload(self) -> dict[str, Any]:
         """Wrap a single IMMEDIATE event in the canonical envelope.
 
-        `interval_seconds=None` -> `summary.interval_minutes` is null;
-        receivers can use that to distinguish IMMEDIATE from BATCHED.
+        Receivers parse the same `{summary, events}` shape regardless of
+        whether the dispatch was IMMEDIATE or BATCHED.
         """
-        return build_envelope(payloads=[self.payload], interval_seconds=None)
+        return build_envelope(payloads=[self.payload])
diff --git a/backend/notification_v2/provider/webhook/slack_webhook.py b/backend/notification_v2/provider/webhook/slack_webhook.py
index 4eb8c599d2..0fda635d74 100644
--- a/backend/notification_v2/provider/webhook/slack_webhook.py
+++ b/backend/notification_v2/provider/webhook/slack_webhook.py
@@ -25,11 +25,9 @@ def format_payload(self) -> dict[str, Any]:
         """Render the IMMEDIATE event through the canonical envelope.
 
         Single shared renderer for IMMEDIATE and BATCHED so receivers see the
-        same Slack body shape regardless of delivery mode. `interval_seconds`
-        is None for IMMEDIATE — `summary.interval_minutes` resolves to null.
+        same Slack body shape regardless of delivery mode.
         """
         return render_clubbed_message(
             payloads=[self.payload],
             platform=PlatformType.SLACK.value,
-            interval_seconds=None,
         )
diff --git a/workers/notification/providers/_clubbed_format.py b/workers/notification/providers/_clubbed_format.py
index dfcfa4add8..d489d76ec7 100644
--- a/workers/notification/providers/_clubbed_format.py
+++ b/workers/notification/providers/_clubbed_format.py
@@ -55,7 +55,7 @@ def _format_file_count(event: dict[str, Any]) -> str:
 
 def _format_event_line(event: dict[str, Any]) -> str:
     parts = [
-        _humanize_timestamp(event.get("timestamp")),
+        event.get("timestamp") or _MISSING,
         f"*{event.get('execution_id') or _MISSING}*",
         event.get("type") or _MISSING,
         event.get("pipeline_name") or _MISSING,
@@ -71,14 +71,15 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
     """Project a flat per-event payload into the canonical shape.
 
     Drops `pipeline_id` and `_source` — neither appears in receiver-visible
-    output. Mirrors the backend projection so renderer input is identical.
+    output. Mirrors the backend projection (including the humanized timestamp)
+    so renderer input is identical.
     """
     event: dict[str, Any] = {
         "type": payload.get("type") or "",
         "pipeline_name": payload.get("pipeline_name") or "",
         "status": payload.get("status") or "",
         "execution_id": payload.get("execution_id") or "",
-        "timestamp": payload.get("timestamp") or "",
+        "timestamp": _humanize_timestamp(payload.get("timestamp")),
         "additional_data": payload.get("additional_data") or {},
     }
     error_message = payload.get("error_message")
@@ -87,28 +88,20 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
     return event
 
 
-def build_envelope(
-    payloads: list[dict[str, Any]],
-    interval_seconds: int | None,
-) -> dict[str, Any]:
+def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
     """Build the canonical `{summary, events}` envelope.
 
-    `interval_seconds=None` for IMMEDIATE -> `summary.interval_minutes` null.
+    Summary carries only `{total, succeeded, failed}` — identical shape for
+    IMMEDIATE and BATCHED.
     """
     capped = payloads[:MAX_BATCH_SIZE]
     succeeded = sum(1 for p in capped if _is_success(p.get("status")))
     failed = len(capped) - succeeded
-    interval_minutes: int | None
-    if interval_seconds is None:
-        interval_minutes = None
-    else:
-        interval_minutes = max(1, interval_seconds // 60)
     return {
         "summary": {
             "total": len(capped),
             "succeeded": succeeded,
             "failed": failed,
-            "interval_minutes": interval_minutes,
         },
         "events": [_event_from_payload(p) for p in capped],
     }
diff --git a/workers/notification/providers/api_webhook.py b/workers/notification/providers/api_webhook.py
index 19ff1d12c3..1e652e9464 100644
--- a/workers/notification/providers/api_webhook.py
+++ b/workers/notification/providers/api_webhook.py
@@ -39,9 +39,7 @@ def prepare_data(self, notification_data: dict[str, Any]) -> dict[str, Any]:
         if "payload" in prepared_data:
             payload = prepared_data["payload"]
             if isinstance(payload, dict) and "events" not in payload:
-                prepared_data["payload"] = build_envelope(
-                    payloads=[payload], interval_seconds=None
-                )
+                prepared_data["payload"] = build_envelope(payloads=[payload])
 
         logger.debug(f"Prepared API webhook data for {notification_data.get('url')}")
         return prepared_data
diff --git a/workers/notification/providers/slack_webhook.py b/workers/notification/providers/slack_webhook.py
index 4532af5672..01f272b024 100644
--- a/workers/notification/providers/slack_webhook.py
+++ b/workers/notification/providers/slack_webhook.py
@@ -59,7 +59,7 @@ def format_payload(self, payload: dict[str, Any]) -> dict[str, Any]:
         if "text" in payload and len(payload) == 1:
             return {"text": payload["text"]}
 
-        envelope = build_envelope(payloads=[payload], interval_seconds=None)
+        envelope = build_envelope(payloads=[payload])
         return {"text": render_slack_text(envelope)}
 
     def get_destination(self, notification_data: dict[str, Any]) -> str:

From f8052dbdcac3e34fff7618815c1e0ba1b305fb1b Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 11:33:21 +0530
Subject: [PATCH 11/27] delivery mode batch by default

---
 .../migrations/0003_add_notification_buffer.py     |  8 ++++----
 backend/notification_v2/models.py                  |  8 ++++----
 backend/notification_v2/serializers.py             |  2 +-
 .../notification-modal/CreateNotification.jsx      | 14 ++------------
 4 files changed, 11 insertions(+), 21 deletions(-)

diff --git a/backend/notification_v2/migrations/0003_add_notification_buffer.py b/backend/notification_v2/migrations/0003_add_notification_buffer.py
index 7f5224849f..fd66f014ba 100644
--- a/backend/notification_v2/migrations/0003_add_notification_buffer.py
+++ b/backend/notification_v2/migrations/0003_add_notification_buffer.py
@@ -16,13 +16,13 @@ class Migration(migrations.Migration):
             name="delivery_mode",
             field=models.CharField(
                 choices=[("IMMEDIATE", "Immediate"), ("BATCHED", "Batched")],
-                default="IMMEDIATE",
+                default="BATCHED",
                 max_length=16,
                 db_comment=(
-                    "IMMEDIATE fires on every completion (default, unchanged "
-                    "behavior). BATCHED buffers events and dispatches a single "
+                    "BATCHED (default) buffers events and dispatches a single "
                     "clubbed message per (org, webhook_url, auth_sig) every "
-                    "NOTIFICATION_CLUB_INTERVAL."
+                    "NOTIFICATION_CLUB_INTERVAL. IMMEDIATE fires on every "
+                    "completion."
                 ),
             ),
         ),
diff --git a/backend/notification_v2/models.py b/backend/notification_v2/models.py
index a8b077f339..9c7d136534 100644
--- a/backend/notification_v2/models.py
+++ b/backend/notification_v2/models.py
@@ -66,11 +66,11 @@ class Notification(BaseModel):
     delivery_mode = models.CharField(
         max_length=16,
         choices=DeliveryMode.choices(),
-        default=DeliveryMode.IMMEDIATE.value,
+        default=DeliveryMode.BATCHED.value,
         db_comment=(
-            "IMMEDIATE fires on every completion (default, unchanged behavior). "
-            "BATCHED buffers events and dispatches a single clubbed message per "
-            "(org, webhook_url, auth_sig) every NOTIFICATION_CLUB_INTERVAL."
+            "BATCHED (default) buffers events and dispatches a single clubbed "
+            "message per (org, webhook_url, auth_sig) every "
+            "NOTIFICATION_CLUB_INTERVAL. IMMEDIATE fires on every completion."
         ),
     )
     # Foreign keys to specific models
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index b2602929fe..158108bed1 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -23,7 +23,7 @@ class NotificationSerializer(serializers.ModelSerializer):
     notify_on_failures = serializers.BooleanField(default=False, required=False)
     delivery_mode = serializers.ChoiceField(
         choices=DeliveryMode.choices(),
-        default=DeliveryMode.IMMEDIATE.value,
+        default=DeliveryMode.BATCHED.value,
         required=False,
     )
 
diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
index 17066ed06b..2d2e548768 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
@@ -19,7 +19,7 @@ const DEFAULT_FORM_DETAILS = {
   is_active: false,
   max_retries: 0,
   notify_on_failures: false,
-  delivery_mode: "IMMEDIATE",
+  delivery_mode: "BATCHED",
   pipeline: "",
   api: "",
   url: "",
@@ -122,17 +122,7 @@ function CreateNotification({
   }, [formDetails]);
 
   const handleInputChange = (changedValues, allValues) => {
-    let nextValues = { ...formDetails, ...allValues };
-    // Failure alerts must not be delayed by the batch window — auto-select
-    // IMMEDIATE the moment the box is checked. The user can still override
-    // to BATCHED afterward and that choice will stick.
-    if (
-      Object.hasOwn(changedValues, "notify_on_failures") &&
-      changedValues.notify_on_failures === true
-    ) {
-      nextValues = { ...nextValues, delivery_mode: "IMMEDIATE" };
-      form.setFieldsValue({ delivery_mode: "IMMEDIATE" });
-    }
+    const nextValues = { ...formDetails, ...allValues };
     setFormDetails(nextValues);
     const changedFieldName = Object.keys(changedValues)[0];
     form.setFields([

From 879873780ec03e5faf26e3dcff8fc74c298be66c Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 13:24:20 +0530
Subject: [PATCH 12/27] UI change

---
 backend/backend/settings/base.py              |  4 +-
 backend/configuration/enums.py                |  2 +
 backend/notification_v2/serializers.py        |  6 +-
 .../notification-modal/CreateNotification.jsx | 58 ++-----------------
 .../settings/platform/PlatformSettings.jsx    | 28 +++++----
 5 files changed, 30 insertions(+), 68 deletions(-)

diff --git a/backend/backend/settings/base.py b/backend/backend/settings/base.py
index fafbad60e3..73969ec13d 100644
--- a/backend/backend/settings/base.py
+++ b/backend/backend/settings/base.py
@@ -220,9 +220,9 @@ def get_required_setting(setting_key: str, default: str | None = None) -> str |
 INDEXING_FLAG_TTL = int(get_required_setting("INDEXING_FLAG_TTL"))
 NOTIFICATION_TIMEOUT = int(get_required_setting("NOTIFICATION_TIMEOUT", "5"))
 # Window for clubbing BATCHED notifications — also the flush cadence (seconds).
-# Default 1800 (30 min). Per-notification buffer rows precompute flush_after at
+# Default 300 (5 min). Per-notification buffer rows precompute flush_after at
 # enqueue time, so changing this only affects rows enqueued after the restart.
-NOTIFICATION_CLUB_INTERVAL = int(os.environ.get("NOTIFICATION_CLUB_INTERVAL", "1800"))
+NOTIFICATION_CLUB_INTERVAL = int(os.environ.get("NOTIFICATION_CLUB_INTERVAL", "300"))
 # Retention for terminal NotificationBuffer rows (DISPATCHED / DEAD_LETTER).
 # PENDING rows are never GC'd regardless of age.
 NOTIFICATION_BUFFER_RETENTION_DAYS = int(
diff --git a/backend/configuration/enums.py b/backend/configuration/enums.py
index a11a0b58e7..78bbeb7dfd 100644
--- a/backend/configuration/enums.py
+++ b/backend/configuration/enums.py
@@ -65,6 +65,8 @@ class ConfigKey(Enum):
         default=settings.NOTIFICATION_CLUB_INTERVAL,
         value_type=ConfigType.INT,
         help_text="Window (seconds) for clubbing BATCHED notifications.",
+        min_value=60,
+        max_value=7200,
     )
 
     def cast_value(self, raw_value: Any):
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index 158108bed1..956a25b86e 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -8,9 +8,9 @@
 class NotificationSettingsSerializer(serializers.Serializer):
     """Org-scoped notification batching settings (UNS-611 v2)."""
 
-    # No min/max here: mfbt is silent on bounds. Backend ConfigSpec accepts
-    # any int; constraining is a follow-up if/when product gives a number.
-    club_interval_seconds = serializers.IntegerField()
+    # Bounds (1 min – 2 h) mirror ConfigKey.NOTIFICATION_CLUB_INTERVAL so DRF
+    # returns a structured 400 before ConfigKey.cast_value re-raises.
+    club_interval_seconds = serializers.IntegerField(min_value=60, max_value=7200)
 
 
 class NotificationSerializer(serializers.ModelSerializer):
diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
index 2d2e548768..d9577f9c39 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/CreateNotification.jsx
@@ -2,12 +2,6 @@ import { Button, Checkbox, Form, Input, Select, Space } from "antd";
 import PropTypes from "prop-types";
 import { useEffect, useState } from "react";
 import { getBackendErrorDetail } from "../../../helpers/GetStaticData";
-import { useAxiosPrivate } from "../../../hooks/useAxiosPrivate";
-import { useSessionStore } from "../../../store/session-store";
-
-// Used only when the org's batch interval can't be fetched (network or auth
-// failure). Backend's env-derived default is also 30 min, so this matches.
-const FALLBACK_BATCH_INTERVAL_MINUTES = 30;
 
 const DEFAULT_FORM_DETAILS = {
   name: "",
@@ -19,7 +13,6 @@ const DEFAULT_FORM_DETAILS = {
   is_active: false,
   max_retries: 0,
   notify_on_failures: false,
-  delivery_mode: "BATCHED",
   pipeline: "",
   api: "",
   url: "",
@@ -75,37 +68,6 @@ function CreateNotification({
   const [formDetails, setFormDetails] = useState(DEFAULT_FORM_DETAILS);
   const [backendErrors, setBackendErrors] = useState(null);
   const [resetForm, setResetForm] = useState(false);
-  const [batchIntervalMinutes, setBatchIntervalMinutes] = useState(
-    FALLBACK_BATCH_INTERVAL_MINUTES,
-  );
-  const axiosPrivate = useAxiosPrivate();
-  const { sessionDetails } = useSessionStore();
-
-  useEffect(() => {
-    // Read live org-scoped interval (UNS-611 v2). Fall back silently to the
-    // hardcoded 30-min default — the dropdown still labels something useful.
-    if (!sessionDetails?.orgId) {
-      return;
-    }
-    axiosPrivate({
-      method: "GET",
-      url: `/api/v1/unstract/${sessionDetails.orgId}/notifications/settings/`,
-    })
-      .then((res) => {
-        const seconds = res?.data?.club_interval_seconds;
-        if (typeof seconds === "number" && seconds > 0) {
-          setBatchIntervalMinutes(Math.max(1, Math.round(seconds / 60)));
-        }
-      })
-      .catch(() => {
-        // Non-fatal — keep fallback.
-      });
-  }, [sessionDetails?.orgId]);
-
-  const deliveryModes = [
-    { value: "IMMEDIATE", label: "Immediate" },
-    { value: "BATCHED", label: "Batched" },
-  ];
 
   useEffect(() => {
     if (editDetails) {
@@ -263,21 +225,13 @@ function CreateNotification({
       <Form.Item
         name="notify_on_failures"
         valuePropName="checked"
-        tooltip="When enabled, only runs with at least one failed file or a run-level error/stop trigger this notification. Otherwise notifications fire on every completion."
-      >
-        <Checkbox>Notify on failures only</Checkbox>
-      </Form.Item>
-      <Form.Item
-        label="Delivery Mode"
-        name="delivery_mode"
-        tooltip="Immediate fires on every completion. Batched buffers events and dispatches a single clubbed message per webhook every batch interval."
-        extra={
-          formDetails.delivery_mode === "BATCHED"
-            ? `Notifications will be batched and sent every ${batchIntervalMinutes} minutes. Org admins can change this in Platform Settings.`
-            : null
-        }
+        extra="Notification interval can be configured in Platform settings."
       >
-        <Select options={deliveryModes} />
+        <Checkbox>
+          <span style={{ fontSize: 14, color: "rgba(0, 0, 0, 0.88)" }}>
+            Notify on failures only
+          </span>
+        </Checkbox>
       </Form.Item>
       <Form.Item className="display-flex-right">
         <Space>
diff --git a/frontend/src/components/settings/platform/PlatformSettings.jsx b/frontend/src/components/settings/platform/PlatformSettings.jsx
index 0b39cebecf..0bbcb641b6 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.jsx
+++ b/frontend/src/components/settings/platform/PlatformSettings.jsx
@@ -77,10 +77,14 @@ function PlatformSettings() {
   }, []);
 
   const handleSaveInterval = () => {
-    if (!batchIntervalMinutes || batchIntervalMinutes < 1) {
+    if (
+      !batchIntervalMinutes ||
+      batchIntervalMinutes < 1 ||
+      batchIntervalMinutes > 120
+    ) {
       setAlertDetails({
         type: "error",
-        content: "Batch interval must be a positive number of minutes.",
+        content: "Notification interval must be between 1 and 120 minutes.",
       });
       return;
     }
@@ -318,6 +322,7 @@ function PlatformSettings() {
           <IslandLayout>
             <div className="plt-set-layout-2">
               <div>
+                <Typography.Title level={5}>Internal API Keys</Typography.Title>
                 {keys.map((keyDetails, keyIndex) => {
                   return (
                     <div key={keyDetails?.keyName}>
@@ -398,21 +403,17 @@ function PlatformSettings() {
               </div>
               <Divider />
               <div className="plt-set-batch-interval">
-                <Typography.Title level={5}>
-                  Notification batching
-                </Typography.Title>
-                <Typography.Text type="secondary">
-                  Batched notifications enqueued after a change pick up the new
-                  value; in-flight rows keep their original cadence.
-                </Typography.Text>
+                <Typography.Title level={5}>Notifications</Typography.Title>
                 <div style={{ marginTop: 12 }}>
                   <Space>
-                    <Typography.Text>Batch interval (minutes)</Typography.Text>
+                    <Typography.Text>
+                      Notification interval (minutes, 1–120)
+                    </Typography.Text>
                     <InputNumber
                       min={1}
+                      max={120}
                       value={batchIntervalMinutes}
                       onChange={(v) => setBatchIntervalMinutes(v)}
-                      placeholder="e.g. 30"
                     />
                     <Button
                       type="primary"
@@ -422,6 +423,11 @@ function PlatformSettings() {
                       Save
                     </Button>
                   </Space>
+                  <div style={{ marginTop: 4 }}>
+                    <Typography.Text type="secondary">
+                      Allowed: 1–120 minutes. Default: 5 minutes.
+                    </Typography.Text>
+                  </div>
                 </div>
               </div>
             </div>

From 50917e8289def43671447a3104e79d2ddf8270a9 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 14:44:20 +0530
Subject: [PATCH 13/27] PR reviews

---
 backend/api_v2/notification.py                |   7 +-
 backend/notification_v2/clubbed_renderer.py   |   2 +-
 backend/notification_v2/enums.py              |   7 +
 backend/notification_v2/helper.py             |  12 +-
 backend/notification_v2/internal_api_views.py | 132 +++++++++++-------
 .../0003_add_notification_buffer.py           |   8 +-
 backend/notification_v2/models.py             |  10 +-
 backend/notification_v2/tasks.py              |   2 +-
 backend/pipeline_v2/notification.py           |   7 +-
 .../workflow_manager/internal_serializers.py  |  34 +++++
 .../settings/platform/PlatformSettings.jsx    |   7 +-
 .../shared/patterns/notification/helper.py    |  60 ++++----
 12 files changed, 191 insertions(+), 97 deletions(-)

diff --git a/backend/api_v2/notification.py b/backend/api_v2/notification.py
index 4cefe92d24..d5d2dca9df 100644
--- a/backend/api_v2/notification.py
+++ b/backend/api_v2/notification.py
@@ -1,9 +1,9 @@
 import logging
 
+from notification_v2.enums import FAILURE_STATUSES
 from notification_v2.helper import dispatch_with_delivery_mode
 from notification_v2.models import Notification
 from pipeline_v2.dto import PipelineStatusPayload
-from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from api_v2.models import APIDeployment
@@ -11,9 +11,6 @@
 logger = logging.getLogger(__name__)
 
 
-_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
-
-
 class APINotification:
     def __init__(self, api: APIDeployment, workflow_execution: WorkflowExecution) -> None:
         self.notifications = Notification.objects.filter(api=api, is_active=True)
@@ -26,7 +23,7 @@ def send(self) -> None:
         # status check alone misses them — see callback aggregation rules.
         failed_files = self.workflow_execution.failed_files or 0
         is_failure = (
-            self.workflow_execution.status in _FAILURE_STATUSES or failed_files > 0
+            self.workflow_execution.status in FAILURE_STATUSES or failed_files > 0
         )
         if not is_failure:
             # Success path: skip rows that opted into failure-only alerts.
diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
index fc85120f7a..1974a896d3 100644
--- a/backend/notification_v2/clubbed_renderer.py
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -1,6 +1,6 @@
 """Canonical envelope + renderer for every dispatch — IMMEDIATE and BATCHED.
 
-The same envelope shape feeds every channel × mode cell so receivers never
+The same envelope shape feeds every channel x mode cell so receivers never
 need to branch on "is this batched?":
 
     {
diff --git a/backend/notification_v2/enums.py b/backend/notification_v2/enums.py
index d6fed8b485..9e694e128f 100644
--- a/backend/notification_v2/enums.py
+++ b/backend/notification_v2/enums.py
@@ -1,5 +1,12 @@
 from enum import Enum
 
+from workflow_manager.workflow_v2.enums import ExecutionStatus
+
+# Single source of truth for "did this run fail for notification routing?".
+# STOPPED is intentionally a failure here per migrations/0002_…notify_on_failures
+# db_comment ("terminal status ERROR/STOPPED or any file in the run errored").
+FAILURE_STATUSES = frozenset({ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value})
+
 
 class NotificationType(Enum):
     WEBHOOK = "WEBHOOK"
diff --git a/backend/notification_v2/helper.py b/backend/notification_v2/helper.py
index 908c0dd993..4a6c5cc907 100644
--- a/backend/notification_v2/helper.py
+++ b/backend/notification_v2/helper.py
@@ -1,4 +1,5 @@
 import hashlib
+import json
 import logging
 from collections.abc import Iterable
 from datetime import timedelta
@@ -26,17 +27,20 @@
 
 
 def compute_auth_sig(notification: Notification) -> str:
-    """SHA-256 hex of (auth_type + auth_key + auth_header) — never raw creds.
+    """SHA-256 hex of (auth_type, auth_key, auth_header) — never raw creds.
 
     Identical auth configs produce the same sig (so grouping clubs them);
-    differing configs split into separate groups.
+    differing configs split into separate groups. The tuple is JSON-encoded
+    before hashing so a literal delimiter byte inside auth_key/header cannot
+    cause two distinct tuples to collapse to the same digest.
     """
-    raw = "|".join(
+    raw = json.dumps(
         [
             notification.authorization_type or _AUTH_SIG_NONE,
             notification.authorization_key or _AUTH_SIG_NONE,
             notification.authorization_header or _AUTH_SIG_NONE,
-        ]
+        ],
+        separators=(",", ":"),
     )
     return hashlib.sha256(raw.encode("utf-8")).hexdigest()
 
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index bf07e2c9c4..9a9c0e4a71 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -25,12 +25,11 @@
 from django.views.decorators.http import require_http_methods
 from pipeline_v2.models import Pipeline
 from utils.organization_utils import filter_queryset_by_organization
-from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from backend.celery_service import app as celery_app
 from notification_v2.clubbed_renderer import render_clubbed_message
-from notification_v2.enums import BufferStatus, DeliveryMode
+from notification_v2.enums import FAILURE_STATUSES, BufferStatus, DeliveryMode
 from notification_v2.helper import (
     build_webhook_headers,
     enqueue,
@@ -43,8 +42,6 @@
 # Constants for error messages
 INTERNAL_SERVER_ERROR_MSG = "Internal server error"
 
-_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
-
 
 def _load_execution(execution_id: str | None) -> WorkflowExecution | None:
     """Best-effort lookup; returns None on missing id or unknown row."""
@@ -73,7 +70,7 @@ def _apply_failure_filter(
     if execution is None:
         return notifications_qs
     failed_files = execution.failed_files or 0
-    is_failure = execution.status in _FAILURE_STATUSES or failed_files > 0
+    is_failure = execution.status in FAILURE_STATUSES or failed_files > 0
     if not is_failure:
         notifications_qs = notifications_qs.filter(notify_on_failures=False)
     return notifications_qs
@@ -387,12 +384,71 @@ def _gc_terminal_rows() -> int:
     return int(deleted_count)
 
 
+def _send_clubbed(
+    *,
+    url: str,
+    body: Any,
+    headers: dict[str, str],
+    platform: str,
+    max_retries: int,
+    buffer_ids: list[str],
+    org_id: Any,
+) -> None:
+    """Send the clubbed Celery task after the DB transition has committed.
+
+    Runs as a ``transaction.on_commit`` callback so a rolled-back UPDATE can
+    never leave a broker-queued message orphaned (the prior order — send
+    then update — risked duplicate delivery if the UPDATE failed). On broker
+    failure we revert rows back to PENDING in a separate transaction so the
+    next flush tick retries cleanly.
+    """
+    try:
+        celery_app.send_task(
+            "send_webhook_notification",
+            args=[url, body, headers, settings.NOTIFICATION_TIMEOUT],
+            kwargs={
+                "max_retries": max_retries,
+                "retry_delay": 10,
+                "platform": platform,
+            },
+            queue="notifications",
+            link_error=celery_app.signature(
+                "notification_v2.mark_buffer_dead_letter",
+                kwargs={"buffer_row_ids": buffer_ids},
+            ),
+        )
+        logger.info(
+            "metric=notification_batch_dispatched_total platform=%s result=success "
+            "org_id=%s webhook_url_hash=%s rows=%d",
+            platform,
+            org_id,
+            webhook_url_hash(url),
+            len(buffer_ids),
+        )
+    except Exception:
+        logger.exception(
+            "metric=notification_batch_dispatched_total platform=%s "
+            "result=broker_failure org_id=%s webhook_url_hash=%s rows=%d",
+            platform,
+            org_id,
+            webhook_url_hash(url),
+            len(buffer_ids),
+        )
+        # Revert outside the committed transaction so a transient broker
+        # outage degrades to "retried next tick" rather than "stuck DISPATCHED".
+        NotificationBuffer.objects.filter(id__in=buffer_ids).update(
+            status=BufferStatus.PENDING.value,
+            dispatched_at=None,
+        )
+
+
 def _dispatch_group(
     org_id: Any,
     webhook_url: str,
     auth_sig: str,
+    platform: str,
 ) -> tuple[int, int]:
-    """Dispatch a single (org, url, auth_sig) group; returns (rows, succeeded).
+    """Dispatch a single (org, url, auth_sig, platform) group; returns (rows, succeeded).
 
     Caller already filtered groups to MIN(flush_after) <= now. Locks rows
     with SKIP LOCKED so a sibling replica skips them rather than blocking.
@@ -407,6 +463,7 @@ def _dispatch_group(
                 organization_id=org_id,
                 webhook_url=webhook_url,
                 auth_sig=auth_sig,
+                platform=platform,
             )
             .order_by("created_at")[:_PROCESS_BUFFER_CAP]
         )
@@ -417,57 +474,33 @@ def _dispatch_group(
             return 0, 0
 
         # Live auth — read from the FIRST row's notification. If multiple
-        # notifications collide on (url, auth_sig) we have, by definition,
-        # identical auth, so this is safe.
+        # notifications collide on (url, auth_sig, platform) we have, by
+        # definition, identical auth + format, so this is safe.
         first_notification = rows[0].notification
-        platform = rows[0].platform
         payloads = [r.payload for r in rows]
         body = render_clubbed_message(payloads, platform)
         headers = build_webhook_headers(first_notification)
-
         buffer_ids = [str(r.id) for r in rows]
-        try:
-            celery_app.send_task(
-                "send_webhook_notification",
-                args=[
-                    first_notification.url,
-                    body,
-                    headers,
-                    settings.NOTIFICATION_TIMEOUT,
-                ],
-                kwargs={
-                    "max_retries": first_notification.max_retries,
-                    "retry_delay": 10,
-                    "platform": platform,
-                },
-                queue="notifications",
-                link_error=celery_app.signature(
-                    "notification_v2.mark_buffer_dead_letter",
-                    kwargs={"buffer_row_ids": buffer_ids},
-                ),
-            )
-        except Exception:
-            # Broker hiccup — leave rows PENDING for the next tick rather
-            # than mark them DEAD_LETTER. `exception` keeps stack context.
-            logger.exception(
-                "Broker dispatch failed for group org=%s url_hash=%s",
-                org_id,
-                webhook_url_hash(webhook_url),
-            )
-            return 0, 0
 
+        # Mark DISPATCHED first; if commit succeeds the on_commit hook
+        # publishes the broker task. If commit fails, rows stay PENDING and
+        # no task is published — eliminates the broker-vs-DB duplicate-send
+        # race that bit us when the order was reversed.
         now = timezone.now()
         NotificationBuffer.objects.filter(id__in=buffer_ids).update(
             status=BufferStatus.DISPATCHED.value,
             dispatched_at=now,
         )
-        logger.info(
-            "metric=notification_batch_dispatched_total platform=%s result=success "
-            "org_id=%s webhook_url_hash=%s rows=%d",
-            platform,
-            org_id,
-            webhook_url_hash(webhook_url),
-            len(rows),
+        transaction.on_commit(
+            lambda: _send_clubbed(
+                url=first_notification.url,
+                body=body,
+                headers=headers,
+                platform=platform,
+                max_retries=first_notification.max_retries,
+                buffer_ids=buffer_ids,
+                org_id=org_id,
+            )
         )
         return len(rows), len(rows)
 
@@ -484,9 +517,9 @@ def process_notification_buffer(request: HttpRequest) -> JsonResponse:
     """Flush PENDING groups that have hit their flush_after; then GC.
 
     Algorithm:
-    1. GROUP BY (org, url, auth_sig), HAVING MIN(flush_after) <= NOW()
+    1. GROUP BY (org, url, auth_sig, platform), HAVING MIN(flush_after) <= NOW()
     2. For each group, in its own transaction: lock-skip-locked rows,
-       render, dispatch a single Celery task, mark rows DISPATCHED.
+       render, mark rows DISPATCHED, on_commit-dispatch a single Celery task.
     3. Sweep terminal rows older than NOTIFICATION_BUFFER_RETENTION_DAYS.
 
     Concurrency: SELECT FOR UPDATE SKIP LOCKED makes parallel calls safe —
@@ -495,7 +528,7 @@ def process_notification_buffer(request: HttpRequest) -> JsonResponse:
     now = timezone.now()
     groups = list(
         NotificationBuffer.objects.filter(status=BufferStatus.PENDING.value)
-        .values("organization_id", "webhook_url", "auth_sig")
+        .values("organization_id", "webhook_url", "auth_sig", "platform")
         .annotate(earliest_flush=Min("flush_after"))
         .filter(earliest_flush__lte=now)
     )
@@ -508,6 +541,7 @@ def process_notification_buffer(request: HttpRequest) -> JsonResponse:
                 org_id=group["organization_id"],
                 webhook_url=group["webhook_url"],
                 auth_sig=group["auth_sig"],
+                platform=group["platform"],
             )
         except Exception:
             logger.exception(
diff --git a/backend/notification_v2/migrations/0003_add_notification_buffer.py b/backend/notification_v2/migrations/0003_add_notification_buffer.py
index fd66f014ba..5090eff18a 100644
--- a/backend/notification_v2/migrations/0003_add_notification_buffer.py
+++ b/backend/notification_v2/migrations/0003_add_notification_buffer.py
@@ -141,7 +141,13 @@ class Migration(migrations.Migration):
             model_name="notificationbuffer",
             index=models.Index(
                 condition=models.Q(("status", "PENDING")),
-                fields=["organization", "webhook_url", "auth_sig", "flush_after"],
+                fields=[
+                    "organization",
+                    "webhook_url",
+                    "auth_sig",
+                    "platform",
+                    "flush_after",
+                ],
                 name="idx_notif_buffer_pending",
             ),
         ),
diff --git a/backend/notification_v2/models.py b/backend/notification_v2/models.py
index 9c7d136534..ea8b68f4ad 100644
--- a/backend/notification_v2/models.py
+++ b/backend/notification_v2/models.py
@@ -195,8 +195,16 @@ class Meta:
         indexes = [
             # Partial covering index — supports Index Only Scans on the flush
             # GROUP BY query and bounds index size to live PENDING backlog.
+            # `platform` is part of the grouping key so SLACK and API rows on
+            # the same (org, url, auth) split into separate dispatches.
             models.Index(
-                fields=["organization", "webhook_url", "auth_sig", "flush_after"],
+                fields=[
+                    "organization",
+                    "webhook_url",
+                    "auth_sig",
+                    "platform",
+                    "flush_after",
+                ],
                 name="idx_notif_buffer_pending",
                 condition=models.Q(status=BufferStatus.PENDING.value),
             ),
diff --git a/backend/notification_v2/tasks.py b/backend/notification_v2/tasks.py
index a143f9295e..f14a07ec55 100644
--- a/backend/notification_v2/tasks.py
+++ b/backend/notification_v2/tasks.py
@@ -44,7 +44,7 @@ def mark_buffer_dead_letter(
         status=BufferStatus.DEAD_LETTER.value
     )
     logger.warning(
-        "metric=notification_batch_dispatched_total result=dead_letter rows=%d " "exc=%r",
+        "metric=notification_batch_dispatched_total result=dead_letter rows=%d exc=%r",
         updated,
         exc,
     )
diff --git a/backend/pipeline_v2/notification.py b/backend/pipeline_v2/notification.py
index 5a40a37506..9537cad47b 100644
--- a/backend/pipeline_v2/notification.py
+++ b/backend/pipeline_v2/notification.py
@@ -1,8 +1,8 @@
 import logging
 
+from notification_v2.enums import FAILURE_STATUSES
 from notification_v2.helper import dispatch_with_delivery_mode
 from notification_v2.models import Notification
-from workflow_manager.workflow_v2.enums import ExecutionStatus
 from workflow_manager.workflow_v2.models.execution import WorkflowExecution
 
 from pipeline_v2.dto import PipelineStatusPayload
@@ -11,9 +11,6 @@
 logger = logging.getLogger(__name__)
 
 
-_FAILURE_STATUSES = {ExecutionStatus.ERROR.value, ExecutionStatus.STOPPED.value}
-
-
 class PipelineNotification:
     def __init__(
         self,
@@ -54,7 +51,7 @@ def send(self) -> None:
         failed_files = (execution.failed_files or 0) if execution else 0
         execution_status = execution.status if execution else None
         is_failure = (
-            execution_status in _FAILURE_STATUSES
+            execution_status in FAILURE_STATUSES
             or failed_files > 0
             or self.pipeline.last_run_status == Pipeline.PipelineStatus.FAILURE
         )
diff --git a/backend/workflow_manager/internal_serializers.py b/backend/workflow_manager/internal_serializers.py
index cd221470cb..951bf1e54d 100644
--- a/backend/workflow_manager/internal_serializers.py
+++ b/backend/workflow_manager/internal_serializers.py
@@ -183,6 +183,40 @@ class WorkflowExecutionStatusUpdateSerializer(serializers.Serializer):
     attempts = serializers.IntegerField(required=False, min_value=0)
     execution_time = serializers.FloatField(required=False, min_value=0)
 
+    def validate(self, attrs):
+        """Reject impossible file-count aggregates.
+
+        Per-field min_value=0 catches negatives, but successful + failed >
+        total or either component > total slips through and skews the
+        outcome-based notification filter downstream.
+        """
+        total = attrs.get("total_files")
+        successful = attrs.get("successful_files")
+        failed = attrs.get("failed_files")
+
+        if total is None:
+            if successful is not None or failed is not None:
+                raise serializers.ValidationError(
+                    {
+                        "total_files": "total_files is required when file aggregates are provided."
+                    }
+                )
+            return attrs
+
+        if successful is not None and successful > total:
+            raise serializers.ValidationError(
+                {"successful_files": "successful_files cannot exceed total_files."}
+            )
+        if failed is not None and failed > total:
+            raise serializers.ValidationError(
+                {"failed_files": "failed_files cannot exceed total_files."}
+            )
+        if successful is not None and failed is not None and successful + failed > total:
+            raise serializers.ValidationError(
+                "successful_files + failed_files cannot exceed total_files."
+            )
+        return attrs
+
 
 class OrganizationContextSerializer(serializers.Serializer):
     """Serializer for organization context information."""
diff --git a/frontend/src/components/settings/platform/PlatformSettings.jsx b/frontend/src/components/settings/platform/PlatformSettings.jsx
index 0bbcb641b6..2b08c8e0ba 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.jsx
+++ b/frontend/src/components/settings/platform/PlatformSettings.jsx
@@ -59,6 +59,11 @@ function PlatformSettings() {
   const { setPostHogCustomEvent } = usePostHogEvents();
 
   useEffect(() => {
+    // Wait for session hydration — without this guard the first render
+    // fires GET against /api/v1/unstract/undefined/... and silently 404s.
+    if (!sessionDetails?.orgId) {
+      return;
+    }
     // Load org-scoped batch interval (UNS-611 v2). Falls back silently to
     // null on failure so the rest of the page still renders.
     axiosPrivate({
@@ -74,7 +79,7 @@ function PlatformSettings() {
       .catch(() => {
         // Non-fatal — admin just won't see a pre-filled value.
       });
-  }, []);
+  }, [sessionDetails?.orgId]);
 
   const handleSaveInterval = () => {
     if (
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index 0148bc2f5f..460c308146 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -29,27 +29,23 @@ def _enqueue_to_buffer(
     api_client: Any,
     notification: dict[str, Any],
     payload: NotificationPayload,
-) -> bool:
+) -> None:
     """POST a single execution event to the backend's buffer endpoint.
 
     Worker writes nothing to the DB itself — the backend owns NotificationBuffer
-    rows. Returns True on success so callers can fall back to immediate dispatch
-    if the buffer endpoint is unavailable. The fallback decision is opinionated:
-    we keep behavior conservative and DON'T fall back so a misconfigured or
-    outage-mode backend can't silently turn BATCHED into IMMEDIATE.
+    rows. Raises on any failure so the outer trigger_* caller's except block
+    logs the drop instead of silently treating BATCHED delivery as successful.
     """
+    # Forward the full per-event shape so the backend renderer can match
+    # IMMEDIATE's KV layout per event (Type / Pipeline Id / Pipeline Name /
+    # Status / Execution Id / Timestamp / Additional Data). Older backend
+    # builds that ignore the extra fields stay unaffected.
+    payload_type = payload.type.value if hasattr(payload.type, "value") else payload.type
+    payload_status = (
+        payload.status.value if hasattr(payload.status, "value") else payload.status
+    )
+    payload_timestamp = payload.timestamp.isoformat() if payload.timestamp else None
     try:
-        # Forward the full per-event shape so the backend renderer can match
-        # IMMEDIATE's KV layout per event (Type / Pipeline Id / Pipeline Name
-        # / Status / Execution Id / Timestamp / Additional Data). Older
-        # backend builds that ignore the extra fields stay unaffected.
-        payload_type = (
-            payload.type.value if hasattr(payload.type, "value") else payload.type
-        )
-        payload_status = (
-            payload.status.value if hasattr(payload.status, "value") else payload.status
-        )
-        payload_timestamp = payload.timestamp.isoformat() if payload.timestamp else None
         api_client._make_request(
             method="POST",
             endpoint=ENQUEUE_BUFFER_ENDPOINT,
@@ -67,21 +63,19 @@ def _enqueue_to_buffer(
             },
             timeout=10,
         )
-        logger.info(
-            "Enqueued BATCHED notification %s for pipeline %s execution %s",
-            notification["id"],
-            payload.pipeline_id,
-            payload.execution_id,
-        )
-        return True
-    except Exception as e:
-        logger.error(
-            "Failed to enqueue BATCHED notification %s for pipeline %s: %s",
+    except Exception:  # noqa: BLE001 — propagate any failure, don't classify
+        logger.exception(
+            "Failed to enqueue BATCHED notification %s for pipeline %s",
             notification["id"],
             payload.pipeline_id,
-            e,
         )
-        return False
+        raise
+    logger.info(
+        "Enqueued BATCHED notification %s for pipeline %s execution %s",
+        notification["id"],
+        payload.pipeline_id,
+        payload.execution_id,
+    )
 
 
 def _route_notification(
@@ -102,7 +96,15 @@ def _route_notification(
         return
 
     if notification.get("delivery_mode") == DELIVERY_MODE_BATCHED:
-        _enqueue_to_buffer(api_client, notification, payload)
+        try:
+            _enqueue_to_buffer(api_client, notification, payload)
+        except Exception:  # noqa: BLE001 — already logged with stack inside
+            # Surface but don't abort the outer trigger_* loop — sibling
+            # BATCHED notifications still deserve their enqueue attempt.
+            logger.warning(
+                "BATCHED enqueue failed for notification %s; continuing with others",
+                notification.get("id"),
+            )
         return
 
     send_notification_to_worker(

From 92ad063e4991ba8d3bfeca95d185402148e118cf Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 15:59:27 +0530
Subject: [PATCH 14/27] sonar issues

---
 backend/notification_v2/clubbed_renderer.py   | 185 ++----------------
 .../workflow_manager/internal_serializers.py  |   4 +-
 .../settings/platform/PlatformSettings.jsx    |   2 +
 .../core/notification_clubbed_renderer.py     |  85 ++++++--
 workers/notification/providers/api_webhook.py |   3 +-
 .../notification/providers/slack_webhook.py   |   9 +-
 6 files changed, 94 insertions(+), 194 deletions(-)
 rename workers/notification/providers/_clubbed_format.py => unstract/core/src/unstract/core/notification_clubbed_renderer.py (53%)

diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
index 1974a896d3..a0096197bd 100644
--- a/backend/notification_v2/clubbed_renderer.py
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -1,195 +1,46 @@
-"""Canonical envelope + renderer for every dispatch — IMMEDIATE and BATCHED.
-
-The same envelope shape feeds every channel x mode cell so receivers never
-need to branch on "is this batched?":
-
-    {
-        "summary": {"total": N, "succeeded": S, "failed": F},
-        "events": [
-            {
-                "type": "ETL" | "TASK" | "API",
-                "pipeline_name": "...",
-                "status": "ERROR" | "SUCCESS" | ...,
-                "execution_id": "...",
-                "timestamp": "2026 May 5 5:03:34 PM",
-                "additional_data": {
-                    "total_files": int,
-                    "successful_files": int,
-                    "failed_files": int,
-                },
-                "error_message": "...",   # only on failure
-            },
-            ...
-        ]
-    }
-
-Slack receives `{"text": "<mrkdwn>"}` pre-rendered from this envelope; API
-receivers see the envelope unchanged so programmatic consumers always parse
-the same shape. `pipeline_id` is intentionally absent from every event dict.
+"""Backend dispatch entry for clubbed-notification rendering.
+
+Delegates the canonical envelope + Slack body to
+``unstract.core.notification_clubbed_renderer`` so backend dispatches and
+worker IMMEDIATE callbacks emit byte-identical receiver-visible payloads.
+This thin shim keeps the ``render_clubbed_message`` platform dispatcher
+(uses ``PlatformType`` enum) backend-side; everything else lives in the
+shared module.
 """
 
 from __future__ import annotations
 
-import datetime
 import logging
 from typing import Any
 
 from notification_v2.enums import PlatformType
+from unstract.core.notification_clubbed_renderer import (
+    build_envelope,
+    render_slack_text,
+)
 
 logger = logging.getLogger(__name__)
 
-# Hard cap on events per dispatch; the rest roll into the next flush tick.
-MAX_BATCH_SIZE = 500
-# Slack inlines this many events before collapsing the rest under an
-# "_… and K more_" footer. Slack tolerates much larger payloads, but
-# readability tanks past ~25 lines.
-SLACK_MAX_DISPLAY_EVENTS = 25
-
-_SUCCESS_STATUSES = {"COMPLETED", "SUCCESS"}
-
-# Middle dot (U+00B7) padded by single spaces — the per-event field separator.
-_SEPARATOR = " · "
-_MISSING = "—"  # em-dash placeholder for missing fields
-_DIVIDER = "———"  # triple em-dash divider between header and events
-
-# Slack emoji shortcodes — render the same as the literal unicode glyphs and
-# stay readable in source.
-_EMOJI_SUCCESS = ":white_check_mark:"
-_EMOJI_FAILURE = ":x:"
-
-
-def _is_success(status: str | None) -> bool:
-    if not status:
-        return False
-    return status.upper() in _SUCCESS_STATUSES
-
-
-def _humanize_timestamp(iso: str | None) -> str:
-    """Render an ISO timestamp as `2026 May 11 11:38:31 AM` (POSIX `%-d`).
-
-    Falls back to the missing placeholder on falsy / unparseable input so a
-    partial row still renders without raising.
-    """
-    if not iso:
-        return _MISSING
-    try:
-        dt = datetime.datetime.fromisoformat(iso)
-    except (TypeError, ValueError):
-        return _MISSING
-    return dt.strftime("%Y %b %-d %I:%M:%S %p")
-
-
-def _format_file_count(event: dict[str, Any]) -> str:
-    """Render the file-count summary; empty string when no totals available."""
-    counts = event.get("additional_data") or {}
-    total = counts.get("total_files")
-    if total is None:
-        return ""
-    if _is_success(event.get("status")):
-        successful = counts.get("successful_files", 0)
-        return f"{_EMOJI_SUCCESS} {successful}/{total} files"
-    failed = counts.get("failed_files", 0)
-    return f"{_EMOJI_FAILURE} {failed}/{total} files"
-
+__all__ = ["build_envelope", "render_clubbed_message"]
 
-def _format_event_line(event: dict[str, Any]) -> str:
-    """Format one event as a single Slack mrkdwn line.
 
-    Fields are middle-dot separated; the file-count column is omitted when
-    `additional_data` is empty so the line collapses to 5 fields, not 6.
-    """
-    parts = [
-        event.get("timestamp") or _MISSING,
-        f"*{event.get('execution_id') or _MISSING}*",
-        event.get("type") or _MISSING,
-        event.get("pipeline_name") or _MISSING,
-        event.get("status") or _MISSING,
-    ]
-    file_count = _format_file_count(event)
-    if file_count:
-        parts.append(file_count)
-    return _SEPARATOR.join(parts)
-
-
-def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
-    """Project a buffered payload into the canonical per-event dict.
-
-    Unified shape across Slack/API and IMMEDIATE/BATCHED. `pipeline_id` is
-    intentionally dropped here — neither channel surfaces it. Timestamps are
-    humanized once at projection so Slack and API consumers see the same
-    string (implicit UTC, no timezone suffix).
-    """
-    event: dict[str, Any] = {
-        "type": payload.get("type") or "",
-        "pipeline_name": payload.get("pipeline_name") or "",
-        "status": payload.get("status") or "",
-        "execution_id": payload.get("execution_id") or "",
-        "timestamp": _humanize_timestamp(payload.get("timestamp")),
-        "additional_data": payload.get("additional_data") or {},
-    }
-    error_message = payload.get("error_message")
-    if error_message:
-        event["error_message"] = error_message
-    return event
-
-
-def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
-    """Build the canonical envelope used by every dispatch path.
-
-    Summary carries only `{total, succeeded, failed}` — same shape for
-    IMMEDIATE and BATCHED so receivers parse one envelope, not two.
-    """
-    capped = payloads[:MAX_BATCH_SIZE]
-    succeeded = sum(1 for p in capped if _is_success(p.get("status")))
-    failed = len(capped) - succeeded
-    return {
-        "summary": {
-            "total": len(capped),
-            "succeeded": succeeded,
-            "failed": failed,
-        },
-        "events": [_event_from_payload(p) for p in capped],
-    }
-
-
-def render_for_slack(envelope: dict[str, Any]) -> dict[str, Any]:
-    """Render the envelope as `{"text": "<mrkdwn>"}` for Slack.
-
-    Header + divider are emitted for every dispatch — IMMEDIATE, BATCHED N=1,
-    and BATCHED N>1 all share the same shape. Visible events are capped at
-    SLACK_MAX_DISPLAY_EVENTS with an `_… and K more_` overflow footer.
-    """
-    summary = envelope["summary"]
-    events: list[dict[str, Any]] = envelope["events"]
-    total = summary["total"]
-    noun = "execution" if total == 1 else "executions"
-    header = (
-        f"*{total} {noun}* "
-        f"({_EMOJI_SUCCESS} {summary['succeeded']} succeeded  "
-        f"{_EMOJI_FAILURE} {summary['failed']} failed)"
-    )
-    visible = events[:SLACK_MAX_DISPLAY_EVENTS]
-    sections: list[str] = [header, _DIVIDER]
-    sections.extend(_format_event_line(e) for e in visible)
-    overflow = len(events) - len(visible)
-    if overflow > 0:
-        sections.append(_DIVIDER)
-        sections.append(f"_… and {overflow} more executions_")
-    return {"text": "\n".join(sections)}
+def _render_for_slack(envelope: dict[str, Any]) -> dict[str, Any]:
+    """Wrap the rendered Slack mrkdwn body in the dict shape Slack expects."""
+    return {"text": render_slack_text(envelope)}
 
 
 def render_clubbed_message(
     payloads: list[dict[str, Any]],
     platform: str,
 ) -> dict[str, Any]:
-    """Top-level entry — returns the dispatch body for `platform`.
+    """Top-level entry — returns the dispatch body for ``platform``.
 
     Used by every dispatch site (BATCHED flush, IMMEDIATE backend providers)
     so the receiver-visible payload is identical regardless of mode.
     """
     envelope = build_envelope(payloads)
     if platform == PlatformType.SLACK.value:
-        return render_for_slack(envelope)
+        return _render_for_slack(envelope)
     if platform == PlatformType.API.value:
         return envelope
     # Unknown platform — fall back to the raw envelope and warn so misrouted
diff --git a/backend/workflow_manager/internal_serializers.py b/backend/workflow_manager/internal_serializers.py
index 951bf1e54d..2e43f66630 100644
--- a/backend/workflow_manager/internal_serializers.py
+++ b/backend/workflow_manager/internal_serializers.py
@@ -213,7 +213,9 @@ def validate(self, attrs):
             )
         if successful is not None and failed is not None and successful + failed > total:
             raise serializers.ValidationError(
-                "successful_files + failed_files cannot exceed total_files."
+                {
+                    "non_field_errors": "successful_files + failed_files cannot exceed total_files."
+                }
             )
         return attrs
 
diff --git a/frontend/src/components/settings/platform/PlatformSettings.jsx b/frontend/src/components/settings/platform/PlatformSettings.jsx
index 2b08c8e0ba..f2eee087b0 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.jsx
+++ b/frontend/src/components/settings/platform/PlatformSettings.jsx
@@ -417,6 +417,8 @@ function PlatformSettings() {
                     <InputNumber
                       min={1}
                       max={120}
+                      step={1}
+                      precision={0}
                       value={batchIntervalMinutes}
                       onChange={(v) => setBatchIntervalMinutes(v)}
                     />
diff --git a/workers/notification/providers/_clubbed_format.py b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
similarity index 53%
rename from workers/notification/providers/_clubbed_format.py
rename to unstract/core/src/unstract/core/notification_clubbed_renderer.py
index d489d76ec7..9571bdfeb7 100644
--- a/workers/notification/providers/_clubbed_format.py
+++ b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
@@ -1,12 +1,33 @@
-"""Worker-side mirror of backend/notification_v2/clubbed_renderer.
-
-Producing the same envelope shape and Slack mrkdwn body the backend renders
-so worker-callback IMMEDIATE payloads (flat per-event dicts) match the
-canonical wire format used by backend BATCHED dispatches. Backend pre-renders
-for its own dispatches — this module covers only the worker-callback IMMEDIATE
-path. Keep the constants and string output byte-identical to
-`backend/notification_v2/clubbed_renderer.py`; promote to `unstract/core/` if
-a third site ever needs the same logic.
+"""Shared clubbed-notification envelope + Slack renderer.
+
+Imported by both `backend/notification_v2/clubbed_renderer.py` and the
+worker `notification/providers/*_webhook.py` so the receiver-visible
+payload (envelope JSON for API, mrkdwn string for Slack) is byte-identical
+regardless of which side rendered it.
+
+Envelope shape:
+
+    {
+        "summary": {"total": N, "succeeded": S, "failed": F},
+        "events": [
+            {
+                "type": "ETL" | "TASK" | "API",
+                "pipeline_name": "...",
+                "status": "ERROR" | "SUCCESS" | ...,
+                "execution_id": "...",
+                "timestamp": "2026 May 5 5:03:34 PM",
+                "additional_data": {
+                    "total_files": int,
+                    "successful_files": int,
+                    "failed_files": int,
+                },
+                "error_message": "...",   # only on failure
+            },
+            ...
+        ]
+    }
+
+`pipeline_id` is intentionally absent — neither channel surfaces it.
 """
 
 from __future__ import annotations
@@ -14,13 +35,22 @@
 import datetime
 from typing import Any
 
+# Hard cap on events per dispatch; the rest roll into the next flush tick.
 MAX_BATCH_SIZE = 500
+# Slack inlines this many events before collapsing the rest under an
+# "_… and K more_" footer. Slack tolerates much larger payloads, but
+# readability tanks past ~25 lines.
 SLACK_MAX_DISPLAY_EVENTS = 25
 
-_SUCCESS_STATUSES = {"COMPLETED", "SUCCESS"}
+_SUCCESS_STATUSES = frozenset({"COMPLETED", "SUCCESS"})
+
+# Middle dot (U+00B7) padded by single spaces — the per-event field separator.
 _SEPARATOR = " · "
-_MISSING = "—"
-_DIVIDER = "———"
+_MISSING = "—"  # em-dash placeholder for missing fields
+_DIVIDER = "———"  # triple em-dash divider between header and events
+
+# Slack emoji shortcodes — render the same as the literal unicode glyphs and
+# stay readable in source.
 _EMOJI_SUCCESS = ":white_check_mark:"
 _EMOJI_FAILURE = ":x:"
 
@@ -32,6 +62,11 @@ def _is_success(status: str | None) -> bool:
 
 
 def _humanize_timestamp(iso: str | None) -> str:
+    """Render an ISO timestamp as `2026 May 11 11:38:31 AM` (POSIX `%-d`).
+
+    Falls back to the missing placeholder on falsy / unparseable input so a
+    partial row still renders without raising.
+    """
     if not iso:
         return _MISSING
     try:
@@ -42,6 +77,7 @@ def _humanize_timestamp(iso: str | None) -> str:
 
 
 def _format_file_count(event: dict[str, Any]) -> str:
+    """Render the file-count summary; empty string when no totals available."""
     counts = event.get("additional_data") or {}
     total = counts.get("total_files")
     if total is None:
@@ -54,6 +90,11 @@ def _format_file_count(event: dict[str, Any]) -> str:
 
 
 def _format_event_line(event: dict[str, Any]) -> str:
+    """Format one event as a single Slack mrkdwn line.
+
+    Fields are middle-dot separated; the file-count column is omitted when
+    `additional_data` is empty so the line collapses to 5 fields, not 6.
+    """
     parts = [
         event.get("timestamp") or _MISSING,
         f"*{event.get('execution_id') or _MISSING}*",
@@ -68,11 +109,12 @@ def _format_event_line(event: dict[str, Any]) -> str:
 
 
 def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
-    """Project a flat per-event payload into the canonical shape.
+    """Project a buffered payload into the canonical per-event dict.
 
-    Drops `pipeline_id` and `_source` — neither appears in receiver-visible
-    output. Mirrors the backend projection (including the humanized timestamp)
-    so renderer input is identical.
+    Unified shape across Slack/API and IMMEDIATE/BATCHED. `pipeline_id` is
+    intentionally dropped — neither channel surfaces it. Timestamps are
+    humanized once at projection so Slack and API consumers see the same
+    string (implicit UTC, no timezone suffix).
     """
     event: dict[str, Any] = {
         "type": payload.get("type") or "",
@@ -89,10 +131,10 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
 
 
 def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
-    """Build the canonical `{summary, events}` envelope.
+    """Build the canonical envelope used by every dispatch path.
 
-    Summary carries only `{total, succeeded, failed}` — identical shape for
-    IMMEDIATE and BATCHED.
+    Summary carries only `{total, succeeded, failed}` — same shape for
+    IMMEDIATE and BATCHED so receivers parse one envelope, not two.
     """
     capped = payloads[:MAX_BATCH_SIZE]
     succeeded = sum(1 for p in capped if _is_success(p.get("status")))
@@ -110,8 +152,9 @@ def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
 def render_slack_text(envelope: dict[str, Any]) -> str:
     """Render the envelope as Slack mrkdwn body text.
 
-    Always emits header + divider regardless of event count so IMMEDIATE,
-    BATCHED N=1, and BATCHED N>1 all share the same shape.
+    Header + divider are emitted for every dispatch — IMMEDIATE, BATCHED N=1,
+    and BATCHED N>1 all share the same shape. Visible events are capped at
+    SLACK_MAX_DISPLAY_EVENTS with an `_… and K more_` overflow footer.
     """
     summary = envelope["summary"]
     events: list[dict[str, Any]] = envelope["events"]
diff --git a/workers/notification/providers/api_webhook.py b/workers/notification/providers/api_webhook.py
index 1e652e9464..cbffc0a1d4 100644
--- a/workers/notification/providers/api_webhook.py
+++ b/workers/notification/providers/api_webhook.py
@@ -8,10 +8,11 @@
 
 from typing import Any
 
-from notification.providers._clubbed_format import build_envelope
 from notification.providers.webhook_provider import WebhookProvider
 from shared.infrastructure.logging import WorkerLogger
 
+from unstract.core.notification_clubbed_renderer import build_envelope
+
 logger = WorkerLogger.get_logger(__name__)
 
 
diff --git a/workers/notification/providers/slack_webhook.py b/workers/notification/providers/slack_webhook.py
index 01f272b024..2bb757662c 100644
--- a/workers/notification/providers/slack_webhook.py
+++ b/workers/notification/providers/slack_webhook.py
@@ -8,12 +8,13 @@
 
 from typing import Any
 
-from notification.providers._clubbed_format import (
+from notification.providers.webhook_provider import WebhookProvider
+from shared.infrastructure.logging import WorkerLogger
+
+from unstract.core.notification_clubbed_renderer import (
     build_envelope,
     render_slack_text,
 )
-from notification.providers.webhook_provider import WebhookProvider
-from shared.infrastructure.logging import WorkerLogger
 
 logger = WorkerLogger.get_logger(__name__)
 
@@ -56,7 +57,7 @@ def format_payload(self, payload: dict[str, Any]) -> dict[str, Any]:
           wrapped in a single-event envelope and rendered to the canonical
           single-line mrkdwn body.
         """
-        if "text" in payload and len(payload) == 1:
+        if "text" in payload and "events" not in payload:
             return {"text": payload["text"]}
 
         envelope = build_envelope(payloads=[payload])

From e6a87e48881adaebf49852560aede610aa97f43e Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 16:00:06 +0530
Subject: [PATCH 15/27] sonar issues

---
 backend/workflow_manager/internal_serializers.py | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/backend/workflow_manager/internal_serializers.py b/backend/workflow_manager/internal_serializers.py
index 2e43f66630..506d389ef8 100644
--- a/backend/workflow_manager/internal_serializers.py
+++ b/backend/workflow_manager/internal_serializers.py
@@ -212,11 +212,8 @@ def validate(self, attrs):
                 {"failed_files": "failed_files cannot exceed total_files."}
             )
         if successful is not None and failed is not None and successful + failed > total:
-            raise serializers.ValidationError(
-                {
-                    "non_field_errors": "successful_files + failed_files cannot exceed total_files."
-                }
-            )
+            msg = "successful_files + failed_files cannot exceed total_files."
+            raise serializers.ValidationError({"non_field_errors": msg})
         return attrs
 
 

From a736bf88e8e07abd9e37723b622c748da316b451 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 16:17:38 +0530
Subject: [PATCH 16/27] code rabbit refactor

---
 .../core/notification_clubbed_renderer.py     | 31 +++++++++++++++++--
 1 file changed, 29 insertions(+), 2 deletions(-)

diff --git a/unstract/core/src/unstract/core/notification_clubbed_renderer.py b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
index 9571bdfeb7..5a21bc65cb 100644
--- a/unstract/core/src/unstract/core/notification_clubbed_renderer.py
+++ b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
@@ -61,6 +61,22 @@ def _is_success(status: str | None) -> bool:
     return status.upper() in _SUCCESS_STATUSES
 
 
+def _has_failed_files(counts: dict[str, Any]) -> bool:
+    """True when file-level aggregates show at least one failure."""
+    failed = counts.get("failed_files")
+    return isinstance(failed, int) and failed > 0
+
+
+def _is_effective_success(status: str | None, counts: dict[str, Any]) -> bool:
+    """Treat a COMPLETED run with any file failures as a partial failure.
+
+    Mirrors the failure-filter contract at dispatch time so renderer summary
+    counts and the per-event file-count emoji match the reason the alert
+    fired.
+    """
+    return _is_success(status) and not _has_failed_files(counts)
+
+
 def _humanize_timestamp(iso: str | None) -> str:
     """Render an ISO timestamp as `2026 May 11 11:38:31 AM` (POSIX `%-d`).
 
@@ -77,11 +93,18 @@ def _humanize_timestamp(iso: str | None) -> str:
 
 
 def _format_file_count(event: dict[str, Any]) -> str:
-    """Render the file-count summary; empty string when no totals available."""
+    """Render the file-count summary; empty string when no totals available.
+
+    A COMPLETED run with file failures short-circuits to the failure shape so
+    the rendered line matches why a failures-only notification fired.
+    """
     counts = event.get("additional_data") or {}
     total = counts.get("total_files")
     if total is None:
         return ""
+    if _has_failed_files(counts):
+        failed = counts.get("failed_files", 0)
+        return f"{_EMOJI_FAILURE} {failed}/{total} files"
     if _is_success(event.get("status")):
         successful = counts.get("successful_files", 0)
         return f"{_EMOJI_SUCCESS} {successful}/{total} files"
@@ -137,7 +160,11 @@ def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
     IMMEDIATE and BATCHED so receivers parse one envelope, not two.
     """
     capped = payloads[:MAX_BATCH_SIZE]
-    succeeded = sum(1 for p in capped if _is_success(p.get("status")))
+    succeeded = sum(
+        1
+        for p in capped
+        if _is_effective_success(p.get("status"), p.get("additional_data") or {})
+    )
     failed = len(capped) - succeeded
     return {
         "summary": {

From e6534949d63d1475f6a4581c16884bb87369027d Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 17:02:24 +0530
Subject: [PATCH 17/27] greptile comments resolve

---
 backend/notification_v2/internal_api_views.py | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 9a9c0e4a71..9eacba6c76 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -286,12 +286,11 @@ def get_api_data(request: HttpRequest, api_id: str) -> JsonResponse:
         )
 
 
-# Required fields on the enqueue endpoint body. Worker-side serialization
-# guarantees these — keep this list in sync with
-# workers/shared/patterns/notification/helper.py.
+# `execution_id` is intentionally optional: the scheduler INPROGRESS path
+# (workers/scheduler/tasks.py, UN-2850 / #1562) fires before WorkflowExecution
+# is created. Renderer falls back to `—` for missing values.
 _ENQUEUE_REQUIRED_FIELDS = (
     "notification_id",
-    "execution_id",
     "pipeline_id",
     "pipeline_name",
     "status",
@@ -351,7 +350,7 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
     # (renderer falls back to "Type: —" / no Additional Data line).
     payload = {
         "type": body.get("type", ""),
-        "execution_id": body["execution_id"],
+        "execution_id": body.get("execution_id"),
         "pipeline_id": body["pipeline_id"],
         "pipeline_name": body["pipeline_name"],
         "status": body["status"],

From 724d280c6651a97d69ef14760b94eeeafbf4fc8a Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 17:55:05 +0530
Subject: [PATCH 18/27] UN-3056 Scope enqueue execution_id exemption to
 INPROGRESS

Keep execution_id in _ENQUEUE_REQUIRED_FIELDS as the canonical required
set; carve out the INPROGRESS exemption at the validator instead of
dropping it broadly. Non-INPROGRESS callers (COMPLETED / ERROR /
STOPPED / PARTIAL_SUCCESS) once again get a loud 400 if they omit
execution_id, addressing Greptile's silent-failure concern on e6534949d.

Extends the comment above the tuple to also flag the consumer-side gap:
INPROGRESS buffer rows ship with execution_id=null, so API receivers
cannot correlate them with execution logs until the producer-reorder
follow-up (UN-3056) lands.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/notification_v2/internal_api_views.py | 24 +++++++++++++++----
 1 file changed, 19 insertions(+), 5 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 9eacba6c76..79f65193d8 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -286,15 +286,22 @@ def get_api_data(request: HttpRequest, api_id: str) -> JsonResponse:
         )
 
 
-# `execution_id` is intentionally optional: the scheduler INPROGRESS path
+# All fields are required at enqueue time. `execution_id` carries one
+# exemption (handled in the validator below): the scheduler INPROGRESS path
 # (workers/scheduler/tasks.py, UN-2850 / #1562) fires before WorkflowExecution
-# is created. Renderer falls back to `—` for missing values.
+# is created, so it has no execution_id to forward. Renderer falls back to
+# `—` for missing values. Long-term fix belongs at the producer.
+#
+# Consumer-side gap: INPROGRESS buffer rows ship with execution_id=null, so
+# API webhook receivers cannot correlate the event with execution logs until
+# the producer-reorder follow-up (UN-3056) lands.
 _ENQUEUE_REQUIRED_FIELDS = (
     "notification_id",
     "pipeline_id",
     "pipeline_name",
     "status",
     "platform",
+    "execution_id",
 )
 
 
@@ -315,12 +322,19 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
             {"status": "error", "message": "Invalid JSON body"}, status=400
         )
 
-    missing = [f for f in _ENQUEUE_REQUIRED_FIELDS if not body.get(f)]
-    if missing:
+    missing_fields = [f for f in _ENQUEUE_REQUIRED_FIELDS if not body.get(f)]
+    # INPROGRESS is the one status legitimately allowed to omit execution_id
+    # (see comment on _ENQUEUE_REQUIRED_FIELDS).
+    if (
+        body.get("status") == Pipeline.PipelineStatus.INPROGRESS
+        and "execution_id" in missing_fields
+    ):
+        missing_fields.remove("execution_id")
+    if missing_fields:
         return JsonResponse(
             {
                 "status": "error",
-                "message": f"Missing required fields: {', '.join(missing)}",
+                "message": f"Missing required fields: {', '.join(missing_fields)}",
             },
             status=400,
         )

From 4104fafb25eccc5bcbb654cf1bf75976569114fe Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 17:57:18 +0530
Subject: [PATCH 19/27] greptile comments resolve

---
 backend/notification_v2/internal_api_views.py | 14 +++++---------
 1 file changed, 5 insertions(+), 9 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 79f65193d8..693e2a0400 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -286,15 +286,11 @@ def get_api_data(request: HttpRequest, api_id: str) -> JsonResponse:
         )
 
 
-# All fields are required at enqueue time. `execution_id` carries one
-# exemption (handled in the validator below): the scheduler INPROGRESS path
-# (workers/scheduler/tasks.py, UN-2850 / #1562) fires before WorkflowExecution
-# is created, so it has no execution_id to forward. Renderer falls back to
-# `—` for missing values. Long-term fix belongs at the producer.
-#
-# Consumer-side gap: INPROGRESS buffer rows ship with execution_id=null, so
-# API webhook receivers cannot correlate the event with execution logs until
-# the producer-reorder follow-up (UN-3056) lands.
+# `execution_id` is required except for INPROGRESS, which fires from the
+# scheduler (workers/scheduler/tasks.py, UN-2850) before WorkflowExecution
+# exists. INPROGRESS rows therefore store execution_id=null — receivers
+# cannot correlate with execution logs until the producer-reorder lands
+# (UN-3056).
 _ENQUEUE_REQUIRED_FIELDS = (
     "notification_id",
     "pipeline_id",

From 167d60f679602e575dceefa9507c81b18ffa8f22 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 18:15:39 +0530
Subject: [PATCH 20/27] UN-3056 Skip deactivated notifications in BATCHED flush

_dispatch_group's lock query did not check notification.is_active, so
PENDING NotificationBuffer rows tied to a deactivated source notification
still dispatched on the next flush tick (up to one NOTIFICATION_CLUB_INTERVAL
of stale traffic). IMMEDIATE deactivation is instant because the GET
notifications endpoint filters by is_active=True; this restores the same
expectation for BATCHED.

Also adds select_related("notification") so the later rows[0].notification
read is part of the same query rather than a per-group round-trip.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/notification_v2/internal_api_views.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 693e2a0400..31d6dffe11 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -467,12 +467,14 @@ def _dispatch_group(
     with transaction.atomic():
         rows = list(
             NotificationBuffer.objects.select_for_update(skip_locked=True)
+            .select_related("notification")
             .filter(
                 status=BufferStatus.PENDING.value,
                 organization_id=org_id,
                 webhook_url=webhook_url,
                 auth_sig=auth_sig,
                 platform=platform,
+                notification__is_active=True,
             )
             .order_by("created_at")[:_PROCESS_BUFFER_CAP]
         )

From 77b7956c2c0b1bf89ef63c8732432871013c2e6f Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 18:22:47 +0530
Subject: [PATCH 21/27] greptile comments resolve

---
 backend/notification_v2/internal_api_views.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 31d6dffe11..492ce42cbf 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -486,12 +486,16 @@ def _dispatch_group(
 
         # Live auth — read from the FIRST row's notification. If multiple
         # notifications collide on (url, auth_sig, platform) we have, by
-        # definition, identical auth + format, so this is safe.
+        # definition, identical auth + format, so this is safe. Retry budget
+        # is the MAX across rows: there's a single HTTP call per batch, so
+        # the most retry-tolerant subscriber's intent wins; using the first
+        # row's value would silently truncate everyone else's retry budget.
         first_notification = rows[0].notification
         payloads = [r.payload for r in rows]
         body = render_clubbed_message(payloads, platform)
         headers = build_webhook_headers(first_notification)
         buffer_ids = [str(r.id) for r in rows]
+        max_retries = max(r.notification.max_retries for r in rows)
 
         # Mark DISPATCHED first; if commit succeeds the on_commit hook
         # publishes the broker task. If commit fails, rows stay PENDING and
@@ -508,7 +512,7 @@ def _dispatch_group(
                 body=body,
                 headers=headers,
                 platform=platform,
-                max_retries=first_notification.max_retries,
+                max_retries=max_retries,
                 buffer_ids=buffer_ids,
                 org_id=org_id,
             )

From 780d51cf30e33a8700b093b79b6b86905a8e2b7a Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 19:26:52 +0530
Subject: [PATCH 22/27] remove immediate mode

---
 backend/notification_v2/clubbed_renderer.py   |  14 +-
 backend/notification_v2/enums.py              |  12 +-
 backend/notification_v2/helper.py             |  93 ++------------
 backend/notification_v2/internal_api_views.py |  20 +--
 backend/notification_v2/provider/__init__.py  |   0
 .../provider/notification_provider.py         |  30 -----
 backend/notification_v2/provider/registry.py  |  54 --------
 .../provider/webhook/__init__.py              |   0
 .../provider/webhook/api_webhook.py           |  30 -----
 .../provider/webhook/slack_webhook.py         |  33 -----
 .../provider/webhook/webhook.py               | 103 ---------------
 .../core/notification_clubbed_renderer.py     |  14 +-
 workers/notification/providers/api_webhook.py |   8 +-
 .../notification/providers/slack_webhook.py   |  22 ++--
 .../shared/patterns/notification/helper.py    | 120 ++----------------
 15 files changed, 64 insertions(+), 489 deletions(-)
 delete mode 100644 backend/notification_v2/provider/__init__.py
 delete mode 100644 backend/notification_v2/provider/notification_provider.py
 delete mode 100644 backend/notification_v2/provider/registry.py
 delete mode 100644 backend/notification_v2/provider/webhook/__init__.py
 delete mode 100644 backend/notification_v2/provider/webhook/api_webhook.py
 delete mode 100644 backend/notification_v2/provider/webhook/slack_webhook.py
 delete mode 100644 backend/notification_v2/provider/webhook/webhook.py

diff --git a/backend/notification_v2/clubbed_renderer.py b/backend/notification_v2/clubbed_renderer.py
index a0096197bd..af20007f76 100644
--- a/backend/notification_v2/clubbed_renderer.py
+++ b/backend/notification_v2/clubbed_renderer.py
@@ -1,11 +1,11 @@
 """Backend dispatch entry for clubbed-notification rendering.
 
 Delegates the canonical envelope + Slack body to
-``unstract.core.notification_clubbed_renderer`` so backend dispatches and
-worker IMMEDIATE callbacks emit byte-identical receiver-visible payloads.
-This thin shim keeps the ``render_clubbed_message`` platform dispatcher
-(uses ``PlatformType`` enum) backend-side; everything else lives in the
-shared module.
+``unstract.core.notification_clubbed_renderer`` so backend and worker
+callbacks emit byte-identical receiver-visible payloads. This thin shim
+keeps the ``render_clubbed_message`` platform dispatcher (uses
+``PlatformType`` enum) backend-side; everything else lives in the shared
+module.
 """
 
 from __future__ import annotations
@@ -35,8 +35,8 @@ def render_clubbed_message(
 ) -> dict[str, Any]:
     """Top-level entry — returns the dispatch body for ``platform``.
 
-    Used by every dispatch site (BATCHED flush, IMMEDIATE backend providers)
-    so the receiver-visible payload is identical regardless of mode.
+    Used by every dispatch site so the receiver-visible payload is
+    identical regardless of caller.
     """
     envelope = build_envelope(payloads)
     if platform == PlatformType.SLACK.value:
diff --git a/backend/notification_v2/enums.py b/backend/notification_v2/enums.py
index 9e694e128f..8ebced2a2e 100644
--- a/backend/notification_v2/enums.py
+++ b/backend/notification_v2/enums.py
@@ -48,10 +48,14 @@ def choices(cls):
 class DeliveryMode(Enum):
     """Per-notification dispatch mode.
 
-    IMMEDIATE fires on every workflow completion (pre-existing behavior).
-    BATCHED buffers events into NotificationBuffer and flushes them as one
-    clubbed message per (org, webhook_url, auth_sig) every
-    NOTIFICATION_CLUB_INTERVAL seconds.
+    Product ships every notification as BATCHED — events buffer into
+    ``NotificationBuffer`` and flush as one clubbed message per
+    (org, webhook_url, auth_sig) every ``NOTIFICATION_CLUB_INTERVAL`` seconds.
+
+    The ``IMMEDIATE`` value is purely a historical DB value — no code reads
+    it anymore (the legacy synchronous-dispatch path was removed). The
+    column and enum value remain so existing rows don't break; both will be
+    dropped in a follow-up schema migration.
     """
 
     IMMEDIATE = "IMMEDIATE"
diff --git a/backend/notification_v2/helper.py b/backend/notification_v2/helper.py
index 4a6c5cc907..9e99335ce8 100644
--- a/backend/notification_v2/helper.py
+++ b/backend/notification_v2/helper.py
@@ -11,13 +11,9 @@
 from notification_v2.enums import (
     AuthorizationType,
     BufferStatus,
-    DeliveryMode,
-    NotificationType,
     PlatformType,
 )
 from notification_v2.models import Notification, NotificationBuffer
-from notification_v2.provider.notification_provider import NotificationProvider
-from notification_v2.provider.registry import get_notification_provider
 
 logger = logging.getLogger(__name__)
 
@@ -75,9 +71,8 @@ def get_org_club_interval_seconds(organization: Organization) -> int:
 def build_webhook_headers(notification: Notification) -> dict[str, str]:
     """Build HTTP headers for a webhook dispatch from the notification's auth.
 
-    Mirrors the logic in ``provider/webhook/webhook.py`` and the worker-side
-    ``get_webhook_headers`` so the clubbed dispatcher and the immediate path
-    produce identical headers for the same auth config.
+    Used by the buffer flush in ``internal_api_views._dispatch_group`` to
+    pass live auth headers through to the Celery task.
     """
     headers = {"Content-Type": "application/json"}
     auth_type_raw = (notification.authorization_type or "").upper()
@@ -107,51 +102,35 @@ def _resolve_organization(notification: Notification) -> Organization | None:
     return None
 
 
-def split_by_delivery_mode(
-    notifications: "Iterable[Notification]",
-) -> tuple[list[Notification], list[Notification]]:
-    """Partition into (IMMEDIATE, BATCHED). Unknown modes default to IMMEDIATE."""
-    immediate: list[Notification] = []
-    batched: list[Notification] = []
-    for n in notifications:
-        if n.delivery_mode == DeliveryMode.BATCHED.value:
-            batched.append(n)
-        else:
-            immediate.append(n)
-    return immediate, batched
-
-
 def dispatch_with_delivery_mode(
     notifications: "Iterable[Notification]",
     payload: dict[str, Any],
     *,
     error_context: str = "",
 ) -> None:
-    """Single-call entry point that splits IMMEDIATE / BATCHED and dispatches.
+    """Enqueue every active notification into ``NotificationBuffer``.
 
-    IMMEDIATE rows fire synchronously via NotificationHelper. BATCHED rows
-    enqueue into NotificationBuffer; an enqueue failure is logged but does
-    not abort the loop — other notifications still get their chance.
+    Single dispatch path: each notification produces a buffer row that the
+    periodic flush ships as part of a clubbed message. An enqueue failure
+    on one row is logged but does not abort the loop — sibling notifications
+    still get their chance.
 
     ``error_context`` lets callers tag failures with their dispatch source
     (pipeline id, api id) for easier triage.
     """
-    immediate, batched = split_by_delivery_mode(notifications)
-    if immediate:
-        NotificationHelper.send_notification(notifications=immediate, payload=payload)
-    for notification in batched:
+    for notification in notifications:
         try:
             enqueue(notification, payload)
         except Exception:
             logger.exception(
-                "Failed to enqueue BATCHED notification %s%s",
+                "Failed to enqueue notification %s%s",
                 notification.id,
                 f" ({error_context})" if error_context else "",
             )
 
 
 def enqueue(notification: Notification, payload: dict[str, Any]) -> NotificationBuffer:
-    """Buffer a single execution event for a BATCHED notification.
+    """Buffer a single execution event for a notification.
 
     Computes auth_sig and flush_after at write time so existing PENDING rows
     keep their original cadence even if NOTIFICATION_CLUB_INTERVAL or the
@@ -172,9 +151,9 @@ def enqueue(notification: Notification, payload: dict[str, Any]) -> Notification
     auth_sig = compute_auth_sig(notification)
     platform = notification.platform or PlatformType.API.value
 
-    # Stamp a buffered-at timestamp so renderers can surface it consistently
-    # alongside IMMEDIATE. Worker callers already supply one; backend
-    # dispatchers (PipelineStatusPayload.to_dict) don't, so default here.
+    # Stamp a buffered-at timestamp so renderers always have one to humanize.
+    # Worker callers already supply one; backend dispatchers
+    # (PipelineStatusPayload.to_dict) don't, so default here.
     payload = {
         **payload,
         "timestamp": payload.get("timestamp") or timezone.now().isoformat(),
@@ -204,49 +183,3 @@ def enqueue(notification: Notification, payload: dict[str, Any]) -> Notification
         flush_after.isoformat(),
     )
     return buffer_row
-
-
-class NotificationHelper:
-    @classmethod
-    def send_notification(cls, notifications: list[Notification], payload: Any) -> None:
-        """Dispatch IMMEDIATE notifications via the registered provider.
-
-        Iterates over notifications, resolves the provider for each
-        (notification_type, platform) pair, and fires the webhook task. BATCHED
-        notifications must be routed to ``enqueue()`` instead — callers branch
-        on ``notification.delivery_mode`` before reaching this method.
-
-        Args:
-            notifications: Active Notification rows to dispatch synchronously.
-            payload: Provider-specific payload (typically a dict).
-        """
-        for notification in notifications:
-            if notification.delivery_mode == DeliveryMode.BATCHED.value:
-                # Callers should not reach here for BATCHED — log loudly so
-                # routing regressions are visible without breaking dispatch.
-                logger.warning(
-                    "BATCHED notification %s reached IMMEDIATE dispatch path; "
-                    "skipping. Caller must branch on delivery_mode.",
-                    notification.id,
-                )
-                continue
-            notification_type = NotificationType(notification.notification_type)
-            platform_type = PlatformType(notification.platform)
-            try:
-                notification_provider = get_notification_provider(
-                    notification_type, platform_type
-                )
-                notifier: NotificationProvider = notification_provider(
-                    notification=notification, payload=payload
-                )
-                notifier.send()
-                logger.info("Sending notification to %s", notification)
-            except ValueError as e:
-                logger.error(
-                    "Error in notification type %s and platform %s for "
-                    "notification %s: %s",
-                    notification_type,
-                    platform_type,
-                    notification,
-                    e,
-                )
diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 492ce42cbf..6409f6bdf6 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -29,7 +29,7 @@
 
 from backend.celery_service import app as celery_app
 from notification_v2.clubbed_renderer import render_clubbed_message
-from notification_v2.enums import FAILURE_STATUSES, BufferStatus, DeliveryMode
+from notification_v2.enums import FAILURE_STATUSES, BufferStatus
 from notification_v2.helper import (
     build_webhook_headers,
     enqueue,
@@ -99,9 +99,6 @@ def _serialize_notification(n: Notification) -> dict[str, Any]:
         "max_retries": n.max_retries,
         "is_active": n.is_active,
         "notify_on_failures": n.notify_on_failures,
-        # Drives the worker-side IMMEDIATE-vs-BATCHED branch in
-        # workers/shared/patterns/notification/helper.py.
-        "delivery_mode": n.delivery_mode,
     }
 
 
@@ -309,7 +306,7 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
     Worker code is model-free: it forwards a notification_id + structured
     payload here and lets the backend write the NotificationBuffer row.
     Rejects rows whose source notification is not BATCHED so a worker
-    routing bug cannot silently divert IMMEDIATE traffic into the buffer.
+    routing bug cannot silently divert non-BATCHED traffic into the buffer.
     """
     try:
         body = json.loads(request.body.decode("utf-8") or "{}")
@@ -342,19 +339,6 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
             {"status": "error", "message": "Notification not found"}, status=404
         )
 
-    if notification.delivery_mode != DeliveryMode.BATCHED.value:
-        # Hard-fail rather than silently auto-correcting — surfaces worker
-        # routing regressions instead of letting them drain into the buffer.
-        return JsonResponse(
-            {
-                "status": "error",
-                "message": (
-                    "Notification delivery_mode is not BATCHED; refuse to enqueue"
-                ),
-            },
-            status=409,
-        )
-
     # type / timestamp / additional_data stay optional during rollout — older
     # worker builds that don't forward them still produce a usable row
     # (renderer falls back to "Type: —" / no Additional Data line).
diff --git a/backend/notification_v2/provider/__init__.py b/backend/notification_v2/provider/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/backend/notification_v2/provider/notification_provider.py b/backend/notification_v2/provider/notification_provider.py
deleted file mode 100644
index 10492aaf3c..0000000000
--- a/backend/notification_v2/provider/notification_provider.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from abc import ABC, abstractmethod
-
-from django.conf import settings
-
-from notification_v2.models import Notification
-
-
-class NotificationProvider(ABC):
-    NOTIFICATION_TIMEOUT = settings.NOTIFICATION_TIMEOUT
-    RETRY_DELAY = 10  # Seconds
-
-    def __init__(self, notification: Notification, payload):
-        self.payload = payload
-        self.notification = notification
-
-    @abstractmethod
-    def send(self):
-        """Method to be overridden in child classes for sending the
-        notification.
-        """
-        raise NotImplementedError("Subclasses should implement this method.")
-
-    def validate(self):
-        """Method to validate the notification data."""
-        pass
-
-    @abstractmethod
-    def get_headers(self):
-        """Method to get the headers for the notification."""
-        raise NotImplementedError("Subclasses should implement this method.")
diff --git a/backend/notification_v2/provider/registry.py b/backend/notification_v2/provider/registry.py
deleted file mode 100644
index 909ad58b4c..0000000000
--- a/backend/notification_v2/provider/registry.py
+++ /dev/null
@@ -1,54 +0,0 @@
-from notification_v2.enums import NotificationType, PlatformType
-from notification_v2.provider.notification_provider import NotificationProvider
-from notification_v2.provider.webhook.api_webhook import APIWebhook
-from notification_v2.provider.webhook.slack_webhook import SlackWebhook
-
-REGISTRY = {
-    NotificationType.WEBHOOK: {
-        PlatformType.SLACK: SlackWebhook,
-        PlatformType.API: APIWebhook,
-        # Add other platform-specific classes here
-    },
-    # Add other notification types and classes here
-}
-
-
-def get_notification_provider(
-    notification_type: NotificationType, platform_type: PlatformType
-) -> NotificationProvider:
-    """Get Notification provider based on notification type and platform type
-    It uses the REGISTRY to map the combination of notification type and
-    platform type to the corresponding NotificationProvider class.
-
-    If the provided combination is not found in the REGISTRY, a ValueError is raised.
-
-    Note:
-        This function assumes that the REGISTRY dictionary is correctly populated
-        with the appropriate NotificationProvider classes for each combination of
-        notification type and platform type.
-
-    See Also:
-        - NotificationType
-        - PlatformType
-        - NotificationProvider
-        - REGISTRY
-
-    Parameters:
-        notification_type (NotificationType): The type of notification.
-        platform_type (PlatformType): The platform/provider type for the notification.
-
-    Returns:
-        NotificationProvider: The appropriate NotificationProvider class for
-        the given combination.
-
-    Raises:
-        ValueError: If the provided combination is not found in the REGISTRY.
-    """
-    if notification_type not in REGISTRY:
-        raise ValueError(f"Unsupported notification type: {notification_type}")
-
-    platform_registry = REGISTRY[notification_type]
-    if platform_type not in platform_registry:
-        raise ValueError(f"Unsupported platform type: {platform_type}")
-
-    return platform_registry[platform_type]
diff --git a/backend/notification_v2/provider/webhook/__init__.py b/backend/notification_v2/provider/webhook/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/backend/notification_v2/provider/webhook/api_webhook.py b/backend/notification_v2/provider/webhook/api_webhook.py
deleted file mode 100644
index 9864d84a4a..0000000000
--- a/backend/notification_v2/provider/webhook/api_webhook.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from typing import Any
-
-from notification_v2.clubbed_renderer import build_envelope
-from notification_v2.provider.webhook.webhook import Webhook
-
-
-class APIWebhook(Webhook):
-    def send(self) -> None:
-        """Send the API webhook notification.
-
-        Wraps the IMMEDIATE event in the canonical envelope before queueing
-        so the receiver-visible JSON shape matches BATCHED dispatches —
-        `{"summary": {...}, "events": [{...}]}`.
-        """
-        self.payload = self.format_payload()
-        super().send()
-
-    def get_headers(self) -> dict[str, str]:
-        """API-specific headers."""
-        headers = super().get_headers()
-        headers["Content-Type"] = "application/json"
-        return headers
-
-    def format_payload(self) -> dict[str, Any]:
-        """Wrap a single IMMEDIATE event in the canonical envelope.
-
-        Receivers parse the same `{summary, events}` shape regardless of
-        whether the dispatch was IMMEDIATE or BATCHED.
-        """
-        return build_envelope(payloads=[self.payload])
diff --git a/backend/notification_v2/provider/webhook/slack_webhook.py b/backend/notification_v2/provider/webhook/slack_webhook.py
deleted file mode 100644
index 0fda635d74..0000000000
--- a/backend/notification_v2/provider/webhook/slack_webhook.py
+++ /dev/null
@@ -1,33 +0,0 @@
-import logging
-from typing import Any
-
-from notification_v2.clubbed_renderer import render_clubbed_message
-from notification_v2.enums import PlatformType
-from notification_v2.provider.webhook.webhook import Webhook
-
-logger = logging.getLogger(__name__)
-
-
-class SlackWebhook(Webhook):
-    def send(self) -> None:
-        """Send the Slack webhook notification."""
-        formatted_payload = self.format_payload()
-        self.payload = formatted_payload
-        super().send()
-
-    def get_headers(self) -> dict[str, str]:
-        """Slack-specific headers."""
-        headers = super().get_headers()
-        headers["Content-Type"] = "application/json"
-        return headers
-
-    def format_payload(self) -> dict[str, Any]:
-        """Render the IMMEDIATE event through the canonical envelope.
-
-        Single shared renderer for IMMEDIATE and BATCHED so receivers see the
-        same Slack body shape regardless of delivery mode.
-        """
-        return render_clubbed_message(
-            payloads=[self.payload],
-            platform=PlatformType.SLACK.value,
-        )
diff --git a/backend/notification_v2/provider/webhook/webhook.py b/backend/notification_v2/provider/webhook/webhook.py
deleted file mode 100644
index 40ddc53e61..0000000000
--- a/backend/notification_v2/provider/webhook/webhook.py
+++ /dev/null
@@ -1,103 +0,0 @@
-import logging
-
-from backend.celery_service import app as celery_app
-from notification_v2.enums import AuthorizationType
-from notification_v2.provider.notification_provider import NotificationProvider
-
-logger = logging.getLogger(__name__)
-
-
-class WebhookNotificationArg:
-    MAX_RETRIES = "max_retries"
-    RETRY_DELAY = "retry_delay"
-
-
-class HeaderConstants:
-    APPLICATION_JSON = "application/json"
-
-
-class Webhook(NotificationProvider):
-    def send(self) -> None:
-        """Send the webhook notification."""
-        try:
-            headers = self.get_headers()
-            self.validate()
-        except ValueError as e:
-            logger.error(f"Error validating notification {self.notification} :: {e}")
-            return
-        celery_app.send_task(
-            "send_webhook_notification",
-            args=[
-                self.notification.url,
-                self.payload,
-                headers,
-                self.NOTIFICATION_TIMEOUT,
-            ],
-            kwargs={
-                WebhookNotificationArg.MAX_RETRIES: self.notification.max_retries,
-                WebhookNotificationArg.RETRY_DELAY: self.RETRY_DELAY,
-            },
-        )
-
-    def validate(self):
-        """Validate notification.
-
-        Returns:
-            _type_: None
-        """
-        if not self.notification.url:
-            raise ValueError("Webhook URL is required.")
-        if not self.payload:
-            raise ValueError("Payload is required.")
-        return super().validate()
-
-    def get_headers(self) -> dict[str, str]:
-        """Get the headers for the notification based on the authorization type and key.
-
-        Raises:
-            ValueError: _description_
-
-        Returns:
-            dict[str, str]: A dictionary containing the headers.
-        """
-        headers: dict[str, str] = {}
-        try:
-            authorization_type = AuthorizationType(
-                self.notification.authorization_type.upper()
-            )
-        except ValueError:
-            raise ValueError(
-                "Unsupported authorization type: "
-                f"{self.notification.authorization_type}"
-            )
-        authorization_key = self.notification.authorization_key
-        authorization_header = self.notification.authorization_header
-
-        header_formats = {
-            AuthorizationType.BEARER: lambda key: {
-                "Authorization": f"Bearer {key}",
-                "Content-Type": HeaderConstants.APPLICATION_JSON,
-            },
-            AuthorizationType.API_KEY: lambda key: {
-                "Authorization": key,
-                "Content-Type": HeaderConstants.APPLICATION_JSON,
-            },
-            AuthorizationType.CUSTOM_HEADER: lambda key: {
-                authorization_header: key,
-                "Content-Type": HeaderConstants.APPLICATION_JSON,
-            },
-            AuthorizationType.NONE: lambda _: {
-                "Content-Type": HeaderConstants.APPLICATION_JSON,
-            },
-        }
-
-        if authorization_type not in header_formats:
-            raise ValueError(f"Unsupported authorization type: {authorization_type}")
-
-        headers = header_formats[authorization_type](authorization_key)
-
-        # Check if custom header type has required details
-        if authorization_type == AuthorizationType.CUSTOM_HEADER:
-            if not authorization_header or not authorization_key:
-                raise ValueError("Custom header or key missing for custom authorization.")
-        return headers
diff --git a/unstract/core/src/unstract/core/notification_clubbed_renderer.py b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
index 5a21bc65cb..9d8ce709a9 100644
--- a/unstract/core/src/unstract/core/notification_clubbed_renderer.py
+++ b/unstract/core/src/unstract/core/notification_clubbed_renderer.py
@@ -134,8 +134,8 @@ def _format_event_line(event: dict[str, Any]) -> str:
 def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
     """Project a buffered payload into the canonical per-event dict.
 
-    Unified shape across Slack/API and IMMEDIATE/BATCHED. `pipeline_id` is
-    intentionally dropped — neither channel surfaces it. Timestamps are
+    Unified shape across Slack/API and every dispatch path. `pipeline_id`
+    is intentionally dropped — neither channel surfaces it. Timestamps are
     humanized once at projection so Slack and API consumers see the same
     string (implicit UTC, no timezone suffix).
     """
@@ -156,8 +156,8 @@ def _event_from_payload(payload: dict[str, Any]) -> dict[str, Any]:
 def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
     """Build the canonical envelope used by every dispatch path.
 
-    Summary carries only `{total, succeeded, failed}` — same shape for
-    IMMEDIATE and BATCHED so receivers parse one envelope, not two.
+    Summary carries only `{total, succeeded, failed}` — one envelope shape
+    so receivers parse a single schema, not two.
     """
     capped = payloads[:MAX_BATCH_SIZE]
     succeeded = sum(
@@ -179,9 +179,9 @@ def build_envelope(payloads: list[dict[str, Any]]) -> dict[str, Any]:
 def render_slack_text(envelope: dict[str, Any]) -> str:
     """Render the envelope as Slack mrkdwn body text.
 
-    Header + divider are emitted for every dispatch — IMMEDIATE, BATCHED N=1,
-    and BATCHED N>1 all share the same shape. Visible events are capped at
-    SLACK_MAX_DISPLAY_EVENTS with an `_… and K more_` overflow footer.
+    Header + divider are emitted for every dispatch — single-event and
+    multi-event batches share the same shape. Visible events are capped at
+    ``SLACK_MAX_DISPLAY_EVENTS`` with an `_… and K more_` overflow footer.
     """
     summary = envelope["summary"]
     events: list[dict[str, Any]] = envelope["events"]
diff --git a/workers/notification/providers/api_webhook.py b/workers/notification/providers/api_webhook.py
index cbffc0a1d4..c6961e7227 100644
--- a/workers/notification/providers/api_webhook.py
+++ b/workers/notification/providers/api_webhook.py
@@ -1,9 +1,9 @@
 """API Webhook Notification Provider
 
-Wraps worker-callback IMMEDIATE payloads (flat per-event dict) in the
-canonical envelope so API webhook receivers always see the same
-``{"summary": {...}, "events": [...]}`` shape — IMMEDIATE or BATCHED.
-Backend dispatches already arrive in envelope form and pass through.
+Wraps worker-callback payloads (flat per-event dict) in the canonical
+envelope so API webhook receivers always see the same
+``{"summary": {...}, "events": [...]}`` shape. Backend dispatches already
+arrive in envelope form and pass through.
 """
 
 from typing import Any
diff --git a/workers/notification/providers/slack_webhook.py b/workers/notification/providers/slack_webhook.py
index 2bb757662c..1028aef289 100644
--- a/workers/notification/providers/slack_webhook.py
+++ b/workers/notification/providers/slack_webhook.py
@@ -1,9 +1,8 @@
 """Slack Webhook Notification Provider
 
-Renders worker-callback IMMEDIATE payloads (flat per-event dict) into the
-same single-line Slack body the backend produces for IMMEDIATE/BATCHED via
-clubbed_renderer. Backend-rendered payloads (`{"text": "<mrkdwn>"}`) pass
-through unchanged.
+Renders worker-callback payloads (flat per-event dict) into the same
+single-line Slack body the backend produces via ``clubbed_renderer``.
+Backend-rendered payloads (`{"text": "<mrkdwn>"}`) pass through unchanged.
 """
 
 from typing import Any
@@ -22,8 +21,9 @@
 class SlackWebhook(WebhookProvider):
     """Slack-specific webhook provider.
 
-    Renders flat IMMEDIATE payloads via the worker-side mirror of the backend
-    clubbed renderer, then sends them as Slack-native ``text`` mrkdwn.
+    Renders flat per-event payloads via the worker-side mirror of the
+    backend clubbed renderer, then sends them as Slack-native ``text``
+    mrkdwn.
     """
 
     def __init__(self) -> None:
@@ -51,11 +51,11 @@ def format_payload(self, payload: dict[str, Any]) -> dict[str, Any]:
         """Format the payload to match Slack's expected structure.
 
         Two input shapes are accepted:
-        - Backend-rendered ``{"text": "<mrkdwn>"}`` (BATCHED dispatch and
-          backend IMMEDIATE through ``clubbed_renderer``) — passed through.
-        - Flat per-event dict from the worker-callback IMMEDIATE path —
-          wrapped in a single-event envelope and rendered to the canonical
-          single-line mrkdwn body.
+        - Backend-rendered ``{"text": "<mrkdwn>"}`` (any backend dispatch
+          through ``clubbed_renderer``) — passed through.
+        - Flat per-event dict from a worker callback — wrapped in a
+          single-event envelope and rendered to the canonical single-line
+          mrkdwn body.
         """
         if "text" in payload and "events" not in payload:
             return {"text": payload["text"]}
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index 460c308146..79009a71a3 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -7,8 +7,6 @@
 import logging
 from typing import Any
 
-from celery import current_app
-
 # Import shared data models from @unstract/core
 from unstract.core.data_models import (
     ExecutionStatus,
@@ -19,9 +17,6 @@
 
 logger = logging.getLogger(__name__)
 
-# Mirrors notification_v2.enums.DeliveryMode.BATCHED. Worker stays string-only
-# so it does not import Django enums.
-DELIVERY_MODE_BATCHED = "BATCHED"
 ENQUEUE_BUFFER_ENDPOINT = "v1/webhook/buffer/enqueue/"
 
 
@@ -37,7 +32,7 @@ def _enqueue_to_buffer(
     logs the drop instead of silently treating BATCHED delivery as successful.
     """
     # Forward the full per-event shape so the backend renderer can match
-    # IMMEDIATE's KV layout per event (Type / Pipeline Id / Pipeline Name /
+    # the canonical KV layout per event (Type / Pipeline Id / Pipeline Name /
     # Status / Execution Id / Timestamp / Additional Data). Older backend
     # builds that ignore the extra fields stay unaffected.
     payload_type = payload.type.value if hasattr(payload.type, "value") else payload.type
@@ -83,10 +78,13 @@ def _route_notification(
     notification: dict[str, Any],
     payload: NotificationPayload,
 ) -> None:
-    """IMMEDIATE -> existing worker queue; BATCHED -> backend enqueue endpoint.
+    """Forward webhook notifications to the backend buffer-enqueue endpoint.
 
-    Defaults to IMMEDIATE when delivery_mode is missing so older backend
-    builds (pre-UNS-611) keep working unchanged.
+    Single dispatch path: the backend owns the buffer and the periodic
+    flush ships clubbed messages. Non-webhook notification types are
+    skipped at this layer. An enqueue failure is logged but doesn't abort
+    the outer trigger_* loop so sibling notifications still get their
+    chance.
     """
     if notification.get("notification_type") != "WEBHOOK":
         logger.debug(
@@ -95,107 +93,13 @@ def _route_notification(
         )
         return
 
-    if notification.get("delivery_mode") == DELIVERY_MODE_BATCHED:
-        try:
-            _enqueue_to_buffer(api_client, notification, payload)
-        except Exception:  # noqa: BLE001 — already logged with stack inside
-            # Surface but don't abort the outer trigger_* loop — sibling
-            # BATCHED notifications still deserve their enqueue attempt.
-            logger.warning(
-                "BATCHED enqueue failed for notification %s; continuing with others",
-                notification.get("id"),
-            )
-        return
-
-    send_notification_to_worker(
-        url=notification["url"],
-        payload=payload,
-        auth_type=notification.get("authorization_type", "NONE"),
-        auth_key=notification.get("authorization_key"),
-        auth_header=notification.get("authorization_header"),
-        max_retries=notification.get("max_retries", 0),
-        platform=notification.get("platform"),
-    )
-
-
-def get_webhook_headers(
-    auth_type: str, auth_key: str | None, auth_header: str | None
-) -> dict[str, str]:
-    """Generate webhook headers based on authorization configuration."""
-    headers = {"Content-Type": "application/json"}
-
     try:
-        if auth_type and auth_key:
-            auth_type_upper = auth_type.upper()
-
-            if auth_type_upper == "BEARER":
-                headers["Authorization"] = f"Bearer {auth_key}"
-            elif auth_type_upper == "API_KEY":
-                headers["Authorization"] = auth_key
-            elif auth_type_upper == "CUSTOM_HEADER" and auth_header:
-                headers[auth_header] = auth_key
-            # NONE type just uses Content-Type header
-    except Exception as e:
-        logger.warning(f"Error generating webhook headers: {e}")
-        # Use default headers if auth config is invalid
-
-    return headers
-
-
-def send_notification_to_worker(
-    url: str,
-    payload: NotificationPayload,
-    auth_type: str,
-    auth_key: str | None,
-    auth_header: str | None,
-    max_retries: int = 0,
-    platform: str | None = None,
-) -> bool:
-    """Send a single notification to the notification worker queue.
-
-    Args:
-        url: Webhook URL to send notification to
-        payload: Structured notification payload
-        auth_type: Authorization type (NONE, BEARER, API_KEY, CUSTOM_HEADER)
-        auth_key: Authorization key/token
-        auth_header: Custom header name for CUSTOM_HEADER auth type
-        max_retries: Maximum number of retry attempts
-        platform: Platform type from notification config (SLACK, API, etc.)
-
-    Returns:
-        True if task was successfully queued, False otherwise
-    """
-    try:
-        headers = get_webhook_headers(auth_type, auth_key, auth_header)
-
-        # Convert payload to webhook format (excludes internal fields)
-        payload_dict = payload.to_webhook_payload()
-
-        # Send task to notification worker
-        current_app.send_task(
-            "send_webhook_notification",
-            args=[
-                url,
-                payload_dict,
-                headers,
-                10,  # timeout
-            ],
-            kwargs={
-                "max_retries": max_retries,
-                "retry_delay": 10,
-                "platform": platform,
-            },
-            queue="notifications",
-        )
-
-        logger.info(
-            f"Sent webhook notification to worker queue for {url} (pipeline: {payload.pipeline_id})"
+        _enqueue_to_buffer(api_client, notification, payload)
+    except Exception:  # noqa: BLE001 — already logged with stack inside
+        logger.warning(
+            "Buffer enqueue failed for notification %s; continuing with others",
+            notification.get("id"),
         )
-        return True
-
-    except Exception as e:
-        logger.error(f"Failed to send notification to {url}: {e}")
-        return False
 
 
 def trigger_notification(

From 743e9a99829cc514a6c95be6c4cbf9306ad9ccc7 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 19:40:53 +0530
Subject: [PATCH 23/27] add legacy code

---
 backend/notification_v2/provider/__init__.py  |   0
 .../provider/notification_provider.py         |  30 +++++
 backend/notification_v2/provider/registry.py  |  54 +++++++++
 .../provider/webhook/__init__.py              |   0
 .../provider/webhook/api_webhook.py           |  30 +++++
 .../provider/webhook/slack_webhook.py         |  33 ++++++
 .../provider/webhook/webhook.py               | 103 ++++++++++++++++++
 7 files changed, 250 insertions(+)
 create mode 100644 backend/notification_v2/provider/__init__.py
 create mode 100644 backend/notification_v2/provider/notification_provider.py
 create mode 100644 backend/notification_v2/provider/registry.py
 create mode 100644 backend/notification_v2/provider/webhook/__init__.py
 create mode 100644 backend/notification_v2/provider/webhook/api_webhook.py
 create mode 100644 backend/notification_v2/provider/webhook/slack_webhook.py
 create mode 100644 backend/notification_v2/provider/webhook/webhook.py

diff --git a/backend/notification_v2/provider/__init__.py b/backend/notification_v2/provider/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/backend/notification_v2/provider/notification_provider.py b/backend/notification_v2/provider/notification_provider.py
new file mode 100644
index 0000000000..10492aaf3c
--- /dev/null
+++ b/backend/notification_v2/provider/notification_provider.py
@@ -0,0 +1,30 @@
+from abc import ABC, abstractmethod
+
+from django.conf import settings
+
+from notification_v2.models import Notification
+
+
+class NotificationProvider(ABC):
+    NOTIFICATION_TIMEOUT = settings.NOTIFICATION_TIMEOUT
+    RETRY_DELAY = 10  # Seconds
+
+    def __init__(self, notification: Notification, payload):
+        self.payload = payload
+        self.notification = notification
+
+    @abstractmethod
+    def send(self):
+        """Method to be overridden in child classes for sending the
+        notification.
+        """
+        raise NotImplementedError("Subclasses should implement this method.")
+
+    def validate(self):
+        """Method to validate the notification data."""
+        pass
+
+    @abstractmethod
+    def get_headers(self):
+        """Method to get the headers for the notification."""
+        raise NotImplementedError("Subclasses should implement this method.")
diff --git a/backend/notification_v2/provider/registry.py b/backend/notification_v2/provider/registry.py
new file mode 100644
index 0000000000..909ad58b4c
--- /dev/null
+++ b/backend/notification_v2/provider/registry.py
@@ -0,0 +1,54 @@
+from notification_v2.enums import NotificationType, PlatformType
+from notification_v2.provider.notification_provider import NotificationProvider
+from notification_v2.provider.webhook.api_webhook import APIWebhook
+from notification_v2.provider.webhook.slack_webhook import SlackWebhook
+
+REGISTRY = {
+    NotificationType.WEBHOOK: {
+        PlatformType.SLACK: SlackWebhook,
+        PlatformType.API: APIWebhook,
+        # Add other platform-specific classes here
+    },
+    # Add other notification types and classes here
+}
+
+
+def get_notification_provider(
+    notification_type: NotificationType, platform_type: PlatformType
+) -> NotificationProvider:
+    """Get Notification provider based on notification type and platform type
+    It uses the REGISTRY to map the combination of notification type and
+    platform type to the corresponding NotificationProvider class.
+
+    If the provided combination is not found in the REGISTRY, a ValueError is raised.
+
+    Note:
+        This function assumes that the REGISTRY dictionary is correctly populated
+        with the appropriate NotificationProvider classes for each combination of
+        notification type and platform type.
+
+    See Also:
+        - NotificationType
+        - PlatformType
+        - NotificationProvider
+        - REGISTRY
+
+    Parameters:
+        notification_type (NotificationType): The type of notification.
+        platform_type (PlatformType): The platform/provider type for the notification.
+
+    Returns:
+        NotificationProvider: The appropriate NotificationProvider class for
+        the given combination.
+
+    Raises:
+        ValueError: If the provided combination is not found in the REGISTRY.
+    """
+    if notification_type not in REGISTRY:
+        raise ValueError(f"Unsupported notification type: {notification_type}")
+
+    platform_registry = REGISTRY[notification_type]
+    if platform_type not in platform_registry:
+        raise ValueError(f"Unsupported platform type: {platform_type}")
+
+    return platform_registry[platform_type]
diff --git a/backend/notification_v2/provider/webhook/__init__.py b/backend/notification_v2/provider/webhook/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/backend/notification_v2/provider/webhook/api_webhook.py b/backend/notification_v2/provider/webhook/api_webhook.py
new file mode 100644
index 0000000000..9864d84a4a
--- /dev/null
+++ b/backend/notification_v2/provider/webhook/api_webhook.py
@@ -0,0 +1,30 @@
+from typing import Any
+
+from notification_v2.clubbed_renderer import build_envelope
+from notification_v2.provider.webhook.webhook import Webhook
+
+
+class APIWebhook(Webhook):
+    def send(self) -> None:
+        """Send the API webhook notification.
+
+        Wraps the IMMEDIATE event in the canonical envelope before queueing
+        so the receiver-visible JSON shape matches BATCHED dispatches —
+        `{"summary": {...}, "events": [{...}]}`.
+        """
+        self.payload = self.format_payload()
+        super().send()
+
+    def get_headers(self) -> dict[str, str]:
+        """API-specific headers."""
+        headers = super().get_headers()
+        headers["Content-Type"] = "application/json"
+        return headers
+
+    def format_payload(self) -> dict[str, Any]:
+        """Wrap a single IMMEDIATE event in the canonical envelope.
+
+        Receivers parse the same `{summary, events}` shape regardless of
+        whether the dispatch was IMMEDIATE or BATCHED.
+        """
+        return build_envelope(payloads=[self.payload])
diff --git a/backend/notification_v2/provider/webhook/slack_webhook.py b/backend/notification_v2/provider/webhook/slack_webhook.py
new file mode 100644
index 0000000000..0fda635d74
--- /dev/null
+++ b/backend/notification_v2/provider/webhook/slack_webhook.py
@@ -0,0 +1,33 @@
+import logging
+from typing import Any
+
+from notification_v2.clubbed_renderer import render_clubbed_message
+from notification_v2.enums import PlatformType
+from notification_v2.provider.webhook.webhook import Webhook
+
+logger = logging.getLogger(__name__)
+
+
+class SlackWebhook(Webhook):
+    def send(self) -> None:
+        """Send the Slack webhook notification."""
+        formatted_payload = self.format_payload()
+        self.payload = formatted_payload
+        super().send()
+
+    def get_headers(self) -> dict[str, str]:
+        """Slack-specific headers."""
+        headers = super().get_headers()
+        headers["Content-Type"] = "application/json"
+        return headers
+
+    def format_payload(self) -> dict[str, Any]:
+        """Render the IMMEDIATE event through the canonical envelope.
+
+        Single shared renderer for IMMEDIATE and BATCHED so receivers see the
+        same Slack body shape regardless of delivery mode.
+        """
+        return render_clubbed_message(
+            payloads=[self.payload],
+            platform=PlatformType.SLACK.value,
+        )
diff --git a/backend/notification_v2/provider/webhook/webhook.py b/backend/notification_v2/provider/webhook/webhook.py
new file mode 100644
index 0000000000..40ddc53e61
--- /dev/null
+++ b/backend/notification_v2/provider/webhook/webhook.py
@@ -0,0 +1,103 @@
+import logging
+
+from backend.celery_service import app as celery_app
+from notification_v2.enums import AuthorizationType
+from notification_v2.provider.notification_provider import NotificationProvider
+
+logger = logging.getLogger(__name__)
+
+
+class WebhookNotificationArg:
+    MAX_RETRIES = "max_retries"
+    RETRY_DELAY = "retry_delay"
+
+
+class HeaderConstants:
+    APPLICATION_JSON = "application/json"
+
+
+class Webhook(NotificationProvider):
+    def send(self) -> None:
+        """Send the webhook notification."""
+        try:
+            headers = self.get_headers()
+            self.validate()
+        except ValueError as e:
+            logger.error(f"Error validating notification {self.notification} :: {e}")
+            return
+        celery_app.send_task(
+            "send_webhook_notification",
+            args=[
+                self.notification.url,
+                self.payload,
+                headers,
+                self.NOTIFICATION_TIMEOUT,
+            ],
+            kwargs={
+                WebhookNotificationArg.MAX_RETRIES: self.notification.max_retries,
+                WebhookNotificationArg.RETRY_DELAY: self.RETRY_DELAY,
+            },
+        )
+
+    def validate(self):
+        """Validate notification.
+
+        Returns:
+            _type_: None
+        """
+        if not self.notification.url:
+            raise ValueError("Webhook URL is required.")
+        if not self.payload:
+            raise ValueError("Payload is required.")
+        return super().validate()
+
+    def get_headers(self) -> dict[str, str]:
+        """Get the headers for the notification based on the authorization type and key.
+
+        Raises:
+            ValueError: _description_
+
+        Returns:
+            dict[str, str]: A dictionary containing the headers.
+        """
+        headers: dict[str, str] = {}
+        try:
+            authorization_type = AuthorizationType(
+                self.notification.authorization_type.upper()
+            )
+        except ValueError:
+            raise ValueError(
+                "Unsupported authorization type: "
+                f"{self.notification.authorization_type}"
+            )
+        authorization_key = self.notification.authorization_key
+        authorization_header = self.notification.authorization_header
+
+        header_formats = {
+            AuthorizationType.BEARER: lambda key: {
+                "Authorization": f"Bearer {key}",
+                "Content-Type": HeaderConstants.APPLICATION_JSON,
+            },
+            AuthorizationType.API_KEY: lambda key: {
+                "Authorization": key,
+                "Content-Type": HeaderConstants.APPLICATION_JSON,
+            },
+            AuthorizationType.CUSTOM_HEADER: lambda key: {
+                authorization_header: key,
+                "Content-Type": HeaderConstants.APPLICATION_JSON,
+            },
+            AuthorizationType.NONE: lambda _: {
+                "Content-Type": HeaderConstants.APPLICATION_JSON,
+            },
+        }
+
+        if authorization_type not in header_formats:
+            raise ValueError(f"Unsupported authorization type: {authorization_type}")
+
+        headers = header_formats[authorization_type](authorization_key)
+
+        # Check if custom header type has required details
+        if authorization_type == AuthorizationType.CUSTOM_HEADER:
+            if not authorization_header or not authorization_key:
+                raise ValueError("Custom header or key missing for custom authorization.")
+        return headers

From ba04d587fb380e5dc36bd2a7689dad82d3539772 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 19:45:52 +0530
Subject: [PATCH 24/27] add legacy code

---
 backend/notification_v2/internal_serializers.py | 1 -
 backend/notification_v2/serializers.py          | 7 +------
 2 files changed, 1 insertion(+), 7 deletions(-)

diff --git a/backend/notification_v2/internal_serializers.py b/backend/notification_v2/internal_serializers.py
index db7a35ab32..94669d64a4 100644
--- a/backend/notification_v2/internal_serializers.py
+++ b/backend/notification_v2/internal_serializers.py
@@ -23,7 +23,6 @@ class Meta:
             "platform",
             "max_retries",
             "is_active",
-            "delivery_mode",
             "created_at",
             "modified_at",
             "pipeline",
diff --git a/backend/notification_v2/serializers.py b/backend/notification_v2/serializers.py
index 956a25b86e..79802be90b 100644
--- a/backend/notification_v2/serializers.py
+++ b/backend/notification_v2/serializers.py
@@ -1,7 +1,7 @@
 from rest_framework import serializers
 from utils.input_sanitizer import validate_name_field
 
-from .enums import AuthorizationType, DeliveryMode, NotificationType, PlatformType
+from .enums import AuthorizationType, NotificationType, PlatformType
 from .models import Notification
 
 
@@ -21,11 +21,6 @@ class NotificationSerializer(serializers.ModelSerializer):
         max_value=4, min_value=0, default=0, required=False
     )
     notify_on_failures = serializers.BooleanField(default=False, required=False)
-    delivery_mode = serializers.ChoiceField(
-        choices=DeliveryMode.choices(),
-        default=DeliveryMode.BATCHED.value,
-        required=False,
-    )
 
     class Meta:
         model = Notification

From b1fd243c347cfb5c3696e6fec7a1cc79d2a3685f Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Wed, 13 May 2026 19:57:08 +0530
Subject: [PATCH 25/27] greptile review

---
 backend/notification_v2/internal_api_views.py  | 10 ++++++++++
 workers/shared/patterns/notification/helper.py |  7 +++++--
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 6409f6bdf6..27d701bc0f 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -339,6 +339,16 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
             {"status": "error", "message": "Notification not found"}, status=404
         )
 
+    # INPROGRESS fires from the scheduler before a WorkflowExecution exists,
+    # so the GET-side `_apply_failure_filter` cannot run (no execution → no
+    # filter applied) and returns notify_on_failures=True rows too. Drop the
+    # event here so failure-only subscribers never receive a run-start.
+    if (
+        notification.notify_on_failures
+        and body.get("status") == Pipeline.PipelineStatus.INPROGRESS
+    ):
+        return JsonResponse({"status": "ok", "buffer_row_id": None})
+
     # type / timestamp / additional_data stay optional during rollout — older
     # worker builds that don't forward them still produce a usable row
     # (renderer falls back to "Type: —" / no Additional Data line).
diff --git a/workers/shared/patterns/notification/helper.py b/workers/shared/patterns/notification/helper.py
index 79009a71a3..ed00475ea0 100644
--- a/workers/shared/patterns/notification/helper.py
+++ b/workers/shared/patterns/notification/helper.py
@@ -58,7 +58,8 @@ def _enqueue_to_buffer(
             },
             timeout=10,
         )
-    except Exception:  # noqa: BLE001 — propagate any failure, don't classify
+    # Propagate any failure; caller decides whether to continue iteration.
+    except Exception:  # noqa: BLE001
         logger.exception(
             "Failed to enqueue BATCHED notification %s for pipeline %s",
             notification["id"],
@@ -95,7 +96,9 @@ def _route_notification(
 
     try:
         _enqueue_to_buffer(api_client, notification, payload)
-    except Exception:  # noqa: BLE001 — already logged with stack inside
+    # Already logged with stack inside _enqueue_to_buffer; broad catch keeps
+    # sibling notifications going.
+    except Exception:  # noqa: BLE001
         logger.warning(
             "Buffer enqueue failed for notification %s; continuing with others",
             notification.get("id"),

From fb47c4fe22d2e2a1a5c7dd66904925258f937f2c Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Thu, 14 May 2026 17:22:57 +0530
Subject: [PATCH 26/27] greptile review

---
 backend/notification_v2/internal_api_views.py | 27 ++++++++++++++-----
 1 file changed, 21 insertions(+), 6 deletions(-)

diff --git a/backend/notification_v2/internal_api_views.py b/backend/notification_v2/internal_api_views.py
index 27d701bc0f..d823da302f 100644
--- a/backend/notification_v2/internal_api_views.py
+++ b/backend/notification_v2/internal_api_views.py
@@ -374,17 +374,32 @@ def enqueue_notification_buffer(request: HttpRequest) -> JsonResponse:
 
 
 def _gc_terminal_rows() -> int:
-    """Delete DISPATCHED / DEAD_LETTER rows older than the retention window.
-
-    PENDING rows are intentionally untouched regardless of age — they
-    represent live work the flush job still owns.
+    """Delete buffer rows past the retention window.
+
+    Two sweeps:
+    - Terminal rows (DISPATCHED / DEAD_LETTER) older than the retention
+      window: hygiene for completed work.
+    - PENDING rows whose source notification has been deactivated and
+      whose ``flush_after`` has aged past the same window: ``_dispatch_group``
+      filters ``notification__is_active=True``, so without this sweep
+      these rows are unreachable from both dispatch and GC and would
+      accumulate forever in the partial PENDING index.
+
+    PENDING rows attached to active notifications are intentionally
+    untouched regardless of age — they represent live work the flush
+    job still owns.
     """
     cutoff = timezone.now() - timedelta(days=settings.NOTIFICATION_BUFFER_RETENTION_DAYS)
-    deleted_count, _ = NotificationBuffer.objects.filter(
+    terminal_deleted, _ = NotificationBuffer.objects.filter(
         status__in=[BufferStatus.DISPATCHED.value, BufferStatus.DEAD_LETTER.value],
         created_at__lt=cutoff,
     ).delete()
-    return int(deleted_count)
+    inactive_deleted, _ = NotificationBuffer.objects.filter(
+        status=BufferStatus.PENDING.value,
+        notification__is_active=False,
+        flush_after__lt=cutoff,
+    ).delete()
+    return int(terminal_deleted) + int(inactive_deleted)
 
 
 def _send_clubbed(

From b8699f4eefe026cfccb94f5c41a3c7840c3ef016 Mon Sep 17 00:00:00 2001
From: kirtimanmishrazipstack <kirtiman.mishra@zipstack.com>
Date: Fri, 22 May 2026 17:11:39 +0530
Subject: [PATCH 27/27] UI as per new designs

---
 .../DisplayNotifications.jsx                  |   2 +-
 .../settings/platform/PlatformSettings.css    |  51 ++++-
 .../settings/platform/PlatformSettings.jsx    | 188 ++++++++++--------
 3 files changed, 150 insertions(+), 91 deletions(-)

diff --git a/frontend/src/components/pipelines-or-deployments/notification-modal/DisplayNotifications.jsx b/frontend/src/components/pipelines-or-deployments/notification-modal/DisplayNotifications.jsx
index 9754dd20ab..6860bf0258 100644
--- a/frontend/src/components/pipelines-or-deployments/notification-modal/DisplayNotifications.jsx
+++ b/frontend/src/components/pipelines-or-deployments/notification-modal/DisplayNotifications.jsx
@@ -91,7 +91,7 @@ function DisplayNotifications({
           indicator: <SpinnerLoader />,
           spinning: isLoading,
         }}
-        pagination={{ pageSize: 5 }}
+        pagination={false}
       />
     </SpaceWrapper>
   );
diff --git a/frontend/src/components/settings/platform/PlatformSettings.css b/frontend/src/components/settings/platform/PlatformSettings.css
index 4ad6f4bf8e..da0da79318 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.css
+++ b/frontend/src/components/settings/platform/PlatformSettings.css
@@ -2,7 +2,7 @@
 
 .plt-set-layout {
   height: calc(100vh - 60px);
-  background-color: #ffffff;
+  background-color: var(--page-bg-3);
 }
 
 .plt-set-layout-2 {
@@ -10,9 +10,10 @@
 }
 
 .plt-set-head {
-  background-color: #f5f7f9;
+  background-color: var(--white);
   padding: 14px;
   height: 60px;
+  border-bottom: 1px solid var(--border-color-1);
 }
 
 .plt-set-head-typo {
@@ -20,14 +21,56 @@
   font-weight: 600;
 }
 
+.plt-set-section {
+  margin-bottom: 16px;
+}
+
+.plt-set-section > .ant-typography {
+  margin-top: 0;
+}
+
+.plt-set-section-subtitle {
+  display: block;
+  margin-bottom: 8px;
+  font-size: 12px;
+}
+
+.plt-set-inner-card {
+  background-color: #f5f7f9;
+  border: 1px solid #e5e7eb;
+  border-radius: 8px;
+  padding: 16px;
+}
+
 .plt-set-key-head {
+  display: flex;
+  align-items: center;
+  gap: 8px;
   margin-bottom: 8px;
 }
 
-.plt-set-key-head-col-1 {
-  padding-right: 16px;
+.plt-set-key-pill-clickable {
+  cursor: pointer;
 }
 
 .plt-set-key-display {
   width: 300px;
 }
+
+.plt-set-notif-field-label {
+  display: block;
+  margin-bottom: 8px;
+  font-size: 13px;
+}
+
+.plt-set-notif-field-row {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+}
+
+.plt-set-notif-helper {
+  display: block;
+  margin-top: 6px;
+  font-size: 12px;
+}
diff --git a/frontend/src/components/settings/platform/PlatformSettings.jsx b/frontend/src/components/settings/platform/PlatformSettings.jsx
index f2eee087b0..88a4613e78 100644
--- a/frontend/src/components/settings/platform/PlatformSettings.jsx
+++ b/frontend/src/components/settings/platform/PlatformSettings.jsx
@@ -9,9 +9,8 @@ import {
   Divider,
   Input,
   InputNumber,
-  Radio,
   Row,
-  Space,
+  Tag,
   Typography,
 } from "antd";
 import { useEffect, useState } from "react";
@@ -326,94 +325,110 @@ function PlatformSettings() {
         <div className="plt-set-layout">
           <IslandLayout>
             <div className="plt-set-layout-2">
-              <div>
+              <div className="plt-set-section">
                 <Typography.Title level={5}>Internal API Keys</Typography.Title>
-                {keys.map((keyDetails, keyIndex) => {
-                  return (
-                    <div key={keyDetails?.keyName}>
-                      <div>
-                        <div className="plt-set-key-head">
-                          <Row>
-                            <Col>
-                              <div className="plt-set-key-head-col-1">
-                                <Typography.Text>
-                                  {keyDetails?.keyName}
-                                </Typography.Text>
-                              </div>
-                            </Col>
-                            <Col>
-                              <div className="plt-set-key-head-col-2">
-                                <Radio
-                                  checked={
-                                    keyDetails?.id && activeKey === keyIndex
-                                  }
-                                  disabled={keyDetails?.id === null}
-                                  onClick={() => handleToggle(keyIndex)}
-                                >
-                                  Active Key
-                                </Radio>
-                              </div>
-                            </Col>
-                          </Row>
-                        </div>
+                <Typography.Text
+                  type="secondary"
+                  className="plt-set-section-subtitle"
+                >
+                  Authenticate platform-to-platform requests. Keep these values
+                  secret.
+                </Typography.Text>
+                <div className="plt-set-inner-card">
+                  {keys.map((keyDetails, keyIndex) => {
+                    const isActive =
+                      Boolean(keyDetails?.id) && activeKey === keyIndex;
+                    const canActivate = keyDetails?.id !== null;
+                    return (
+                      <div key={keyDetails?.keyName}>
                         <div>
-                          <Row gutter={10}>
-                            <Col>
-                              <div className="plt-set-key-display">
-                                <Input
-                                  size="small"
-                                  value={keys[keyIndex].key}
-                                  suffix={
-                                    <CopyOutlined
-                                      onClick={() =>
-                                        copyText(keys[keyIndex].key)
-                                      }
-                                    />
-                                  }
-                                />
-                              </div>
-                            </Col>
-                            <Col>
-                              <Button
-                                size="small"
-                                loading={isLoadingIndex === keyIndex}
-                                onClick={() => handleGenerate(keyIndex)}
-                              >
-                                {keyDetails?.id?.length > 0
-                                  ? "Refresh"
-                                  : "Generate"}
-                              </Button>
-                            </Col>
-                            <Col>
-                              <ConfirmModal
-                                handleConfirm={() => handleDelete(keyIndex)}
-                                content="Want to delete this platform key? This action cannot be undone."
-                                okText="Delete"
+                          <div className="plt-set-key-head">
+                            <Typography.Text>
+                              {keyDetails?.keyName}
+                            </Typography.Text>
+                            {isActive ? (
+                              <Tag color="success">Active</Tag>
+                            ) : (
+                              <Tag
+                                className={
+                                  canActivate
+                                    ? "plt-set-key-pill-clickable"
+                                    : undefined
+                                }
+                                onClick={
+                                  canActivate
+                                    ? () => handleToggle(keyIndex)
+                                    : undefined
+                                }
                               >
+                                Inactive
+                              </Tag>
+                            )}
+                          </div>
+                          <div>
+                            <Row gutter={10}>
+                              <Col>
+                                <div className="plt-set-key-display">
+                                  <Input
+                                    size="small"
+                                    value={keys[keyIndex].key}
+                                    suffix={
+                                      <CopyOutlined
+                                        onClick={() =>
+                                          copyText(keys[keyIndex].key)
+                                        }
+                                      />
+                                    }
+                                  />
+                                </div>
+                              </Col>
+                              <Col>
                                 <Button
                                   size="small"
-                                  icon={<DeleteOutlined />}
-                                  disabled={keyDetails?.id === null}
-                                  loading={isDeletingIndex === keyIndex}
-                                />
-                              </ConfirmModal>
-                            </Col>
-                          </Row>
+                                  loading={isLoadingIndex === keyIndex}
+                                  onClick={() => handleGenerate(keyIndex)}
+                                >
+                                  {keyDetails?.id?.length > 0
+                                    ? "Refresh"
+                                    : "Generate"}
+                                </Button>
+                              </Col>
+                              <Col>
+                                <ConfirmModal
+                                  handleConfirm={() => handleDelete(keyIndex)}
+                                  content="Want to delete this platform key? This action cannot be undone."
+                                  okText="Delete"
+                                >
+                                  <Button
+                                    size="small"
+                                    icon={<DeleteOutlined />}
+                                    disabled={keyDetails?.id === null}
+                                    loading={isDeletingIndex === keyIndex}
+                                  />
+                                </ConfirmModal>
+                              </Col>
+                            </Row>
+                          </div>
                         </div>
+                        {keyIndex < keys?.length - 1 && <Divider />}
                       </div>
-                      {keyIndex < keys?.length - 1 && <Divider />}
-                    </div>
-                  );
-                })}
+                    );
+                  })}
+                </div>
               </div>
-              <Divider />
-              <div className="plt-set-batch-interval">
+              <div className="plt-set-section">
                 <Typography.Title level={5}>Notifications</Typography.Title>
-                <div style={{ marginTop: 12 }}>
-                  <Space>
-                    <Typography.Text>
-                      Notification interval (minutes, 1–120)
-                    </Typography.Text>
+                <Typography.Text
+                  type="secondary"
+                  className="plt-set-section-subtitle"
+                >
+                  Control how often the platform notifies you about activity.
+                </Typography.Text>
+                <div className="plt-set-inner-card">
+                  <Typography.Text className="plt-set-notif-field-label">
+                    Notification interval
+                  </Typography.Text>
+                  <div className="plt-set-notif-field-row">
                     <InputNumber
                       min={1}
                       max={120}
@@ -429,12 +444,13 @@ function PlatformSettings() {
                     >
                       Save
                     </Button>
-                  </Space>
-                  <div style={{ marginTop: 4 }}>
-                    <Typography.Text type="secondary">
-                      Allowed: 1–120 minutes. Default: 5 minutes.
-                    </Typography.Text>
                   </div>
+                  <Typography.Text
+                    type="secondary"
+                    className="plt-set-notif-helper"
+                  >
+                    Allowed: 1 to 120 minutes. Default: 5 minutes.
+                  </Typography.Text>
                 </div>
               </div>
             </div>