From 36463bb9b68314995ac451db33d1f345855416a6 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Thu, 2 Apr 2026 01:57:01 +0530
Subject: [PATCH 01/57] UN-2946 [FEAT] Add lightweight list serializer for
 Prompt Studio and prompt list endpoint

- Add CustomToolListSerializer for the list action to avoid N+1 queries
  (profile lookups, prompt fetching, coverage calculation per tool)
- Add ToolStudioPromptListSerializer with only prompt_id, prompt_key,
  enforce_type, sequence_number
- Add GET /prompt-studio/prompt/?tool_id={uuid} list endpoint
- List action uses select_related and Subquery annotation for prompt_count
- Detail endpoint unchanged (still uses full CustomToolSerializer)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .../prompt_studio_v2/serializers.py             | 17 +++++++++++++++++
 backend/prompt_studio/prompt_studio_v2/urls.py  | 13 ++++++++++---
 backend/prompt_studio/prompt_studio_v2/views.py | 11 ++++++++++-
 3 files changed, 37 insertions(+), 4 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_v2/serializers.py b/backend/prompt_studio/prompt_studio_v2/serializers.py
index e1adddc33c..6a4d28032d 100644
--- a/backend/prompt_studio/prompt_studio_v2/serializers.py
+++ b/backend/prompt_studio/prompt_studio_v2/serializers.py
@@ -5,6 +5,23 @@
 from .models import ToolStudioPrompt
 
 
+class ToolStudioPromptListSerializer(serializers.ModelSerializer):
+    """Lightweight serializer for listing prompts by tool.
+
+    Returns only the fields needed for linking/display without
+    output data or coverage calculation.
+    """
+
+    class Meta:
+        model = ToolStudioPrompt
+        fields = [
+            "prompt_id",
+            "prompt_key",
+            "enforce_type",
+            "sequence_number",
+        ]
+
+
 class ToolStudioPromptSerializer(AuditSerializer):
     class Meta:
         model = ToolStudioPrompt
diff --git a/backend/prompt_studio/prompt_studio_v2/urls.py b/backend/prompt_studio/prompt_studio_v2/urls.py
index 23e5f02438..0ce3d03545 100644
--- a/backend/prompt_studio/prompt_studio_v2/urls.py
+++ b/backend/prompt_studio/prompt_studio_v2/urls.py
@@ -3,6 +3,8 @@
 
 from .views import ToolStudioPromptView
 
+prompt_studio_prompt_list = ToolStudioPromptView.as_view({"get": "list"})
+
 prompt_studio_prompt_detail = ToolStudioPromptView.as_view(
     {
         "get": "retrieve",
@@ -16,15 +18,20 @@
 
 urlpatterns = format_suffix_patterns(
     [
+        path(
+            "prompt/reorder/",
+            reorder_prompts,
+            name="reorder_prompts",
+        ),
         path(
             "prompt/<uuid:pk>/",
             prompt_studio_prompt_detail,
             name="tool-studio-prompt-detail",
         ),
         path(
-            "prompt/reorder/",
-            reorder_prompts,
-            name="reorder_prompts",
+            "prompt/",
+            prompt_studio_prompt_list,
+            name="tool-studio-prompt-list",
         ),
     ]
 )
diff --git a/backend/prompt_studio/prompt_studio_v2/views.py b/backend/prompt_studio/prompt_studio_v2/views.py
index f120baf15f..a540480274 100644
--- a/backend/prompt_studio/prompt_studio_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_v2/views.py
@@ -10,7 +10,10 @@
 from prompt_studio.prompt_studio_v2.constants import ToolStudioPromptKeys
 from prompt_studio.prompt_studio_v2.controller import PromptStudioController
 from prompt_studio.prompt_studio_v2.models import ToolStudioPrompt
-from prompt_studio.prompt_studio_v2.serializers import ToolStudioPromptSerializer
+from prompt_studio.prompt_studio_v2.serializers import (
+    ToolStudioPromptListSerializer,
+    ToolStudioPromptSerializer,
+)
 
 
 class ToolStudioPromptView(viewsets.ModelViewSet):
@@ -28,8 +31,14 @@ class ToolStudioPromptView(viewsets.ModelViewSet):
 
     versioning_class = URLPathVersioning
     serializer_class = ToolStudioPromptSerializer
+
     permission_classes: list[type[PromptAcesssToUser]] = [PromptAcesssToUser]
 
+    def get_serializer_class(self):
+        if self.action == "list":
+            return ToolStudioPromptListSerializer
+        return ToolStudioPromptSerializer
+
     def get_queryset(self) -> QuerySet | None:
         filter_args = FilterHelper.build_filter_args(
             self.request,

From 9300a4d67db47bf78818fd5d06f0541bb0ba9238 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Thu, 2 Apr 2026 01:57:29 +0530
Subject: [PATCH 02/57] UN-2946 [FEAT] Add Look-Ups plugin integration in
 sidebar nav and routes

- Add lookup-studio plugin detection with dynamic import
- Add PromptStudioPopoverContent for hover submenu (Projects / Look-Ups)
  following the same Popover pattern as HITL and Platform Settings
- Register lookups/* route in useMainAppRoutes.js

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .../navigations/side-nav-bar/SideNavBar.jsx   | 118 ++++++++++++++++++
 frontend/src/routes/useMainAppRoutes.js       |   9 ++
 2 files changed, 127 insertions(+)

diff --git a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
index bb328b1a98..3f6f43733f 100644
--- a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
+++ b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
@@ -89,6 +89,14 @@ try {
   // Plugin unavailable
 }
 
+let lookupStudioEnabled = false;
+try {
+  await import("../../../plugins/lookup-studio");
+  lookupStudioEnabled = true;
+} catch {
+  // Plugin unavailable
+}
+
 let manualReviewSettingsEnabled = false;
 try {
   await import("../../../plugins/manual-review/settings/Settings.jsx");
@@ -258,6 +266,45 @@ HITLPopoverContent.propTypes = {
   navigate: PropTypes.func.isRequired,
 };
 
+const PROMPT_STUDIO_MENU_ITEMS = [
+  { key: "projects", label: "Projects", subPath: "/tools" },
+  { key: "lookups", label: "Look-Ups", subPath: "/lookups" },
+];
+
+const getActivePromptStudioKey = (orgName) => {
+  const currentPath = globalThis.location.pathname;
+  if (currentPath.startsWith(`/${orgName}/lookups`)) {
+    return "lookups";
+  }
+  return "projects";
+};
+
+const PromptStudioPopoverContent = ({ orgName, navigate }) => {
+  const activeKey = getActivePromptStudioKey(orgName);
+
+  return (
+    <nav className="settings-sidebar-popover">
+      {PROMPT_STUDIO_MENU_ITEMS.map((menuItem) => (
+        <button
+          key={menuItem.key}
+          type="button"
+          className={`settings-menu-item ${
+            activeKey === menuItem.key ? "active" : ""
+          }`}
+          onClick={() => navigate(`/${orgName}${menuItem.subPath}`)}
+        >
+          {menuItem.label}
+        </button>
+      ))}
+    </nav>
+  );
+};
+
+PromptStudioPopoverContent.propTypes = {
+  orgName: PropTypes.string.isRequired,
+  navigate: PropTypes.func.isRequired,
+};
+
 const SideNavBar = ({ collapsed, setCollapsed }) => {
   const navigate = useNavigate();
   const { sessionDetails } = useSessionStore();
@@ -506,6 +553,14 @@ const SideNavBar = ({ collapsed, setCollapsed }) => {
     });
   }
 
+  // Mark Prompt Studio item for popover rendering when lookups plugin is available
+  if (lookupStudioEnabled && isUnstract) {
+    const psItem = data[0]?.subMenu?.find((el) => el.id === 1.1);
+    if (psItem) {
+      psItem.hasLookupPopover = true;
+    }
+  }
+
   // Add HITL Review section if plugin is available and user has HITL role
   const isHITLRole = [
     "unstract_reviewer",
@@ -700,6 +755,69 @@ const SideNavBar = ({ collapsed, setCollapsed }) => {
                       );
                     }
 
+                    // Prompt Studio with Look-Ups popover
+                    if (el.hasLookupPopover) {
+                      const psContent = (
+                        <Tooltip title={collapsed ? el.title : ""}>
+                          <Space
+                            className={`space-styles ${
+                              el.active ||
+                              globalThis.location.pathname.startsWith(
+                                `/${orgName}/lookups`,
+                              )
+                                ? "space-styles-active"
+                                : ""
+                            } ${el.disable ? "space-styles-disable" : ""}`}
+                            onClick={() => {
+                              if (!el.disable) {
+                                navigate(el.path);
+                              }
+                            }}
+                            data-testid="sidebar-prompt-studio"
+                          >
+                            <Image
+                              src={el.image}
+                              alt="side_icon"
+                              className="menu-item-icon"
+                              preview={false}
+                            />
+                            {!collapsed && (
+                              <div>
+                                <Typography className="sidebar-item-text fs-14">
+                                  {el.title}
+                                </Typography>
+                                <Typography className="sidebar-item-text fs-11">
+                                  {el.description}
+                                </Typography>
+                              </div>
+                            )}
+                          </Space>
+                        </Tooltip>
+                      );
+
+                      if (el.disable) {
+                        return <div key={el.id}>{psContent}</div>;
+                      }
+
+                      return (
+                        <Popover
+                          key={el.id}
+                          content={
+                            <PromptStudioPopoverContent
+                              orgName={orgName}
+                              navigate={navigate}
+                            />
+                          }
+                          trigger="hover"
+                          placement="rightTop"
+                          arrow={false}
+                          overlayClassName="settings-popover-overlay"
+                        >
+                          {psContent}
+                        </Popover>
+                      );
+                    }
+
                     return (
                       <Tooltip key={el.id} title={collapsed ? el.title : ""}>
                         <Space
diff --git a/frontend/src/routes/useMainAppRoutes.js b/frontend/src/routes/useMainAppRoutes.js
index 1d5849b103..768dfee976 100644
--- a/frontend/src/routes/useMainAppRoutes.js
+++ b/frontend/src/routes/useMainAppRoutes.js
@@ -61,6 +61,14 @@ try {
   // Do nothing, Not-found Page will be triggered.
 }
 
+let LookupStudio;
+try {
+  const mod = await import("../plugins/lookup-studio");
+  LookupStudio = mod.LookupStudio;
+} catch {
+  // Do nothing, Not-found Page will be triggered.
+}
+
 try {
   const mod1 = await import("../plugins/app-deployment/AppDeployments.jsx");
   AppDeployments = mod1.AppDeployments;
@@ -180,6 +188,7 @@ function useMainAppRoutes() {
             element={<AgenticPromptStudio />}
           />
         )}
+        {LookupStudio && <Route path="lookups/*" element={<LookupStudio />} />}
         <Route path="logs" element={<LogsPage />} />
         <Route path="logs/:type/:id/" element={<LogsPage />} />
         <Route

From e36562d617deb73b5742f67fc4c9a00f0de34c23 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Thu, 2 Apr 2026 14:11:02 +0530
Subject: [PATCH 03/57] UN-2946 [FIX] Use .get() fallback for
 prompt_studio_tool in create_profile_manager

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/prompt_studio_core_v2/views.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 22c1a378bb..e936e3dcae 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -824,9 +824,10 @@ def create_profile_manager(self, request: HttpRequest, pk: Any = None) -> Respon
         serializer = ProfileManagerSerializer(data=request.data, context=context)
         serializer.is_valid(raise_exception=True)
         # Check for the maximum number of profiles constraint
-        prompt_studio_tool = serializer.validated_data[
-            ProfileManagerKeys.PROMPT_STUDIO_TOOL
-        ]
+        prompt_studio_tool = (
+            serializer.validated_data.get(ProfileManagerKeys.PROMPT_STUDIO_TOOL)
+            or self.get_object()
+        )
         profile_count = ProfileManager.objects.filter(
             prompt_studio_tool=prompt_studio_tool
         ).count()

From 4765e99bc5a3d1bd17360795b7e17d468e00a5b9 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sat, 4 Apr 2026 03:40:14 +0530
Subject: [PATCH 04/57] UN-2946 [FEAT] Add Lookups V2 OSS integration hooks for
 post-extraction enrichment
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add lookup_config export in prompt_studio_helper and registry_helper
  via cloud plugin guard (try/except ImportError)
- Store raw output in PromptStudioOutputManager, enriched in cloud
  LookupOutputResult — preserving both for UI tab display
- Add LookupEnrichmentProtocol and plugin call in post-extraction
  pipeline using ExecutorPluginLoader (no-op in OSS)
- Track lookup LLM usage via standard metrics pipeline
  (usage_kwargs with run_id/execution_id, capture_metrics)
- Move webhook postprocessing from answer_prompt to pipeline
- Frontend: dynamic plugin imports for LookupMenuItem, LookupIndicator,
  LookupOutputTabs in prompt cards; fetch lookup outputs on page load
- Add scroll-to-prompt support via query param in DocumentParser

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .gitignore                                    |   1 +
 .../prompt_studio_helper.py                   |  35 ++++++
 .../output_manager_helper.py                  |  35 ++++++
 .../prompt_studio_registry_helper.py          |  11 ++
 .../document-parser/DocumentParser.jsx        |  23 +++-
 .../custom-tools/prompt-card/Header.jsx       |  24 ++++
 .../prompt-card/PromptCardItems.jsx           |  13 ++
 .../custom-tools/prompt-card/PromptOutput.jsx | 116 +++++++++++++-----
 .../helpers/custom-tools/CustomToolsHelper.js |  26 ++++
 frontend/src/hooks/usePromptOutput.js         |  14 +++
 workers/executor/executors/answer_prompt.py   |  25 +---
 workers/executor/executors/legacy_executor.py |  89 ++++++++++++++
 .../executor/executors/plugins/protocols.py   |   7 ++
 13 files changed, 366 insertions(+), 53 deletions(-)

diff --git a/.gitignore b/.gitignore
index f6837ce079..cd4084ecdd 100644
--- a/.gitignore
+++ b/.gitignore
@@ -703,3 +703,4 @@ CONTRIBUTION_GUIDE.md
 
 # MCP servers
 .serena
+.gstack/
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index d0ffef3114..9b76a86782 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -387,6 +387,18 @@ def _build_prompt_output(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
+        # Lookup config (cloud plugin hook)
+        try:
+            from pluggable_apps.lookup_v1.execution import (
+                build_lookup_config_for_prompt,
+            )
+
+            lookup_config = build_lookup_config_for_prompt(prompt)
+            if lookup_config:
+                output["lookup_config"] = lookup_config
+        except ImportError:
+            pass
+
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_MONITOR_LLM] = [monitor_llm]
@@ -798,6 +810,18 @@ def build_fetch_response_payload(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
+        # Lookup config (cloud plugin hook)
+        try:
+            from pluggable_apps.lookup_v1.execution import (
+                build_lookup_config_for_prompt,
+            )
+
+            lookup_config = build_lookup_config_for_prompt(prompt)
+            if lookup_config:
+                output["lookup_config"] = lookup_config
+        except ImportError:
+            pass
+
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_MONITOR_LLM] = [monitor_llm]
@@ -1893,6 +1917,17 @@ def _fetch_response(
         output[TSPKeys.ENABLE_POSTPROCESSING_WEBHOOK] = webhook_enabled
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
+        # Lookup config (cloud plugin hook)
+        try:
+            from pluggable_apps.lookup_v1.execution import (
+                build_lookup_config_for_prompt,
+            )
+
+            lookup_config = build_lookup_config_for_prompt(prompt)
+            if lookup_config:
+                output["lookup_config"] = lookup_config
+        except ImportError:
+            pass
         # Eval settings for the prompt
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 405b91e00f..d0197e128f 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -170,6 +170,15 @@ def update_or_create_prompt_output(
 
             # TODO: use enums here
             output = outputs.get(prompt.prompt_key)
+
+            # If lookup enrichment ran, structured_output contains the enriched
+            # value. Restore the original raw LLM output for the prompt output
+            # table — the enriched value lives in LookupOutputResult instead.
+            lookup_outputs = metadata.get("lookup_outputs", {})
+            prompt_lookup = lookup_outputs.get(prompt.prompt_key)
+            if prompt_lookup and "original" in prompt_lookup:
+                output = prompt_lookup["original"]
+
             if prompt.enforce_type in {"json", "table", "record", "line-item"}:
                 output = json.dumps(output)
             eval_metrics = outputs.get(f"{prompt.prompt_key}__evaluation", [])
@@ -189,6 +198,32 @@ def update_or_create_prompt_output(
                 word_confidence_data=prompt_word_confidence_data,
             )
 
+            # Persist lookup outputs if present (cloud plugin)
+            if prompt_lookup:
+                try:
+                    from pluggable_apps.lookup_v1.models import (
+                        LookupOutputResult,
+                    )
+
+                    lookup_meta = prompt_lookup.get("meta", {})
+                    lookup_id = lookup_meta.get("lookup_id")
+                    if lookup_id:
+                        LookupOutputResult.objects.update_or_create(
+                            prompt_output=prompt_output,
+                            defaults={
+                                "lookup_definition_id": lookup_id,
+                                "output": prompt_lookup.get("enriched", ""),
+                            },
+                        )
+                except ImportError:
+                    pass
+                except Exception:
+                    logger.warning(
+                        "Failed to persist lookup output for prompt %s",
+                        prompt.prompt_key,
+                        exc_info=True,
+                    )
+
             # Serialize the instance
             serializer = PromptStudioOutputSerializer(prompt_output)
             serialized_data.append(serializer.data)
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 6ce1f72095..87d4fa0def 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -355,6 +355,17 @@ def frame_export_json(
             output[JsonSchemaKey.POSTPROCESSING_WEBHOOK_URL] = (
                 prompt.postprocessing_webhook_url
             )
+            # Lookup config (cloud plugin hook)
+            try:
+                from pluggable_apps.lookup_v1.execution import (
+                    build_lookup_config_for_prompt,
+                )
+
+                lookup_config = build_lookup_config_for_prompt(prompt)
+                if lookup_config:
+                    output["lookup_config"] = lookup_config
+            except ImportError:
+                pass
             # Retaining the old fields in condition
             # for backward compatibility. To be removed in future.
             if (
diff --git a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
index 3d5c891e13..c5e60a2c93 100644
--- a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
+++ b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
@@ -1,5 +1,6 @@
 import PropTypes from "prop-types";
 import { useEffect, useRef, useState } from "react";
+import { useSearchParams } from "react-router-dom";
 
 import "./DocumentParser.css";
 import { promptType } from "../../../helpers/GetStaticData";
@@ -42,6 +43,7 @@ function DocumentParser({
   const [isChallenge, setIsChallenge] = useState(false);
   const [allTableSettings, setAllTableSettings] = useState([]);
   const bottomRef = useRef(null);
+  const [searchParams, setSearchParams] = useSearchParams();
   const {
     details,
     isSimplePromptStudio,
@@ -108,6 +110,25 @@ function DocumentParser({
     }
   }, [scrollToBottom]);
 
+  // Handle scrollTo query param for cross-linking from Lookup Studio
+  useEffect(() => {
+    const scrollToPromptId = searchParams.get("scrollTo");
+    if (!scrollToPromptId || !details?.prompts?.length) {
+      return;
+    }
+
+    const el = document.querySelector(`[data-prompt-id="${scrollToPromptId}"]`);
+    if (el) {
+      el.scrollIntoView({ behavior: "smooth", block: "center" });
+      el.classList.add("highlighted-prompt");
+      setTimeout(() => el.classList.remove("highlighted-prompt"), 2000);
+    }
+
+    // Clear the param so it doesn't re-trigger
+    searchParams.delete("scrollTo");
+    setSearchParams(searchParams, { replace: true });
+  }, [details?.prompts]);
+
   const promptUrl = (urlPath) => {
     return `/api/v1/unstract/${sessionDetails?.orgId}/prompt-studio/prompt/${urlPath}`;
   };
@@ -242,7 +263,7 @@ function DocumentParser({
     <div className="doc-parser-layout">
       {details?.prompts?.map((item) => {
         return (
-          <div key={item.prompt_id}>
+          <div key={item.prompt_id} data-prompt-id={item.prompt_id}>
             <div className="doc-parser-pad-top" />
             <PromptCardWrapper
               item={item}
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index 2b6d6b99c1..b8d7a1707e 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -41,6 +41,16 @@ try {
   // The component will remain 'undefined' it is not available
 }
 
+let LookupMenuItem;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/prompt-card/LookupMenuItem"
+  );
+  LookupMenuItem = mod.LookupMenuItem;
+} catch {
+  // Not available in OSS
+}
+
 function Header({
   promptDetails,
   promptKey,
@@ -267,6 +277,20 @@ function Header({
           isPublicSource,
       },
     ];
+    if (LookupMenuItem && !isSimplePromptStudio) {
+      dropdownItems.splice(
+        dropdownItems.length - 1,
+        0,
+        {
+          type: "divider",
+        },
+        {
+          label: <LookupMenuItem promptDetails={promptDetails} />,
+          key: "lookup",
+        },
+      );
+    }
+
     if (isSimplePromptStudio) {
       dropdownItems.splice(0, 1);
     }
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
index 90f4936a3a..40439bce55 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
@@ -30,6 +30,16 @@ try {
   // The component will remain null of it is not available
 }
 
+let LookupIndicator;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/prompt-card/LookupIndicator"
+  );
+  LookupIndicator = mod.LookupIndicator;
+} catch {
+  // Not available in OSS
+}
+
 function PromptCardItems({
   promptDetails,
   enforceTypeList,
@@ -260,6 +270,9 @@ function PromptCardItems({
                           </Typography.Link>
                         </Space>
                       </Button>
+                      {LookupIndicator && (
+                        <LookupIndicator promptDetails={promptDetails} />
+                      )}
                     </Space>
                     <Space>
                       {details?.enable_highlight &&
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index 88df329744..02e552ae44 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -51,6 +51,16 @@ try {
   // The component will remain null of it is not available
 }
 
+let LookupOutputTabs;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/prompt-card/LookupOutputTabs"
+  );
+  LookupOutputTabs = mod.LookupOutputTabs;
+} catch {
+  // Not available in OSS
+}
+
 function PromptOutput({
   promptDetails,
   handleRun,
@@ -193,20 +203,46 @@ function PromptOutput({
             "highlighted-prompt-cell"
           }`}
         >
-          <DisplayPromptResult
-            output={promptOutput}
-            highlightData={
-              promptOutputData?.highlightData?.[promptDetails.prompt_key]
-            }
-            handleSelectHighlight={handleSelectHighlight}
-            confidenceData={
-              promptOutputData?.confidenceData?.[promptDetails.prompt_key]
-            }
-            wordConfidenceData={
-              promptOutputData?.wordConfidenceData?.[promptDetails.prompt_key]
-            }
-            progressMsg={progressMsg}
-          />
+          {LookupOutputTabs ? (
+            <LookupOutputTabs
+              promptId={promptId}
+              profileManagerId={defaultLlmProfile}
+              defaultLlmProfile={defaultLlmProfile}
+              promptOutputId={promptOutputData?.promptOutputId}
+            >
+              <DisplayPromptResult
+                output={promptOutput}
+                highlightData={
+                  promptOutputData?.highlightData?.[promptDetails.prompt_key]
+                }
+                handleSelectHighlight={handleSelectHighlight}
+                confidenceData={
+                  promptOutputData?.confidenceData?.[promptDetails.prompt_key]
+                }
+                wordConfidenceData={
+                  promptOutputData?.wordConfidenceData?.[
+                    promptDetails.prompt_key
+                  ]
+                }
+                progressMsg={progressMsg}
+              />
+            </LookupOutputTabs>
+          ) : (
+            <DisplayPromptResult
+              output={promptOutput}
+              highlightData={
+                promptOutputData?.highlightData?.[promptDetails.prompt_key]
+              }
+              handleSelectHighlight={handleSelectHighlight}
+              confidenceData={
+                promptOutputData?.confidenceData?.[promptDetails.prompt_key]
+              }
+              wordConfidenceData={
+                promptOutputData?.wordConfidenceData?.[promptDetails.prompt_key]
+              }
+              progressMsg={progressMsg}
+            />
+          )}
           <div className="prompt-profile-run">
             <CopyPromptOutputBtn
               isDisabled={isTableExtraction}
@@ -429,20 +465,44 @@ function PromptOutput({
                       handleTable(profileId, promptOutputData)
                     ) : (
                       <>
-                        <DisplayPromptResult
-                          output={promptOutputData?.output}
-                          profileId={profileId}
-                          docId={selectedDoc?.document_id}
-                          promptRunStatus={promptRunStatus}
-                          handleSelectHighlight={handleSelectHighlight}
-                          highlightData={promptOutputData?.highlightData}
-                          confidenceData={promptOutputData?.confidenceData}
-                          wordConfidenceData={
-                            promptOutputData?.wordConfidenceData
-                          }
-                          promptDetails={promptDetails}
-                          progressMsg={progressMsg}
-                        />
+                        {LookupOutputTabs ? (
+                          <LookupOutputTabs
+                            promptId={promptId}
+                            profileManagerId={profileId}
+                            defaultLlmProfile={defaultLlmProfile}
+                            promptOutputId={promptOutputData?.promptOutputId}
+                          >
+                            <DisplayPromptResult
+                              output={promptOutputData?.output}
+                              profileId={profileId}
+                              docId={selectedDoc?.document_id}
+                              promptRunStatus={promptRunStatus}
+                              handleSelectHighlight={handleSelectHighlight}
+                              highlightData={promptOutputData?.highlightData}
+                              confidenceData={promptOutputData?.confidenceData}
+                              wordConfidenceData={
+                                promptOutputData?.wordConfidenceData
+                              }
+                              promptDetails={promptDetails}
+                              progressMsg={progressMsg}
+                            />
+                          </LookupOutputTabs>
+                        ) : (
+                          <DisplayPromptResult
+                            output={promptOutputData?.output}
+                            profileId={profileId}
+                            docId={selectedDoc?.document_id}
+                            promptRunStatus={promptRunStatus}
+                            handleSelectHighlight={handleSelectHighlight}
+                            highlightData={promptOutputData?.highlightData}
+                            confidenceData={promptOutputData?.confidenceData}
+                            wordConfidenceData={
+                              promptOutputData?.wordConfidenceData
+                            }
+                            promptDetails={promptDetails}
+                            progressMsg={progressMsg}
+                          />
+                        )}
                         <div className="prompt-profile-run">
                           <CopyPromptOutputBtn
                             isDisabled={isTableExtraction}
diff --git a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
index 543ad9b14b..1c0f8efeab 100644
--- a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
+++ b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
@@ -19,6 +19,20 @@ try {
 } catch {
   // Do nothing, Not-found Page will be triggered.
 }
+
+let fetchLookupAssignments;
+let fetchLookupOutputs;
+let resetLookupAssignments;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/store/useFetchLookupAssignments"
+  );
+  fetchLookupAssignments = mod.fetchLookupAssignments;
+  fetchLookupOutputs = mod.fetchLookupOutputs;
+  resetLookupAssignments = mod.resetLookupAssignments;
+} catch {
+  // Lookup feature not available in OSS
+}
 function CustomToolsHelper() {
   const [isLoading, setIsLoading] = useState(true);
   const { id } = useParams();
@@ -115,6 +129,15 @@ function CustomToolsHelper() {
       .then((res) => {
         const data = res?.data;
         updatedCusTool["adapters"] = data;
+
+        // Fetch lookup data (cloud only, fire-and-forget)
+        if (fetchLookupAssignments) {
+          const toolId = updatedCusTool["details"]?.tool_id;
+          fetchLookupAssignments(axiosPrivate, sessionDetails?.orgId, toolId);
+          if (fetchLookupOutputs) {
+            fetchLookupOutputs(axiosPrivate, sessionDetails?.orgId, toolId);
+          }
+        }
       })
       .catch((err) => {
         setAlertDetails(handleException(err, "Failed to load the custom tool"));
@@ -131,6 +154,9 @@ function CustomToolsHelper() {
       setDefaultCustomTool();
       emptyCusToolMessages();
       resetTokenUsage();
+      if (resetLookupAssignments) {
+        resetLookupAssignments();
+      }
     };
   }, []);
 
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index 530cdf2bc7..0e06070b7b 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -23,6 +23,16 @@ try {
   // The component will remain null of it is not available
 }
 
+let handleLookupOutput;
+try {
+  const mod = await import(
+    "../plugins/lookup-studio/prompt-card/handleLookupOutput"
+  );
+  handleLookupOutput = mod.handleLookupOutput;
+} catch {
+  // Not available in OSS
+}
+
 const usePromptOutput = () => {
   const { sessionDetails } = useSessionStore();
   const { setTokenUsage, updateTokenUsage } = useTokenUsageStore();
@@ -125,6 +135,10 @@ const usePromptOutput = () => {
         wordConfidenceData: item?.word_confidence_data,
       };
 
+      if (handleLookupOutput && item?.lookup_outputs) {
+        handleLookupOutput(item.prompt_output_id, item.lookup_outputs);
+      }
+
       if (item?.is_single_pass_extract && isTokenUsageForSinglePassAdded) {
         return;
       }
diff --git a/workers/executor/executors/answer_prompt.py b/workers/executor/executors/answer_prompt.py
index c22c8aaafd..d1eef5b3be 100644
--- a/workers/executor/executors/answer_prompt.py
+++ b/workers/executor/executors/answer_prompt.py
@@ -338,27 +338,4 @@ def handle_json(
             structured_output[prompt_key] = {}
             return
 
-        highlight_data = None
-        if enable_highlight and metadata and PSKeys.HIGHLIGHT_DATA in metadata:
-            highlight_data = metadata[PSKeys.HIGHLIGHT_DATA].get(prompt_key)
-
-        processed_data = parsed_data
-        updated_highlight_data = None
-
-        webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
-        if webhook_enabled:
-            webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
-            processed_data, updated_highlight_data = (
-                AnswerPromptService._run_webhook_postprocess(
-                    parsed_data=parsed_data,
-                    webhook_url=webhook_url,
-                    highlight_data=highlight_data,
-                )
-            )
-
-        structured_output[prompt_key] = processed_data
-
-        if enable_highlight and metadata and updated_highlight_data is not None:
-            metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_key] = (
-                updated_highlight_data
-            )
+        structured_output[prompt_key] = parsed_data
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 18e1f47749..0b06b24bc2 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1654,6 +1654,15 @@ def _execute_single_prompt(
             )
             shim.stream_log(f"Applied type conversion for: {prompt_name}")
 
+            self._run_post_extraction_pipeline(
+                output=output,
+                structured_output=structured_output,
+                metadata=metadata,
+                metrics=metrics,
+                shim=shim,
+                usage_kwargs=usage_kwargs,
+            )
+
             self._run_challenge_if_enabled(
                 tool_settings=tool_settings,
                 output=output,
@@ -1844,6 +1853,86 @@ def _run_line_item_extraction(
                 level=LogLevel.ERROR,
             )
 
+    def _run_post_extraction_pipeline(
+        self,
+        output: dict[str, Any],
+        structured_output: dict[str, Any],
+        metadata: dict[str, Any],
+        metrics: dict[str, Any],
+        shim: Any,
+        usage_kwargs: dict[str, Any] | None = None,
+    ) -> None:
+        """Post-extraction pipeline: lookup enrichment, webhook postprocessing.
+
+        Runs after type conversion, before challenge/evaluation.
+        """
+        from executor.executors.answer_prompt import AnswerPromptService
+        from executor.executors.constants import PromptServiceConstants as PSKeys
+        from executor.executors.plugins import ExecutorPluginLoader
+
+        prompt_name = output[PSKeys.NAME]
+        current_value = structured_output.get(prompt_name)
+
+        # Step 1: Lookup enrichment (cloud plugin)
+        lookup_config = output.get("lookup_config")
+        lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
+        if lookup_config and current_value is not None and lookup_cls:
+            _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
+            llm_adapter_id = lookup_config.get("llm_adapter_id", "")
+            llm = llm_cls(
+                adapter_instance_id=llm_adapter_id,
+                tool=shim,
+                usage_kwargs={
+                    **(usage_kwargs or {}),
+                    PSKeys.LLM_USAGE_REASON: "lookup",
+                },
+                capture_metrics=True,
+            )
+
+            enricher = lookup_cls(
+                current_value=current_value,
+                lookup_config=lookup_config,
+                structured_output=structured_output,
+                llm=llm,
+                shim=shim,
+            )
+            lookup_result = enricher.run()
+
+            if lookup_result is not None:
+                metadata.setdefault("lookup_outputs", {})[prompt_name] = {
+                    "original": str(current_value),
+                    "enriched": lookup_result,
+                    "meta": {
+                        "lookup_id": lookup_config.get("lookup_id", ""),
+                        "lookup_name": lookup_config.get("lookup_name", ""),
+                    },
+                }
+                structured_output[prompt_name] = lookup_result
+                shim.stream_log(f"Lookup enrichment complete for: {prompt_name}")
+
+            metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
+                llm.get_metrics()
+            )
+
+        # Step 2: Webhook postprocessing (JSON only, moved from handle_json)
+        output_type = output.get(PSKeys.TYPE, "")
+        webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
+        if webhook_enabled and output_type == PSKeys.JSON:
+            webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
+            highlight_data = None
+            if metadata and PSKeys.HIGHLIGHT_DATA in metadata:
+                highlight_data = metadata.get(PSKeys.HIGHLIGHT_DATA, {}).get(prompt_name)
+            processed, updated_highlights = AnswerPromptService._run_webhook_postprocess(
+                parsed_data=structured_output.get(prompt_name),
+                webhook_url=webhook_url,
+                highlight_data=highlight_data,
+            )
+            structured_output[prompt_name] = processed
+            if updated_highlights is not None and metadata:
+                metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_name] = (
+                    updated_highlights
+                )
+
     @staticmethod
     def _apply_type_conversion(
         output: dict[str, Any],
diff --git a/workers/executor/executors/plugins/protocols.py b/workers/executor/executors/plugins/protocols.py
index fb4d676b37..a5ed148a5b 100644
--- a/workers/executor/executors/plugins/protocols.py
+++ b/workers/executor/executors/plugins/protocols.py
@@ -49,3 +49,10 @@ class EvaluationProtocol(Protocol):
     """Legacy executor: prompt evaluation."""
 
     def run(self, **kwargs: Any) -> dict: ...
+
+
+@runtime_checkable
+class LookupEnrichmentProtocol(Protocol):
+    """Legacy executor: post-extraction lookup enrichment."""
+
+    def run(self) -> str | None: ...

From 68e394ba6b0a455e6ea9919d7a571eb1abd6fac7 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sat, 4 Apr 2026 03:51:31 +0530
Subject: [PATCH 05/57] UN-2946 Removed unnecessary gitignore

---
 .gitignore | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index cd4084ecdd..f6837ce079 100644
--- a/.gitignore
+++ b/.gitignore
@@ -703,4 +703,3 @@ CONTRIBUTION_GUIDE.md
 
 # MCP servers
 .serena
-.gstack/

From 059ceed1ff028be85cc0a7a86f263685e33f2915 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sat, 4 Apr 2026 04:37:04 +0530
Subject: [PATCH 06/57] UN-2946 [REFACTOR] Deduplicate lookup config helper and
 add lookup usage reason

- Extract get_lookup_config() to prompt_studio/lookup_utils.py, replacing
  4 identical try/except ImportError blocks across prompt_studio_helper
  and prompt_studio_registry_helper
- Add LOOKUP to LLMUsageReason choices (was missing, causing invalid
  choice on usage records from lookup enrichment LLM calls)
- Migration: usage_v2/0004_add_lookup_usage_reason

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         | 26 ++++++++++++
 .../prompt_studio_helper.py                   | 40 ++++---------------
 .../prompt_studio_registry_helper.py          | 14 ++-----
 .../0004_add_lookup_usage_reason.py           | 28 +++++++++++++
 backend/usage_v2/models.py                    |  1 +
 5 files changed, 65 insertions(+), 44 deletions(-)
 create mode 100644 backend/prompt_studio/lookup_utils.py
 create mode 100644 backend/usage_v2/migrations/0004_add_lookup_usage_reason.py

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
new file mode 100644
index 0000000000..f2e889f50f
--- /dev/null
+++ b/backend/prompt_studio/lookup_utils.py
@@ -0,0 +1,26 @@
+"""Shared utility for lookup config resolution.
+
+Wraps the cloud-only build_lookup_config_for_prompt call so that
+OSS callers don't repeat the try/except ImportError guard.
+"""
+
+import logging
+
+logger = logging.getLogger(__name__)
+
+
+def get_lookup_config(prompt) -> dict | None:
+    """Return lookup config for a prompt, or None if lookups are unavailable.
+
+    This is a thin wrapper around the cloud plugin's
+    build_lookup_config_for_prompt. In OSS deployments where the plugin
+    is absent, it returns None silently.
+    """
+    try:
+        from pluggable_apps.lookup_v1.execution import (
+            build_lookup_config_for_prompt,
+        )
+
+        return build_lookup_config_for_prompt(prompt)
+    except ImportError:
+        return None
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index 9b76a86782..6744171ed4 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -20,6 +20,7 @@
 from utils.local_context import StateStore
 
 from backend.celery_service import app as celery_app
+from prompt_studio.lookup_utils import get_lookup_config
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_profile_manager_v2.profile_manager_helper import (
     ProfileManagerHelper,
@@ -387,17 +388,8 @@ def _build_prompt_output(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
-        # Lookup config (cloud plugin hook)
-        try:
-            from pluggable_apps.lookup_v1.execution import (
-                build_lookup_config_for_prompt,
-            )
-
-            lookup_config = build_lookup_config_for_prompt(prompt)
-            if lookup_config:
-                output["lookup_config"] = lookup_config
-        except ImportError:
-            pass
+        if lookup_config := get_lookup_config(prompt):
+            output["lookup_config"] = lookup_config
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -810,17 +802,8 @@ def build_fetch_response_payload(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
-        # Lookup config (cloud plugin hook)
-        try:
-            from pluggable_apps.lookup_v1.execution import (
-                build_lookup_config_for_prompt,
-            )
-
-            lookup_config = build_lookup_config_for_prompt(prompt)
-            if lookup_config:
-                output["lookup_config"] = lookup_config
-        except ImportError:
-            pass
+        if lookup_config := get_lookup_config(prompt):
+            output["lookup_config"] = lookup_config
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -1917,17 +1900,8 @@ def _fetch_response(
         output[TSPKeys.ENABLE_POSTPROCESSING_WEBHOOK] = webhook_enabled
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
-        # Lookup config (cloud plugin hook)
-        try:
-            from pluggable_apps.lookup_v1.execution import (
-                build_lookup_config_for_prompt,
-            )
-
-            lookup_config = build_lookup_config_for_prompt(prompt)
-            if lookup_config:
-                output["lookup_config"] = lookup_config
-        except ImportError:
-            pass
+        if lookup_config := get_lookup_config(prompt):
+            output["lookup_config"] = lookup_config
         # Eval settings for the prompt
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 87d4fa0def..c6cb80bb07 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -7,6 +7,7 @@
 from django.db import IntegrityError
 from plugins import get_plugin
 
+from prompt_studio.lookup_utils import get_lookup_config
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.models import CustomTool
 from prompt_studio.prompt_studio_core_v2.prompt_studio_helper import PromptStudioHelper
@@ -355,17 +356,8 @@ def frame_export_json(
             output[JsonSchemaKey.POSTPROCESSING_WEBHOOK_URL] = (
                 prompt.postprocessing_webhook_url
             )
-            # Lookup config (cloud plugin hook)
-            try:
-                from pluggable_apps.lookup_v1.execution import (
-                    build_lookup_config_for_prompt,
-                )
-
-                lookup_config = build_lookup_config_for_prompt(prompt)
-                if lookup_config:
-                    output["lookup_config"] = lookup_config
-            except ImportError:
-                pass
+            if lookup_config := get_lookup_config(prompt):
+                output["lookup_config"] = lookup_config
             # Retaining the old fields in condition
             # for backward compatibility. To be removed in future.
             if (
diff --git a/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py b/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py
new file mode 100644
index 0000000000..76c628d9ee
--- /dev/null
+++ b/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py
@@ -0,0 +1,28 @@
+# Generated by Django 4.2.1 on 2026-04-03 22:44
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("usage_v2", "0003_usage_usage_executi_4deb35_idx"),
+    ]
+
+    operations = [
+        migrations.AlterField(
+            model_name="usage",
+            name="llm_usage_reason",
+            field=models.CharField(
+                blank=True,
+                choices=[
+                    ("extraction", "Extraction"),
+                    ("challenge", "Challenge"),
+                    ("summarize", "Summarize"),
+                    ("lookup", "Lookup"),
+                ],
+                db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
+                max_length=255,
+                null=True,
+            ),
+        ),
+    ]
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 8da3d751ba..dc983c56b5 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -17,6 +17,7 @@ class LLMUsageReason(models.TextChoices):
     EXTRACTION = "extraction", "Extraction"
     CHALLENGE = "challenge", "Challenge"
     SUMMARIZE = "summarize", "Summarize"
+    LOOKUP = "lookup", "Lookup"
 
 
 class UsageModelManager(DefaultOrganizationManagerMixin, models.Manager):

From 7699441e45d6b9fb362a2668d7aeca41a43ffe52 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sun, 5 Apr 2026 22:37:00 +0530
Subject: [PATCH 07/57] UN-2946 [FEAT] Add get_last_usage() to SDK1 LLM for
 token tracking

Store prompt/completion/total token counts from the most recent
complete() call on the LLM object itself, making usage data
queryable without relying on the Audit pipeline roundtrip.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 unstract/sdk1/src/unstract/sdk1/llm.py | 15 +++++++++++++++
 1 file changed, 15 insertions(+)

diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index c1730e6613..f751e7f87c 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -211,6 +211,7 @@ def __init__(  # noqa: C901
         if capture_metrics_from_platform is not None:
             self._capture_metrics = capture_metrics_from_platform
         self._metrics: dict[str, object] = {}
+        self._last_usage: Mapping[str, int] = {}
 
     def _get_adapter_info(self) -> str:
         """Build a display string identifying this adapter for errors."""
@@ -552,6 +553,10 @@ def get_model_name(self) -> str:
     def get_metrics(self) -> dict[str, object]:
         return self._metrics
 
+    def get_last_usage(self) -> Mapping[str, int]:
+        """Token usage from the most recent complete() call."""
+        return self._last_usage
+
     def get_usage_reason(self) -> object:
         return self.platform_kwargs.get("llm_usage_reason")
 
@@ -573,6 +578,12 @@ def _record_usage(
         logger.info(f"[sdk1][LLM][{model}][{llm_api}] Prompt Tokens: {prompt_tokens}")
         logger.info(f"[sdk1][LLM][{model}][{llm_api}] LLM Usage: {all_tokens}")
 
+        self._last_usage = {
+            "prompt_tokens": all_tokens.prompt_llm_token_count,
+            "completion_tokens": all_tokens.completion_llm_token_count,
+            "total_tokens": all_tokens.total_llm_token_count,
+        }
+
         Audit().push_usage_data(
             platform_api_key=self._platform_api_key,
             token_counter=all_tokens,
@@ -963,6 +974,10 @@ def get_metrics(self) -> dict[str, object]:
         """Get captured metrics."""
         return self._llm_instance.get_metrics()
 
+    def get_last_usage(self) -> Mapping[str, int]:
+        """Token usage from the most recent complete() call."""
+        return self._llm_instance.get_last_usage()
+
     def get_usage_reason(self) -> object:
         """Get usage reason from platform kwargs."""
         return self._llm_instance.get_usage_reason()

From 6e368961a5ddf821b1c4fc3bc3bdfcfad6cf8cb1 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 6 Apr 2026 00:16:19 +0530
Subject: [PATCH 08/57] UN-2946 [REFACTOR] Split post-extraction pipeline into
 lookup and webhook methods

Move lookup result-application logic to the cloud plugin, matching
the challenge plugin pattern where the plugin owns metadata mutation.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 workers/executor/executors/legacy_executor.py | 120 +++++++++---------
 1 file changed, 62 insertions(+), 58 deletions(-)

diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 0b06b24bc2..7ccdcb656d 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1654,7 +1654,7 @@ def _execute_single_prompt(
             )
             shim.stream_log(f"Applied type conversion for: {prompt_name}")
 
-            self._run_post_extraction_pipeline(
+            self._run_lookup_enrichment(
                 output=output,
                 structured_output=structured_output,
                 metadata=metadata,
@@ -1662,6 +1662,11 @@ def _execute_single_prompt(
                 shim=shim,
                 usage_kwargs=usage_kwargs,
             )
+            self._run_webhook_postprocessing(
+                output=output,
+                structured_output=structured_output,
+                metadata=metadata,
+            )
 
             self._run_challenge_if_enabled(
                 tool_settings=tool_settings,
@@ -1853,7 +1858,7 @@ def _run_line_item_extraction(
                 level=LogLevel.ERROR,
             )
 
-    def _run_post_extraction_pipeline(
+    def _run_lookup_enrichment(
         self,
         output: dict[str, Any],
         structured_output: dict[str, Any],
@@ -1862,76 +1867,75 @@ def _run_post_extraction_pipeline(
         shim: Any,
         usage_kwargs: dict[str, Any] | None = None,
     ) -> None:
-        """Post-extraction pipeline: lookup enrichment, webhook postprocessing.
-
-        Runs after type conversion, before challenge/evaluation.
-        """
-        from executor.executors.answer_prompt import AnswerPromptService
+        """Run lookup enrichment plugin if enabled and available."""
         from executor.executors.constants import PromptServiceConstants as PSKeys
         from executor.executors.plugins import ExecutorPluginLoader
 
         prompt_name = output[PSKeys.NAME]
         current_value = structured_output.get(prompt_name)
 
-        # Step 1: Lookup enrichment (cloud plugin)
         lookup_config = output.get("lookup_config")
         lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
-        if lookup_config and current_value is not None and lookup_cls:
-            _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
-            llm_adapter_id = lookup_config.get("llm_adapter_id", "")
-            llm = llm_cls(
-                adapter_instance_id=llm_adapter_id,
-                tool=shim,
-                usage_kwargs={
-                    **(usage_kwargs or {}),
-                    PSKeys.LLM_USAGE_REASON: "lookup",
-                },
-                capture_metrics=True,
-            )
+        if not (lookup_config and current_value is not None and lookup_cls):
+            return
 
-            enricher = lookup_cls(
-                current_value=current_value,
-                lookup_config=lookup_config,
-                structured_output=structured_output,
-                llm=llm,
-                shim=shim,
-            )
-            lookup_result = enricher.run()
-
-            if lookup_result is not None:
-                metadata.setdefault("lookup_outputs", {})[prompt_name] = {
-                    "original": str(current_value),
-                    "enriched": lookup_result,
-                    "meta": {
-                        "lookup_id": lookup_config.get("lookup_id", ""),
-                        "lookup_name": lookup_config.get("lookup_name", ""),
-                    },
-                }
-                structured_output[prompt_name] = lookup_result
-                shim.stream_log(f"Lookup enrichment complete for: {prompt_name}")
+        _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
+        llm_adapter_id = lookup_config.get("llm_adapter_id", "")
+        llm = llm_cls(
+            adapter_instance_id=llm_adapter_id,
+            tool=shim,
+            usage_kwargs={
+                **(usage_kwargs or {}),
+                PSKeys.LLM_USAGE_REASON: "lookup",
+            },
+            capture_metrics=True,
+        )
 
-            metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
-                llm.get_metrics()
-            )
+        enricher = lookup_cls(
+            current_value=current_value,
+            lookup_config=lookup_config,
+            structured_output=structured_output,
+            llm=llm,
+            shim=shim,
+            metadata=metadata,
+            prompt_name=prompt_name,
+        )
+        enricher.run()
+
+        metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
+            llm.get_metrics()
+        )
 
-        # Step 2: Webhook postprocessing (JSON only, moved from handle_json)
+    @staticmethod
+    def _run_webhook_postprocessing(
+        output: dict[str, Any],
+        structured_output: dict[str, Any],
+        metadata: dict[str, Any],
+    ) -> None:
+        """Run webhook postprocessing if enabled (JSON outputs only)."""
+        from executor.executors.answer_prompt import AnswerPromptService
+        from executor.executors.constants import PromptServiceConstants as PSKeys
+
+        prompt_name = output[PSKeys.NAME]
         output_type = output.get(PSKeys.TYPE, "")
         webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
-        if webhook_enabled and output_type == PSKeys.JSON:
-            webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
-            highlight_data = None
-            if metadata and PSKeys.HIGHLIGHT_DATA in metadata:
-                highlight_data = metadata.get(PSKeys.HIGHLIGHT_DATA, {}).get(prompt_name)
-            processed, updated_highlights = AnswerPromptService._run_webhook_postprocess(
-                parsed_data=structured_output.get(prompt_name),
-                webhook_url=webhook_url,
-                highlight_data=highlight_data,
+        if not (webhook_enabled and output_type == PSKeys.JSON):
+            return
+
+        webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
+        highlight_data = None
+        if metadata and PSKeys.HIGHLIGHT_DATA in metadata:
+            highlight_data = metadata.get(PSKeys.HIGHLIGHT_DATA, {}).get(prompt_name)
+        processed, updated_highlights = AnswerPromptService._run_webhook_postprocess(
+            parsed_data=structured_output.get(prompt_name),
+            webhook_url=webhook_url,
+            highlight_data=highlight_data,
+        )
+        structured_output[prompt_name] = processed
+        if updated_highlights is not None and metadata:
+            metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_name] = (
+                updated_highlights
             )
-            structured_output[prompt_name] = processed
-            if updated_highlights is not None and metadata:
-                metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_name] = (
-                    updated_highlights
-                )
 
     @staticmethod
     def _apply_type_conversion(

From 5b8c06dfa6db8f737fea7ae44c460e7673f4e4e9 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 6 Apr 2026 02:46:32 +0530
Subject: [PATCH 09/57] UN-2946 [FEAT] Generic async extraction callbacks and
 WebSocket transport fallback

Add reusable extraction_complete/extraction_error callback tasks to the
ide_callback worker, replacing the need for Django-based celery workers
for text extraction. Add ExtractionAPIClient for internal API calls.
Add polling fallback to WebSocket transport for local dev reliability.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/utils/websocket_views.py            |   2 +-
 frontend/src/helpers/SocketContext.js       |   2 +-
 workers/ide_callback/tasks.py               | 159 ++++++++++++++++++++
 workers/shared/clients/extraction_client.py |  63 ++++++++
 4 files changed, 224 insertions(+), 2 deletions(-)
 create mode 100644 workers/shared/clients/extraction_client.py

diff --git a/backend/utils/websocket_views.py b/backend/utils/websocket_views.py
index a57521ca43..51998399c4 100644
--- a/backend/utils/websocket_views.py
+++ b/backend/utils/websocket_views.py
@@ -63,7 +63,7 @@ def emit_websocket(request):
         # Emit the WebSocket event
         _emit_websocket_event(room=room, event=event, data=message_data)
 
-        logger.debug(f"WebSocket event emitted: room={room}, event={event}")
+        logger.info(f"WebSocket event emitted: room={room}, event={event}")
 
         return JsonResponse(
             {
diff --git a/frontend/src/helpers/SocketContext.js b/frontend/src/helpers/SocketContext.js
index 6e6ace9a63..ec6a274e9e 100644
--- a/frontend/src/helpers/SocketContext.js
+++ b/frontend/src/helpers/SocketContext.js
@@ -16,7 +16,7 @@ const SocketProvider = ({ children }) => {
     // This ensures session cookies are sent (same-origin) and avoids
     // cross-origin WebSocket issues.
     const newSocket = io(getBaseUrl(), {
-      transports: ["websocket"],
+      transports: ["websocket", "polling"],
       path: "/api/v1/socket",
     });
     setSocket(newSocket);
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index cb610678b1..e2b3b4dcf6 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -504,3 +504,162 @@ def ide_prompt_error(
         )
     except Exception:
         logger.exception("ide_prompt_error callback failed")
+
+
+# ------------------------------------------------------------------
+# Generic Text Extraction Callbacks
+#
+# Reusable extraction callbacks that route based on ``source`` in
+# callback_kwargs (e.g. "lookup", future "prompt_studio").
+# ------------------------------------------------------------------
+
+
+def _get_extraction_client():
+    from shared.clients.extraction_client import ExtractionAPIClient
+
+    return ExtractionAPIClient()
+
+
+@app.task(name="extraction_complete")
+def extraction_complete(
+    result_dict: dict[str, Any],
+    callback_kwargs: dict[str, Any] | None = None,
+) -> dict[str, Any]:
+    """Celery link callback after successful text extraction.
+
+    Computes token count from extracted text, persists result via
+    internal API, and emits a WebSocket event.
+    """
+    cb = callback_kwargs or {}
+    source = cb.get("source", "")
+    file_id = cb.get("file_id", "")
+    org_id = cb.get("org_id", "")
+    extracted_text_path = cb.get("extracted_text_path", "")
+    ws_room = cb.get("ws_room", "")
+    ws_event = cb.get("ws_event", "")
+
+    api = _get_extraction_client()
+    ps_api = _get_api_client()
+
+    try:
+        # Check executor-level failure
+        if not result_dict.get("success", False):
+            error_msg = result_dict.get("error", "Unknown executor error")
+            logger.error(
+                "extraction executor reported failure: source=%s file=%s error=%s",
+                source,
+                file_id,
+                error_msg,
+            )
+            api.mark_extraction_error(
+                source=source,
+                file_id=file_id,
+                error=error_msg,
+                organization_id=org_id,
+            )
+            if ws_room and ws_event:
+                _emit_websocket(
+                    ps_api,
+                    room=ws_room,
+                    event=ws_event,
+                    data={
+                        "file_id": file_id,
+                        "status": "ERROR",
+                        "error": error_msg[:500],
+                    },
+                )
+            return {"status": "failed", "error": error_msg}
+
+        extracted_text = result_dict.get("data", {}).get("extracted_text", "")
+        token_count = len(extracted_text) // 4
+
+        api.mark_extraction_complete(
+            source=source,
+            file_id=file_id,
+            token_count=token_count,
+            extracted_text_path=extracted_text_path,
+            organization_id=org_id,
+        )
+
+        if ws_room and ws_event:
+            _emit_websocket(
+                ps_api,
+                room=ws_room,
+                event=ws_event,
+                data={
+                    "file_id": file_id,
+                    "status": "COMPLETED",
+                    "token_count": token_count,
+                },
+            )
+
+        logger.info(
+            "Extraction completed: source=%s file=%s tokens=%d",
+            source,
+            file_id,
+            token_count,
+        )
+        return {"status": "completed", "file_id": file_id, "token_count": token_count}
+
+    except Exception as e:
+        logger.exception(
+            "extraction_complete callback failed: source=%s file=%s", source, file_id
+        )
+        if ws_room and ws_event:
+            try:
+                _emit_websocket(
+                    ps_api,
+                    room=ws_room,
+                    event=ws_event,
+                    data={
+                        "file_id": file_id,
+                        "status": "ERROR",
+                        "error": str(e)[:500],
+                    },
+                )
+            except Exception:
+                pass
+        raise
+
+
+@app.task(name="extraction_error")
+def extraction_error(
+    failed_task_id: str,
+    callback_kwargs: dict[str, Any] | None = None,
+) -> None:
+    """Celery link_error callback when an extraction task fails."""
+    cb = callback_kwargs or {}
+    source = cb.get("source", "")
+    file_id = cb.get("file_id", "")
+    org_id = cb.get("org_id", "")
+    ws_room = cb.get("ws_room", "")
+    ws_event = cb.get("ws_event", "")
+
+    api = _get_extraction_client()
+    ps_api = _get_api_client()
+
+    try:
+        error_msg = _get_task_error(failed_task_id, default="Text extraction failed")
+
+        api.mark_extraction_error(
+            source=source,
+            file_id=file_id,
+            error=error_msg,
+            organization_id=org_id,
+        )
+
+        if ws_room and ws_event:
+            _emit_websocket(
+                ps_api,
+                room=ws_room,
+                event=ws_event,
+                data={
+                    "file_id": file_id,
+                    "status": "ERROR",
+                    "error": error_msg[:500],
+                },
+            )
+    except Exception:
+        logger.exception(
+            "extraction_error callback failed: source=%s file=%s", source, file_id
+        )
diff --git a/workers/shared/clients/extraction_client.py b/workers/shared/clients/extraction_client.py
new file mode 100644
index 0000000000..db6781be62
--- /dev/null
+++ b/workers/shared/clients/extraction_client.py
@@ -0,0 +1,63 @@
+"""Extraction API Client for text extraction callbacks.
+
+Used by the ide_callback worker to persist extraction results
+through the backend's internal API endpoints.
+"""
+
+import logging
+from typing import Any
+
+from .base_client import BaseAPIClient
+
+logger = logging.getLogger(__name__)
+
+_EXTRACTION_COMPLETE_ENDPOINT = "v1/extraction/extraction-complete/"
+_EXTRACTION_ERROR_ENDPOINT = "v1/extraction/extraction-error/"
+
+
+class ExtractionAPIClient(BaseAPIClient):
+    """API client for generic text extraction callback endpoints."""
+
+    def mark_extraction_complete(
+        self,
+        source: str,
+        file_id: str,
+        token_count: int,
+        extracted_text_path: str,
+        organization_id: str | None = None,
+        **extra: Any,
+    ) -> dict[str, Any]:
+        """Notify backend that extraction succeeded."""
+        payload: dict[str, Any] = {
+            "source": source,
+            "file_id": file_id,
+            "token_count": token_count,
+            "extracted_text_path": extracted_text_path,
+            **extra,
+        }
+        return self.post(
+            _EXTRACTION_COMPLETE_ENDPOINT,
+            data=payload,
+            organization_id=organization_id,
+        )
+
+    def mark_extraction_error(
+        self,
+        source: str,
+        file_id: str,
+        error: str,
+        organization_id: str | None = None,
+        **extra: Any,
+    ) -> dict[str, Any]:
+        """Notify backend that extraction failed."""
+        payload: dict[str, Any] = {
+            "source": source,
+            "file_id": file_id,
+            "error": error,
+            **extra,
+        }
+        return self.post(
+            _EXTRACTION_ERROR_ENDPOINT,
+            data=payload,
+            organization_id=organization_id,
+        )

From df4956945ced453861bb540d330f28aa26d96ff4 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 6 Apr 2026 03:24:17 +0530
Subject: [PATCH 10/57] Reduce success notification duration from 2s to 1s for
 less intrusive UX

---
 frontend/src/store/alert-store.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/frontend/src/store/alert-store.js b/frontend/src/store/alert-store.js
index 24549e09ce..5c5cf5c16d 100644
--- a/frontend/src/store/alert-store.js
+++ b/frontend/src/store/alert-store.js
@@ -4,7 +4,7 @@ import { create } from "zustand";
 import { isNonNegativeNumber } from "../helpers/GetStaticData";
 
 const DEFAULT_DURATION = 6;
-const SUCCESS_DURATION = 2;
+const SUCCESS_DURATION = 1;
 
 const STORE_VARIABLES = {
   alertDetails: {

From 5e39f704ba2d13fa33a93814e75d358d1a65763b Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 6 Apr 2026 03:27:33 +0530
Subject: [PATCH 11/57] Revert "Reduce success notification duration from 2s to
 1s for less intrusive UX"

This reverts commit d6e136deefc3a8a5f90dc2007a4ba5c4d7effdf9.
---
 frontend/src/store/alert-store.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/frontend/src/store/alert-store.js b/frontend/src/store/alert-store.js
index 5c5cf5c16d..24549e09ce 100644
--- a/frontend/src/store/alert-store.js
+++ b/frontend/src/store/alert-store.js
@@ -4,7 +4,7 @@ import { create } from "zustand";
 import { isNonNegativeNumber } from "../helpers/GetStaticData";
 
 const DEFAULT_DURATION = 6;
-const SUCCESS_DURATION = 1;
+const SUCCESS_DURATION = 2;
 
 const STORE_VARIABLES = {
   alertDetails: {

From e4c023eb5f9b1c7c96fb8387dc9783163b52c709 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 7 Apr 2026 04:52:27 +0530
Subject: [PATCH 12/57] UN-2946 [REFACTOR] Pluggable lookup export validation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Replace inline DRAFT lookup check with pluggable cloud-only hook.
Uses try/except ImportError pattern — zero lookup code in OSS.
Collects all DRAFT lookups in one pass with markdown-linked error messages.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .../prompt_studio_registry_helper.py          | 19 ++++++++++++++++---
 1 file changed, 16 insertions(+), 3 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index c6cb80bb07..bb7841c108 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -7,7 +7,6 @@
 from django.db import IntegrityError
 from plugins import get_plugin
 
-from prompt_studio.lookup_utils import get_lookup_config
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.models import CustomTool
 from prompt_studio.prompt_studio_core_v2.prompt_studio_helper import PromptStudioHelper
@@ -298,6 +297,19 @@ def frame_export_json(
             settings, JsonSchemaKey.WORD_CONFIDENCE_POSTAMBLE.upper(), ""
         )
 
+        # Validate lookup assignments (cloud-only, no-op in OSS)
+        lookup_configs = {}
+        try:
+            from pluggable_apps.lookup_v1.validation import (
+                validate_lookups_for_export,
+            )
+
+            lookup_configs, lookup_error = validate_lookups_for_export(prompts)
+            if lookup_error:
+                raise InValidCustomToolError(lookup_error)
+        except ImportError:
+            pass
+
         for prompt in prompts:
             if prompt.prompt_type == JsonSchemaKey.NOTES or not prompt.active:
                 continue
@@ -356,8 +368,9 @@ def frame_export_json(
             output[JsonSchemaKey.POSTPROCESSING_WEBHOOK_URL] = (
                 prompt.postprocessing_webhook_url
             )
-            if lookup_config := get_lookup_config(prompt):
-                output["lookup_config"] = lookup_config
+            prompt_id_str = str(prompt.prompt_id)
+            if prompt_id_str in lookup_configs:
+                output["lookup_config"] = lookup_configs[prompt_id_str]
             # Retaining the old fields in condition
             # for backward compatibility. To be removed in future.
             if (

From 9bf072e8e7fb7918cf25ea11a9be19509b4c412c Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 7 Apr 2026 16:52:32 +0530
Subject: [PATCH 13/57] UN-2946 [REFACTOR] Lookups V2 review cleanup

- Consolidate cloud imports into lookup_utils.py with persist_lookup_output() and validate_lookups_for_export() wrappers
- Fix LookupEnrichmentProtocol.run() return type to None matching challenge/evaluation pattern
- Revert logger.info to logger.debug in websocket_views.py
- Eliminate duplicated LookupOutputTabs ternary with renderWithLookupWrapper helper
- Move lookups menu constants from SideNavBar.jsx to cloud plugin
- Harden DocumentParser.jsx scrollTo with UUID validation and fix useEffect dependency
- Revert SocketContext transport to ["websocket"]

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         | 44 ++++++++---
 .../output_manager_helper.py                  | 20 +----
 .../prompt_studio_registry_helper.py          | 15 +---
 backend/utils/websocket_views.py              |  2 +-
 .../document-parser/DocumentParser.jsx        | 10 ++-
 .../custom-tools/prompt-card/PromptOutput.jsx | 75 +++++++------------
 .../navigations/side-nav-bar/SideNavBar.jsx   | 43 +----------
 frontend/src/helpers/SocketContext.js         |  2 +-
 .../executor/executors/plugins/protocols.py   |  2 +-
 9 files changed, 81 insertions(+), 132 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index f2e889f50f..823d9fc015 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -1,7 +1,7 @@
-"""Shared utility for lookup config resolution.
+"""Shared utility for lookup operations.
 
-Wraps the cloud-only build_lookup_config_for_prompt call so that
-OSS callers don't repeat the try/except ImportError guard.
+Wraps cloud-only lookup calls so that OSS callers don't repeat
+the try/except ImportError guard. All functions are no-ops in OSS.
 """
 
 import logging
@@ -10,12 +10,7 @@
 
 
 def get_lookup_config(prompt) -> dict | None:
-    """Return lookup config for a prompt, or None if lookups are unavailable.
-
-    This is a thin wrapper around the cloud plugin's
-    build_lookup_config_for_prompt. In OSS deployments where the plugin
-    is absent, it returns None silently.
-    """
+    """Return lookup config for a prompt, or None if lookups are unavailable."""
     try:
         from pluggable_apps.lookup_v1.execution import (
             build_lookup_config_for_prompt,
@@ -24,3 +19,34 @@ def get_lookup_config(prompt) -> dict | None:
         return build_lookup_config_for_prompt(prompt)
     except ImportError:
         return None
+
+
+def persist_lookup_output(prompt_output, prompt_lookup: dict) -> None:
+    """Persist lookup enrichment result. No-op in OSS."""
+    try:
+        from pluggable_apps.lookup_v1.models import LookupOutputResult
+
+        lookup_meta = prompt_lookup.get("meta", {})
+        lookup_id = lookup_meta.get("lookup_id")
+        if lookup_id:
+            LookupOutputResult.objects.update_or_create(
+                prompt_output=prompt_output,
+                defaults={
+                    "lookup_definition_id": lookup_id,
+                    "output": prompt_lookup.get("enriched", ""),
+                },
+            )
+    except ImportError:
+        pass
+
+
+def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
+    """Validate lookup assignments before export. Returns ({}, None) in OSS."""
+    try:
+        from pluggable_apps.lookup_v1.validation import (
+            validate_lookups_for_export as _validate,
+        )
+
+        return _validate(prompts)
+    except ImportError:
+        return {}, None
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index d0197e128f..0fb92c126d 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -4,6 +4,7 @@
 
 from django.core.exceptions import ObjectDoesNotExist
 
+from prompt_studio.lookup_utils import persist_lookup_output
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.exceptions import (
     AnswerFetchError,
@@ -198,25 +199,10 @@ def update_or_create_prompt_output(
                 word_confidence_data=prompt_word_confidence_data,
             )
 
-            # Persist lookup outputs if present (cloud plugin)
+            # Persist lookup outputs if present (cloud plugin, no-op in OSS)
             if prompt_lookup:
                 try:
-                    from pluggable_apps.lookup_v1.models import (
-                        LookupOutputResult,
-                    )
-
-                    lookup_meta = prompt_lookup.get("meta", {})
-                    lookup_id = lookup_meta.get("lookup_id")
-                    if lookup_id:
-                        LookupOutputResult.objects.update_or_create(
-                            prompt_output=prompt_output,
-                            defaults={
-                                "lookup_definition_id": lookup_id,
-                                "output": prompt_lookup.get("enriched", ""),
-                            },
-                        )
-                except ImportError:
-                    pass
+                    persist_lookup_output(prompt_output, prompt_lookup)
                 except Exception:
                     logger.warning(
                         "Failed to persist lookup output for prompt %s",
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index bb7841c108..92cfb6e160 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -7,6 +7,7 @@
 from django.db import IntegrityError
 from plugins import get_plugin
 
+from prompt_studio.lookup_utils import validate_lookups_for_export
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.models import CustomTool
 from prompt_studio.prompt_studio_core_v2.prompt_studio_helper import PromptStudioHelper
@@ -298,17 +299,9 @@ def frame_export_json(
         )
 
         # Validate lookup assignments (cloud-only, no-op in OSS)
-        lookup_configs = {}
-        try:
-            from pluggable_apps.lookup_v1.validation import (
-                validate_lookups_for_export,
-            )
-
-            lookup_configs, lookup_error = validate_lookups_for_export(prompts)
-            if lookup_error:
-                raise InValidCustomToolError(lookup_error)
-        except ImportError:
-            pass
+        lookup_configs, lookup_error = validate_lookups_for_export(prompts)
+        if lookup_error:
+            raise InValidCustomToolError(lookup_error)
 
         for prompt in prompts:
             if prompt.prompt_type == JsonSchemaKey.NOTES or not prompt.active:
diff --git a/backend/utils/websocket_views.py b/backend/utils/websocket_views.py
index 51998399c4..a57521ca43 100644
--- a/backend/utils/websocket_views.py
+++ b/backend/utils/websocket_views.py
@@ -63,7 +63,7 @@ def emit_websocket(request):
         # Emit the WebSocket event
         _emit_websocket_event(room=room, event=event, data=message_data)
 
-        logger.info(f"WebSocket event emitted: room={room}, event={event}")
+        logger.debug(f"WebSocket event emitted: room={room}, event={event}")
 
         return JsonResponse(
             {
diff --git a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
index c5e60a2c93..2b55e26807 100644
--- a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
+++ b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
@@ -111,9 +111,15 @@ function DocumentParser({
   }, [scrollToBottom]);
 
   // Handle scrollTo query param for cross-linking from Lookup Studio
+  const UUID_RE =
+    /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
   useEffect(() => {
     const scrollToPromptId = searchParams.get("scrollTo");
-    if (!scrollToPromptId || !details?.prompts?.length) {
+    if (
+      !scrollToPromptId ||
+      !UUID_RE.test(scrollToPromptId) ||
+      !details?.prompts?.length
+    ) {
       return;
     }
 
@@ -127,7 +133,7 @@ function DocumentParser({
     // Clear the param so it doesn't re-trigger
     searchParams.delete("scrollTo");
     setSearchParams(searchParams, { replace: true });
-  }, [details?.prompts]);
+  }, [details?.prompts, searchParams]);
 
   const promptUrl = (urlPath) => {
     return `/api/v1/unstract/${sessionDetails?.orgId}/prompt-studio/prompt/${urlPath}`;
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index 02e552ae44..872c657b2d 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -61,6 +61,15 @@ try {
   // Not available in OSS
 }
 
+// Wraps children in LookupOutputTabs when available (cloud),
+// passes through children directly in OSS.
+const renderWithLookupWrapper = (lookupProps, children) =>
+  LookupOutputTabs ? (
+    <LookupOutputTabs {...lookupProps}>{children}</LookupOutputTabs>
+  ) : (
+    children
+  );
+
 function PromptOutput({
   promptDetails,
   handleRun,
@@ -203,31 +212,13 @@ function PromptOutput({
             "highlighted-prompt-cell"
           }`}
         >
-          {LookupOutputTabs ? (
-            <LookupOutputTabs
-              promptId={promptId}
-              profileManagerId={defaultLlmProfile}
-              defaultLlmProfile={defaultLlmProfile}
-              promptOutputId={promptOutputData?.promptOutputId}
-            >
-              <DisplayPromptResult
-                output={promptOutput}
-                highlightData={
-                  promptOutputData?.highlightData?.[promptDetails.prompt_key]
-                }
-                handleSelectHighlight={handleSelectHighlight}
-                confidenceData={
-                  promptOutputData?.confidenceData?.[promptDetails.prompt_key]
-                }
-                wordConfidenceData={
-                  promptOutputData?.wordConfidenceData?.[
-                    promptDetails.prompt_key
-                  ]
-                }
-                progressMsg={progressMsg}
-              />
-            </LookupOutputTabs>
-          ) : (
+          {renderWithLookupWrapper(
+            {
+              promptId,
+              profileManagerId: defaultLlmProfile,
+              defaultLlmProfile,
+              promptOutputId: promptOutputData?.promptOutputId,
+            },
             <DisplayPromptResult
               output={promptOutput}
               highlightData={
@@ -241,7 +232,7 @@ function PromptOutput({
                 promptOutputData?.wordConfidenceData?.[promptDetails.prompt_key]
               }
               progressMsg={progressMsg}
-            />
+            />,
           )}
           <div className="prompt-profile-run">
             <CopyPromptOutputBtn
@@ -465,29 +456,13 @@ function PromptOutput({
                       handleTable(profileId, promptOutputData)
                     ) : (
                       <>
-                        {LookupOutputTabs ? (
-                          <LookupOutputTabs
-                            promptId={promptId}
-                            profileManagerId={profileId}
-                            defaultLlmProfile={defaultLlmProfile}
-                            promptOutputId={promptOutputData?.promptOutputId}
-                          >
-                            <DisplayPromptResult
-                              output={promptOutputData?.output}
-                              profileId={profileId}
-                              docId={selectedDoc?.document_id}
-                              promptRunStatus={promptRunStatus}
-                              handleSelectHighlight={handleSelectHighlight}
-                              highlightData={promptOutputData?.highlightData}
-                              confidenceData={promptOutputData?.confidenceData}
-                              wordConfidenceData={
-                                promptOutputData?.wordConfidenceData
-                              }
-                              promptDetails={promptDetails}
-                              progressMsg={progressMsg}
-                            />
-                          </LookupOutputTabs>
-                        ) : (
+                        {renderWithLookupWrapper(
+                          {
+                            promptId,
+                            profileManagerId: profileId,
+                            defaultLlmProfile,
+                            promptOutputId: promptOutputData?.promptOutputId,
+                          },
                           <DisplayPromptResult
                             output={promptOutputData?.output}
                             profileId={profileId}
@@ -501,7 +476,7 @@ function PromptOutput({
                             }
                             promptDetails={promptDetails}
                             progressMsg={progressMsg}
-                          />
+                          />,
                         )}
                         <div className="prompt-profile-run">
                           <CopyPromptOutputBtn
diff --git a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
index 3f6f43733f..b3b1d0a014 100644
--- a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
+++ b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
@@ -90,9 +90,11 @@ try {
 }
 
 let lookupStudioEnabled = false;
+let PromptStudioPopoverContent = null;
 try {
-  await import("../../../plugins/lookup-studio");
+  const mod = await import("../../../plugins/lookup-studio");
   lookupStudioEnabled = true;
+  PromptStudioPopoverContent = mod.PromptStudioPopoverContent;
 } catch {
   // Plugin unavailable
 }
@@ -266,45 +268,6 @@ HITLPopoverContent.propTypes = {
   navigate: PropTypes.func.isRequired,
 };
 
-const PROMPT_STUDIO_MENU_ITEMS = [
-  { key: "projects", label: "Projects", subPath: "/tools" },
-  { key: "lookups", label: "Look-Ups", subPath: "/lookups" },
-];
-
-const getActivePromptStudioKey = (orgName) => {
-  const currentPath = globalThis.location.pathname;
-  if (currentPath.startsWith(`/${orgName}/lookups`)) {
-    return "lookups";
-  }
-  return "projects";
-};
-
-const PromptStudioPopoverContent = ({ orgName, navigate }) => {
-  const activeKey = getActivePromptStudioKey(orgName);
-
-  return (
-    <nav className="settings-sidebar-popover">
-      {PROMPT_STUDIO_MENU_ITEMS.map((menuItem) => (
-        <button
-          key={menuItem.key}
-          type="button"
-          className={`settings-menu-item ${
-            activeKey === menuItem.key ? "active" : ""
-          }`}
-          onClick={() => navigate(`/${orgName}${menuItem.subPath}`)}
-        >
-          {menuItem.label}
-        </button>
-      ))}
-    </nav>
-  );
-};
-
-PromptStudioPopoverContent.propTypes = {
-  orgName: PropTypes.string.isRequired,
-  navigate: PropTypes.func.isRequired,
-};
-
 const SideNavBar = ({ collapsed, setCollapsed }) => {
   const navigate = useNavigate();
   const { sessionDetails } = useSessionStore();
diff --git a/frontend/src/helpers/SocketContext.js b/frontend/src/helpers/SocketContext.js
index ec6a274e9e..6e6ace9a63 100644
--- a/frontend/src/helpers/SocketContext.js
+++ b/frontend/src/helpers/SocketContext.js
@@ -16,7 +16,7 @@ const SocketProvider = ({ children }) => {
     // This ensures session cookies are sent (same-origin) and avoids
     // cross-origin WebSocket issues.
     const newSocket = io(getBaseUrl(), {
-      transports: ["websocket", "polling"],
+      transports: ["websocket"],
       path: "/api/v1/socket",
     });
     setSocket(newSocket);
diff --git a/workers/executor/executors/plugins/protocols.py b/workers/executor/executors/plugins/protocols.py
index a5ed148a5b..9ce1c5eb9e 100644
--- a/workers/executor/executors/plugins/protocols.py
+++ b/workers/executor/executors/plugins/protocols.py
@@ -55,4 +55,4 @@ def run(self, **kwargs: Any) -> dict: ...
 class LookupEnrichmentProtocol(Protocol):
     """Legacy executor: post-extraction lookup enrichment."""
 
-    def run(self) -> str | None: ...
+    def run(self) -> None: ...

From ae4ba0a130d1aee7914750d7f7a7773590a7e8fe Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 7 Apr 2026 19:45:01 +0530
Subject: [PATCH 14/57] UN-2946 [UI] Replace sidebar popover with in-page tabs
 for Lookups

Move Prompt Studio / Look-Ups navigation from a hover popover on the
sidebar into a Segmented control within the ToolNavBar. CustomTools
dynamically imports LookupList from the plugin and renders tabs when
available, falling back to projects-only view in OSS mode.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .../list-of-tools/ListOfTools.jsx             | 13 +++-
 .../navigations/side-nav-bar/SideNavBar.jsx   | 73 ++-----------------
 .../navigations/tool-nav-bar/ToolNavBar.jsx   |  3 +
 frontend/src/pages/CustomTools.jsx            | 30 +++++++-
 4 files changed, 48 insertions(+), 71 deletions(-)

diff --git a/frontend/src/components/custom-tools/list-of-tools/ListOfTools.jsx b/frontend/src/components/custom-tools/list-of-tools/ListOfTools.jsx
index dd1e55853b..86ab15ab16 100644
--- a/frontend/src/components/custom-tools/list-of-tools/ListOfTools.jsx
+++ b/frontend/src/components/custom-tools/list-of-tools/ListOfTools.jsx
@@ -48,7 +48,7 @@ DefaultCustomButtons.propTypes = {
   handleNewProjectBtnClick: PropTypes.func.isRequired,
 };
 
-function ListOfTools() {
+function ListOfTools({ segmentOptions, segmentValue, onSegmentChange }) {
   const [isListLoading, setIsListLoading] = useState(false);
   const [openAddTool, setOpenAddTool] = useState(false);
   const [openImportTool, setOpenImportTool] = useState(false);
@@ -373,12 +373,15 @@ function ListOfTools() {
   return (
     <>
       <ToolNavBar
-        title={"Prompt Studio"}
+        title="Prompt Studio"
         enableSearch
         onSearch={onSearch}
         searchList={listOfTools}
         setSearchList={setFilteredListOfTools}
         customButtons={customButtonsElement}
+        segmentOptions={segmentOptions}
+        segmentValue={segmentValue}
+        segmentFilter={onSegmentChange}
       />
       <div className="list-of-tools-layout">
         <div className="list-of-tools-island">{defaultContent}</div>
@@ -412,4 +415,10 @@ function ListOfTools() {
   );
 }
 
+ListOfTools.propTypes = {
+  segmentOptions: PropTypes.arrayOf(PropTypes.string),
+  segmentValue: PropTypes.string,
+  onSegmentChange: PropTypes.func,
+};
+
 export { ListOfTools };
diff --git a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
index b3b1d0a014..7cecc20333 100644
--- a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
+++ b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
@@ -90,11 +90,9 @@ try {
 }
 
 let lookupStudioEnabled = false;
-let PromptStudioPopoverContent = null;
 try {
-  const mod = await import("../../../plugins/lookup-studio");
+  await import("../../../plugins/lookup-studio");
   lookupStudioEnabled = true;
-  PromptStudioPopoverContent = mod.PromptStudioPopoverContent;
 } catch {
   // Plugin unavailable
 }
@@ -516,11 +514,13 @@ const SideNavBar = ({ collapsed, setCollapsed }) => {
     });
   }
 
-  // Mark Prompt Studio item for popover rendering when lookups plugin is available
+  // Extend Prompt Studio active state to include /lookups paths
   if (lookupStudioEnabled && isUnstract) {
     const psItem = data[0]?.subMenu?.find((el) => el.id === 1.1);
     if (psItem) {
-      psItem.hasLookupPopover = true;
+      psItem.active =
+        psItem.active ||
+        globalThis.location.pathname.startsWith(`/${orgName}/lookups`);
     }
   }
 
@@ -718,69 +718,6 @@ const SideNavBar = ({ collapsed, setCollapsed }) => {
                       );
                     }
 
-                    // Prompt Studio with Look-Ups popover
-                    if (el.hasLookupPopover) {
-                      const psContent = (
-                        <Tooltip title={collapsed ? el.title : ""}>
-                          <Space
-                            className={`space-styles ${
-                              el.active ||
-                              globalThis.location.pathname.startsWith(
-                                `/${orgName}/lookups`,
-                              )
-                                ? "space-styles-active"
-                                : ""
-                            } ${el.disable ? "space-styles-disable" : ""}`}
-                            onClick={() => {
-                              if (!el.disable) {
-                                navigate(el.path);
-                              }
-                            }}
-                            data-testid="sidebar-prompt-studio"
-                          >
-                            <Image
-                              src={el.image}
-                              alt="side_icon"
-                              className="menu-item-icon"
-                              preview={false}
-                            />
-                            {!collapsed && (
-                              <div>
-                                <Typography className="sidebar-item-text fs-14">
-                                  {el.title}
-                                </Typography>
-                                <Typography className="sidebar-item-text fs-11">
-                                  {el.description}
-                                </Typography>
-                              </div>
-                            )}
-                          </Space>
-                        </Tooltip>
-                      );
-
-                      if (el.disable) {
-                        return <div key={el.id}>{psContent}</div>;
-                      }
-
-                      return (
-                        <Popover
-                          key={el.id}
-                          content={
-                            <PromptStudioPopoverContent
-                              orgName={orgName}
-                              navigate={navigate}
-                            />
-                          }
-                          trigger="hover"
-                          placement="rightTop"
-                          arrow={false}
-                          overlayClassName="settings-popover-overlay"
-                        >
-                          {psContent}
-                        </Popover>
-                      );
-                    }
-
                     return (
                       <Tooltip key={el.id} title={collapsed ? el.title : ""}>
                         <Space
diff --git a/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx b/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
index 999630d596..677fba8a1e 100644
--- a/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
+++ b/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
@@ -19,6 +19,7 @@ function ToolNavBar({
   onNavigateBack,
   segmentFilter,
   segmentOptions,
+  segmentValue,
   onSearch,
   searchKey,
 }) {
@@ -79,6 +80,7 @@ function ToolNavBar({
         {segmentFilter && segmentOptions && (
           <Segmented
             options={segmentOptions}
+            value={segmentValue}
             onChange={segmentFilter}
             className="tool-nav-bar__segment"
           />
@@ -111,6 +113,7 @@ ToolNavBar.propTypes = {
   previousRouteState: PropTypes.object,
   onNavigateBack: PropTypes.func,
   segmentOptions: PropTypes.array,
+  segmentValue: PropTypes.string,
   segmentFilter: PropTypes.func,
   onSearch: PropTypes.func,
   searchKey: PropTypes.string,
diff --git a/frontend/src/pages/CustomTools.jsx b/frontend/src/pages/CustomTools.jsx
index bd177301c7..1f6c2d3934 100644
--- a/frontend/src/pages/CustomTools.jsx
+++ b/frontend/src/pages/CustomTools.jsx
@@ -1,7 +1,35 @@
+import { useEffect, useState } from "react";
+
 import { ListOfTools } from "../components/custom-tools/list-of-tools/ListOfTools";
 
+const TAB_OPTIONS = ["Projects", "Look-Ups"];
+
 function CustomTools() {
-  return <ListOfTools />;
+  const [LookupListComp, setLookupListComp] = useState(null);
+  const [activeTab, setActiveTab] = useState("Projects");
+
+  useEffect(() => {
+    import("../plugins/lookup-studio")
+      .then((mod) => setLookupListComp(() => mod.LookupList))
+      .catch(() => {});
+  }, []);
+
+  // No lookup plugin = just render projects list (OSS mode)
+  if (!LookupListComp) {
+    return <ListOfTools />;
+  }
+
+  const tabProps = {
+    segmentOptions: TAB_OPTIONS,
+    segmentValue: activeTab,
+    onSegmentChange: setActiveTab,
+  };
+
+  return activeTab === "Projects" ? (
+    <ListOfTools {...tabProps} />
+  ) : (
+    <LookupListComp {...tabProps} />
+  );
 }
 
 export { CustomTools };

From 8aa675884b51ca610f3e2f64acd416f1848e4724 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 8 Apr 2026 16:42:08 +0530
Subject: [PATCH 15/57] UN-2946 [FEAT] Deferred batch usage tracking with
 operation metrics

Switch from eager per-call Audit HTTP push to a deferred batch write
pattern for adapter usage. LLM/embedding calls stash records in-memory;
the executor flushes them into ExecutionResult metadata; the Celery task
batch-writes via a new internal endpoint.

Adds 5 nullable columns to Usage (reference_id, reference_type,
execution_time_ms, status, error_message) and a composite index for
lookup dashboard queries. Extensible choice lists allow cloud plugins
to register additional usage reasons and reference types.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/usage_v2/internal_urls.py             |  5 +
 backend/usage_v2/internal_views.py            | 41 +++++++++
 .../0004_add_lookup_usage_reason.py           | 28 ------
 .../migrations/0004_usage_metrics_fields.py   | 90 ++++++++++++++++++
 backend/usage_v2/models.py                    | 86 ++++++++++++++++--
 unstract/sdk1/src/unstract/sdk1/llm.py        | 91 ++++++++++++++-----
 .../sdk1/src/unstract/sdk1/usage_handler.py   | 46 ++++++++--
 .../sdk1/src/unstract/sdk1/utils/common.py    |  7 ++
 workers/executor/executors/legacy_executor.py | 18 ++++
 workers/executor/executors/usage.py           | 81 -----------------
 workers/executor/tasks.py                     | 21 +++++
 workers/shared/clients/usage_client.py        | 25 +++++
 12 files changed, 390 insertions(+), 149 deletions(-)
 delete mode 100644 backend/usage_v2/migrations/0004_add_lookup_usage_reason.py
 create mode 100644 backend/usage_v2/migrations/0004_usage_metrics_fields.py
 delete mode 100644 workers/executor/executors/usage.py

diff --git a/backend/usage_v2/internal_urls.py b/backend/usage_v2/internal_urls.py
index b5a8675554..e7e0082e99 100644
--- a/backend/usage_v2/internal_urls.py
+++ b/backend/usage_v2/internal_urls.py
@@ -17,4 +17,9 @@
         internal_views.PagesProcessedInternalView.as_view(),
         name="aggregated-pages-processed",
     ),
+    path(
+        "batch/",
+        internal_views.UsageBatchCreateView.as_view(),
+        name="usage-batch-create",
+    ),
 ]
diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 3c28779c56..ca6642b443 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -6,10 +6,12 @@
 from rest_framework import status
 from rest_framework.request import Request
 from rest_framework.views import APIView
+from utils.user_context import UserContext
 
 from unstract.core.data_models import UsageResponseData
 
 from .helper import UsageHelper
+from .models import Usage
 
 logger = logging.getLogger(__name__)
 
@@ -133,3 +135,42 @@ def get(self, request: Request, file_execution_id: str) -> JsonResponse:
                 },
                 status=status.HTTP_500_INTERNAL_SERVER_ERROR,
             )
+
+
+class UsageBatchCreateView(APIView):
+    """Bulk create usage records from worker finalization."""
+
+    def post(self, request: Request) -> JsonResponse:
+        records = request.data.get("records", [])
+        if not records:
+            return JsonResponse({"created": 0}, status=200)
+
+        # Resolved by InternalAPIAuthMiddleware via StateStore
+        organization = UserContext.get_organization()
+
+        usage_objects = []
+        for r in records:
+            usage_objects.append(
+                Usage(
+                    organization=organization,
+                    workflow_id=r.get("workflow_id", ""),
+                    execution_id=r.get("execution_id", ""),
+                    adapter_instance_id=r.get("adapter_instance_id", ""),
+                    run_id=r.get("run_id"),
+                    usage_type=r.get("usage_type", "llm"),
+                    llm_usage_reason=r.get("llm_usage_reason", ""),
+                    model_name=r.get("model_name", ""),
+                    embedding_tokens=r.get("embedding_tokens", 0),
+                    prompt_tokens=r.get("prompt_tokens", 0),
+                    completion_tokens=r.get("completion_tokens", 0),
+                    total_tokens=r.get("total_tokens", 0),
+                    cost_in_dollars=r.get("cost_in_dollars", 0.0),
+                    reference_id=r.get("reference_id"),
+                    reference_type=r.get("reference_type"),
+                    execution_time_ms=r.get("execution_time_ms"),
+                    status=r.get("status"),
+                    error_message=r.get("error_message"),
+                )
+            )
+        created = Usage.objects.bulk_create(usage_objects)
+        return JsonResponse({"created": len(created)}, status=201)
diff --git a/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py b/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py
deleted file mode 100644
index 76c628d9ee..0000000000
--- a/backend/usage_v2/migrations/0004_add_lookup_usage_reason.py
+++ /dev/null
@@ -1,28 +0,0 @@
-# Generated by Django 4.2.1 on 2026-04-03 22:44
-
-from django.db import migrations, models
-
-
-class Migration(migrations.Migration):
-    dependencies = [
-        ("usage_v2", "0003_usage_usage_executi_4deb35_idx"),
-    ]
-
-    operations = [
-        migrations.AlterField(
-            model_name="usage",
-            name="llm_usage_reason",
-            field=models.CharField(
-                blank=True,
-                choices=[
-                    ("extraction", "Extraction"),
-                    ("challenge", "Challenge"),
-                    ("summarize", "Summarize"),
-                    ("lookup", "Lookup"),
-                ],
-                db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
-                max_length=255,
-                null=True,
-            ),
-        ),
-    ]
diff --git a/backend/usage_v2/migrations/0004_usage_metrics_fields.py b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
new file mode 100644
index 0000000000..03174f0677
--- /dev/null
+++ b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
@@ -0,0 +1,90 @@
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("usage_v2", "0003_usage_usage_executi_4deb35_idx"),
+    ]
+
+    operations = [
+        # Extend llm_usage_reason choices (cloud plugins append at runtime)
+        migrations.AlterField(
+            model_name="usage",
+            name="llm_usage_reason",
+            field=models.CharField(
+                blank=True,
+                choices=[
+                    ("extraction", "Extraction"),
+                    ("challenge", "Challenge"),
+                    ("summarize", "Summarize"),
+                ],
+                db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
+                max_length=255,
+                null=True,
+            ),
+        ),
+        migrations.AddField(
+            model_name="usage",
+            name="reference_id",
+            field=models.UUIDField(
+                blank=True,
+                db_comment=(
+                    "Polymorphic correlation ID (no FK constraint) linking to the "
+                    "entity that triggered this usage. Interpret via reference_type. "
+                    "OSS values: prompt_key UUID. "
+                    "NULL for most operations; survives entity deletion."
+                ),
+                null=True,
+            ),
+        ),
+        migrations.AddField(
+            model_name="usage",
+            name="reference_type",
+            field=models.CharField(
+                blank=True,
+                choices=[("prompt_key", "Prompt Key")],
+                db_comment=(
+                    "Discriminator for reference_id. "
+                    "OSS values: 'prompt_key'. "
+                    "NULL when reference_id is NULL."
+                ),
+                max_length=64,
+                null=True,
+            ),
+        ),
+        migrations.AddField(
+            model_name="usage",
+            name="execution_time_ms",
+            field=models.IntegerField(
+                blank=True,
+                db_comment="Wall-clock time for the operation in milliseconds",
+                null=True,
+            ),
+        ),
+        migrations.AddField(
+            model_name="usage",
+            name="status",
+            field=models.CharField(
+                blank=True,
+                db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
+                max_length=16,
+                null=True,
+            ),
+        ),
+        migrations.AddField(
+            model_name="usage",
+            name="error_message",
+            field=models.TextField(
+                blank=True,
+                db_comment="Error details when status is ERROR",
+                null=True,
+            ),
+        ),
+        migrations.AddIndex(
+            model_name="usage",
+            index=models.Index(
+                fields=["llm_usage_reason", "reference_id", "-created_at"],
+                name="idx_usage_reason_ref_created",
+            ),
+        ),
+    ]
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index dc983c56b5..365fdc956b 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -1,3 +1,4 @@
+import logging
 import uuid
 
 from django.db import models
@@ -7,17 +8,44 @@
     DefaultOrganizationMixin,
 )
 
+logger = logging.getLogger(__name__)
+
 
 class UsageType(models.TextChoices):
     LLM = "llm", "LLM Usage"
     EMBEDDING = "embedding", "Embedding Usage"
 
 
-class LLMUsageReason(models.TextChoices):
-    EXTRACTION = "extraction", "Extraction"
-    CHALLENGE = "challenge", "Challenge"
-    SUMMARIZE = "summarize", "Summarize"
-    LOOKUP = "lookup", "Lookup"
+# ── Extensible choice lists ─────────────────────────────────────────
+# OSS defines base values. Cloud plugins append via try-import so that
+# Django validation accepts cloud-specific values when the plugin is
+# installed, without leaking cloud details into OSS code.
+
+_LLM_USAGE_REASON_CHOICES: list[tuple[str, str]] = [
+    ("extraction", "Extraction"),
+    ("challenge", "Challenge"),
+    ("summarize", "Summarize"),
+]
+
+_REFERENCE_TYPE_CHOICES: list[tuple[str, str]] = [
+    ("prompt_key", "Prompt Key"),
+]
+
+try:
+    from pluggable_apps.lookup_v1.constants import (
+        CLOUD_LLM_USAGE_REASON_CHOICES,
+        CLOUD_REFERENCE_TYPE_CHOICES,
+    )
+
+    _LLM_USAGE_REASON_CHOICES.extend(CLOUD_LLM_USAGE_REASON_CHOICES)
+    _REFERENCE_TYPE_CHOICES.extend(CLOUD_REFERENCE_TYPE_CHOICES)
+except ImportError:
+    pass
+except Exception:
+    logger.warning("Failed to load cloud usage choices", exc_info=True)
+
+LLM_USAGE_REASON_CHOICES = _LLM_USAGE_REASON_CHOICES
+REFERENCE_TYPE_CHOICES = _REFERENCE_TYPE_CHOICES
 
 
 class UsageModelManager(DefaultOrganizationManagerMixin, models.Manager):
@@ -25,6 +53,11 @@ class UsageModelManager(DefaultOrganizationManagerMixin, models.Manager):
 
 
 class Usage(DefaultOrganizationMixin, BaseModel):
+    # reference_type → reference_id mapping (no FK constraint):
+    #   "prompt_key"  → ToolStudioPrompt UUID (OSS)
+    #   Cloud plugins register additional types via CLOUD_REFERENCE_TYPE_CHOICES.
+    # Usage records survive entity deletion.
+
     id = models.UUIDField(
         primary_key=True,
         default=uuid.uuid4,
@@ -53,7 +86,7 @@ class Usage(DefaultOrganizationMixin, BaseModel):
     )
     llm_usage_reason = models.CharField(
         max_length=255,
-        choices=LLMUsageReason.choices,
+        choices=LLM_USAGE_REASON_CHOICES,
         null=True,
         blank=True,
         db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
@@ -68,6 +101,43 @@ class Usage(DefaultOrganizationMixin, BaseModel):
     )
     total_tokens = models.IntegerField(db_comment="Total number of tokens used")
     cost_in_dollars = models.FloatField(db_comment="Total number of tokens used")
+    reference_id = models.UUIDField(
+        null=True,
+        blank=True,
+        db_comment=(
+            "Polymorphic correlation ID (no FK constraint) linking to the "
+            "entity that triggered this usage. Interpret via reference_type. "
+            "OSS values: prompt_key UUID. "
+            "NULL for most operations; survives entity deletion."
+        ),
+    )
+    reference_type = models.CharField(
+        max_length=64,
+        choices=REFERENCE_TYPE_CHOICES,
+        null=True,
+        blank=True,
+        db_comment=(
+            "Discriminator for reference_id. "
+            "OSS values: 'prompt_key'. "
+            "NULL when reference_id is NULL."
+        ),
+    )
+    execution_time_ms = models.IntegerField(
+        null=True,
+        blank=True,
+        db_comment="Wall-clock time for the operation in milliseconds",
+    )
+    status = models.CharField(
+        max_length=16,
+        null=True,
+        blank=True,
+        db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
+    )
+    error_message = models.TextField(
+        null=True,
+        blank=True,
+        db_comment="Error details when status is ERROR",
+    )
     # Manager
     objects = UsageModelManager()
 
@@ -79,4 +149,8 @@ class Meta:
         indexes = [
             models.Index(fields=["run_id"]),
             models.Index(fields=["execution_id"]),
+            models.Index(
+                fields=["llm_usage_reason", "reference_id", "-created_at"],
+                name="idx_usage_reason_ref_created",
+            ),
         ]
diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index f751e7f87c..56b27dc163 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -9,11 +9,10 @@
 import litellm
 
 # from litellm import get_supported_openai_params
-from litellm import get_max_tokens, token_counter
+from litellm import get_max_tokens
 from pydantic import ValidationError
 from unstract.sdk1.adapters.constants import Common
 from unstract.sdk1.adapters.llm1 import adapters
-from unstract.sdk1.audit import Audit
 from unstract.sdk1.constants import Common as SdkCommon
 from unstract.sdk1.constants import ToolEnv
 from unstract.sdk1.exceptions import LLMError, SdkError, strip_litellm_prefix
@@ -21,7 +20,6 @@
 from unstract.sdk1.tool.base import BaseTool
 from unstract.sdk1.utils.common import (
     LLMResponseCompat,
-    TokenCounterCompat,
     capture_metrics,
 )
 from unstract.sdk1.utils.retry_utils import (
@@ -211,7 +209,7 @@ def __init__(  # noqa: C901
         if capture_metrics_from_platform is not None:
             self._capture_metrics = capture_metrics_from_platform
         self._metrics: dict[str, object] = {}
-        self._last_usage: Mapping[str, int] = {}
+        self._pending_usage: list[dict] = []
 
     def _get_adapter_info(self) -> str:
         """Build a display string identifying this adapter for errors."""
@@ -555,11 +553,27 @@ def get_metrics(self) -> dict[str, object]:
 
     def get_last_usage(self) -> Mapping[str, int]:
         """Token usage from the most recent complete() call."""
-        return self._last_usage
+        if not self._pending_usage:
+            return {}
+        last = self._pending_usage[-1]
+        return {
+            "prompt_tokens": last["prompt_tokens"],
+            "completion_tokens": last["completion_tokens"],
+            "total_tokens": last["total_tokens"],
+        }
 
     def get_usage_reason(self) -> object:
         return self.platform_kwargs.get("llm_usage_reason")
 
+    def flush_pending_usage(self) -> list[dict]:
+        """Return and clear all pending usage records.
+
+        Called by the executor at finalization to collect records for batch write.
+        """
+        records = self._pending_usage
+        self._pending_usage = []
+        return records
+
     def _record_usage(
         self,
         model: str,
@@ -567,29 +581,52 @@ def _record_usage(
         usage: Mapping[str, int] | None,
         llm_api: str,
     ) -> None:
-        prompt_tokens = token_counter(model=model, messages=messages)
         usage_data: Mapping[str, int] = usage or {}
-        all_tokens = TokenCounterCompat(
-            prompt_tokens=usage_data.get("prompt_tokens", 0),
-            completion_tokens=usage_data.get("completion_tokens", 0),
-            total_tokens=usage_data.get("total_tokens", 0),
+        prompt_tokens = usage_data.get("prompt_tokens", 0)
+        completion_tokens = usage_data.get("completion_tokens", 0)
+        total_tokens = usage_data.get("total_tokens", 0)
+
+        logger.info(
+            "[sdk1][LLM][%s][%s] Usage: prompt=%d completion=%d total=%d",
+            model,
+            llm_api,
+            prompt_tokens,
+            completion_tokens,
+            total_tokens,
         )
 
-        logger.info(f"[sdk1][LLM][{model}][{llm_api}] Prompt Tokens: {prompt_tokens}")
-        logger.info(f"[sdk1][LLM][{model}][{llm_api}] LLM Usage: {all_tokens}")
-
-        self._last_usage = {
-            "prompt_tokens": all_tokens.prompt_llm_token_count,
-            "completion_tokens": all_tokens.completion_llm_token_count,
-            "total_tokens": all_tokens.total_llm_token_count,
-        }
-
-        Audit().push_usage_data(
-            platform_api_key=self._platform_api_key,
-            token_counter=all_tokens,
-            event_type="llm",
-            model_name=model,
-            kwargs={"provider": self.adapter.get_provider(), **self.platform_kwargs},
+        try:
+            prompt_cost, compl_cost = litellm.cost_per_token(
+                model=model,
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+            )
+            cost = prompt_cost + compl_cost
+        except Exception:
+            cost = 0.0
+
+        # Strip provider prefix (e.g. "azure/gpt-4o" → "gpt-4o") for storage,
+        # matching the old Audit.push_usage_data() behavior.
+        display_model = model.split("/", 1)[-1] if model else model
+
+        self._pending_usage.append(
+            {
+                "usage_type": "llm",
+                "model_name": display_model,
+                "provider": self.adapter.get_provider(),
+                "adapter_instance_id": self.platform_kwargs.get(
+                    "adapter_instance_id", ""
+                ),
+                "run_id": self.platform_kwargs.get("run_id", ""),
+                "execution_id": self.platform_kwargs.get("execution_id", ""),
+                "llm_usage_reason": self.platform_kwargs.get("llm_usage_reason", ""),
+                "prompt_tokens": prompt_tokens,
+                "completion_tokens": completion_tokens,
+                "total_tokens": total_tokens,
+                "embedding_tokens": 0,
+                "cost_in_dollars": cost,
+                "status": "SUCCESS",
+            }
         )
 
     # Finish reasons indicating a safety/policy refusal across providers:
@@ -982,6 +1019,10 @@ def get_usage_reason(self) -> object:
         """Get usage reason from platform kwargs."""
         return self._llm_instance.get_usage_reason()
 
+    def flush_pending_usage(self) -> list[dict]:
+        """Return and clear all pending usage records."""
+        return self._llm_instance.flush_pending_usage()
+
     def test_connection(self) -> bool:
         """Test connection to the LLM provider."""
         return self._llm_instance.test_connection()
diff --git a/unstract/sdk1/src/unstract/sdk1/usage_handler.py b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
index 0ffa7c43e2..44a819b44c 100644
--- a/unstract/sdk1/src/unstract/sdk1/usage_handler.py
+++ b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
@@ -1,9 +1,9 @@
 from typing import Any
 
+import litellm
 from llama_index.core.callbacks import CBEventType, TokenCountingHandler
 from llama_index.core.callbacks.base_handler import BaseCallbackHandler
 from llama_index.core.embeddings import BaseEmbedding
-from unstract.sdk1.audit import Audit
 from unstract.sdk1.constants import LogLevel
 from unstract.sdk1.tool.stream import StreamMixin
 
@@ -57,6 +57,7 @@ def __init__(
         self._verbose = verbose
         self.token_counter = token_counter
         self.embed_model = embed_model
+        self._pending_usage: list[dict] = []
         self.platform_api_key = platform_api_key
         super().__init__(
             log_level=log_level,  # StreamMixin's args
@@ -102,16 +103,43 @@ def on_event_end(
             and payload is not None
         ):
             model_name = self.embed_model.model_name
-            # Need to push the data to via platform service
+            embedding_tokens = self.token_counter.total_embedding_token_count
             self.stream_log(
-                log=f"Pushing embedding usage for model {model_name}",
+                log=f"Recording embedding usage for model {model_name}",
                 level=LogLevel.DEBUG,
             )
-            Audit(log_level=self.log_level).push_usage_data(
-                platform_api_key=self.platform_api_key,
-                token_counter=self.token_counter,
-                event_type=event_type,
-                model_name=self.embed_model.model_name,
-                kwargs=self.kwargs,
+
+            try:
+                prompt_cost, _ = litellm.cost_per_token(
+                    model=model_name,
+                    prompt_tokens=embedding_tokens,
+                    completion_tokens=0,
+                )
+                cost = prompt_cost
+            except Exception:
+                cost = 0.0
+
+            display_model = model_name.split("/", 1)[-1] if model_name else model_name
+
+            self._pending_usage.append(
+                {
+                    "usage_type": "embedding",
+                    "model_name": display_model,
+                    "adapter_instance_id": self.kwargs.get("adapter_instance_id", ""),
+                    "run_id": self.kwargs.get("run_id", ""),
+                    "execution_id": self.kwargs.get("execution_id", ""),
+                    "embedding_tokens": embedding_tokens,
+                    "prompt_tokens": 0,
+                    "completion_tokens": 0,
+                    "total_tokens": 0,
+                    "cost_in_dollars": cost,
+                    "status": "SUCCESS",
+                }
             )
             self.token_counter.reset_counts()
+
+    def flush_pending_usage(self) -> list[dict]:
+        """Return and clear all pending usage records."""
+        records = self._pending_usage
+        self._pending_usage = []
+        return records
diff --git a/unstract/sdk1/src/unstract/sdk1/utils/common.py b/unstract/sdk1/src/unstract/sdk1/utils/common.py
index 86b0f173b6..c2c3fdbca5 100644
--- a/unstract/sdk1/src/unstract/sdk1/utils/common.py
+++ b/unstract/sdk1/src/unstract/sdk1/utils/common.py
@@ -250,6 +250,13 @@ def wrapper(self: object, *args: object, **kwargs: object) -> object:
                     # If the key isn't in self._metrics, set it to new_metrics
                     self._metrics = new_metrics
 
+                # Stamp timing onto the most recent pending usage record
+                pending = getattr(self, "_pending_usage", [])
+                if pending:
+                    time_taken = new_metrics.get(time_taken_key)
+                    if time_taken is not None:
+                        pending[-1]["execution_time_ms"] = int(time_taken * 1000)
+
         return result
 
     return wrapper
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 7ccdcb656d..7a0a41a424 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -79,6 +79,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
         # Extract log streaming info (set by tasks.py for IDE sessions).
         self._log_events_id: str = context.log_events_id or ""
         self._log_component: dict[str, str] = getattr(context, "_log_component", {})
+        self._usage_records: list[dict[str, Any]] = []
 
         handler_name = self._OPERATION_MAP.get(context.operation)
         if handler_name is None:
@@ -107,6 +108,11 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                 context.run_id,
                 result.success,
             )
+            # Attach collected usage records to the result metadata
+            if self._usage_records:
+                result.metadata.setdefault("usage_records", []).extend(
+                    self._usage_records
+                )
             return result
         except LegacyExecutorError as exc:
             elapsed = time.monotonic() - start
@@ -1390,6 +1396,7 @@ def _run_challenge_if_enabled(
             metadata=metadata,
         )
         challenger.run()
+        self._usage_records.extend(challenge_llm.flush_pending_usage())
         shim.stream_log(f"Challenge verification completed for: {prompt_name}")
         logger.info("Challenge completed: prompt=%s", prompt_name)
 
@@ -1702,6 +1709,15 @@ def _execute_single_prompt(
                     f"{llm.get_usage_reason()}_llm": llm.get_metrics(),
                 }
             )
+            self._usage_records.extend(llm.flush_pending_usage())
+            # Flush embedding usage from callback handlers
+            if chunk_size > 0:
+                try:
+                    for handler in embedding.callback_manager.handlers:
+                        if hasattr(handler, "flush_pending_usage"):
+                            self._usage_records.extend(handler.flush_pending_usage())
+                except Exception:
+                    pass
             if vector_db:
                 vector_db.close()
 
@@ -1901,6 +1917,7 @@ def _run_lookup_enrichment(
             prompt_name=prompt_name,
         )
         enricher.run()
+        self._usage_records.extend(llm.flush_pending_usage())
 
         metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
             llm.get_metrics()
@@ -2150,6 +2167,7 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
 
             shim.stream_log("Running document summarization...")
             summary = answer_prompt_svc.run_completion(llm=llm, prompt=prompt)
+            self._usage_records.extend(llm.flush_pending_usage())
             logger.info("Summarization completed: run_id=%s", context.run_id)
             shim.stream_log("Summarization completed")
             return ExecutionResult(
diff --git a/workers/executor/executors/usage.py b/workers/executor/executors/usage.py
deleted file mode 100644
index ab6296eaeb..0000000000
--- a/workers/executor/executors/usage.py
+++ /dev/null
@@ -1,81 +0,0 @@
-"""Usage tracking helper for the executor worker.
-
-Ported from prompt-service/.../helpers/usage.py.
-Flask/DB dependencies removed — usage data is pushed via the SDK1
-``Audit`` class (HTTP to platform API) and returned directly in
-``ExecutionResult.metadata`` instead of querying the DB.
-
-Note: The SDK1 adapters (LLM, EmbeddingCompat) already call
-``Audit().push_usage_data()`` internally.  This helper is for
-explicit push calls outside of adapter operations (e.g. rent rolls).
-"""
-
-import logging
-from typing import Any
-
-logger = logging.getLogger(__name__)
-
-
-class UsageHelper:
-    @staticmethod
-    def push_usage_data(
-        event_type: str,
-        kwargs: dict[str, Any],
-        platform_api_key: str,
-        token_counter: Any = None,
-        model_name: str = "",
-    ) -> bool:
-        """Push usage data to the audit service.
-
-        Wraps ``Audit().push_usage_data()`` with validation and
-        error handling.
-
-        Args:
-            event_type: Type of usage event (e.g. "llm", "embedding").
-            kwargs: Context dict (run_id, execution_id, etc.).
-            platform_api_key: API key for platform service auth.
-            token_counter: Token counter with usage metrics.
-            model_name: Name of the model used.
-
-        Returns:
-            True if successful, False otherwise.
-        """
-        if not kwargs or not isinstance(kwargs, dict):
-            logger.error("Invalid kwargs provided to push_usage_data")
-            return False
-
-        if not platform_api_key or not isinstance(platform_api_key, str):
-            logger.error("Invalid platform_api_key provided to push_usage_data")
-            return False
-
-        try:
-            from unstract.sdk1.audit import Audit
-
-            logger.debug(
-                "Pushing usage data for event_type=%s model=%s",
-                event_type,
-                model_name,
-            )
-
-            Audit().push_usage_data(
-                platform_api_key=platform_api_key,
-                token_counter=token_counter,
-                model_name=model_name,
-                event_type=event_type,
-                kwargs=kwargs,
-            )
-
-            logger.info("Successfully pushed usage data for %s", model_name)
-            return True
-        except Exception:
-            logger.exception("Error pushing usage data")
-            return False
-
-    @staticmethod
-    def format_float_positional(value: float, precision: int = 10) -> str:
-        """Format a float without scientific notation.
-
-        Removes trailing zeros for clean display of cost values.
-        """
-        formatted: str = f"{value:.{precision}f}"
-        return formatted.rstrip("0").rstrip(".") if "." in formatted else formatted
diff --git a/workers/executor/tasks.py b/workers/executor/tasks.py
index 77d5ecaebd..ea02b7c353 100644
--- a/workers/executor/tasks.py
+++ b/workers/executor/tasks.py
@@ -6,7 +6,9 @@
 """
 
 from celery import shared_task
+from shared.clients import UsageAPIClient
 from shared.enums.task_enums import TaskName
+from shared.infrastructure.config import WorkerConfig
 from shared.infrastructure.logging import WorkerLogger
 
 from unstract.sdk1.execution.context import ExecutionContext
@@ -97,6 +99,25 @@ def execute_extraction(self, execution_context_dict: dict) -> dict:
     orchestrator = ExecutionOrchestrator()
     result = orchestrator.execute(context)
 
+    # Batch write usage records collected during execution
+    usage_records = result.metadata.get("usage_records", [])
+    if usage_records:
+        try:
+            config = WorkerConfig()
+            with UsageAPIClient(config) as usage_client:
+                usage_client.set_organization_context(context.organization_id)
+                usage_client.bulk_create_usage(
+                    usage_records,
+                    organization_id=context.organization_id,
+                )
+        except Exception:
+            logger.warning(
+                "Failed to flush %d usage records for run_id=%s",
+                len(usage_records),
+                context.run_id,
+                exc_info=True,
+            )
+
     logger.info(
         "execute_extraction complete: celery_task_id=%s request_id=%s success=%s",
         self.request.id,
diff --git a/workers/shared/clients/usage_client.py b/workers/shared/clients/usage_client.py
index a7ba8c7013..f61f65e27a 100644
--- a/workers/shared/clients/usage_client.py
+++ b/workers/shared/clients/usage_client.py
@@ -171,6 +171,31 @@ def get_aggregated_token_count(
                 message="Failed to retrieve usage data",
             )
 
+    def bulk_create_usage(
+        self, records: list[dict], organization_id: str | None = None
+    ) -> bool:
+        """Bulk create usage records at execution finalization.
+
+        Args:
+            records: List of usage record dicts to create.
+            organization_id: Optional organization ID override.
+
+        Returns:
+            True if records were created successfully.
+        """
+        if not records:
+            return True
+        try:
+            response = self.post(
+                "v1/usage/batch/",
+                data={"records": records},
+                organization_id=organization_id,
+            )
+            return response.get("success", False) or "created" in response
+        except Exception as e:
+            logger.error("Failed to bulk create usage records: %s", e)
+            return False
+
     def get_aggregated_pages_processed(
         self, file_execution_id: str | uuid.UUID, organization_id: str | None = None
     ) -> int | None:

From 0d29c9d631594c1acf19dec3f248264fd34cc80f Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 10 Apr 2026 14:15:22 +0530
Subject: [PATCH 16/57] UN-2946 [FEAT] Add plugin hook for lookup output
 enrichment in serializer

Bridge function in lookup_utils.py lets cloud plugins enrich
PromptStudioOutputSerializer with lookup data (enriched output,
lookup name). Enables real-time lookup results via WebSocket
without page refresh.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         | 27 ++++++++++++++++---
 .../serializers.py                            |  3 +++
 2 files changed, 26 insertions(+), 4 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 823d9fc015..10783e405c 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -29,17 +29,36 @@ def persist_lookup_output(prompt_output, prompt_lookup: dict) -> None:
         lookup_meta = prompt_lookup.get("meta", {})
         lookup_id = lookup_meta.get("lookup_id")
         if lookup_id:
+            defaults = {
+                "lookup_definition_id": lookup_id,
+                "output": prompt_lookup.get("enriched", ""),
+            }
+            version_id = lookup_meta.get("version_id")
+            if version_id:
+                defaults["version_id"] = version_id
             LookupOutputResult.objects.update_or_create(
                 prompt_output=prompt_output,
-                defaults={
-                    "lookup_definition_id": lookup_id,
-                    "output": prompt_lookup.get("enriched", ""),
-                },
+                defaults=defaults,
             )
     except ImportError:
         pass
 
 
+def enrich_prompt_output(prompt_output, data: dict) -> dict:
+    """Let cloud plugins enrich serialized prompt output with lookup data.
+
+    No-op in OSS.
+    """
+    try:
+        from pluggable_apps.lookup_v1.output_enrichment import (
+            enrich_with_lookup_output,
+        )
+
+        return enrich_with_lookup_output(prompt_output, data)
+    except ImportError:
+        return data
+
+
 def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
     """Validate lookup assignments before export. Returns ({}, None) in OSS."""
     try:
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
index 275e4a0956..e4276dbb23 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
@@ -4,6 +4,7 @@
 from usage_v2.helper import UsageHelper
 
 from backend.serializers import AuditSerializer
+from prompt_studio.lookup_utils import enrich_prompt_output
 
 from .models import PromptStudioOutputManager
 from .output_manager_util import OutputManagerUtils
@@ -47,6 +48,8 @@ def to_representation(self, instance):
                 " | Process continued"
             )
             data["coverage"] = {}
+        data = enrich_prompt_output(instance, data)
+
         # Convert string to list
         try:
             context = data["context"]

From 17ffe3802f3c4bacef9e51e861d6ff8e0e53ed79 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sun, 12 Apr 2026 11:22:19 +0530
Subject: [PATCH 17/57] UN-2946 [FEAT] Add lookup usage observability with
 error handling and metadata passthrough

- Wire usage_kwargs_extra from lookup config into LLM usage_kwargs for execution observability
- Add error handling around enricher.run() with explicit ERROR usage records
- Generic passthrough of _usage_kwargs into usage records for arbitrary metadata (e.g. reference_id)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 unstract/sdk1/src/unstract/sdk1/llm.py        |  1 +
 workers/executor/executors/legacy_executor.py | 31 +++++++++++++++----
 2 files changed, 26 insertions(+), 6 deletions(-)

diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index 56b27dc163..eb31c52ad6 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -626,6 +626,7 @@ def _record_usage(
                 "embedding_tokens": 0,
                 "cost_in_dollars": cost,
                 "status": "SUCCESS",
+                **self._usage_kwargs,
             }
         )
 
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 7a0a41a424..42210210ef 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1903,6 +1903,7 @@ def _run_lookup_enrichment(
             usage_kwargs={
                 **(usage_kwargs or {}),
                 PSKeys.LLM_USAGE_REASON: "lookup",
+                **lookup_config.get("usage_kwargs_extra", {}),
             },
             capture_metrics=True,
         )
@@ -1916,12 +1917,30 @@ def _run_lookup_enrichment(
             metadata=metadata,
             prompt_name=prompt_name,
         )
-        enricher.run()
-        self._usage_records.extend(llm.flush_pending_usage())
-
-        metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
-            llm.get_metrics()
-        )
+        try:
+            enricher.run()
+        except Exception as e:
+            logger.warning("Lookup enrichment failed for %s: %s", prompt_name, e)
+            error_record = {
+                "usage_type": "llm",
+                "llm_usage_reason": "lookup",
+                "model_name": lookup_config.get("llm_adapter_id", "unknown"),
+                "status": "ERROR",
+                "error_message": str(e)[:2000],
+                "prompt_tokens": 0,
+                "completion_tokens": 0,
+                "total_tokens": 0,
+                "embedding_tokens": 0,
+                "cost_in_dollars": 0.0,
+                **(usage_kwargs or {}),
+                **lookup_config.get("usage_kwargs_extra", {}),
+            }
+            self._usage_records.append(error_record)
+        finally:
+            self._usage_records.extend(llm.flush_pending_usage())
+            metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
+                llm.get_metrics()
+            )
 
     @staticmethod
     def _run_webhook_postprocessing(

From 6aad216f5c57feb87adf0090d1559adcee7674cf Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 15 Apr 2026 15:22:22 +0530
Subject: [PATCH 18/57] UN-2946 [FEAT] Support enriched output copy and lookup
 drawer plugin hooks

Add dynamic import of getEnrichedCopyText so the copy button copies
enriched lookup output when the Enriched tab is active. Applied to
both single-pass and multi-profile output paths.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 .../custom-tools/prompt-card/PromptOutput.jsx | 48 +++++++++++++------
 1 file changed, 33 insertions(+), 15 deletions(-)

diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index 872c657b2d..a1e492bb29 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -61,6 +61,16 @@ try {
   // Not available in OSS
 }
 
+let getEnrichedCopyText;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/prompt-card/getEnrichedCopyText"
+  );
+  getEnrichedCopyText = mod.getEnrichedCopyText;
+} catch {
+  // Not available in OSS
+}
+
 // Wraps children in LookupOutputTabs when available (cloud),
 // passes through children directly in OSS.
 const renderWithLookupWrapper = (lookupProps, children) =>
@@ -237,15 +247,19 @@ function PromptOutput({
           <div className="prompt-profile-run">
             <CopyPromptOutputBtn
               isDisabled={isTableExtraction}
-              copyToClipboard={() =>
+              copyToClipboard={() => {
+                const enrichedText = getEnrichedCopyText?.(
+                  promptOutputData?.promptOutputId,
+                );
                 copyOutputToClipboard(
-                  displayPromptResult(
-                    promptOutput,
-                    true,
-                    promptDetails?.enable_highlight,
-                  ),
-                )
-              }
+                  enrichedText ||
+                    displayPromptResult(
+                      promptOutput,
+                      true,
+                      promptDetails?.enable_highlight,
+                    ),
+                );
+              }}
             />
             <PromptOutputExpandBtn
               promptId={promptDetails?.prompt_id}
@@ -481,14 +495,18 @@ function PromptOutput({
                         <div className="prompt-profile-run">
                           <CopyPromptOutputBtn
                             isDisabled={isTableExtraction}
-                            copyToClipboard={() =>
+                            copyToClipboard={() => {
+                              const enrichedText = getEnrichedCopyText?.(
+                                promptOutputData?.promptOutputId,
+                              );
                               copyOutputToClipboard(
-                                displayPromptResult(
-                                  promptOutputData?.output,
-                                  true,
-                                ),
-                              )
-                            }
+                                enrichedText ||
+                                  displayPromptResult(
+                                    promptOutputData?.output,
+                                    true,
+                                  ),
+                              );
+                            }}
                           />
                         </div>
                       </>

From dafefa9d82cb72cde00ad9334b210f960af4a745 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 21 Apr 2026 23:44:10 +0530
Subject: [PATCH 19/57] UN-2946 [FEAT] Lookup export validation gate,
 raw-latest helper, and modified_at fix

- Add /prompt-studio/<pk>/lookup-validation/ endpoint backing the FE
  Export/Deploy gate; multi-var block check accepts prompt_ids so a single
  prompt run isn't blocked by an unrelated multi-var lookup.
- Add /prompt-output/latest-by-keys/ endpoint that returns the most recent
  raw output per prompt_key for the test panel's "Use Latest Outputs"
  helper.
- Fix prompt output modified_at not refreshing on re-runs (QuerySet.update
  bypasses auto_now); set timezone.now() explicitly in the update args.
- lookup_utils: bridge get_lookup_validation_for_tool and
  get_multi_var_lookups_for_tool with prompt_ids scoping.
- Header wires useLookupExportGate via try-import (no-op stub in OSS).
- TokenUsage treats all-null Usage rows as empty.
- CombinedOutput / JsonView build enriched dict from
  metadata.lookup_outputs to back the Raw|Enriched output toggle.
- .gitignore: widen docker/compose.*.yaml.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .gitignore                                    |  2 +-
 backend/prompt_studio/lookup_utils.py         | 50 +++++++++++++++
 .../prompt_studio_helper.py                   |  7 ++-
 .../prompt_studio_core_v2/urls.py             |  9 +++
 .../prompt_studio_core_v2/views.py            | 47 ++++++++++++++
 .../output_manager_helper.py                  | 21 ++++++-
 .../prompt_studio_output_manager_v2/urls.py   |  6 ++
 .../prompt_studio_output_manager_v2/views.py  | 49 +++++++++++++++
 .../combined-output/CombinedOutput.jsx        | 61 ++++++++++++++-----
 .../custom-tools/combined-output/JsonView.jsx | 46 ++++++++++++--
 .../components/custom-tools/header/Header.jsx | 24 +++++++-
 .../profile-info-bar/ProfileInfoBar.css       |  2 +
 .../custom-tools/token-usage/TokenUsage.jsx   |  9 ++-
 13 files changed, 306 insertions(+), 27 deletions(-)

diff --git a/.gitignore b/.gitignore
index f6837ce079..f0c0cb8438 100644
--- a/.gitignore
+++ b/.gitignore
@@ -653,7 +653,7 @@ docker/*.env
 !docker/sample*.env
 docker/public_tools.json
 docker/proxy_overrides.yaml
-docker/compose.override.yaml
+docker/compose.*.yaml
 docker/workflow_data/
 
 # Tool development
diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 10783e405c..5625c33878 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -21,6 +21,34 @@ def get_lookup_config(prompt) -> dict | None:
         return None
 
 
+def get_lookup_configs_for_tool(tool) -> list[dict] | None:
+    """Return lookup configs for a tool (single pass), or None in OSS."""
+    try:
+        from pluggable_apps.lookup_v1.execution import (
+            build_lookup_configs_for_tool,
+        )
+
+        return build_lookup_configs_for_tool(tool)
+    except ImportError:
+        return None
+
+
+def get_multi_var_lookups_for_tool(tool, prompt_ids=None) -> list[str]:
+    """Return names of multi-variable lookups linked to the tool, [] in OSS.
+
+    ``prompt_ids`` scopes the check to a specific subset of linked prompts
+    so single / bulk runs only block when a lookup the run actually uses
+    is multi-variable.
+    """
+    try:
+        from pluggable_apps.lookup_v1.execution import has_multi_var_lookups
+
+        _, names = has_multi_var_lookups(tool, prompt_ids=prompt_ids)
+        return names
+    except ImportError:
+        return []
+
+
 def persist_lookup_output(prompt_output, prompt_lookup: dict) -> None:
     """Persist lookup enrichment result. No-op in OSS."""
     try:
@@ -69,3 +97,25 @@ def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
         return _validate(prompts)
     except ImportError:
         return {}, None
+
+
+def get_lookup_validation_for_tool(tool) -> dict:
+    """Pre-emptive lookup validation for FE Export / Deploy gating.
+
+    Returns an "always ok" payload in OSS so the FE gate is a no-op.
+    """
+    try:
+        from pluggable_apps.lookup_v1.validation import (
+            get_lookup_validation_for_tool as _validate,
+        )
+
+        return _validate(tool)
+    except ImportError:
+        return {
+            "ok": True,
+            "draft_lookups": [],
+            "multi_var_lookups": [],
+            "single_pass_enabled": bool(
+                getattr(tool, "single_pass_extraction_mode", False)
+            ),
+        }
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index 6744171ed4..ee8f1a4c8b 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -20,7 +20,7 @@
 from utils.local_context import StateStore
 
 from backend.celery_service import app as celery_app
-from prompt_studio.lookup_utils import get_lookup_config
+from prompt_studio.lookup_utils import get_lookup_config, get_lookup_configs_for_tool
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_profile_manager_v2.profile_manager_helper import (
     ProfileManagerHelper,
@@ -1173,6 +1173,11 @@ def build_single_pass_payload(
             TSPKeys.SIMILARITY_TOP_K: default_profile.similarity_top_k,
         }
 
+        # Inject lookup configs for single pass enrichment
+        lookup_configs = get_lookup_configs_for_tool(tool)
+        if lookup_configs:
+            tool_settings["lookup_configs"] = lookup_configs
+
         for p in prompts:
             if not p.prompt:
                 raise EmptyPromptError()
diff --git a/backend/prompt_studio/prompt_studio_core_v2/urls.py b/backend/prompt_studio/prompt_studio_core_v2/urls.py
index 86cbb97dd3..9163e8736e 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/urls.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/urls.py
@@ -66,6 +66,10 @@
 
 prompt_studio_task_status = PromptStudioCoreView.as_view({"get": "task_status"})
 
+prompt_studio_lookup_validation = PromptStudioCoreView.as_view(
+    {"get": "lookup_validation"}
+)
+
 
 urlpatterns = format_suffix_patterns(
     [
@@ -165,5 +169,10 @@
             prompt_studio_task_status,
             name="prompt-studio-task-status",
         ),
+        path(
+            "prompt-studio/<uuid:pk>/lookup-validation/",
+            prompt_studio_lookup_validation,
+            name="prompt-studio-lookup-validation",
+        ),
     ]
 )
diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index e936e3dcae..96fd4c8702 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -32,6 +32,10 @@
 from workflow_manager.endpoint_v2.models import WorkflowEndpoint
 
 from backend.celery_service import app as celery_app
+from prompt_studio.lookup_utils import (
+    get_lookup_validation_for_tool,
+    get_multi_var_lookups_for_tool,
+)
 from prompt_studio.prompt_profile_manager_v2.constants import (
     ProfileManagerErrors,
     ProfileManagerKeys,
@@ -89,6 +93,34 @@
 logger = logging.getLogger(__name__)
 
 
+def _multi_var_lookup_block_response(custom_tool, prompt_ids=None):
+    """Block non-SP runs when a linked lookup has >1 input variable.
+
+    ``prompt_ids`` scopes the check to the prompt(s) being run so a
+    multi-var lookup attached to an unrelated prompt in the same project
+    doesn't block a single-var lookup's run.
+
+    Returns a Response object (HTTP 400) when a block applies, or None
+    to let the caller proceed.
+    """
+    if getattr(custom_tool, "single_pass_extraction_mode", False):
+        return None
+    names = get_multi_var_lookups_for_tool(custom_tool, prompt_ids=prompt_ids)
+    if not names:
+        return None
+    return Response(
+        {
+            "error": (
+                "Multi-variable lookup(s) "
+                f"{', '.join(names)} are linked to prompts in this project. "
+                "These can only run in single pass extraction mode. "
+                "Enable single pass or unlink the lookup before running."
+            )
+        },
+        status=status.HTTP_400_BAD_REQUEST,
+    )
+
+
 class PromptStudioCoreView(viewsets.ModelViewSet):
     """Viewset to handle all Custom tool related operations."""
 
@@ -476,6 +508,10 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
         document_id: str = request.data.get(ToolStudioPromptKeys.DOCUMENT_ID)
         prompt_id: str = request.data.get(ToolStudioPromptKeys.ID)
         run_id: str = request.data.get(ToolStudioPromptKeys.RUN_ID)
+        if err := _multi_var_lookup_block_response(
+            custom_tool, prompt_ids=[prompt_id] if prompt_id else None
+        ):
+            return err
         profile_manager_id: str = request.data.get(
             ToolStudioPromptKeys.PROFILE_MANAGER_ID
         )
@@ -577,6 +613,8 @@ def bulk_fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
                 {"error": "prompt_ids is required and must be non-empty."},
                 status=status.HTTP_400_BAD_REQUEST,
             )
+        if err := _multi_var_lookup_block_response(custom_tool, prompt_ids=prompt_ids):
+            return err
         document_id: str = request.data.get(ToolStudioPromptKeys.DOCUMENT_ID)
         run_id: str = request.data.get(ToolStudioPromptKeys.RUN_ID)
         profile_manager_id: str = request.data.get(
@@ -1060,6 +1098,15 @@ def export_tool(self, request: Request, pk: Any = None) -> Response:
             status=status.HTTP_200_OK,
         )
 
+    @action(detail=True, methods=["get"], url_path="lookup-validation")
+    def lookup_validation(self, request: Request, pk: Any = None) -> Response:
+        """Pre-emptive lookup gating for Export / API Deployment buttons.
+
+        Cloud-only check; OSS returns ``ok: True`` so the FE proceeds.
+        """
+        custom_tool = self.get_object()
+        return Response(get_lookup_validation_for_tool(custom_tool))
+
     @action(detail=True, methods=["get"])
     def export_tool_info(self, request: Request, pk: Any = None) -> Response:
         custom_tool = self.get_object()
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 0fb92c126d..056e7feb5d 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -3,6 +3,7 @@
 from typing import Any
 
 from django.core.exceptions import ObjectDoesNotExist
+from django.utils import timezone
 
 from prompt_studio.lookup_utils import persist_lookup_output
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
@@ -107,6 +108,8 @@ def update_or_create_prompt_output(
                     "highlight_data": highlight_data,
                     "confidence_data": confidence_data,
                     "word_confidence_data": word_confidence_data,
+                    # QuerySet.update() bypasses auto_now on modified_at.
+                    "modified_at": timezone.now(),
                 }
                 PromptStudioOutputManager.objects.filter(
                     document_manager=document_manager,
@@ -257,17 +260,20 @@ def fetch_default_output_response(
 
         Returns:
             dict[str, Any]: Formatted JSON response for combined output.
+                Includes a reserved ``_lookup_outputs`` key with per-prompt
+                enriched data when lookups are configured.
         """
-        # Initialize the result dictionary
+        from prompt_studio.lookup_utils import enrich_prompt_output
+
         result: dict[str, Any] = {}
-        # Iterate over ToolStudioPrompt records
+        lookup_outputs: dict[str, Any] = {}
+
         for tool_prompt in tool_studio_prompts:
             if tool_prompt.prompt_type == PSOMKeys.NOTES:
                 continue
             prompt_id = str(tool_prompt.prompt_id)
             profile_manager_id = tool_prompt.profile_manager_id
 
-            # If profile_manager is not set, skip this record
             if not profile_manager_id and not use_default_profile:
                 result[tool_prompt.prompt_key] = ""
                 continue
@@ -292,6 +298,15 @@ def fetch_default_output_response(
 
                 for output in queryset:
                     result[tool_prompt.prompt_key] = output.output
+                    # Check for lookup enrichment
+                    enriched = enrich_prompt_output(output, {})
+                    if "lookup_outputs" in enriched:
+                        lookup_outputs[tool_prompt.prompt_key] = enriched[
+                            "lookup_outputs"
+                        ]
             except ObjectDoesNotExist:
                 result[tool_prompt.prompt_key] = ""
+
+        if lookup_outputs:
+            result["_lookup_outputs"] = lookup_outputs
         return result
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/urls.py b/backend/prompt_studio/prompt_studio_output_manager_v2/urls.py
index 61ec8540fa..77270c22fe 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/urls.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/urls.py
@@ -7,6 +7,7 @@
 get_output_for_tool_default = PromptStudioOutputView.as_view(
     {"get": "get_output_for_tool_default"}
 )
+latest_outputs_by_keys = PromptStudioOutputView.as_view({"get": "latest_outputs_by_keys"})
 
 urlpatterns = format_suffix_patterns(
     [
@@ -16,5 +17,10 @@
             get_output_for_tool_default,
             name="prompt-default-profile-outputs",
         ),
+        path(
+            "prompt-output/latest-by-keys/",
+            latest_outputs_by_keys,
+            name="prompt-output-latest-by-keys",
+        ),
     ]
 )
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
index c0c002d803..5a31c481dc 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
@@ -61,6 +61,55 @@ def get_queryset(self) -> QuerySet | None:
 
         return queryset
 
+    def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
+        """Return the most recent raw output value per source prompt key.
+
+        Used by the lookup Test panel's "Use Latest Outputs" button to
+        pre-fill {{input.X}} fields from prior prompt runs in the linked
+        tool. Always returns the raw extraction — the enriched value would
+        already include lookup post-processing, which would defeat the
+        purpose of testing the lookup with sample inputs.
+        """
+        tool_id = request.GET.get("tool_id")
+        keys_param = request.GET.get("prompt_keys", "")
+        if not tool_id:
+            raise APIException(
+                detail=PromptOutputManagerErrorMessage.TOOL_VALIDATION,
+                code=400,
+            )
+
+        prompt_keys = [k.strip() for k in keys_param.split(",") if k.strip()]
+        if not prompt_keys:
+            return Response({}, status=status.HTTP_200_OK)
+
+        prompt_id_to_key = dict(
+            ToolStudioPrompt.objects.filter(
+                tool_id=tool_id, prompt_key__in=prompt_keys
+            ).values_list("prompt_id", "prompt_key")
+        )
+        if not prompt_id_to_key:
+            return Response({}, status=status.HTTP_200_OK)
+
+        outputs = (
+            PromptStudioOutputManager.objects.filter(
+                prompt_id__in=prompt_id_to_key.keys()
+            )
+            .exclude(output__isnull=True)
+            .exclude(output__exact="")
+            .order_by("-modified_at")
+            .values("prompt_id", "output")
+        )
+
+        result: dict[str, str] = {}
+        for row in outputs:
+            key = prompt_id_to_key.get(row["prompt_id"])
+            if key and key not in result:
+                result[key] = row["output"]
+            if len(result) == len(prompt_id_to_key):
+                break
+
+        return Response(result, status=status.HTTP_200_OK)
+
     def get_output_for_tool_default(self, request: HttpRequest) -> Response:
         # Get the tool_id from request parameters
         # TODO: Setup Serializer here
diff --git a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
index 3036e7b9d6..20993ffc4b 100644
--- a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
+++ b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
@@ -59,6 +59,7 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
   } = useCustomToolStore();
 
   const [combinedOutput, setCombinedOutput] = useState({});
+  const [enrichedOutput, setEnrichedOutput] = useState({});
   const [isOutputLoading, setIsOutputLoading] = useState(false);
   const [adapterData, setAdapterData] = useState([]);
   const [activeKey, setActiveKey] = useState(
@@ -117,29 +118,60 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
         const prompts = details?.prompts || [];
 
         if (activeKey === "0" && !isSimplePromptStudio) {
+          const lookupOutputs = data?._lookup_outputs || {};
           const output = Object.entries(data).reduce((acc, [key, value]) => {
+            if (key === "_lookup_outputs") return acc;
             acc[key] = displayPromptResult(value, false);
             return acc;
           }, {});
           setCombinedOutput(output);
+
+          if (Object.keys(lookupOutputs).length > 0) {
+            const enriched = {};
+            for (const [key, val] of Object.entries(output)) {
+              const lookupData = lookupOutputs[key];
+              enriched[key] = lookupData?.output
+                ? displayPromptResult(lookupData.output, false)
+                : val;
+            }
+            setEnrichedOutput(enriched);
+          } else {
+            setEnrichedOutput({});
+          }
         } else {
-          const output = prompts.reduce((acc, item) => {
-            if (item?.prompt_type !== promptType.notes) {
-              const profileManager = selectedProfile || item?.profile_manager;
-              const outputDetails = data.find(
-                (outputValue) =>
-                  outputValue?.prompt_id === item?.prompt_id &&
-                  outputValue?.profile_manager === profileManager,
-              );
+          const output = {};
+          const enriched = {};
+          let hasEnriched = false;
+
+          for (const item of prompts) {
+            if (item?.prompt_type === promptType.notes) continue;
+            const profileManager = selectedProfile || item?.profile_manager;
+            const outputDetails = data.find(
+              (outputValue) =>
+                outputValue?.prompt_id === item?.prompt_id &&
+                outputValue?.profile_manager === profileManager,
+            );
+
+            output[item?.prompt_key] =
+              outputDetails?.output?.length > 0
+                ? displayPromptResult(outputDetails?.output, false)
+                : "";
 
-              acc[item?.prompt_key] =
-                outputDetails?.output?.length > 0
-                  ? displayPromptResult(outputDetails?.output, false)
-                  : "";
+            // Build enriched output from lookup_outputs
+            const lookupData = outputDetails?.lookup_outputs;
+            if (lookupData?.output) {
+              enriched[item?.prompt_key] = displayPromptResult(
+                lookupData.output,
+                false,
+              );
+              hasEnriched = true;
+            } else {
+              enriched[item?.prompt_key] = output[item?.prompt_key];
             }
-            return acc;
-          }, {});
+          }
+
           setCombinedOutput(output);
+          setEnrichedOutput(hasEnriched ? enriched : {});
         }
       } catch (err) {
         setAlertDetails(
@@ -229,6 +261,7 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
   return (
     <JsonView
       combinedOutput={filteredCombinedOutput}
+      enrichedOutput={enrichedOutput}
       handleTabChange={handleTabChange}
       selectedProfile={selectedProfile}
       llmProfiles={llmProfiles}
diff --git a/frontend/src/components/custom-tools/combined-output/JsonView.jsx b/frontend/src/components/custom-tools/combined-output/JsonView.jsx
index f9d6a86a83..dfc82f92e1 100644
--- a/frontend/src/components/custom-tools/combined-output/JsonView.jsx
+++ b/frontend/src/components/custom-tools/combined-output/JsonView.jsx
@@ -2,12 +2,23 @@ import { Tabs } from "antd";
 import TabPane from "antd/es/tabs/TabPane";
 import Prism from "prismjs";
 import PropTypes from "prop-types";
-import { useEffect } from "react";
+import { useEffect, useState } from "react";
 
 import { JsonViewBody } from "./JsonViewBody";
 
+let EnrichedOutputToggle;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-enriched-toggle/EnrichedOutputToggle"
+  );
+  EnrichedOutputToggle = mod.EnrichedOutputToggle;
+} catch {
+  // The component will remain undefined if it is not available
+}
+
 function JsonView({
   combinedOutput,
+  enrichedOutput,
   handleTabChange,
   adapterData,
   activeKey,
@@ -16,9 +27,25 @@ function JsonView({
   isSinglePass,
   isLoading,
 }) {
+  const [activeView, setActiveView] = useState("Raw");
+
   useEffect(() => {
     Prism.highlightAll();
-  }, [combinedOutput]);
+  }, [combinedOutput, enrichedOutput, activeView]);
+
+  // Reset to Raw when enriched data is not available
+  useEffect(() => {
+    if (!enrichedOutput || Object.keys(enrichedOutput).length === 0) {
+      setActiveView("Raw");
+    }
+  }, [enrichedOutput]);
+
+  const displayOutput =
+    activeView === "Enriched" &&
+    enrichedOutput &&
+    Object.keys(enrichedOutput).length > 0
+      ? enrichedOutput
+      : combinedOutput;
 
   return (
     <div className="combined-op-layout">
@@ -34,14 +61,24 @@ function JsonView({
             />
           ))}
         </Tabs>
-        <div className="combined-op-segment"></div>
+        <div className="combined-op-segment">
+          {EnrichedOutputToggle && (
+            <EnrichedOutputToggle
+              activeView={activeView}
+              onChange={setActiveView}
+              hasEnrichedData={
+                !!(enrichedOutput && Object.keys(enrichedOutput).length > 0)
+              }
+            />
+          )}
+        </div>
       </div>
       <div className="combined-op-divider" />
       <JsonViewBody
         activeKey={activeKey}
         selectedProfile={selectedProfile}
         llmProfiles={llmProfiles}
-        combinedOutput={combinedOutput}
+        combinedOutput={displayOutput}
         isLoading={isLoading}
       />
       <div className="gap" />
@@ -51,6 +88,7 @@ function JsonView({
 
 JsonView.propTypes = {
   combinedOutput: PropTypes.object.isRequired,
+  enrichedOutput: PropTypes.object,
   handleTabChange: PropTypes.func,
   adapterData: PropTypes.array,
   selectedProfile: PropTypes.string,
diff --git a/frontend/src/components/custom-tools/header/Header.jsx b/frontend/src/components/custom-tools/header/Header.jsx
index 15e41c8a0a..5421f299b6 100644
--- a/frontend/src/components/custom-tools/header/Header.jsx
+++ b/frontend/src/components/custom-tools/header/Header.jsx
@@ -18,6 +18,10 @@ import "./Header.css";
 let SinglePassToggleSwitch;
 let CloneButton;
 let PromptShareButton;
+let useLookupExportGate = () => ({
+  checkLookups: () => Promise.resolve(true),
+  modalEl: null,
+});
 try {
   const mod = await import(
     "../../../plugins/single-pass-toggle-switch/SinglePassToggleSwitch"
@@ -26,6 +30,14 @@ try {
 } catch {
   // The variable will remain undefined if the component is not available.
 }
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/hooks/useLookupExportGate"
+  );
+  useLookupExportGate = mod.useLookupExportGate;
+} catch {
+  // OSS — gate stays a no-op resolving true.
+}
 try {
   const mod = await import(
     "../../../plugins/prompt-studio-public-share/public-share-btn/PromptShareButton.jsx"
@@ -72,6 +84,7 @@ function Header({
   const [isApiDeploymentLoading, setIsApiDeploymentLoading] = useState(false);
   const [editModalOpen, setEditModalOpen] = useState(false);
   const [editForm] = Form.useForm();
+  const { checkLookups, modalEl: lookupGateModalEl } = useLookupExportGate();
 
   const handleExport = (
     selectedUsers,
@@ -129,7 +142,7 @@ function Header({
     setConfirmModalVisible(false);
   }, [lastExportParams, handleExport]);
 
-  const handleShare = (isEdit) => {
+  const handleShare = async (isEdit) => {
     try {
       setPostHogCustomEvent("ps_exported_tool", {
         info: `Clicked on the 'Export' button`,
@@ -139,6 +152,9 @@ function Header({
       // If an error occurs while setting custom posthog event, ignore it and continue
     }
 
+    const ok = await checkLookups(details?.tool_id, "export");
+    if (!ok) return;
+
     const requestOptions = {
       method: "GET",
       url: `/api/v1/unstract/${sessionDetails?.orgId}/prompt-studio/export/${details?.tool_id}`,
@@ -255,7 +271,7 @@ function Header({
       });
   };
 
-  const handleCreateApiDeployment = () => {
+  const handleCreateApiDeployment = async () => {
     try {
       setPostHogCustomEvent("intent_create_api_deployment_from_prompt_studio", {
         info: "Clicked Create API Deployment in tool IDE",
@@ -266,6 +282,9 @@ function Header({
       // If an error occurs while setting custom posthog event, ignore it and continue
     }
 
+    const ok = await checkLookups(details?.tool_id, "API deployment");
+    if (!ok) return;
+
     // Check for existing API deployments before proceeding
     setIsApiDeploymentLoading(true);
     const path = `/api/v1/unstract/${sessionDetails.orgId}`;
@@ -422,6 +441,7 @@ function Header({
 
   return (
     <>
+      {lookupGateModalEl}
       <ToolNavBar
         title={details?.tool_name || ""}
         subtitle={isPublicSource ? undefined : details?.description}
diff --git a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
index 8346c26d71..f9f89d03a9 100644
--- a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
+++ b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
@@ -1,3 +1,5 @@
 .profile-info-bar {
   margin-bottom: 10px;
+  flex-wrap: wrap;
+  gap: 4px 0;
 }
diff --git a/frontend/src/components/custom-tools/token-usage/TokenUsage.jsx b/frontend/src/components/custom-tools/token-usage/TokenUsage.jsx
index 846c11f0a2..3c52a40058 100644
--- a/frontend/src/components/custom-tools/token-usage/TokenUsage.jsx
+++ b/frontend/src/components/custom-tools/token-usage/TokenUsage.jsx
@@ -23,8 +23,13 @@ function TokenUsage({ tokenUsageId, isLoading }) {
     setTokens(tokenUsage[tokenUsageId]); // Update tokens state with the token usage data for the given tokenUsageId
   }, [tokenUsage, tokenUsageId]);
 
-  // If no tokens data is available, render nothing
-  if (!tokens || !Object.keys(tokens)?.length || isLoading) {
+  // BE returns all-null fields when no Usage rows match; treat as empty.
+  if (
+    !tokens ||
+    !Object.keys(tokens)?.length ||
+    isLoading ||
+    tokens?.total_tokens == null
+  ) {
     return "NA";
   }
 

From 3cf18c9b1e7f7fdd87a847e365c077a78531db27 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 22 Apr 2026 01:19:15 +0530
Subject: [PATCH 20/57] UN-2946 [UI] Fix combined output pill overlap and
 preserve Look-Ups tab on back
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- ProfileInfoBar: swap Row/Col for plain flex-wrap div — kills Ant Row
  negative-margin quirk that overlapped wrapped pills in combined output.
- CustomTools: honor location.state.activeTab so back navigation from
  lookup detail lands on the Look-Ups tab instead of defaulting to Projects.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../profile-info-bar/ProfileInfoBar.css       |  9 ++-
 .../profile-info-bar/ProfileInfoBar.jsx       | 62 +++++++------------
 frontend/src/pages/CustomTools.jsx            | 13 +++-
 3 files changed, 43 insertions(+), 41 deletions(-)

diff --git a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
index f9f89d03a9..da866a895f 100644
--- a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
+++ b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.css
@@ -1,5 +1,10 @@
 .profile-info-bar {
-  margin-bottom: 10px;
+  display: flex;
   flex-wrap: wrap;
-  gap: 4px 0;
+  gap: 6px 8px;
+  margin-bottom: 10px;
+}
+
+.profile-info-bar .ant-tag {
+  margin: 0;
 }
diff --git a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.jsx b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.jsx
index 8f52a68a49..9341753987 100644
--- a/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.jsx
+++ b/frontend/src/components/custom-tools/profile-info-bar/ProfileInfoBar.jsx
@@ -1,4 +1,4 @@
-import { Col, Row, Tag } from "antd";
+import { Tag } from "antd";
 import PropTypes from "prop-types";
 import "./ProfileInfoBar.css";
 
@@ -10,43 +10,29 @@ const ProfileInfoBar = ({ profiles, profileId }) => {
   }
 
   return (
-    <Row className="profile-info-bar">
-      <Col>
-        <Tag>
-          <strong>Profile Name:</strong> {profile?.profile_name}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>Chunk Size:</strong> {profile?.chunk_size}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>Vector Store:</strong> {profile?.vector_store}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>Embedding Model:</strong> {profile?.embedding_model}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>LLM:</strong> {profile?.llm}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>X2Text:</strong> {profile?.x2text}
-        </Tag>
-      </Col>
-      <Col>
-        <Tag>
-          <strong>Reindex:</strong> {profile?.reindex ? "Yes" : "No"}
-        </Tag>
-      </Col>
-    </Row>
+    <div className="profile-info-bar">
+      <Tag>
+        <strong>Profile Name:</strong> {profile?.profile_name}
+      </Tag>
+      <Tag>
+        <strong>Chunk Size:</strong> {profile?.chunk_size}
+      </Tag>
+      <Tag>
+        <strong>Vector Store:</strong> {profile?.vector_store}
+      </Tag>
+      <Tag>
+        <strong>Embedding Model:</strong> {profile?.embedding_model}
+      </Tag>
+      <Tag>
+        <strong>LLM:</strong> {profile?.llm}
+      </Tag>
+      <Tag>
+        <strong>X2Text:</strong> {profile?.x2text}
+      </Tag>
+      <Tag>
+        <strong>Reindex:</strong> {profile?.reindex ? "Yes" : "No"}
+      </Tag>
+    </div>
   );
 };
 
diff --git a/frontend/src/pages/CustomTools.jsx b/frontend/src/pages/CustomTools.jsx
index 1f6c2d3934..9543fb5c16 100644
--- a/frontend/src/pages/CustomTools.jsx
+++ b/frontend/src/pages/CustomTools.jsx
@@ -1,12 +1,16 @@
 import { useEffect, useState } from "react";
+import { useLocation } from "react-router-dom";
 
 import { ListOfTools } from "../components/custom-tools/list-of-tools/ListOfTools";
 
 const TAB_OPTIONS = ["Projects", "Look-Ups"];
 
 function CustomTools() {
+  const location = useLocation();
   const [LookupListComp, setLookupListComp] = useState(null);
-  const [activeTab, setActiveTab] = useState("Projects");
+  const [activeTab, setActiveTab] = useState(
+    location.state?.activeTab || "Projects",
+  );
 
   useEffect(() => {
     import("../plugins/lookup-studio")
@@ -14,6 +18,13 @@ function CustomTools() {
       .catch(() => {});
   }, []);
 
+  // Honor tab from navigation state on subsequent entries
+  useEffect(() => {
+    if (location.state?.activeTab) {
+      setActiveTab(location.state.activeTab);
+    }
+  }, [location.state?.activeTab]);
+
   // No lookup plugin = just render projects list (OSS mode)
   if (!LookupListComp) {
     return <ListOfTools />;

From d63767b514aff77142654203dfd5d3ef420aa5ea Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 22 Apr 2026 04:07:35 +0530
Subject: [PATCH 21/57] UN-2946 [FEAT] Add last_exported_at and wire lookup
 staleness bridge

Introduces nullable last_exported_at on CustomTool (populated on first
successful export) so staleness checks can compare against downstream
mutations without a data backfill. NULL is treated as "unknown" and
suppresses the lookup-dirty flag to avoid false alarms on pre-feature
projects. Adds the get_latest_lookup_mutation_for_tool bridge in
lookup_utils so OSS stays decoupled from the cloud plugin.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         | 16 ++++++++++++++
 .../0007_customtool_last_exported_at.py       | 21 +++++++++++++++++++
 .../prompt_studio_core_v2/models.py           |  9 ++++++++
 .../prompt_studio_core_v2/views.py            | 17 +++++++++++++++
 4 files changed, 63 insertions(+)
 create mode 100644 backend/prompt_studio/prompt_studio_core_v2/migrations/0007_customtool_last_exported_at.py

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 5625c33878..474f9a5d52 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -99,6 +99,22 @@ def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
         return {}, None
 
 
+def get_latest_lookup_mutation_for_tool(tool):
+    """Return the max modified_at across all lookup-related records linked to
+    the tool (version, reference file, assignment). Used for banner staleness.
+
+    Returns None if lookups are unavailable or nothing is linked.
+    """
+    try:
+        from pluggable_apps.lookup_v1.staleness import (
+            get_latest_lookup_mutation_for_tool as _get,
+        )
+
+        return _get(tool)
+    except ImportError:
+        return None
+
+
 def get_lookup_validation_for_tool(tool) -> dict:
     """Pre-emptive lookup validation for FE Export / Deploy gating.
 
diff --git a/backend/prompt_studio/prompt_studio_core_v2/migrations/0007_customtool_last_exported_at.py b/backend/prompt_studio/prompt_studio_core_v2/migrations/0007_customtool_last_exported_at.py
new file mode 100644
index 0000000000..91539c9cf9
--- /dev/null
+++ b/backend/prompt_studio/prompt_studio_core_v2/migrations/0007_customtool_last_exported_at.py
@@ -0,0 +1,21 @@
+# Generated by Django 4.2.1 on 2026-04-21 20:20
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("prompt_studio_core_v2", "0006_add_custom_data_to_customtool"),
+    ]
+
+    operations = [
+        migrations.AddField(
+            model_name="customtool",
+            name="last_exported_at",
+            field=models.DateTimeField(
+                blank=True,
+                db_comment="Timestamp of the last successful export; NULL if never exported since the field was introduced.",
+                null=True,
+            ),
+        ),
+    ]
diff --git a/backend/prompt_studio/prompt_studio_core_v2/models.py b/backend/prompt_studio/prompt_studio_core_v2/models.py
index 406c157efc..f7d1d2b9e5 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/models.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/models.py
@@ -161,6 +161,15 @@ class CustomTool(DefaultOrganizationMixin, BaseModel):
         db_comment="Flag to share this custom tool with all users in the organization",
     )
 
+    # NULL on pre-feature tools; populated on first successful export.
+    # Drives staleness checks (e.g. lookup-change banner) without requiring
+    # a data backfill.
+    last_exported_at = models.DateTimeField(
+        null=True,
+        blank=True,
+        db_comment="Timestamp of the last successful export; NULL if never exported since the field was introduced.",
+    )
+
     objects = CustomToolModelManager()
 
     def delete(self, organization_id=None, *args, **kwargs):
diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 96fd4c8702..a41a40017f 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -14,6 +14,7 @@
 from django.db import IntegrityError
 from django.db.models import Count, OuterRef, QuerySet, Subquery
 from django.http import HttpRequest, HttpResponse
+from django.utils import timezone
 from file_management.constants import FileInformationKey as FileKey
 from file_management.exceptions import FileNotFound
 from permissions.permission import IsOwner, IsOwnerOrSharedUserOrSharedToOrg
@@ -33,6 +34,7 @@
 
 from backend.celery_service import app as celery_app
 from prompt_studio.lookup_utils import (
+    get_latest_lookup_mutation_for_tool,
     get_lookup_validation_for_tool,
     get_multi_var_lookups_for_tool,
 )
@@ -1085,6 +1087,11 @@ def export_tool(self, request: Request, pk: Any = None) -> Response:
             force_export=force_export,
         )
 
+        # Record export timestamp so staleness checks (e.g. lookup-change
+        # banner) can compare against mutations that happened afterwards.
+        custom_tool.last_exported_at = timezone.now()
+        custom_tool.save(update_fields=["last_exported_at"])
+
         # Notify HubSpot about first tool export
         notify_hubspot_event(
             user=request.user,
@@ -1285,10 +1292,20 @@ def check_deployment_usage(self, request: Request, pk: Any = None) -> Response:
             instance: CustomTool = self.get_object()
             is_used, workflow_ids = self._check_tool_usage_in_workflows(instance)
 
+            # Lookup staleness: NULL last_exported_at means we can't compare,
+            # so treat as clean (don't false-alarm pre-feature projects).
+            is_lookup_dirty = False
+            if instance.last_exported_at is not None:
+                latest = get_latest_lookup_mutation_for_tool(instance)
+                is_lookup_dirty = (
+                    latest is not None and latest > instance.last_exported_at
+                )
+
             deployment_info: dict = {
                 "is_used": is_used,
                 "deployment_types": [],
                 "message": "",
+                "is_lookup_dirty": is_lookup_dirty,
             }
 
             if is_used and workflow_ids:

From eced338dd159148e1be54a52259204f828e8a875 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 22 Apr 2026 04:07:41 +0530
Subject: [PATCH 22/57] UN-2946 [FEAT] Stream lookup enrichment failures to
 workflow logs

When enricher.run() raises, surface a user-visible ERROR log line in
the workflow execution log alongside the existing usage record. Keeps
lookup failures observable next to the other pre/post lookup lines we
already emit.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 workers/executor/executors/legacy_executor.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 42210210ef..f66e6d9fa0 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1921,6 +1921,11 @@ def _run_lookup_enrichment(
             enricher.run()
         except Exception as e:
             logger.warning("Lookup enrichment failed for %s: %s", prompt_name, e)
+            lookup_label = lookup_config.get("lookup_name") or prompt_name
+            shim.stream_log(
+                f"Lookup `{lookup_label}` failed: {str(e)[:200]}",
+                level=LogLevel.ERROR,
+            )
             error_record = {
                 "usage_type": "llm",
                 "llm_usage_reason": "lookup",

From 58f2dbd162e25279e86ec48f0313c59a45b37a52 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 22 Apr 2026 04:08:09 +0530
Subject: [PATCH 23/57] UN-2946 [UI] Wire lookup dirty-seed and export gate
 into ToolIde

Loads useLookupDirtySeed (server-side is_lookup_dirty) and
useLookupExportGate from the cloud plugin via dynamic imports so the
reminder banner reflects lookup changes across page reloads and the
banner's Export flow goes through the same validation modal as the
main buttons. Also adds a titleAdornment slot on ToolNavBar for
rendering the onboarding tooltip and relaxes EmptyState.text to accept
nodes for the tagline + link composition.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../custom-tools/tool-ide/ToolIde.jsx         | 42 +++++++++++++++++++
 .../navigations/tool-nav-bar/ToolNavBar.jsx   |  3 ++
 .../widgets/empty-state/EmptyState.jsx        |  2 +-
 3 files changed, 46 insertions(+), 1 deletion(-)

diff --git a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
index 93c8198593..ab87f6f19c 100644
--- a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
+++ b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
@@ -44,6 +44,36 @@ try {
 } catch {
   // Do nothing if plugins are not loaded.
 }
+
+// Cloud-only hook that seeds hasUnsavedChanges from server-side
+// lookup-staleness. No-op stub in OSS.
+let useLookupDirtySeed = () => {
+  // no-op
+};
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/hooks/useLookupDirtySeed.js"
+  );
+  useLookupDirtySeed = mod.useLookupDirtySeed;
+} catch {
+  // Do nothing if plugin is not loaded.
+}
+
+// Cloud-only lookup export validation gate. OSS stub resolves true so
+// the reminder bar's "Export" button proceeds directly.
+let useLookupExportGate = () => ({
+  checkLookups: () => Promise.resolve(true),
+  modalEl: null,
+});
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/hooks/useLookupExportGate"
+  );
+  useLookupExportGate = mod.useLookupExportGate;
+} catch {
+  // OSS — gate stays a no-op resolving true.
+}
+
 function ToolIde() {
   const [openSettings, setOpenSettings] = useState(false);
   const customToolStore = useCustomToolStore();
@@ -76,6 +106,7 @@ function ToolIde() {
   const isCheckingUsageRef = useRef(false);
   const hasCheckedForCurrentSessionRef = useRef(false);
   const abortControllerRef = useRef(null);
+  const { checkLookups, modalEl: lookupGateModalEl } = useLookupExportGate();
 
   useEffect(() => {
     if (openShareModal) {
@@ -178,6 +209,11 @@ function ToolIde() {
     }
   }, [details?.tool_id]);
 
+  // Cloud plugin seeds hasUnsavedChanges when a linked lookup has been
+  // edited since the tool's last export — surfaces the re-export banner
+  // for mutations made on the standalone /lookups page. No-op in OSS.
+  useLookupDirtySeed(details?.tool_id);
+
   // Cleanup abort controller on unmount
   useEffect(() => {
     return () => {
@@ -189,6 +225,10 @@ function ToolIde() {
 
   // Handle export from reminder bar
   const handleExportFromReminder = useCallback(async () => {
+    const ok = await checkLookups(details?.tool_id, "export");
+    if (!ok) {
+      return;
+    }
     setIsExporting(true);
     try {
       const requestOptions = {
@@ -237,6 +277,7 @@ function ToolIde() {
     handleException,
     markChangesAsExported,
     setPostHogCustomEvent,
+    checkLookups,
   ]);
 
   const generateIndex = async (doc) => {
@@ -340,6 +381,7 @@ function ToolIde() {
           isExporting={isExporting}
         />
       )}
+      {lookupGateModalEl}
       <Header
         handleUpdateTool={handleUpdateTool}
         setOpenSettings={setOpenSettings}
diff --git a/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx b/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
index 677fba8a1e..e39c50ff1e 100644
--- a/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
+++ b/frontend/src/components/navigations/tool-nav-bar/ToolNavBar.jsx
@@ -9,6 +9,7 @@ import "./ToolNavBar.css";
 
 function ToolNavBar({
   title,
+  titleAdornment,
   subtitle,
   onEditTitle,
   enableSearch,
@@ -54,6 +55,7 @@ function ToolNavBar({
                 <Typography.Text strong className="tool-nav-bar__title">
                   {title}
                 </Typography.Text>
+                {titleAdornment}
                 {onEditTitle && (
                   <Button
                     type="text"
@@ -104,6 +106,7 @@ function ToolNavBar({
 
 ToolNavBar.propTypes = {
   title: PropTypes.string,
+  titleAdornment: PropTypes.node,
   subtitle: PropTypes.string,
   onEditTitle: PropTypes.func,
   enableSearch: PropTypes.bool,
diff --git a/frontend/src/components/widgets/empty-state/EmptyState.jsx b/frontend/src/components/widgets/empty-state/EmptyState.jsx
index d221c25449..0c9c8537d0 100644
--- a/frontend/src/components/widgets/empty-state/EmptyState.jsx
+++ b/frontend/src/components/widgets/empty-state/EmptyState.jsx
@@ -27,7 +27,7 @@ function EmptyState({ text, btnText, handleClick }) {
 }
 
 EmptyState.propTypes = {
-  text: PropTypes.string.isRequired,
+  text: PropTypes.node.isRequired,
   btnText: PropTypes.string,
   handleClick: PropTypes.func,
 };

From 3bddd7cbfae0ba29d531aa1c5f90e5cb9cc66607 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Thu, 23 Apr 2026 15:39:12 +0530
Subject: [PATCH 24/57] UN-2946 [FEAT] Share lookup test wrapper + generic
 ExecutionLogs back state

- Delegate production lookup enrichment to LookupEnrichment.run_with_metrics
  so the executor and the IDE test path share LLM construction, error
  handling, and usage-record emission.
- Let ExecutionLogs callers pass an arbitrary backRouteState via location
  state so nested UI restore (e.g. a sub-tab) no longer needs special
  casing in this component.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../logging/execution-logs/ExecutionLogs.jsx  |  5 +-
 workers/executor/executors/legacy_executor.py | 52 +++----------------
 2 files changed, 10 insertions(+), 47 deletions(-)

diff --git a/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx b/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
index a9c72a0efb..1b0b6ea208 100644
--- a/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
+++ b/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
@@ -54,14 +54,15 @@ function ExecutionLogs() {
     ? location.state?.from || `/${sessionDetails?.orgName}/logs`
     : null;
 
-  // State to pass back for scroll restoration
+  // Scroll-restoration takes precedence; fall back to caller-provided
+  // backRouteState so callers can restore arbitrary upstream UI state.
   const backRouteState =
     id && location.state?.scrollToCardId
       ? {
           scrollToCardId: location.state.scrollToCardId,
           cardExpanded: location.state.cardExpanded,
         }
-      : null;
+      : location.state?.backRouteState || null;
 
   const items = [
     {
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index f66e6d9fa0..185e99e06d 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1896,56 +1896,18 @@ def _run_lookup_enrichment(
             return
 
         _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
-        llm_adapter_id = lookup_config.get("llm_adapter_id", "")
-        llm = llm_cls(
-            adapter_instance_id=llm_adapter_id,
-            tool=shim,
-            usage_kwargs={
-                **(usage_kwargs or {}),
-                PSKeys.LLM_USAGE_REASON: "lookup",
-                **lookup_config.get("usage_kwargs_extra", {}),
-            },
-            capture_metrics=True,
-        )
-
-        enricher = lookup_cls(
-            current_value=current_value,
+        outcome = lookup_cls.run_with_metrics(
+            llm_cls=llm_cls,
             lookup_config=lookup_config,
             structured_output=structured_output,
-            llm=llm,
-            shim=shim,
+            current_value=current_value,
             metadata=metadata,
             prompt_name=prompt_name,
+            shim=shim,
+            usage_kwargs=usage_kwargs,
         )
-        try:
-            enricher.run()
-        except Exception as e:
-            logger.warning("Lookup enrichment failed for %s: %s", prompt_name, e)
-            lookup_label = lookup_config.get("lookup_name") or prompt_name
-            shim.stream_log(
-                f"Lookup `{lookup_label}` failed: {str(e)[:200]}",
-                level=LogLevel.ERROR,
-            )
-            error_record = {
-                "usage_type": "llm",
-                "llm_usage_reason": "lookup",
-                "model_name": lookup_config.get("llm_adapter_id", "unknown"),
-                "status": "ERROR",
-                "error_message": str(e)[:2000],
-                "prompt_tokens": 0,
-                "completion_tokens": 0,
-                "total_tokens": 0,
-                "embedding_tokens": 0,
-                "cost_in_dollars": 0.0,
-                **(usage_kwargs or {}),
-                **lookup_config.get("usage_kwargs_extra", {}),
-            }
-            self._usage_records.append(error_record)
-        finally:
-            self._usage_records.extend(llm.flush_pending_usage())
-            metrics.setdefault(prompt_name, {})[f"{llm.get_usage_reason()}_llm"] = (
-                llm.get_metrics()
-            )
+        self._usage_records.extend(outcome.usage_records)
+        metrics.setdefault(prompt_name, {})["lookup_llm"] = outcome.llm_metrics
 
     @staticmethod
     def _run_webhook_postprocessing(

From 1bf0b0396411afbd21eecd2b4a6e360869a3d865 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 24 Apr 2026 01:19:53 +0530
Subject: [PATCH 25/57] =?UTF-8?q?UN-2946=20[REFACTOR]=20Round-2=20review?=
 =?UTF-8?q?=20fixes=20=E2=80=94=20OSS=20side?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bucket of hardening fixes driven by a staff-level PR re-review:

- Org-scope latest_outputs_by_keys (was cross-tenant readable via raw
  .objects.filter() that bypassed OrganizationFilterBackend).
- Hide lookup payload shape from OSS: three new opaque bridge helpers
  (get_original_value_if_enriched, attach_combined_output_enrichment,
  extract_prompt_output_enrichment) replace direct reads of
  metadata["lookup_outputs"] / _lookup_outputs / lookup_outputs in
  output_manager_helper, CombinedOutput.jsx, and usePromptOutput.js.
- Split usage_v2 index into a new 0005 migration that uses
  AddIndexConcurrently + atomic=False so prod doesn't lock the billing
  table during build.
- Delete stale workers/tests/test_usage.py that imported the removed
  UsageHelper module.
- SDK1 LLM gains public get_last_usage_record() so downstream code
  stops reaching into _pending_usage across plugin boundaries.
- legacy_executor stamps metadata["lookup_errors"][prompt] on a failed
  lookup outcome for dashboards that surface partial-failure runs.
- extraction_client docstring notes the cloud-only endpoint contract.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         |  49 +++
 .../output_manager_helper.py                  |  41 ++-
 .../prompt_studio_output_manager_v2/views.py  |  12 +-
 .../migrations/0004_usage_metrics_fields.py   |  10 +-
 .../0005_usage_reason_ref_created_idx.py      |  26 ++
 .../combined-output/CombinedOutput.jsx        |  42 +--
 frontend/src/hooks/usePromptOutput.js         |  15 +-
 unstract/sdk1/src/unstract/sdk1/llm.py        |  11 +
 workers/executor/executors/legacy_executor.py |   8 +
 workers/shared/clients/extraction_client.py   |  18 +-
 workers/tests/test_usage.py                   | 312 ------------------
 11 files changed, 180 insertions(+), 364 deletions(-)
 create mode 100644 backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
 delete mode 100644 workers/tests/test_usage.py

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 474f9a5d52..1628384b98 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -115,6 +115,55 @@ def get_latest_lookup_mutation_for_tool(tool):
         return None
 
 
+def get_original_value_if_enriched(metadata: dict, prompt_key: str):
+    """Return the pre-enrichment value for ``prompt_key`` if present.
+
+    Opaque wrapper around the cloud plugin's ``lookup_outputs`` metadata
+    shape so OSS callers don't need to know the key names. Returns None
+    when no enrichment happened or the plugin is absent.
+    """
+    if not isinstance(metadata, dict):
+        return None
+    lookup_outputs = metadata.get("lookup_outputs") or {}
+    prompt_lookup = lookup_outputs.get(prompt_key)
+    if isinstance(prompt_lookup, dict) and "original" in prompt_lookup:
+        return prompt_lookup.get("original"), prompt_lookup
+    return None
+
+
+def attach_combined_output_enrichment(result: dict, enriched_by_key: dict) -> None:
+    """Stamp the combined-output payload with enriched-output metadata.
+
+    OSS ships a stub that ignores the call; cloud reroutes into the payload
+    key its FE plugin expects. Keeping the key name out of OSS lets cloud
+    evolve the shape without OSS-side coordination.
+    """
+    try:
+        from pluggable_apps.lookup_v1.output_enrichment import (
+            attach_combined_output_enrichment as _attach,
+        )
+
+        _attach(result, enriched_by_key)
+    except ImportError:
+        return
+
+
+def extract_prompt_output_enrichment(item) -> dict | None:
+    """Pick enriched-output data off a serialized prompt-output row.
+
+    Returns a plugin-opaque dict (the FE treats it as a black box) or None
+    when no enrichment is present / plugin missing.
+    """
+    try:
+        from pluggable_apps.lookup_v1.output_enrichment import (
+            extract_prompt_output_enrichment as _extract,
+        )
+
+        return _extract(item)
+    except ImportError:
+        return None
+
+
 def get_lookup_validation_for_tool(tool) -> dict:
     """Pre-emptive lookup validation for FE Export / Deploy gating.
 
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 056e7feb5d..72805bd1ba 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -5,7 +5,12 @@
 from django.core.exceptions import ObjectDoesNotExist
 from django.utils import timezone
 
-from prompt_studio.lookup_utils import persist_lookup_output
+from prompt_studio.lookup_utils import (
+    attach_combined_output_enrichment,
+    extract_prompt_output_enrichment,
+    get_original_value_if_enriched,
+    persist_lookup_output,
+)
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.exceptions import (
     AnswerFetchError,
@@ -175,13 +180,16 @@ def update_or_create_prompt_output(
             # TODO: use enums here
             output = outputs.get(prompt.prompt_key)
 
-            # If lookup enrichment ran, structured_output contains the enriched
-            # value. Restore the original raw LLM output for the prompt output
-            # table — the enriched value lives in LookupOutputResult instead.
-            lookup_outputs = metadata.get("lookup_outputs", {})
-            prompt_lookup = lookup_outputs.get(prompt.prompt_key)
-            if prompt_lookup and "original" in prompt_lookup:
-                output = prompt_lookup["original"]
+            # If lookup enrichment ran, structured_output contains the
+            # enriched value. Restore the original raw LLM output for the
+            # prompt output table — the enriched value is persisted by the
+            # cloud plugin via persist_lookup_output. Cloud owns the
+            # metadata shape; OSS queries through the bridge.
+            enrichment = get_original_value_if_enriched(metadata, prompt.prompt_key)
+            if enrichment is not None:
+                output, prompt_lookup = enrichment
+            else:
+                prompt_lookup = None
 
             if prompt.enforce_type in {"json", "table", "record", "line-item"}:
                 output = json.dumps(output)
@@ -260,13 +268,13 @@ def fetch_default_output_response(
 
         Returns:
             dict[str, Any]: Formatted JSON response for combined output.
-                Includes a reserved ``_lookup_outputs`` key with per-prompt
-                enriched data when lookups are configured.
+                When lookups are configured, the cloud plugin adds an
+                opaque enrichment payload via ``attach_combined_output_enrichment``.
         """
         from prompt_studio.lookup_utils import enrich_prompt_output
 
         result: dict[str, Any] = {}
-        lookup_outputs: dict[str, Any] = {}
+        enrichment_by_key: dict[str, Any] = {}
 
         for tool_prompt in tool_studio_prompts:
             if tool_prompt.prompt_type == PSOMKeys.NOTES:
@@ -298,15 +306,12 @@ def fetch_default_output_response(
 
                 for output in queryset:
                     result[tool_prompt.prompt_key] = output.output
-                    # Check for lookup enrichment
                     enriched = enrich_prompt_output(output, {})
-                    if "lookup_outputs" in enriched:
-                        lookup_outputs[tool_prompt.prompt_key] = enriched[
-                            "lookup_outputs"
-                        ]
+                    bundle = extract_prompt_output_enrichment(enriched)
+                    if bundle is not None:
+                        enrichment_by_key[tool_prompt.prompt_key] = bundle
             except ObjectDoesNotExist:
                 result[tool_prompt.prompt_key] = ""
 
-        if lookup_outputs:
-            result["_lookup_outputs"] = lookup_outputs
+        attach_combined_output_enrichment(result, enrichment_by_key)
         return result
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
index 5a31c481dc..ff9818962d 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
@@ -10,6 +10,7 @@
 from rest_framework.versioning import URLPathVersioning
 from utils.common_utils import CommonUtils
 from utils.filtering import FilterHelper
+from utils.user_context import UserContext
 
 from prompt_studio.prompt_studio_output_manager_v2.constants import (
     PromptOutputManagerErrorMessage,
@@ -82,9 +83,15 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
         if not prompt_keys:
             return Response({}, status=status.HTTP_200_OK)
 
+        # Custom actions don't go through self.filter_queryset(), so
+        # OrganizationFilterBackend does not run. Scope explicitly here via
+        # the tool's organization FK to prevent cross-tenant reads.
+        organization = UserContext.get_organization()
         prompt_id_to_key = dict(
             ToolStudioPrompt.objects.filter(
-                tool_id=tool_id, prompt_key__in=prompt_keys
+                tool_id=tool_id,
+                tool_id__organization=organization,
+                prompt_key__in=prompt_keys,
             ).values_list("prompt_id", "prompt_key")
         )
         if not prompt_id_to_key:
@@ -92,7 +99,8 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
 
         outputs = (
             PromptStudioOutputManager.objects.filter(
-                prompt_id__in=prompt_id_to_key.keys()
+                prompt_id__in=prompt_id_to_key.keys(),
+                tool_id__organization=organization,
             )
             .exclude(output__isnull=True)
             .exclude(output__exact="")
diff --git a/backend/usage_v2/migrations/0004_usage_metrics_fields.py b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
index 03174f0677..89cf1feb3c 100644
--- a/backend/usage_v2/migrations/0004_usage_metrics_fields.py
+++ b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
@@ -80,11 +80,7 @@ class Migration(migrations.Migration):
                 null=True,
             ),
         ),
-        migrations.AddIndex(
-            model_name="usage",
-            index=models.Index(
-                fields=["llm_usage_reason", "reference_id", "-created_at"],
-                name="idx_usage_reason_ref_created",
-            ),
-        ),
+        # Index creation moved to 0005 so it can run CONCURRENTLY — the usage
+        # table is billing-critical and a plain AddIndex takes a share-update
+        # lock for the duration of the build on large tables.
     ]
diff --git a/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
new file mode 100644
index 0000000000..043dfa6693
--- /dev/null
+++ b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
@@ -0,0 +1,26 @@
+from django.contrib.postgres.operations import AddIndexConcurrently
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    """Build the lookup-usage dashboard index without locking the table.
+
+    CONCURRENTLY requires that the migration itself runs outside a
+    transaction, hence atomic = False.
+    """
+
+    atomic = False
+
+    dependencies = [
+        ("usage_v2", "0004_usage_metrics_fields"),
+    ]
+
+    operations = [
+        AddIndexConcurrently(
+            model_name="usage",
+            index=models.Index(
+                fields=["llm_usage_reason", "reference_id", "-created_at"],
+                name="idx_usage_reason_ref_created",
+            ),
+        ),
+    ]
diff --git a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
index 20993ffc4b..cb3f8ec1e2 100644
--- a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
+++ b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
@@ -47,6 +47,20 @@ try {
   // The component will remain null if it is not available
 }
 
+// Cloud plugin hook — OSS falls back to passthrough helpers that leave
+// the payload untouched and report "no enrichment".
+let splitCombinedData = (data) => ({ combined: data, bundle: null });
+let buildEnrichedFromBundle = () => ({});
+let getEnrichmentFromItem = () => null;
+try {
+  const mod = await import("../../../plugins/lookup-enriched-toggle/helpers");
+  splitCombinedData = mod.splitCombinedData;
+  buildEnrichedFromBundle = mod.buildEnrichedFromBundle;
+  getEnrichmentFromItem = mod.getEnrichmentFromItem;
+} catch {
+  // Plugin unavailable — passthroughs above retain OSS behavior.
+}
+
 function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
   const {
     details,
@@ -118,26 +132,15 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
         const prompts = details?.prompts || [];
 
         if (activeKey === "0" && !isSimplePromptStudio) {
-          const lookupOutputs = data?._lookup_outputs || {};
-          const output = Object.entries(data).reduce((acc, [key, value]) => {
-            if (key === "_lookup_outputs") return acc;
+          const { combined: payload, bundle } = splitCombinedData(data);
+          const output = Object.entries(payload).reduce((acc, [key, value]) => {
             acc[key] = displayPromptResult(value, false);
             return acc;
           }, {});
           setCombinedOutput(output);
-
-          if (Object.keys(lookupOutputs).length > 0) {
-            const enriched = {};
-            for (const [key, val] of Object.entries(output)) {
-              const lookupData = lookupOutputs[key];
-              enriched[key] = lookupData?.output
-                ? displayPromptResult(lookupData.output, false)
-                : val;
-            }
-            setEnrichedOutput(enriched);
-          } else {
-            setEnrichedOutput({});
-          }
+          setEnrichedOutput(
+            buildEnrichedFromBundle(output, bundle, displayPromptResult),
+          );
         } else {
           const output = {};
           const enriched = {};
@@ -157,11 +160,10 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
                 ? displayPromptResult(outputDetails?.output, false)
                 : "";
 
-            // Build enriched output from lookup_outputs
-            const lookupData = outputDetails?.lookup_outputs;
-            if (lookupData?.output) {
+            const enrichment = getEnrichmentFromItem(outputDetails);
+            if (enrichment?.output) {
               enriched[item?.prompt_key] = displayPromptResult(
-                lookupData.output,
+                enrichment.output,
                 false,
               );
               hasEnriched = true;
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index 0e06070b7b..98727a1c1c 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -33,6 +33,16 @@ try {
   // Not available in OSS
 }
 
+// Opaque extractor so the per-item enrichment payload key name lives in
+// the plugin, not OSS. OSS falls back to a no-op.
+let getEnrichmentFromItem = () => null;
+try {
+  const mod = await import("../plugins/lookup-enriched-toggle/helpers");
+  getEnrichmentFromItem = mod.getEnrichmentFromItem;
+} catch {
+  // Plugin unavailable — no-op.
+}
+
 const usePromptOutput = () => {
   const { sessionDetails } = useSessionStore();
   const { setTokenUsage, updateTokenUsage } = useTokenUsageStore();
@@ -135,8 +145,9 @@ const usePromptOutput = () => {
         wordConfidenceData: item?.word_confidence_data,
       };
 
-      if (handleLookupOutput && item?.lookup_outputs) {
-        handleLookupOutput(item.prompt_output_id, item.lookup_outputs);
+      const enrichment = getEnrichmentFromItem(item);
+      if (handleLookupOutput && enrichment) {
+        handleLookupOutput(item.prompt_output_id, enrichment);
       }
 
       if (item?.is_single_pass_extract && isTokenUsageForSinglePassAdded) {
diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index eb31c52ad6..2b85548cb0 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -562,6 +562,17 @@ def get_last_usage(self) -> Mapping[str, int]:
             "total_tokens": last["total_tokens"],
         }
 
+    def get_last_usage_record(self) -> dict | None:
+        """Full usage record for the most recent complete() call.
+
+        Returns the complete record (tokens + cost + model + reason
+        metadata) so callers don't have to reach into ``_pending_usage``
+        directly. ``None`` if no call has been made yet.
+        """
+        if not self._pending_usage:
+            return None
+        return self._pending_usage[-1]
+
     def get_usage_reason(self) -> object:
         return self.platform_kwargs.get("llm_usage_reason")
 
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 185e99e06d..134331a599 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1907,7 +1907,15 @@ def _run_lookup_enrichment(
             usage_kwargs=usage_kwargs,
         )
         self._usage_records.extend(outcome.usage_records)
+        # Key stays in sync with llm_usage_reason="lookup" set inside
+        # run_with_metrics; metrics are grouped by reason elsewhere.
         metrics.setdefault(prompt_name, {})["lookup_llm"] = outcome.llm_metrics
+        # Surface a prompt-level degraded flag for dashboards that group
+        # partial-failure runs without forcing the executor to error out.
+        if not outcome.success:
+            metadata.setdefault("lookup_errors", {})[prompt_name] = (outcome.error or "")[
+                :2000
+            ]
 
     @staticmethod
     def _run_webhook_postprocessing(
diff --git a/workers/shared/clients/extraction_client.py b/workers/shared/clients/extraction_client.py
index db6781be62..07b839eb32 100644
--- a/workers/shared/clients/extraction_client.py
+++ b/workers/shared/clients/extraction_client.py
@@ -1,7 +1,16 @@
 """Extraction API Client for text extraction callbacks.
 
-Used by the ide_callback worker to persist extraction results
-through the backend's internal API endpoints.
+Used by the ide_callback worker to persist extraction results through
+the backend's internal API endpoints.
+
+NOTE on scope: the callback endpoints ``v1/extraction/extraction-{complete,error}/``
+are currently registered **only** by the cloud ``lookup_v1`` plugin
+(see ``pluggable_apps/lookup_v1/internal_urls.py``). The interface is
+``source``-dispatched and designed to serve other extraction flows
+(prompt-studio docs, connectors) in the future, but in OSS-only builds
+the endpoints are absent. Callers from OSS paths should expect a 404
+response and treat it as a no-op; the worker's error handling covers
+this via a 404-terminal pattern.
 """
 
 import logging
@@ -16,7 +25,10 @@
 
 
 class ExtractionAPIClient(BaseAPIClient):
-    """API client for generic text extraction callback endpoints."""
+    """API client for the extraction-callback endpoints registered by
+    cloud-side plugins (today: lookup_v1). See module docstring for the
+    OSS-absence contract.
+    """
 
     def mark_extraction_complete(
         self,
diff --git a/workers/tests/test_usage.py b/workers/tests/test_usage.py
deleted file mode 100644
index fc08ac825b..0000000000
--- a/workers/tests/test_usage.py
+++ /dev/null
@@ -1,312 +0,0 @@
-"""Phase 2G — Usage tracking tests.
-
-Verifies:
-1. UsageHelper.push_usage_data wraps Audit correctly
-2. Invalid kwargs returns False
-3. Invalid platform_api_key returns False
-4. Audit exceptions are caught and return False
-5. format_float_positional formats correctly
-6. SDK1 adapters already push usage (integration check)
-7. answer_prompt handler returns metrics in ExecutionResult
-"""
-
-from unittest.mock import MagicMock, patch
-
-
-from executor.executors.usage import UsageHelper
-
-
-# ---------------------------------------------------------------------------
-# 1. push_usage_data success
-# ---------------------------------------------------------------------------
-
-
-class TestPushUsageData:
-    @patch("unstract.sdk1.audit.Audit")
-    def test_push_success(self, mock_audit_cls):
-        """Successful push returns True and calls Audit."""
-        mock_audit = MagicMock()
-        mock_audit_cls.return_value = mock_audit
-
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "run-001", "execution_id": "exec-001"},
-            platform_api_key="test-key",
-            token_counter=MagicMock(),
-            model_name="gpt-4",
-        )
-
-        assert result is True
-        mock_audit.push_usage_data.assert_called_once()
-        call_kwargs = mock_audit.push_usage_data.call_args
-        assert call_kwargs.kwargs["platform_api_key"] == "test-key"
-        assert call_kwargs.kwargs["model_name"] == "gpt-4"
-        assert call_kwargs.kwargs["event_type"] == "llm"
-
-    @patch("unstract.sdk1.audit.Audit")
-    def test_push_passes_token_counter(self, mock_audit_cls):
-        """Token counter is passed through to Audit."""
-        mock_audit = MagicMock()
-        mock_audit_cls.return_value = mock_audit
-        mock_counter = MagicMock()
-
-        UsageHelper.push_usage_data(
-            event_type="embedding",
-            kwargs={"run_id": "run-002"},
-            platform_api_key="key-2",
-            token_counter=mock_counter,
-        )
-
-        call_kwargs = mock_audit.push_usage_data.call_args
-        assert call_kwargs.kwargs["token_counter"] is mock_counter
-
-
-# ---------------------------------------------------------------------------
-# 2. Invalid kwargs
-# ---------------------------------------------------------------------------
-
-
-class TestPushValidation:
-    def test_none_kwargs_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs=None,
-            platform_api_key="key",
-        )
-        assert result is False
-
-    def test_empty_kwargs_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={},
-            platform_api_key="key",
-        )
-        assert result is False
-
-    def test_non_dict_kwargs_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs="not a dict",
-            platform_api_key="key",
-        )
-        assert result is False
-
-
-# ---------------------------------------------------------------------------
-# 3. Invalid platform_api_key
-# ---------------------------------------------------------------------------
-
-
-class TestPushApiKeyValidation:
-    def test_none_key_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "r1"},
-            platform_api_key=None,
-        )
-        assert result is False
-
-    def test_empty_key_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "r1"},
-            platform_api_key="",
-        )
-        assert result is False
-
-    def test_non_string_key_returns_false(self):
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "r1"},
-            platform_api_key=12345,
-        )
-        assert result is False
-
-
-# ---------------------------------------------------------------------------
-# 4. Audit exceptions are caught
-# ---------------------------------------------------------------------------
-
-
-class TestPushErrorHandling:
-    @patch("unstract.sdk1.audit.Audit")
-    def test_audit_exception_returns_false(self, mock_audit_cls):
-        """Audit errors are caught and return False."""
-        mock_audit = MagicMock()
-        mock_audit.push_usage_data.side_effect = Exception("Network error")
-        mock_audit_cls.return_value = mock_audit
-
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "r1"},
-            platform_api_key="key",
-            token_counter=MagicMock(),
-        )
-
-        assert result is False
-
-    @patch("unstract.sdk1.audit.Audit")
-    def test_import_error_returns_false(self, mock_audit_cls):
-        """Import errors are caught gracefully."""
-        mock_audit_cls.side_effect = ImportError("no module")
-
-        result = UsageHelper.push_usage_data(
-            event_type="llm",
-            kwargs={"run_id": "r1"},
-            platform_api_key="key",
-        )
-
-        assert result is False
-
-
-# ---------------------------------------------------------------------------
-# 5. format_float_positional
-# ---------------------------------------------------------------------------
-
-
-class TestFormatFloat:
-    def test_normal_float(self):
-        assert UsageHelper.format_float_positional(0.0001234) == "0.0001234"
-
-    def test_trailing_zeros_removed(self):
-        assert UsageHelper.format_float_positional(1.50) == "1.5"
-
-    def test_integer_value(self):
-        assert UsageHelper.format_float_positional(42.0) == "42"
-
-    def test_zero(self):
-        assert UsageHelper.format_float_positional(0.0) == "0"
-
-    def test_small_value(self):
-        result = UsageHelper.format_float_positional(0.00000001)
-        assert "0.00000001" == result
-
-    def test_custom_precision(self):
-        result = UsageHelper.format_float_positional(1.123456789, precision=3)
-        assert result == "1.123"
-
-
-# ---------------------------------------------------------------------------
-# 6. SDK1 adapters already push usage
-# ---------------------------------------------------------------------------
-
-
-class TestAdapterUsageTracking:
-    def test_llm_calls_audit_push(self):
-        """Verify the LLM adapter imports and calls Audit.push_usage_data.
-
-        This is a static analysis check — we verify the SDK1 LLM module
-        references Audit.push_usage_data, confirming adapters handle
-        usage tracking internally.
-        """
-        import inspect
-
-        from unstract.sdk1.llm import LLM
-
-        source = inspect.getsource(LLM)
-        assert "push_usage_data" in source
-        assert "Audit" in source
-
-
-# ---------------------------------------------------------------------------
-# 7. answer_prompt handler returns metrics
-# ---------------------------------------------------------------------------
-
-
-class TestMetricsInResult:
-    @patch(
-        "unstract.sdk1.utils.indexing.IndexingUtils.generate_index_key",
-        return_value="doc-id-test",
-    )
-    @patch(
-        "executor.executors.legacy_executor.LegacyExecutor._get_prompt_deps"
-    )
-    @patch("executor.executors.legacy_executor.ExecutorToolShim")
-    def test_answer_prompt_returns_metrics(
-        self, mock_shim_cls, mock_get_deps, _mock_idx, tmp_path
-    ):
-        """answer_prompt result includes metrics dict."""
-        from unstract.sdk1.execution.context import ExecutionContext
-        from unstract.sdk1.execution.registry import ExecutorRegistry
-
-        ExecutorRegistry.clear()
-        from executor.executors.legacy_executor import LegacyExecutor
-
-        if "legacy" not in ExecutorRegistry.list_executors():
-            ExecutorRegistry.register(LegacyExecutor)
-
-        executor = ExecutorRegistry.get("legacy")
-
-        # Mock all dependencies
-        mock_llm = MagicMock()
-        mock_llm.get_metrics.return_value = {"total_tokens": 100}
-        mock_llm.get_usage_reason.return_value = "extraction"
-        mock_llm.complete.return_value = {
-            "response": MagicMock(text="test answer"),
-            "highlight_data": [],
-            "confidence_data": None,
-            "word_confidence_data": None,
-            "line_numbers": [],
-            "whisper_hash": "",
-        }
-
-        mock_llm_cls = MagicMock(return_value=mock_llm)
-        mock_index = MagicMock()
-        mock_index.return_value.generate_index_key.return_value = "doc-123"
-
-        mock_get_deps.return_value = (
-            MagicMock(),   # AnswerPromptService — use real for construct
-            MagicMock(),   # RetrievalService
-            MagicMock(),   # VariableReplacementService
-            mock_index,    # Index
-            mock_llm_cls,  # LLM
-            MagicMock(),   # EmbeddingCompat
-            MagicMock(),   # VectorDB
-        )
-
-        # Patch AnswerPromptService methods at their real location
-        with patch(
-            "executor.executors.answer_prompt.AnswerPromptService.extract_variable",
-            return_value="test prompt",
-        ), patch(
-            "executor.executors.answer_prompt.AnswerPromptService.construct_and_run_prompt",
-            return_value="test answer",
-        ):
-            ctx = ExecutionContext(
-                executor_name="legacy",
-                operation="answer_prompt",
-                run_id="run-metrics-001",
-                execution_source="tool",
-                organization_id="org-test",
-                request_id="req-metrics-001",
-                executor_params={
-                    "tool_settings": {},
-                    "outputs": [
-                        {
-                            "name": "field1",
-                            "prompt": "What is X?",
-                            "chunk-size": 512,
-                            "chunk-overlap": 64,
-                            "vector-db": "vdb-1",
-                            "embedding": "emb-1",
-                            "x2text_adapter": "x2t-1",
-                            "llm": "llm-1",
-                            "type": "text",
-                            "retrieval-strategy": "simple",
-                            "similarity-top-k": 5,
-                        },
-                    ],
-                    "tool_id": "tool-1",
-                    "file_hash": "hash123",
-                    "file_path": str(tmp_path / "test.txt"),
-                    "file_name": "test.txt",
-                    "PLATFORM_SERVICE_API_KEY": "test-key",
-                },
-            )
-            result = executor.execute(ctx)
-
-        assert result.success is True
-        assert "metrics" in result.data
-        assert "field1" in result.data["metrics"]
-
-        ExecutorRegistry.clear()

From baaf2039a64b3eccaf44bbb946c82bfdb2cda052 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 24 Apr 2026 14:26:19 +0530
Subject: [PATCH 26/57] =?UTF-8?q?UN-2946=20[REFACTOR]=20Round-3=20review?=
 =?UTF-8?q?=20fixes=20=E2=80=94=20OSS=20side?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Module-level probe in prompt_studio/lookup_utils.py — swap per-function
  try/except ImportError for a single LOOKUPS_AVAILABLE flag. Add
  attach_lookup_config / attach_lookup_configs_to_tool_settings helpers
  so the direct metadata["lookup_errors"] write and the
  lookup_config key stamping both route through the bridge.
- Reject org=None in UsageBatchCreateView (usage_v2/internal_views.py).
- Lift useLookupExportGate to a single mount in ToolIde.jsx; thread
  checkLookups down into custom-tools/header/Header.jsx (eliminates
  the double modal-portal risk).
- Delete the direct metadata["lookup_errors"] write from
  workers/executor/executors/legacy_executor.py — flat summary is now
  stamped by LookupEnrichment.write_lookup_error in the cloud plugin.
  Replace hardcoded "lookup_llm" metrics key with lookup_cls.METRICS_KEY.
- Trim boilerplate comments across CombinedOutput, PromptCardItems,
  PromptOutput, usePromptOutput, prompt-card/Header, CustomToolsHelper,
  SideNavBar — keep the why-comments, drop the what-comments.
---
 backend/prompt_studio/lookup_utils.py         | 155 ++++++++----------
 .../prompt_studio_helper.py                   |  16 +-
 .../prompt_studio_registry_helper.py          |   7 +-
 backend/usage_v2/internal_views.py            |  15 +-
 .../combined-output/CombinedOutput.jsx        |   4 +-
 .../components/custom-tools/header/Header.jsx |  31 +---
 .../custom-tools/prompt-card/Header.jsx       |   4 +-
 .../prompt-card/PromptCardItems.jsx           |   4 +-
 .../custom-tools/prompt-card/PromptOutput.jsx |   8 +-
 .../custom-tools/tool-ide/ToolIde.jsx         |  13 +-
 .../helpers/custom-tools/CustomToolsHelper.js |   4 +-
 .../navigations/side-nav-bar/SideNavBar.jsx   |   4 +-
 frontend/src/hooks/usePromptOutput.js         |   8 +-
 unstract/sdk1/src/unstract/sdk1/llm.py        |   5 +
 workers/executor/executors/legacy_executor.py |  16 +-
 workers/shared/clients/usage_client.py        |   8 +-
 16 files changed, 137 insertions(+), 165 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 1628384b98..7a1d6b4850 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -1,36 +1,39 @@
 """Shared utility for lookup operations.
 
-Wraps cloud-only lookup calls so that OSS callers don't repeat
-the try/except ImportError guard. All functions are no-ops in OSS.
+Wraps cloud-only lookup calls so that OSS callers don't repeat the
+try/except ImportError guard. All functions are no-ops in OSS. A single
+module-level probe decides availability so downstream errors inside the
+cloud plugin surface instead of being silently swallowed as ImportError.
 """
 
 import logging
 
 logger = logging.getLogger(__name__)
 
+try:
+    from pluggable_apps.lookup_v1 import execution as _execution
+    from pluggable_apps.lookup_v1 import output_enrichment as _output_enrichment
+    from pluggable_apps.lookup_v1 import staleness as _staleness
+    from pluggable_apps.lookup_v1 import validation as _validation
+    from pluggable_apps.lookup_v1.models import LookupOutputResult as _LookupOutputResult
+
+    LOOKUPS_AVAILABLE = True
+except ImportError:
+    LOOKUPS_AVAILABLE = False
+
 
 def get_lookup_config(prompt) -> dict | None:
     """Return lookup config for a prompt, or None if lookups are unavailable."""
-    try:
-        from pluggable_apps.lookup_v1.execution import (
-            build_lookup_config_for_prompt,
-        )
-
-        return build_lookup_config_for_prompt(prompt)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return None
+    return _execution.build_lookup_config_for_prompt(prompt)
 
 
 def get_lookup_configs_for_tool(tool) -> list[dict] | None:
     """Return lookup configs for a tool (single pass), or None in OSS."""
-    try:
-        from pluggable_apps.lookup_v1.execution import (
-            build_lookup_configs_for_tool,
-        )
-
-        return build_lookup_configs_for_tool(tool)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return None
+    return _execution.build_lookup_configs_for_tool(tool)
 
 
 def get_multi_var_lookups_for_tool(tool, prompt_ids=None) -> list[str]:
@@ -40,36 +43,31 @@ def get_multi_var_lookups_for_tool(tool, prompt_ids=None) -> list[str]:
     so single / bulk runs only block when a lookup the run actually uses
     is multi-variable.
     """
-    try:
-        from pluggable_apps.lookup_v1.execution import has_multi_var_lookups
-
-        _, names = has_multi_var_lookups(tool, prompt_ids=prompt_ids)
-        return names
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return []
+    _, names = _execution.has_multi_var_lookups(tool, prompt_ids=prompt_ids)
+    return names
 
 
 def persist_lookup_output(prompt_output, prompt_lookup: dict) -> None:
     """Persist lookup enrichment result. No-op in OSS."""
-    try:
-        from pluggable_apps.lookup_v1.models import LookupOutputResult
-
-        lookup_meta = prompt_lookup.get("meta", {})
-        lookup_id = lookup_meta.get("lookup_id")
-        if lookup_id:
-            defaults = {
-                "lookup_definition_id": lookup_id,
-                "output": prompt_lookup.get("enriched", ""),
-            }
-            version_id = lookup_meta.get("version_id")
-            if version_id:
-                defaults["version_id"] = version_id
-            LookupOutputResult.objects.update_or_create(
-                prompt_output=prompt_output,
-                defaults=defaults,
-            )
-    except ImportError:
-        pass
+    if not LOOKUPS_AVAILABLE:
+        return
+    lookup_meta = prompt_lookup.get("meta", {})
+    lookup_id = lookup_meta.get("lookup_id")
+    if not lookup_id:
+        return
+    defaults = {
+        "lookup_definition_id": lookup_id,
+        "output": prompt_lookup.get("enriched", ""),
+    }
+    version_id = lookup_meta.get("version_id")
+    if version_id:
+        defaults["version_id"] = version_id
+    _LookupOutputResult.objects.update_or_create(
+        prompt_output=prompt_output,
+        defaults=defaults,
+    )
 
 
 def enrich_prompt_output(prompt_output, data: dict) -> dict:
@@ -77,26 +75,16 @@ def enrich_prompt_output(prompt_output, data: dict) -> dict:
 
     No-op in OSS.
     """
-    try:
-        from pluggable_apps.lookup_v1.output_enrichment import (
-            enrich_with_lookup_output,
-        )
-
-        return enrich_with_lookup_output(prompt_output, data)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return data
+    return _output_enrichment.enrich_with_lookup_output(prompt_output, data)
 
 
 def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
     """Validate lookup assignments before export. Returns ({}, None) in OSS."""
-    try:
-        from pluggable_apps.lookup_v1.validation import (
-            validate_lookups_for_export as _validate,
-        )
-
-        return _validate(prompts)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return {}, None
+    return _validation.validate_lookups_for_export(prompts)
 
 
 def get_latest_lookup_mutation_for_tool(tool):
@@ -105,14 +93,9 @@ def get_latest_lookup_mutation_for_tool(tool):
 
     Returns None if lookups are unavailable or nothing is linked.
     """
-    try:
-        from pluggable_apps.lookup_v1.staleness import (
-            get_latest_lookup_mutation_for_tool as _get,
-        )
-
-        return _get(tool)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return None
+    return _staleness.get_latest_lookup_mutation_for_tool(tool)
 
 
 def get_original_value_if_enriched(metadata: dict, prompt_key: str):
@@ -138,14 +121,9 @@ def attach_combined_output_enrichment(result: dict, enriched_by_key: dict) -> No
     key its FE plugin expects. Keeping the key name out of OSS lets cloud
     evolve the shape without OSS-side coordination.
     """
-    try:
-        from pluggable_apps.lookup_v1.output_enrichment import (
-            attach_combined_output_enrichment as _attach,
-        )
-
-        _attach(result, enriched_by_key)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return
+    _output_enrichment.attach_combined_output_enrichment(result, enriched_by_key)
 
 
 def extract_prompt_output_enrichment(item) -> dict | None:
@@ -154,14 +132,9 @@ def extract_prompt_output_enrichment(item) -> dict | None:
     Returns a plugin-opaque dict (the FE treats it as a black box) or None
     when no enrichment is present / plugin missing.
     """
-    try:
-        from pluggable_apps.lookup_v1.output_enrichment import (
-            extract_prompt_output_enrichment as _extract,
-        )
-
-        return _extract(item)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return None
+    return _output_enrichment.extract_prompt_output_enrichment(item)
 
 
 def get_lookup_validation_for_tool(tool) -> dict:
@@ -169,13 +142,7 @@ def get_lookup_validation_for_tool(tool) -> dict:
 
     Returns an "always ok" payload in OSS so the FE gate is a no-op.
     """
-    try:
-        from pluggable_apps.lookup_v1.validation import (
-            get_lookup_validation_for_tool as _validate,
-        )
-
-        return _validate(tool)
-    except ImportError:
+    if not LOOKUPS_AVAILABLE:
         return {
             "ok": True,
             "draft_lookups": [],
@@ -184,3 +151,25 @@ def get_lookup_validation_for_tool(tool) -> dict:
                 getattr(tool, "single_pass_extraction_mode", False)
             ),
         }
+    return _validation.get_lookup_validation_for_tool(tool)
+
+
+def attach_lookup_config(output: dict, config: dict) -> None:
+    """Stamp a per-prompt output dict with the lookup config payload.
+
+    Keeps the payload key name owned by the bridge so OSS call sites
+    don't encode the contract.
+    """
+    output["lookup_config"] = config
+
+
+def attach_lookup_configs_to_tool_settings(
+    tool_settings: dict, configs: list[dict]
+) -> None:
+    """Stamp tool_settings with the per-tool lookup configs list."""
+    tool_settings["lookup_configs"] = configs
+
+
+def get_lookup_config_from_output(output: dict) -> dict | None:
+    """Read the lookup config stamped on a prompt output, if any."""
+    return output.get("lookup_config")
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index ee8f1a4c8b..50aacb48cb 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -20,7 +20,12 @@
 from utils.local_context import StateStore
 
 from backend.celery_service import app as celery_app
-from prompt_studio.lookup_utils import get_lookup_config, get_lookup_configs_for_tool
+from prompt_studio.lookup_utils import (
+    attach_lookup_config,
+    attach_lookup_configs_to_tool_settings,
+    get_lookup_config,
+    get_lookup_configs_for_tool,
+)
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_profile_manager_v2.profile_manager_helper import (
     ProfileManagerHelper,
@@ -389,7 +394,7 @@ def _build_prompt_output(
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
         if lookup_config := get_lookup_config(prompt):
-            output["lookup_config"] = lookup_config
+            attach_lookup_config(output, lookup_config)
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -803,7 +808,7 @@ def build_fetch_response_payload(
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
         if lookup_config := get_lookup_config(prompt):
-            output["lookup_config"] = lookup_config
+            attach_lookup_config(output, lookup_config)
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -1173,10 +1178,9 @@ def build_single_pass_payload(
             TSPKeys.SIMILARITY_TOP_K: default_profile.similarity_top_k,
         }
 
-        # Inject lookup configs for single pass enrichment
         lookup_configs = get_lookup_configs_for_tool(tool)
         if lookup_configs:
-            tool_settings["lookup_configs"] = lookup_configs
+            attach_lookup_configs_to_tool_settings(tool_settings, lookup_configs)
 
         for p in prompts:
             if not p.prompt:
@@ -1906,7 +1910,7 @@ def _fetch_response(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
         if lookup_config := get_lookup_config(prompt):
-            output["lookup_config"] = lookup_config
+            attach_lookup_config(output, lookup_config)
         # Eval settings for the prompt
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 92cfb6e160..50480493c4 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -7,7 +7,10 @@
 from django.db import IntegrityError
 from plugins import get_plugin
 
-from prompt_studio.lookup_utils import validate_lookups_for_export
+from prompt_studio.lookup_utils import (
+    attach_lookup_config,
+    validate_lookups_for_export,
+)
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.models import CustomTool
 from prompt_studio.prompt_studio_core_v2.prompt_studio_helper import PromptStudioHelper
@@ -363,7 +366,7 @@ def frame_export_json(
             )
             prompt_id_str = str(prompt.prompt_id)
             if prompt_id_str in lookup_configs:
-                output["lookup_config"] = lookup_configs[prompt_id_str]
+                attach_lookup_config(output, lookup_configs[prompt_id_str])
             # Retaining the old fields in condition
             # for backward compatibility. To be removed in future.
             if (
diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index ca6642b443..6d840e7e03 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -145,8 +145,21 @@ def post(self, request: Request) -> JsonResponse:
         if not records:
             return JsonResponse({"created": 0}, status=200)
 
-        # Resolved by InternalAPIAuthMiddleware via StateStore
         organization = UserContext.get_organization()
+        if organization is None:
+            logger.error(
+                "UsageBatchCreateView received %d records with no organization; "
+                "refusing to write rows that would be invisible to tenant dashboards",
+                len(records),
+            )
+            return JsonResponse(
+                {
+                    "success": False,
+                    "error": "Organization context missing. "
+                    "Worker must send X-Organization-ID.",
+                },
+                status=status.HTTP_400_BAD_REQUEST,
+            )
 
         usage_objects = []
         for r in records:
diff --git a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
index cb3f8ec1e2..7cd217778f 100644
--- a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
+++ b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
@@ -57,9 +57,7 @@ try {
   splitCombinedData = mod.splitCombinedData;
   buildEnrichedFromBundle = mod.buildEnrichedFromBundle;
   getEnrichmentFromItem = mod.getEnrichmentFromItem;
-} catch {
-  // Plugin unavailable — passthroughs above retain OSS behavior.
-}
+} catch {}
 
 function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
   const {
diff --git a/frontend/src/components/custom-tools/header/Header.jsx b/frontend/src/components/custom-tools/header/Header.jsx
index 5421f299b6..471588a4b2 100644
--- a/frontend/src/components/custom-tools/header/Header.jsx
+++ b/frontend/src/components/custom-tools/header/Header.jsx
@@ -18,47 +18,33 @@ import "./Header.css";
 let SinglePassToggleSwitch;
 let CloneButton;
 let PromptShareButton;
-let useLookupExportGate = () => ({
-  checkLookups: () => Promise.resolve(true),
-  modalEl: null,
-});
 try {
   const mod = await import(
     "../../../plugins/single-pass-toggle-switch/SinglePassToggleSwitch"
   );
   SinglePassToggleSwitch = mod.SinglePassToggleSwitch;
-} catch {
-  // The variable will remain undefined if the component is not available.
-}
-try {
-  const mod = await import(
-    "../../../plugins/lookup-studio/hooks/useLookupExportGate"
-  );
-  useLookupExportGate = mod.useLookupExportGate;
-} catch {
-  // OSS — gate stays a no-op resolving true.
-}
+} catch {}
 try {
   const mod = await import(
     "../../../plugins/prompt-studio-public-share/public-share-btn/PromptShareButton.jsx"
   );
   PromptShareButton = mod.PromptShareButton;
-} catch {
-  // The variable will remain undefined if the component is not available.
-}
+} catch {}
 try {
   const mod = await import(
     "../../../plugins/prompt-studio-clone/clone-btn/CloneButton.jsx"
   );
   CloneButton = mod.CloneButton;
-} catch {
-  // The variable will remain undefined if the component is not available.
-}
+} catch {}
+
+const noopCheckLookups = () => Promise.resolve(true);
+
 function Header({
   setOpenSettings,
   handleUpdateTool,
   setOpenShareModal,
   setOpenCloneModal,
+  checkLookups = noopCheckLookups,
 }) {
   const [isExportLoading, setIsExportLoading] = useState(false);
   const { details, isPublicSource, markChangesAsExported } =
@@ -84,7 +70,6 @@ function Header({
   const [isApiDeploymentLoading, setIsApiDeploymentLoading] = useState(false);
   const [editModalOpen, setEditModalOpen] = useState(false);
   const [editForm] = Form.useForm();
-  const { checkLookups, modalEl: lookupGateModalEl } = useLookupExportGate();
 
   const handleExport = (
     selectedUsers,
@@ -441,7 +426,6 @@ function Header({
 
   return (
     <>
-      {lookupGateModalEl}
       <ToolNavBar
         title={details?.tool_name || ""}
         subtitle={isPublicSource ? undefined : details?.description}
@@ -547,6 +531,7 @@ Header.propTypes = {
   handleUpdateTool: PropTypes.func.isRequired,
   setOpenCloneModal: PropTypes.func.isRequired,
   setOpenShareModal: PropTypes.func.isRequired,
+  checkLookups: PropTypes.func,
 };
 
 export { Header };
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index b8d7a1707e..830b93081e 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -47,9 +47,7 @@ try {
     "../../../plugins/lookup-studio/prompt-card/LookupMenuItem"
   );
   LookupMenuItem = mod.LookupMenuItem;
-} catch {
-  // Not available in OSS
-}
+} catch {}
 
 function Header({
   promptDetails,
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
index 40439bce55..c8379a0b1d 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptCardItems.jsx
@@ -36,9 +36,7 @@ try {
     "../../../plugins/lookup-studio/prompt-card/LookupIndicator"
   );
   LookupIndicator = mod.LookupIndicator;
-} catch {
-  // Not available in OSS
-}
+} catch {}
 
 function PromptCardItems({
   promptDetails,
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index a1e492bb29..e515767e85 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -57,9 +57,7 @@ try {
     "../../../plugins/lookup-studio/prompt-card/LookupOutputTabs"
   );
   LookupOutputTabs = mod.LookupOutputTabs;
-} catch {
-  // Not available in OSS
-}
+} catch {}
 
 let getEnrichedCopyText;
 try {
@@ -67,9 +65,7 @@ try {
     "../../../plugins/lookup-studio/prompt-card/getEnrichedCopyText"
   );
   getEnrichedCopyText = mod.getEnrichedCopyText;
-} catch {
-  // Not available in OSS
-}
+} catch {}
 
 // Wraps children in LookupOutputTabs when available (cloud),
 // passes through children directly in OSS.
diff --git a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
index ab87f6f19c..483ebd80f4 100644
--- a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
+++ b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
@@ -47,17 +47,13 @@ try {
 
 // Cloud-only hook that seeds hasUnsavedChanges from server-side
 // lookup-staleness. No-op stub in OSS.
-let useLookupDirtySeed = () => {
-  // no-op
-};
+let useLookupDirtySeed = () => {};
 try {
   const mod = await import(
     "../../../plugins/lookup-studio/hooks/useLookupDirtySeed.js"
   );
   useLookupDirtySeed = mod.useLookupDirtySeed;
-} catch {
-  // Do nothing if plugin is not loaded.
-}
+} catch {}
 
 // Cloud-only lookup export validation gate. OSS stub resolves true so
 // the reminder bar's "Export" button proceeds directly.
@@ -70,9 +66,7 @@ try {
     "../../../plugins/lookup-studio/hooks/useLookupExportGate"
   );
   useLookupExportGate = mod.useLookupExportGate;
-} catch {
-  // OSS — gate stays a no-op resolving true.
-}
+} catch {}
 
 function ToolIde() {
   const [openSettings, setOpenSettings] = useState(false);
@@ -387,6 +381,7 @@ function ToolIde() {
         setOpenSettings={setOpenSettings}
         setOpenShareModal={setOpenShareModal}
         setOpenCloneModal={setOpenCloneModal}
+        checkLookups={checkLookups}
       />
       <div
         className={isPublicSource ? "public-tool-ide-body" : "tool-ide-body"}
diff --git a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
index 1c0f8efeab..a917c30b77 100644
--- a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
+++ b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
@@ -30,9 +30,7 @@ try {
   fetchLookupAssignments = mod.fetchLookupAssignments;
   fetchLookupOutputs = mod.fetchLookupOutputs;
   resetLookupAssignments = mod.resetLookupAssignments;
-} catch {
-  // Lookup feature not available in OSS
-}
+} catch {}
 function CustomToolsHelper() {
   const [isLoading, setIsLoading] = useState(true);
   const { id } = useParams();
diff --git a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
index 7cecc20333..724c241e7c 100644
--- a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
+++ b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
@@ -93,9 +93,7 @@ let lookupStudioEnabled = false;
 try {
   await import("../../../plugins/lookup-studio");
   lookupStudioEnabled = true;
-} catch {
-  // Plugin unavailable
-}
+} catch {}
 
 let manualReviewSettingsEnabled = false;
 try {
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index 98727a1c1c..b4951dd45a 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -29,9 +29,7 @@ try {
     "../plugins/lookup-studio/prompt-card/handleLookupOutput"
   );
   handleLookupOutput = mod.handleLookupOutput;
-} catch {
-  // Not available in OSS
-}
+} catch {}
 
 // Opaque extractor so the per-item enrichment payload key name lives in
 // the plugin, not OSS. OSS falls back to a no-op.
@@ -39,9 +37,7 @@ let getEnrichmentFromItem = () => null;
 try {
   const mod = await import("../plugins/lookup-enriched-toggle/helpers");
   getEnrichmentFromItem = mod.getEnrichmentFromItem;
-} catch {
-  // Plugin unavailable — no-op.
-}
+} catch {}
 
 const usePromptOutput = () => {
   const { sessionDetails } = useSessionStore();
diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index 2b85548cb0..3b015b3c54 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -614,6 +614,11 @@ def _record_usage(
             )
             cost = prompt_cost + compl_cost
         except Exception:
+            logger.warning(
+                "Failed to compute cost for model=%s; recording as 0.0",
+                model,
+                exc_info=True,
+            )
             cost = 0.0
 
         # Strip provider prefix (e.g. "azure/gpt-4o" → "gpt-4o") for storage,
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 134331a599..5966f4bf4a 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1710,14 +1710,16 @@ def _execute_single_prompt(
                 }
             )
             self._usage_records.extend(llm.flush_pending_usage())
-            # Flush embedding usage from callback handlers
             if chunk_size > 0:
                 try:
                     for handler in embedding.callback_manager.handlers:
                         if hasattr(handler, "flush_pending_usage"):
                             self._usage_records.extend(handler.flush_pending_usage())
                 except Exception:
-                    pass
+                    logger.warning(
+                        "Failed to flush embedding usage from callback handlers",
+                        exc_info=True,
+                    )
             if vector_db:
                 vector_db.close()
 
@@ -1907,15 +1909,7 @@ def _run_lookup_enrichment(
             usage_kwargs=usage_kwargs,
         )
         self._usage_records.extend(outcome.usage_records)
-        # Key stays in sync with llm_usage_reason="lookup" set inside
-        # run_with_metrics; metrics are grouped by reason elsewhere.
-        metrics.setdefault(prompt_name, {})["lookup_llm"] = outcome.llm_metrics
-        # Surface a prompt-level degraded flag for dashboards that group
-        # partial-failure runs without forcing the executor to error out.
-        if not outcome.success:
-            metadata.setdefault("lookup_errors", {})[prompt_name] = (outcome.error or "")[
-                :2000
-            ]
+        metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = outcome.llm_metrics
 
     @staticmethod
     def _run_webhook_postprocessing(
diff --git a/workers/shared/clients/usage_client.py b/workers/shared/clients/usage_client.py
index f61f65e27a..1fc87eb0dc 100644
--- a/workers/shared/clients/usage_client.py
+++ b/workers/shared/clients/usage_client.py
@@ -71,7 +71,7 @@ def error_response(
 
     def is_success(self) -> bool:
         """Check if the response indicates success."""
-        return self.success_response and self.status == ResponseStatus.SUCCESS
+        return self.success and self.status == ResponseStatus.SUCCESS
 
 
 @dataclass
@@ -192,8 +192,10 @@ def bulk_create_usage(
                 organization_id=organization_id,
             )
             return response.get("success", False) or "created" in response
-        except Exception as e:
-            logger.error("Failed to bulk create usage records: %s", e)
+        except Exception:
+            logger.error(
+                "Failed to bulk create %d usage records", len(records), exc_info=True
+            )
             return False
 
     def get_aggregated_pages_processed(

From 1ce0d6e480738c43ef47e6aa816c50874d4a3063 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sat, 25 Apr 2026 03:41:31 +0530
Subject: [PATCH 27/57] =?UTF-8?q?UN-2946=20[FEAT]=20Reference=20prompts=20?=
 =?UTF-8?q?by=20UUID=20+=20missing-file=20gate=20=E2=80=94=20OSS=20side?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

OSS counterpart to the cloud-side data-model change. Wires the prompt
studio runtime to the new wire shape, surfaces lookup runnability state
in the prompt card, and adds the usage_v2 enum entries the cloud side
records against (lookup as an LLM usage reason, lookup_version as a
reference type).

Partially working — known follow-up:
TODO: rework lookup input UX. The current variable-mapping flow is awkward
(separate rows, manual prompt selection per variable); needs a redesign that
mirrors how users actually compose a lookup template.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py         | 11 +++--
 .../prompt_studio_helper.py                   |  9 +++-
 ...6_alter_usage_llm_usage_reason_and_more.py | 42 +++++++++++++++++++
 .../custom-tools/prompt-card/Header.jsx       | 40 ++++++++++++++++--
 .../prompt-card/RunAllPrompts.jsx             |  3 ++
 5 files changed, 97 insertions(+), 8 deletions(-)
 create mode 100644 backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 7a1d6b4850..06145d7e22 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -29,11 +29,16 @@ def get_lookup_config(prompt) -> dict | None:
     return _execution.build_lookup_config_for_prompt(prompt)
 
 
-def get_lookup_configs_for_tool(tool) -> list[dict] | None:
-    """Return lookup configs for a tool (single pass), or None in OSS."""
+def get_lookup_configs_for_tool(tool, prompts=None) -> list[dict] | None:
+    """Return lookup configs for a tool (single pass), or None in OSS.
+
+    ``prompts`` scopes the build+validation to the prompts actually
+    participating in the run so an unrelated incomplete assignment on
+    the tool doesn't block it.
+    """
     if not LOOKUPS_AVAILABLE:
         return None
-    return _execution.build_lookup_configs_for_tool(tool)
+    return _execution.build_lookup_configs_for_tool(tool, prompts=prompts)
 
 
 def get_multi_var_lookups_for_tool(tool, prompt_ids=None) -> list[str]:
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index 50aacb48cb..1a4130f199 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -14,6 +14,7 @@
 from django.db import transaction
 from django.db.models.manager import BaseManager
 from plugins import get_plugin
+from rest_framework.exceptions import APIException
 from rest_framework.request import Request
 from utils.file_storage.constants import FileStorageKeys
 from utils.file_storage.helpers.prompt_studio_file_helper import PromptStudioFileHelper
@@ -1178,7 +1179,7 @@ def build_single_pass_payload(
             TSPKeys.SIMILARITY_TOP_K: default_profile.similarity_top_k,
         }
 
-        lookup_configs = get_lookup_configs_for_tool(tool)
+        lookup_configs = get_lookup_configs_for_tool(tool, prompts=prompts)
         if lookup_configs:
             attach_lookup_configs_to_tool_settings(tool_settings, lookup_configs)
 
@@ -1605,6 +1606,9 @@ def _execute_single_prompt(
                 is_single_pass=False,
                 profile_manager_id=profile_manager_id,
             )
+        except APIException:
+            # Validation responses are user-facing; DRF renders them as-is.
+            raise
         except Exception as e:
             logger.error(
                 f"[{tool.tool_id}] Error while fetching response for "
@@ -1670,6 +1674,9 @@ def _execute_prompts_in_single_pass(
                 document_id=document_id,
                 is_single_pass=True,
             )
+        except APIException:
+            # Validation responses are user-facing; DRF renders them as-is.
+            raise
         except Exception as e:
             logger.error(
                 f"[{tool.tool_id}] Error while fetching single pass response: {e}"
diff --git a/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py b/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py
new file mode 100644
index 0000000000..0df32ac2b8
--- /dev/null
+++ b/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py
@@ -0,0 +1,42 @@
+# Generated by Django 4.2.1 on 2026-04-24 20:16
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("usage_v2", "0005_usage_reason_ref_created_idx"),
+    ]
+
+    operations = [
+        migrations.AlterField(
+            model_name="usage",
+            name="llm_usage_reason",
+            field=models.CharField(
+                blank=True,
+                choices=[
+                    ("extraction", "Extraction"),
+                    ("challenge", "Challenge"),
+                    ("summarize", "Summarize"),
+                    ("lookup", "Lookup"),
+                ],
+                db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
+                max_length=255,
+                null=True,
+            ),
+        ),
+        migrations.AlterField(
+            model_name="usage",
+            name="reference_type",
+            field=models.CharField(
+                blank=True,
+                choices=[
+                    ("prompt_key", "Prompt Key"),
+                    ("lookup_version", "Lookup Version"),
+                ],
+                db_comment="Discriminator for reference_id. OSS values: 'prompt_key'. NULL when reference_id is NULL.",
+                max_length=64,
+                null=True,
+            ),
+        ),
+    ]
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index 830b93081e..55ffe6286e 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -49,6 +49,31 @@ try {
   LookupMenuItem = mod.LookupMenuItem;
 } catch {}
 
+let usePromptRunGatePlugin;
+let lookupPluginLoadError;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/hooks/usePromptRunGate"
+  );
+  usePromptRunGatePlugin = mod.usePromptRunGate;
+} catch (err) {
+  lookupPluginLoadError = err;
+}
+
+// If the sibling plugin import succeeded, a failure here means the
+// plugin is present but broken — surface it so the no-op fallback
+// doesn't silently disable the run gate.
+if (lookupPluginLoadError && LookupMenuItem) {
+  // eslint-disable-next-line no-console
+  console.warn(
+    "[Header] lookup-studio plugin loaded but usePromptRunGate failed to import",
+    lookupPluginLoadError,
+  );
+}
+
+// Stable identity so React doesn't see a conditional hook call.
+const usePromptRunGate = usePromptRunGatePlugin || (() => null);
+
 function Header({
   promptDetails,
   promptKey,
@@ -77,6 +102,7 @@ function Header({
     isSimplePromptStudio,
     details,
   } = useCustomToolStore();
+  const runGate = usePromptRunGate(promptDetails);
   const [items, setItems] = useState([]);
 
   const [isDisablePrompt, setIsDisablePrompt] = useState(null);
@@ -367,7 +393,9 @@ function Header({
         )}
         {!singlePassExtractMode && !isSimplePromptStudio && (
           <>
-            <Tooltip title="Run all LLMs for current document">
+            <Tooltip
+              title={runGate?.reason || "Run all LLMs for current document"}
+            >
               <Button
                 size="small"
                 type="text"
@@ -385,13 +413,16 @@ function Header({
                   isCoverageLoading ||
                   indexDocs?.includes(selectedDoc?.document_id) ||
                   isPublicSource ||
-                  spsLoading?.[selectedDoc?.document_id]
+                  spsLoading?.[selectedDoc?.document_id] ||
+                  !!runGate?.disabled
                 }
               >
                 <PlayCircleOutlined className="prompt-card-actions-head" />
               </Button>
             </Tooltip>
-            <Tooltip title="Run all LLMs for all documents">
+            <Tooltip
+              title={runGate?.reason || "Run all LLMs for all documents"}
+            >
               <Button
                 size="small"
                 type="text"
@@ -407,7 +438,8 @@ function Header({
                       promptStudioUpdateStatus?.isUpdating) ||
                   isCoverageLoading ||
                   indexDocs?.includes(selectedDoc?.document_id) ||
-                  isPublicSource
+                  isPublicSource ||
+                  !!runGate?.disabled
                 }
               >
                 <PlayCircleFilled className="prompt-card-actions-head" />
diff --git a/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx b/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
index abf187845e..6a0229f7e8 100644
--- a/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
@@ -4,6 +4,9 @@ import { PROMPT_RUN_TYPES } from "../../../helpers/GetStaticData";
 import usePromptRun from "../../../hooks/usePromptRun";
 import { useCustomToolStore } from "../../../store/custom-tool-store";
 
+// No tool-wide gate here — per-prompt Run buttons + server already
+// block broken prompts, so disabling bulk would only hide valid ones.
+
 function RunAllPrompts() {
   const { selectedDoc, isMultiPassExtractLoading, isPublicSource } =
     useCustomToolStore();

From 07dd8800dd4dfe170a1f9c9175a0445d8daaed03 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Sun, 26 Apr 2026 17:11:28 +0530
Subject: [PATCH 28/57] UN-2946 [FIX] Surface skipped lookups when source
 prompt has no value
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

When a configured lookup runs but extraction returned None for the source
prompt, _run_lookup_enrichment used to fall through silently — leaving
users wondering why enrichment didn't appear. Stream a one-line workflow
log via shim.stream_log so the skip is visible alongside other tool-run
events.
---
 workers/executor/executors/legacy_executor.py | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 65a6f19171..5d133ae1a6 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1935,7 +1935,16 @@ def _run_lookup_enrichment(
 
         lookup_config = output.get("lookup_config")
         lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
-        if not (lookup_config and current_value is not None and lookup_cls):
+        if not (lookup_config and lookup_cls):
+            return
+        if current_value is None:
+            # Skipping silently here would leave the user wondering why a
+            # configured lookup didn't run — surface it to the workflow log.
+            lookup_name = lookup_config.get("lookup_name") or "lookup"
+            shim.stream_log(
+                f"Skipping lookup `{lookup_name}` for `{prompt_name}` — "
+                f"source prompt produced no value."
+            )
             return
 
         _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()

From 288df588f3f86a14c837309b33aa7de17688966c Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 27 Apr 2026 02:09:28 +0530
Subject: [PATCH 29/57] UN-2946 [REFACTOR] Address Sonar findings on lookups V2
 PR

- Extract _init_llm_and_retrieval and _flush_per_prompt_metrics from
  LegacyExecutor._execute_single_prompt to drop cognitive complexity
  below the gate
- Extract per-prompt helpers from OutputManagerHelper.fetch_default_output_response
- Extract buildDefaultProfileOutputs / buildSelectedProfileOutputs from
  CombinedOutput.fetchCombinedOutput
- Give OSS lookup-plugin stub fns matching parameter lists so static
  analysis stops flagging call sites as arity mismatches
- Define _UNKNOWN_EXECUTOR_ERROR constant in ide_callback.tasks for the
  thrice-duplicated literal
- Use splice(-1, 0, ...) idiom for LookupMenuItem insertion in prompt
  card Header

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../output_manager_helper.py                  |  86 +++++++----
 .../combined-output/CombinedOutput.jsx        | 104 +++++++------
 .../custom-tools/prompt-card/Header.jsx       |   2 +-
 frontend/src/hooks/usePromptOutput.js         |   5 +-
 workers/executor/executors/legacy_executor.py | 141 ++++++++++++------
 workers/ide_callback/tasks.py                 |   8 +-
 6 files changed, 213 insertions(+), 133 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index b40b7a48a3..171d86fb3a 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -249,6 +249,49 @@ def fetch_default_llm_profile(tool: CustomTool) -> ProfileManager:
         except DefaultProfileError:
             raise DefaultProfileError("Default ProfileManager does not exist.")
 
+    @staticmethod
+    def _resolve_profile_for_prompt(
+        tool_prompt: ToolStudioPrompt,
+        use_default_profile: bool,
+    ) -> str | None:
+        profile_manager_id = tool_prompt.profile_manager_id
+        if not profile_manager_id and not use_default_profile:
+            return None
+        if not profile_manager_id:
+            default_profile = ProfileManager.get_default_llm_profile(tool_prompt.tool_id)
+            profile_manager_id = default_profile.profile_id
+        return profile_manager_id
+
+    @staticmethod
+    def _collect_default_output_for_prompt(
+        tool_prompt: ToolStudioPrompt,
+        profile_manager_id: str,
+        document_manager_id: str,
+        enrichment_by_key: dict[str, Any],
+    ) -> Any:
+        from prompt_studio.lookup_utils import enrich_prompt_output
+
+        try:
+            queryset = PromptStudioOutputManager.objects.filter(
+                prompt_id=str(tool_prompt.prompt_id),
+                profile_manager=profile_manager_id,
+                is_single_pass_extract=False,
+                document_manager_id=document_manager_id,
+            )
+            if not queryset.exists():
+                return ""
+
+            value: Any = ""
+            for output in queryset:
+                value = output.output
+                enriched = enrich_prompt_output(output, {})
+                bundle = extract_prompt_output_enrichment(enriched)
+                if bundle is not None:
+                    enrichment_by_key[tool_prompt.prompt_key] = bundle
+            return value
+        except ObjectDoesNotExist:
+            return ""
+
     @staticmethod
     def fetch_default_output_response(
         tool_studio_prompts: list[ToolStudioPrompt],
@@ -268,47 +311,26 @@ def fetch_default_output_response(
                 When lookups are configured, the cloud plugin adds an
                 opaque enrichment payload via ``attach_combined_output_enrichment``.
         """
-        from prompt_studio.lookup_utils import enrich_prompt_output
-
         result: dict[str, Any] = {}
         enrichment_by_key: dict[str, Any] = {}
 
         for tool_prompt in tool_studio_prompts:
             if tool_prompt.prompt_type == PSOMKeys.NOTES:
                 continue
-            prompt_id = str(tool_prompt.prompt_id)
-            profile_manager_id = tool_prompt.profile_manager_id
-
-            if not profile_manager_id and not use_default_profile:
+            profile_manager_id = OutputManagerHelper._resolve_profile_for_prompt(
+                tool_prompt, use_default_profile
+            )
+            if profile_manager_id is None:
                 result[tool_prompt.prompt_key] = ""
                 continue
-
-            if not profile_manager_id:
-                default_profile = ProfileManager.get_default_llm_profile(
-                    tool_prompt.tool_id
-                )
-                profile_manager_id = default_profile.profile_id
-
-            try:
-                queryset = PromptStudioOutputManager.objects.filter(
-                    prompt_id=prompt_id,
-                    profile_manager=profile_manager_id,
-                    is_single_pass_extract=False,
-                    document_manager_id=document_manager_id,
+            result[tool_prompt.prompt_key] = (
+                OutputManagerHelper._collect_default_output_for_prompt(
+                    tool_prompt,
+                    profile_manager_id,
+                    document_manager_id,
+                    enrichment_by_key,
                 )
-
-                if not queryset.exists():
-                    result[tool_prompt.prompt_key] = ""
-                    continue
-
-                for output in queryset:
-                    result[tool_prompt.prompt_key] = output.output
-                    enriched = enrich_prompt_output(output, {})
-                    bundle = extract_prompt_output_enrichment(enriched)
-                    if bundle is not None:
-                        enrichment_by_key[tool_prompt.prompt_key] = bundle
-            except ObjectDoesNotExist:
-                result[tool_prompt.prompt_key] = ""
+            )
 
         attach_combined_output_enrichment(result, enrichment_by_key)
         return result
diff --git a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
index 7cd217778f..9aeffdff54 100644
--- a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
+++ b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
@@ -50,8 +50,8 @@ try {
 // Cloud plugin hook — OSS falls back to passthrough helpers that leave
 // the payload untouched and report "no enrichment".
 let splitCombinedData = (data) => ({ combined: data, bundle: null });
-let buildEnrichedFromBundle = () => ({});
-let getEnrichmentFromItem = () => null;
+let buildEnrichedFromBundle = (_output, _bundle, _formatter) => ({});
+let getEnrichmentFromItem = (_item) => null;
 try {
   const mod = await import("../../../plugins/lookup-enriched-toggle/helpers");
   splitCombinedData = mod.splitCombinedData;
@@ -120,6 +120,55 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
       return;
     }
 
+    const buildDefaultProfileOutputs = (data) => {
+      const { combined: payload, bundle } = splitCombinedData(data);
+      const output = Object.entries(payload).reduce((acc, [key, value]) => {
+        acc[key] = displayPromptResult(value, false);
+        return acc;
+      }, {});
+      return {
+        output,
+        enriched: buildEnrichedFromBundle(output, bundle, displayPromptResult),
+        hasEnriched: true,
+      };
+    };
+
+    const buildPerPromptOutput = (item, data) => {
+      const profileManager = selectedProfile || item?.profile_manager;
+      const outputDetails = data.find(
+        (outputValue) =>
+          outputValue?.prompt_id === item?.prompt_id &&
+          outputValue?.profile_manager === profileManager,
+      );
+      const value =
+        outputDetails?.output?.length > 0
+          ? displayPromptResult(outputDetails?.output, false)
+          : "";
+      const enrichment = getEnrichmentFromItem(outputDetails);
+      const enrichedValue = enrichment?.output
+        ? displayPromptResult(enrichment.output, false)
+        : value;
+      return { value, enrichedValue, hasEnriched: !!enrichment?.output };
+    };
+
+    const buildSelectedProfileOutputs = (data, prompts) => {
+      const output = {};
+      const enriched = {};
+      let hasEnriched = false;
+      for (const item of prompts) {
+        if (item?.prompt_type === promptType.notes) continue;
+        const {
+          value,
+          enrichedValue,
+          hasEnriched: enrichedHit,
+        } = buildPerPromptOutput(item, data);
+        output[item?.prompt_key] = value;
+        enriched[item?.prompt_key] = enrichedValue;
+        hasEnriched = hasEnriched || enrichedHit;
+      }
+      return { output, enriched: hasEnriched ? enriched : {}, hasEnriched };
+    };
+
     const fetchCombinedOutput = async () => {
       setIsOutputLoading(true);
       setCombinedOutput({});
@@ -128,51 +177,12 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
         const res = await handleOutputApiRequest();
         const data = res?.data || [];
         const prompts = details?.prompts || [];
-
-        if (activeKey === "0" && !isSimplePromptStudio) {
-          const { combined: payload, bundle } = splitCombinedData(data);
-          const output = Object.entries(payload).reduce((acc, [key, value]) => {
-            acc[key] = displayPromptResult(value, false);
-            return acc;
-          }, {});
-          setCombinedOutput(output);
-          setEnrichedOutput(
-            buildEnrichedFromBundle(output, bundle, displayPromptResult),
-          );
-        } else {
-          const output = {};
-          const enriched = {};
-          let hasEnriched = false;
-
-          for (const item of prompts) {
-            if (item?.prompt_type === promptType.notes) continue;
-            const profileManager = selectedProfile || item?.profile_manager;
-            const outputDetails = data.find(
-              (outputValue) =>
-                outputValue?.prompt_id === item?.prompt_id &&
-                outputValue?.profile_manager === profileManager,
-            );
-
-            output[item?.prompt_key] =
-              outputDetails?.output?.length > 0
-                ? displayPromptResult(outputDetails?.output, false)
-                : "";
-
-            const enrichment = getEnrichmentFromItem(outputDetails);
-            if (enrichment?.output) {
-              enriched[item?.prompt_key] = displayPromptResult(
-                enrichment.output,
-                false,
-              );
-              hasEnriched = true;
-            } else {
-              enriched[item?.prompt_key] = output[item?.prompt_key];
-            }
-          }
-
-          setCombinedOutput(output);
-          setEnrichedOutput(hasEnriched ? enriched : {});
-        }
+        const useDefaultProfile = activeKey === "0" && !isSimplePromptStudio;
+        const { output, enriched } = useDefaultProfile
+          ? buildDefaultProfileOutputs(data)
+          : buildSelectedProfileOutputs(data, prompts);
+        setCombinedOutput(output);
+        setEnrichedOutput(enriched);
       } catch (err) {
         setAlertDetails(
           handleException(err, "Failed to generate combined output"),
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index 55ffe6286e..6a15265179 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -303,7 +303,7 @@ function Header({
     ];
     if (LookupMenuItem && !isSimplePromptStudio) {
       dropdownItems.splice(
-        dropdownItems.length - 1,
+        -1,
         0,
         {
           type: "divider",
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index b4951dd45a..12d451315d 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -32,8 +32,9 @@ try {
 } catch {}
 
 // Opaque extractor so the per-item enrichment payload key name lives in
-// the plugin, not OSS. OSS falls back to a no-op.
-let getEnrichmentFromItem = () => null;
+// the plugin, not OSS. OSS falls back to a no-op. Stub signature matches
+// the cloud helper so static analysis doesn't see call sites as arity mismatches.
+let getEnrichmentFromItem = (_item) => null;
 try {
   const mod = await import("../plugins/lookup-enriched-toggle/helpers");
   getEnrichmentFromItem = mod.getEnrichmentFromItem;
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 5d133ae1a6..2c515acdb9 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -452,7 +452,7 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
         pre_extracted_text = index_params.get(IKeys.EXTRACTED_TEXT, "") or ""
         if pre_extracted_text:
             logger.info(
-                "ide_index: marker hit, skipping extract step " "(len=%d, run_id=%s)",
+                "ide_index: marker hit, skipping extract step (len=%d, run_id=%s)",
                 len(pre_extracted_text),
                 context.run_id,
             )
@@ -1086,8 +1086,7 @@ def _handle_index(self, context: ExecutionContext) -> ExecutionResult:
                     "Document already indexed in vector store; skipping re-index."
                 )
                 logger.info(
-                    "Skipping re-index: doc_id=%s already in vector DB and "
-                    "reindex=False",
+                    "Skipping re-index: doc_id=%s already in vector DB and reindex=False",
                     doc_id,
                 )
                 return ExecutionResult(success=True, data={IKeys.DOC_ID: doc_id})
@@ -1597,34 +1596,16 @@ def _execute_single_prompt(
             return
 
         usage_kwargs = {"run_id": run_id, "execution_id": execution_id}
-        try:
-            llm = llm_cls(
-                adapter_instance_id=output[PSKeys.LLM],
-                tool=shim,
-                usage_kwargs={**usage_kwargs, PSKeys.LLM_USAGE_REASON: PSKeys.EXTRACTION},
-                capture_metrics=True,
-            )
-            vector_db = None
-            if chunk_size > 0:
-                embedding = embedding_compat_cls(
-                    adapter_instance_id=output[PSKeys.EMBEDDING],
-                    tool=shim,
-                    kwargs={**usage_kwargs},
-                )
-                vector_db = vector_db_cls(
-                    tool=shim,
-                    adapter_instance_id=output[PSKeys.VECTOR_DB],
-                    embedding=embedding,
-                )
-            shim.stream_log(
-                f"Initialized LLM and retrieval adapters for: `{prompt_name}`"
-            )
-        except Exception as e:
-            msg = f"Couldn't fetch adapter. {e}"
-            logger.error(msg)
-            raise LegacyExecutorError(
-                message=msg, code=getattr(e, "status_code", None) or 500
-            ) from e
+        llm, embedding, vector_db = self._init_llm_and_retrieval(
+            output=output,
+            shim=shim,
+            chunk_size=chunk_size,
+            llm_cls=llm_cls,
+            embedding_compat_cls=embedding_compat_cls,
+            vector_db_cls=vector_db_cls,
+            usage_kwargs=usage_kwargs,
+            prompt_name=prompt_name,
+        )
 
         context_list: list[str] = []
         try:
@@ -1740,25 +1721,89 @@ def _execute_single_prompt(
             if isinstance(val, str):
                 structured_output[prompt_name] = val.rstrip("\n")
         finally:
-            metrics.setdefault(prompt_name, {}).update(
-                {
-                    "context_retrieval": context_retrieval_metrics.get(prompt_name, {}),
-                    f"{llm.get_usage_reason()}_llm": llm.get_metrics(),
-                }
+            self._flush_per_prompt_metrics(
+                metrics=metrics,
+                context_retrieval_metrics=context_retrieval_metrics,
+                prompt_name=prompt_name,
+                llm=llm,
+                embedding=embedding,
+                vector_db=vector_db,
+                chunk_size=chunk_size,
             )
-            self._usage_records.extend(llm.flush_pending_usage())
+
+    def _init_llm_and_retrieval(
+        self,
+        output: dict[str, Any],
+        shim: Any,
+        chunk_size: int,
+        llm_cls: Any,
+        embedding_compat_cls: Any,
+        vector_db_cls: Any,
+        usage_kwargs: dict[str, Any],
+        prompt_name: str,
+    ) -> tuple[Any, Any, Any]:
+        from executor.executors.constants import PromptServiceConstants as PSKeys
+
+        try:
+            llm = llm_cls(
+                adapter_instance_id=output[PSKeys.LLM],
+                tool=shim,
+                usage_kwargs={**usage_kwargs, PSKeys.LLM_USAGE_REASON: PSKeys.EXTRACTION},
+                capture_metrics=True,
+            )
+            embedding = None
+            vector_db = None
             if chunk_size > 0:
-                try:
-                    for handler in embedding.callback_manager.handlers:
-                        if hasattr(handler, "flush_pending_usage"):
-                            self._usage_records.extend(handler.flush_pending_usage())
-                except Exception:
-                    logger.warning(
-                        "Failed to flush embedding usage from callback handlers",
-                        exc_info=True,
-                    )
-            if vector_db:
-                vector_db.close()
+                embedding = embedding_compat_cls(
+                    adapter_instance_id=output[PSKeys.EMBEDDING],
+                    tool=shim,
+                    kwargs={**usage_kwargs},
+                )
+                vector_db = vector_db_cls(
+                    tool=shim,
+                    adapter_instance_id=output[PSKeys.VECTOR_DB],
+                    embedding=embedding,
+                )
+            shim.stream_log(
+                f"Initialized LLM and retrieval adapters for: `{prompt_name}`"
+            )
+            return llm, embedding, vector_db
+        except Exception as e:
+            msg = f"Couldn't fetch adapter. {e}"
+            logger.error(msg)
+            raise LegacyExecutorError(
+                message=msg, code=getattr(e, "status_code", None) or 500
+            ) from e
+
+    def _flush_per_prompt_metrics(
+        self,
+        metrics: dict[str, Any],
+        context_retrieval_metrics: dict[str, Any],
+        prompt_name: str,
+        llm: Any,
+        embedding: Any,
+        vector_db: Any,
+        chunk_size: int,
+    ) -> None:
+        metrics.setdefault(prompt_name, {}).update(
+            {
+                "context_retrieval": context_retrieval_metrics.get(prompt_name, {}),
+                f"{llm.get_usage_reason()}_llm": llm.get_metrics(),
+            }
+        )
+        self._usage_records.extend(llm.flush_pending_usage())
+        if chunk_size > 0 and embedding is not None:
+            try:
+                for handler in embedding.callback_manager.handlers:
+                    if hasattr(handler, "flush_pending_usage"):
+                        self._usage_records.extend(handler.flush_pending_usage())
+            except Exception:
+                logger.warning(
+                    "Failed to flush embedding usage from callback handlers",
+                    exc_info=True,
+                )
+        if vector_db:
+            vector_db.close()
 
     def _run_table_extraction(
         self,
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index e2b3b4dcf6..b44c541eb6 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -24,6 +24,8 @@
 # WebSocket emission endpoint (relative to internal API base)
 _EMIT_WEBSOCKET_ENDPOINT = "emit-websocket/"
 
+_UNKNOWN_EXECUTOR_ERROR = "Unknown executor error"
+
 
 class _SafeEncoder(json.JSONEncoder):
     """JSON encoder that converts uuid.UUID and datetime objects to strings."""
@@ -164,7 +166,7 @@ def ide_index_complete(
     try:
         # Check executor-level failure
         if not result_dict.get("success", False):
-            error_msg = result_dict.get("error", "Unknown executor error")
+            error_msg = result_dict.get("error", _UNKNOWN_EXECUTOR_ERROR)
             logger.error("ide_index executor reported failure: %s", error_msg)
             api.remove_document_indexing(
                 org_id=org_id,
@@ -370,7 +372,7 @@ def ide_prompt_complete(
     try:
         # Check executor-level failure
         if not result_dict.get("success", False):
-            error_msg = result_dict.get("error", "Unknown executor error")
+            error_msg = result_dict.get("error", _UNKNOWN_EXECUTOR_ERROR)
             logger.error("ide_prompt executor reported failure: %s", error_msg)
             _emit_event(
                 api,
@@ -544,7 +546,7 @@ def extraction_complete(
     try:
         # Check executor-level failure
         if not result_dict.get("success", False):
-            error_msg = result_dict.get("error", "Unknown executor error")
+            error_msg = result_dict.get("error", _UNKNOWN_EXECUTOR_ERROR)
             logger.error(
                 "extraction executor reported failure: source=%s file=%s error=%s",
                 source,

From 8e5491c446f9b2a65c706905ce7b7ca3caba8da0 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 27 Apr 2026 10:36:39 +0530
Subject: [PATCH 30/57] UN-2946 [FIX] Preserve usage records on executor
 failure paths

- LegacyExecutor.execute attaches collected usage_records to failure
  metadata in the LegacyExecutorError branch
- ExecutionOrchestrator broad-except pulls usage_records off the executor
  before wrapping the unhandled exception, so Celery autoretry doesn't
  drop billing rows from a partially-completed run
- lookup_utils.get_lookup_validation_for_tool OSS stub returns
  incomplete_lookups: [] to match the cloud schema

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 backend/prompt_studio/lookup_utils.py                |  1 +
 .../sdk1/src/unstract/sdk1/execution/orchestrator.py | 12 +++++++++---
 workers/executor/executors/legacy_executor.py        |  8 +++++++-
 3 files changed, 17 insertions(+), 4 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 06145d7e22..213001ef09 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -152,6 +152,7 @@ def get_lookup_validation_for_tool(tool) -> dict:
             "ok": True,
             "draft_lookups": [],
             "multi_var_lookups": [],
+            "incomplete_lookups": [],
             "single_pass_enabled": bool(
                 getattr(tool, "single_pass_extraction_mode", False)
             ),
diff --git a/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py b/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
index 2c0f66f3bb..af5684fb1f 100644
--- a/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
+++ b/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
@@ -9,6 +9,7 @@
 
 import logging
 import time
+from typing import Any
 
 from unstract.sdk1.execution.context import ExecutionContext
 from unstract.sdk1.execution.registry import ExecutorRegistry
@@ -37,8 +38,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
             exceptions (wrapped as a failure result).
         """
         logger.info(
-            "Orchestrating execution: executor=%s operation=%s "
-            "run_id=%s request_id=%s",
+            "Orchestrating execution: executor=%s operation=%s run_id=%s request_id=%s",
             context.executor_name,
             context.operation,
             context.run_id,
@@ -61,9 +61,15 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                 context.executor_name,
                 elapsed,
             )
+            metadata: dict[str, Any] = {"elapsed_seconds": round(elapsed, 3)}
+            # Preserve usage records the executor collected before crashing so
+            # the task wrapper still flushes them on retry.
+            collected = getattr(executor, "_usage_records", None) or []
+            if collected:
+                metadata["usage_records"] = list(collected)
             return ExecutionResult.failure(
                 error=f"{type(exc).__name__}: {exc}",
-                metadata={"elapsed_seconds": round(elapsed, 3)},
+                metadata=metadata,
             )
 
         elapsed = time.monotonic() - start
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 2c515acdb9..eb2d564053 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -153,7 +153,13 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                     )
                 except Exception:
                     pass  # Best-effort — don't mask the original error
-            return ExecutionResult.failure(error=exc.message)
+            # Preserve any usage rows collected before the failure so the task
+            # wrapper still flushes them. Without this, transient errors that
+            # trigger Celery autoretry re-run LLMs and lose billing rows.
+            failure_metadata: dict[str, Any] = {}
+            if self._usage_records:
+                failure_metadata["usage_records"] = list(self._usage_records)
+            return ExecutionResult.failure(error=exc.message, metadata=failure_metadata)
 
     def _build_shim(
         self,

From a23c7a61b4fac1de64a2b6140fc0bcf2a01888dd Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 27 Apr 2026 12:38:53 +0530
Subject: [PATCH 31/57] =?UTF-8?q?UN-2946=20[REFACTOR]=20Squash=20usage=5Fv?=
 =?UTF-8?q?2=20migrations=203=20=E2=86=92=202=20for=20lookups=20V2?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Folds 0006 (choices-only AlterField, no SQL) into 0004 by baking the
final llm_usage_reason and reference_type choice lists directly. Keeps
0005 separate to preserve CREATE INDEX CONCURRENTLY safety on the
billing-critical usage table. Existing envs that already ran 0006 need
a one-time DELETE on its django_migrations row.
---
 .../migrations/0004_usage_metrics_fields.py   |  6 ++-
 ...6_alter_usage_llm_usage_reason_and_more.py | 42 -------------------
 2 files changed, 5 insertions(+), 43 deletions(-)
 delete mode 100644 backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py

diff --git a/backend/usage_v2/migrations/0004_usage_metrics_fields.py b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
index 89cf1feb3c..182cfb6ca2 100644
--- a/backend/usage_v2/migrations/0004_usage_metrics_fields.py
+++ b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
@@ -17,6 +17,7 @@ class Migration(migrations.Migration):
                     ("extraction", "Extraction"),
                     ("challenge", "Challenge"),
                     ("summarize", "Summarize"),
+                    ("lookup", "Lookup"),
                 ],
                 db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
                 max_length=255,
@@ -42,7 +43,10 @@ class Migration(migrations.Migration):
             name="reference_type",
             field=models.CharField(
                 blank=True,
-                choices=[("prompt_key", "Prompt Key")],
+                choices=[
+                    ("prompt_key", "Prompt Key"),
+                    ("lookup_version", "Lookup Version"),
+                ],
                 db_comment=(
                     "Discriminator for reference_id. "
                     "OSS values: 'prompt_key'. "
diff --git a/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py b/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py
deleted file mode 100644
index 0df32ac2b8..0000000000
--- a/backend/usage_v2/migrations/0006_alter_usage_llm_usage_reason_and_more.py
+++ /dev/null
@@ -1,42 +0,0 @@
-# Generated by Django 4.2.1 on 2026-04-24 20:16
-
-from django.db import migrations, models
-
-
-class Migration(migrations.Migration):
-    dependencies = [
-        ("usage_v2", "0005_usage_reason_ref_created_idx"),
-    ]
-
-    operations = [
-        migrations.AlterField(
-            model_name="usage",
-            name="llm_usage_reason",
-            field=models.CharField(
-                blank=True,
-                choices=[
-                    ("extraction", "Extraction"),
-                    ("challenge", "Challenge"),
-                    ("summarize", "Summarize"),
-                    ("lookup", "Lookup"),
-                ],
-                db_comment="Reason for LLM usage. Empty if usage_type is 'embedding'. ",
-                max_length=255,
-                null=True,
-            ),
-        ),
-        migrations.AlterField(
-            model_name="usage",
-            name="reference_type",
-            field=models.CharField(
-                blank=True,
-                choices=[
-                    ("prompt_key", "Prompt Key"),
-                    ("lookup_version", "Lookup Version"),
-                ],
-                db_comment="Discriminator for reference_id. OSS values: 'prompt_key'. NULL when reference_id is NULL.",
-                max_length=64,
-                null=True,
-            ),
-        ),
-    ]

From 0be7a0f160f53a940b194e53584e8ba6fc57172b Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 27 Apr 2026 15:10:54 +0530
Subject: [PATCH 32/57] =?UTF-8?q?UN-2946=20[REFACTOR]=20Update=20OSS?=
 =?UTF-8?q?=E2=86=94cloud=20lookup=20bridge=20for=20app=20rename?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Cloud's lookup_v1 plugin is being renamed to lookups; update the OSS
try-import paths (prompt_studio/lookup_utils.py, usage_v2/models.py)
and the related comment in workers/shared/clients/extraction_client.py.
Bridge contract is unchanged — the cloud module just lives at a new
import path.
---
 backend/prompt_studio/lookup_utils.py       | 10 +++++-----
 backend/usage_v2/models.py                  |  2 +-
 workers/shared/clients/extraction_client.py |  6 +++---
 3 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 213001ef09..b1bc79a707 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -11,11 +11,11 @@
 logger = logging.getLogger(__name__)
 
 try:
-    from pluggable_apps.lookup_v1 import execution as _execution
-    from pluggable_apps.lookup_v1 import output_enrichment as _output_enrichment
-    from pluggable_apps.lookup_v1 import staleness as _staleness
-    from pluggable_apps.lookup_v1 import validation as _validation
-    from pluggable_apps.lookup_v1.models import LookupOutputResult as _LookupOutputResult
+    from pluggable_apps.lookups import execution as _execution
+    from pluggable_apps.lookups import output_enrichment as _output_enrichment
+    from pluggable_apps.lookups import staleness as _staleness
+    from pluggable_apps.lookups import validation as _validation
+    from pluggable_apps.lookups.models import LookupOutputResult as _LookupOutputResult
 
     LOOKUPS_AVAILABLE = True
 except ImportError:
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 02f65e1d3d..32356a8192 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -32,7 +32,7 @@ class UsageType(models.TextChoices):
 ]
 
 try:
-    from pluggable_apps.lookup_v1.constants import (
+    from pluggable_apps.lookups.constants import (
         CLOUD_LLM_USAGE_REASON_CHOICES,
         CLOUD_REFERENCE_TYPE_CHOICES,
     )
diff --git a/workers/shared/clients/extraction_client.py b/workers/shared/clients/extraction_client.py
index 07b839eb32..43f64c712e 100644
--- a/workers/shared/clients/extraction_client.py
+++ b/workers/shared/clients/extraction_client.py
@@ -4,8 +4,8 @@
 the backend's internal API endpoints.
 
 NOTE on scope: the callback endpoints ``v1/extraction/extraction-{complete,error}/``
-are currently registered **only** by the cloud ``lookup_v1`` plugin
-(see ``pluggable_apps/lookup_v1/internal_urls.py``). The interface is
+are currently registered **only** by the cloud ``lookups`` plugin
+(see ``pluggable_apps/lookups/internal_urls.py``). The interface is
 ``source``-dispatched and designed to serve other extraction flows
 (prompt-studio docs, connectors) in the future, but in OSS-only builds
 the endpoints are absent. Callers from OSS paths should expect a 404
@@ -26,7 +26,7 @@
 
 class ExtractionAPIClient(BaseAPIClient):
     """API client for the extraction-callback endpoints registered by
-    cloud-side plugins (today: lookup_v1). See module docstring for the
+    cloud-side plugins (today: lookups). See module docstring for the
     OSS-absence contract.
     """
 

From a4679b11d04eaae2e5e24d8c82f35a9d01ca3c9b Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 27 Apr 2026 17:40:19 +0530
Subject: [PATCH 33/57] UN-2946 [FIX] Address greptile review on lookups V2 OSS

- usage_v2/internal_views.py: wrap bulk_create in try/except so a flush
  failure logs ERROR with full context instead of returning a silent 500;
  chunk with batch_size=500 to bound transaction size on the
  billing-critical usage table.
- legacy_executor: extend the lookup empty-value guard to also skip on
  empty strings/lists/dicts so a "" extraction doesn't reach the LLM as
  an empty input. Boolean/number 0/False remain valid.
---
 backend/usage_v2/internal_views.py            | 20 ++++++++++++++++++-
 workers/executor/executors/legacy_executor.py |  9 ++++++++-
 2 files changed, 27 insertions(+), 2 deletions(-)

diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 6d840e7e03..1ff9b1376f 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -185,5 +185,23 @@ def post(self, request: Request) -> JsonResponse:
                     error_message=r.get("error_message"),
                 )
             )
-        created = Usage.objects.bulk_create(usage_objects)
+
+        try:
+            # Chunk to bound transaction size on the billing-critical table.
+            created = Usage.objects.bulk_create(usage_objects, batch_size=500)
+        except Exception as e:
+            logger.error(
+                "bulk_create failed for %d usage records (org=%s): %s",
+                len(usage_objects),
+                organization.organization_id if organization else None,
+                e,
+                exc_info=True,
+            )
+            return JsonResponse(
+                {
+                    "success": False,
+                    "error": "Failed to persist usage records",
+                },
+                status=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            )
         return JsonResponse({"created": len(created)}, status=201)
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index eb2d564053..1c010d9f5b 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -1988,7 +1988,14 @@ def _run_lookup_enrichment(
         lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
         if not (lookup_config and lookup_cls):
             return
-        if current_value is None:
+        # Treat empty strings/containers as "no value" too — for boolean and
+        # number prompts, falsy 0/False are still valid inputs and must run.
+        is_empty = (
+            current_value is None
+            or (isinstance(current_value, str) and not current_value.strip())
+            or (isinstance(current_value, (list, dict)) and not current_value)
+        )
+        if is_empty:
             # Skipping silently here would leave the user wondering why a
             # configured lookup didn't run — surface it to the workflow log.
             lookup_name = lookup_config.get("lookup_name") or "lookup"

From 5e8a22329fcee03534a7510f8638bd8501511cb4 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 11:14:31 +0530
Subject: [PATCH 34/57] UN-2946 [FIX] Static usage choices to fix migration
 drift in OSS CI
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Greptile P1: migration 0004_usage_metrics_fields hard-codes the cloud
values "lookup" / "lookup_version" into the AlterField operations,
but the model resolved its choices via a try-import that only fired
when pluggable_apps.lookups was present. In OSS-only builds the
import raised, the model carried 3 choices, and ``makemigrations
--check`` saw drift against the migration's 4 choices — turning OSS
CI red on every run.

Carry the union of OSS + cloud values statically in usage_v2/models.py
and drop the try-import. Cloud-only entries are unused on OSS but
make migration state and model state agree in both builds. The DB is
unaffected (choices is a Django-validator concern, not DDL).

The now-unused CLOUD_LLM_USAGE_REASON_CHOICES /
CLOUD_REFERENCE_TYPE_CHOICES exports are removed from the cloud
plugin's constants module in a separate commit.
---
 backend/usage_v2/models.py | 41 +++++++++++++-------------------------
 1 file changed, 14 insertions(+), 27 deletions(-)

diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 32356a8192..ac0f583aa4 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -1,4 +1,3 @@
-import logging
 import uuid
 
 from django.db import models
@@ -8,45 +7,33 @@
     DefaultOrganizationMixin,
 )
 
-logger = logging.getLogger(__name__)
-
 
 class UsageType(models.TextChoices):
     LLM = "llm", "LLM Usage"
     EMBEDDING = "embedding", "Embedding Usage"
 
 
-# ── Extensible choice lists ─────────────────────────────────────────
-# OSS defines base values. Cloud plugins append via try-import so that
-# Django validation accepts cloud-specific values when the plugin is
-# installed, without leaking cloud details into OSS code.
+# ── Choice lists (static union of OSS + cloud values) ────────────────
+# Cloud-only entries (e.g. "lookup", "lookup_version") are listed here
+# even on OSS-only builds where they're never written. A previous
+# try-import pattern extended these at runtime when the cloud plugin
+# was importable, but that left model state ≠ migration state in OSS
+# builds and broke ``makemigrations --check`` in CI. Carrying the union
+# statically keeps both sides in lockstep at the cost of a couple of
+# unused choice entries on OSS.
 
-_LLM_USAGE_REASON_CHOICES: list[tuple[str, str]] = [
+LLM_USAGE_REASON_CHOICES: list[tuple[str, str]] = [
     ("extraction", "Extraction"),
     ("challenge", "Challenge"),
     ("summarize", "Summarize"),
+    ("lookup", "Lookup"),
 ]
 
-_REFERENCE_TYPE_CHOICES: list[tuple[str, str]] = [
+REFERENCE_TYPE_CHOICES: list[tuple[str, str]] = [
     ("prompt_key", "Prompt Key"),
+    ("lookup_version", "Lookup Version"),
 ]
 
-try:
-    from pluggable_apps.lookups.constants import (
-        CLOUD_LLM_USAGE_REASON_CHOICES,
-        CLOUD_REFERENCE_TYPE_CHOICES,
-    )
-
-    _LLM_USAGE_REASON_CHOICES.extend(CLOUD_LLM_USAGE_REASON_CHOICES)
-    _REFERENCE_TYPE_CHOICES.extend(CLOUD_REFERENCE_TYPE_CHOICES)
-except ImportError:
-    pass
-except Exception:
-    logger.warning("Failed to load cloud usage choices", exc_info=True)
-
-LLM_USAGE_REASON_CHOICES = _LLM_USAGE_REASON_CHOICES
-REFERENCE_TYPE_CHOICES = _REFERENCE_TYPE_CHOICES
-
 
 class UsageModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     pass
@@ -54,8 +41,8 @@ class UsageModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
 
 class Usage(DefaultOrganizationMixin, BaseModel):
     # reference_type → reference_id mapping (no FK constraint):
-    #   "prompt_key"  → ToolStudioPrompt UUID (OSS)
-    #   Cloud plugins register additional types via CLOUD_REFERENCE_TYPE_CHOICES.
+    #   "prompt_key"      → ToolStudioPrompt UUID (OSS-only writer)
+    #   "lookup_version"  → LookupVersion UUID (cloud-only writer)
     # Usage records survive entity deletion.
 
     id = models.UUIDField(

From f9d384441f1319a337d2681ef0788ac63b971bb2 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 12:39:49 +0530
Subject: [PATCH 35/57] UN-2946 [FEAT] Block enforce_type switch via lookup
 plugin gate

When a prompt has a lookup configured, switching its enforce_type to a
complex type (table / line-item / agentic_table) is blocked: the cloud
plugin exposes useEnforceTypeSwitchGate, which OSS dynamically imports
with a no-op fallback. Blocked switches surface an alert and keep the
previous enforce_type.
---
 .../custom-tools/prompt-card/PromptCard.jsx   | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/frontend/src/components/custom-tools/prompt-card/PromptCard.jsx b/frontend/src/components/custom-tools/prompt-card/PromptCard.jsx
index 2e579108c2..29fda260e2 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptCard.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptCard.jsx
@@ -14,6 +14,19 @@ import { PromptCardItems } from "./PromptCardItems";
 import "./PromptCard.css";
 import { handleUpdateStatus } from "./constants";
 
+let useEnforceTypeSwitchGatePlugin;
+try {
+  const mod = await import(
+    "../../../plugins/lookup-studio/hooks/useEnforceTypeSwitchGate"
+  );
+  useEnforceTypeSwitchGatePlugin = mod.useEnforceTypeSwitchGate;
+} catch {
+  // Cloud plugin not present; gate falls back to no-op below.
+}
+
+const useEnforceTypeSwitchGate =
+  useEnforceTypeSwitchGatePlugin || (() => () => null);
+
 const PromptCard = memo(
   ({
     promptDetails,
@@ -56,6 +69,7 @@ const PromptCard = memo(
     const { messages } = useSocketCustomToolStore();
     const { setAlertDetails } = useAlertStore();
     const { setPostHogCustomEvent } = usePostHogEvents();
+    const enforceTypeSwitchGate = useEnforceTypeSwitchGate();
 
     useEffect(() => {
       if (
@@ -260,6 +274,11 @@ const PromptCard = memo(
     };
 
     const handleTypeChange = (value) => {
+      const block = enforceTypeSwitchGate(promptDetailsState?.prompt_id, value);
+      if (block) {
+        setAlertDetails({ type: "error", content: block.reason });
+        return;
+      }
       handleChange(value, promptDetailsState?.prompt_id, "enforce_type", true);
     };
 

From d8986974d2246951bf62e7e84009a722aef6e27b Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 13:16:44 +0530
Subject: [PATCH 36/57] UN-2946 [FIX] Harden billing/usage paths against silent
 drops
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Guard embedding flush on callback_manager is None so public-adapter
  embedding usage stops being silently swallowed by the broad except.
- Initialise LegacyExecutor._usage_records in __init__ so an
  early-execute crash can't leave the orchestrator's getattr fallback
  reading None.
- Wrap challenge and summarisation completion calls in try/finally so
  flush_pending_usage() runs even on exception — transient errors
  no longer drop those LLMs' billing rows.
- Replace bare except: pass on the FE error stream with
  logger.debug; the secondary failure is now recoverable.
- Tighten UsageAPIClient.bulk_create_usage success heuristic against
  future partial-body contracts; capture and log the bool return at the
  Celery task with run_id + organization_id.
- Drop redundant organization_id kwarg passed alongside
  set_organization_context in tasks.py.
- SDK records: spread _usage_kwargs first so explicit billing fields
  win; write run_id/llm_usage_reason as None instead of "" so
  UUIDField/choice columns don't reject the row.
- Use rsplit('/', 1)[-1] for display_model so multi-segment IDs
  (e.g. bedrock/anthropic/claude) collapse to the trailing segment.
- Log the litellm cost_per_token failure for embeddings (matches the
  LLM path).
---
 unstract/sdk1/src/unstract/sdk1/llm.py        | 25 +++++++----
 .../sdk1/src/unstract/sdk1/usage_handler.py   | 19 +++++++-
 workers/executor/executors/legacy_executor.py | 43 +++++++++++++------
 workers/executor/tasks.py                     | 21 ++++++---
 workers/shared/clients/usage_client.py        | 10 ++++-
 5 files changed, 90 insertions(+), 28 deletions(-)

diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index 7fb3d8f9be..08a0077768 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -642,7 +642,7 @@ def get_metrics(self) -> dict[str, object]:
         return self._metrics
 
     def get_last_usage(self) -> Mapping[str, int]:
-        """Token usage from the most recent complete() call."""
+        """Token usage from the most recent LLM call (sync, async, or streaming)."""
         if not self._pending_usage:
             return {}
         last = self._pending_usage[-1]
@@ -653,7 +653,7 @@ def get_last_usage(self) -> Mapping[str, int]:
         }
 
     def get_last_usage_record(self) -> dict | None:
-        """Full usage record for the most recent complete() call.
+        """Full usage record for the most recent LLM call (sync, async, or streaming).
 
         Returns the complete record (tokens + cost + model + reason
         metadata) so callers don't have to reach into ``_pending_usage``
@@ -711,28 +711,37 @@ def _record_usage(
             )
             cost = 0.0
 
-        # Strip provider prefix (e.g. "azure/gpt-4o" → "gpt-4o") for storage,
-        # matching the old Audit.push_usage_data() behavior.
-        display_model = model.split("/", 1)[-1] if model else model
+        # rsplit so multi-segment IDs (e.g. ``bedrock/anthropic/claude``)
+        # collapse to the trailing segment, matching legacy Audit semantics.
+        display_model = model.rsplit("/", 1)[-1] if model else model
 
+        # ``_usage_kwargs`` spread first so explicit fields below win — those
+        # are the canonical billing values (tokens, cost, status); we only
+        # want callers to provide context (reference_id, reference_type),
+        # not override computed numbers.
         self._pending_usage.append(
             {
+                **self._usage_kwargs,
                 "usage_type": "llm",
                 "model_name": display_model,
                 "provider": self.adapter.get_provider(),
                 "adapter_instance_id": self.platform_kwargs.get(
                     "adapter_instance_id", ""
                 ),
-                "run_id": self.platform_kwargs.get("run_id", ""),
+                # ``run_id`` lands in a UUIDField column; "" would fail the
+                # cast — keep absent values as None so the bulk-create view
+                # writes NULL.
+                "run_id": self.platform_kwargs.get("run_id") or None,
                 "execution_id": self.platform_kwargs.get("execution_id", ""),
-                "llm_usage_reason": self.platform_kwargs.get("llm_usage_reason", ""),
+                # ``llm_usage_reason`` has a fixed choice set; "" isn't a
+                # valid choice, so write None when missing.
+                "llm_usage_reason": self.platform_kwargs.get("llm_usage_reason") or None,
                 "prompt_tokens": prompt_tokens,
                 "completion_tokens": completion_tokens,
                 "total_tokens": total_tokens,
                 "embedding_tokens": 0,
                 "cost_in_dollars": cost,
                 "status": "SUCCESS",
-                **self._usage_kwargs,
             }
         )
 
diff --git a/unstract/sdk1/src/unstract/sdk1/usage_handler.py b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
index 44a819b44c..9836bdf87a 100644
--- a/unstract/sdk1/src/unstract/sdk1/usage_handler.py
+++ b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
@@ -1,3 +1,4 @@
+import logging
 from typing import Any
 
 import litellm
@@ -7,6 +8,8 @@
 from unstract.sdk1.constants import LogLevel
 from unstract.sdk1.tool.stream import StreamMixin
 
+logger = logging.getLogger(__name__)
+
 
 class UsageHandler(StreamMixin, BaseCallbackHandler):
     """Handler for usage events in LLM or Embedding models.
@@ -102,6 +105,8 @@ def on_event_end(
             and event_type not in self.event_ends_to_ignore
             and payload is not None
         ):
+            if self.embed_model is None:
+                return
             model_name = self.embed_model.model_name
             embedding_tokens = self.token_counter.total_embedding_token_count
             self.stream_log(
@@ -117,16 +122,26 @@ def on_event_end(
                 )
                 cost = prompt_cost
             except Exception:
+                logger.warning(
+                    "Failed to compute embedding cost for model=%s; recording 0.0",
+                    model_name,
+                    exc_info=True,
+                )
                 cost = 0.0
 
-            display_model = model_name.split("/", 1)[-1] if model_name else model_name
+            # rsplit so multi-segment IDs (e.g. ``bedrock/anthropic/claude``)
+            # collapse to the trailing segment, matching legacy Audit semantics.
+            display_model = model_name.rsplit("/", 1)[-1] if model_name else model_name
 
             self._pending_usage.append(
                 {
                     "usage_type": "embedding",
                     "model_name": display_model,
                     "adapter_instance_id": self.kwargs.get("adapter_instance_id", ""),
-                    "run_id": self.kwargs.get("run_id", ""),
+                    # ``run_id`` lands in a UUIDField column; "" would fail the
+                    # cast — keep absent values as None so the bulk-create view
+                    # writes NULL.
+                    "run_id": self.kwargs.get("run_id") or None,
                     "execution_id": self.kwargs.get("execution_id", ""),
                     "embedding_tokens": embedding_tokens,
                     "prompt_tokens": 0,
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 7bd3b88a47..83e7c76ec0 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -59,11 +59,16 @@ class LegacyExecutor(BaseExecutor):
 
     def __init__(self) -> None:
         # Per-request state — overwritten on every ``execute()`` call.
+        # ``_usage_records`` initialised here too so the orchestrator's
+        # ``getattr(executor, "_usage_records", None)`` always sees a real
+        # list — an early-init crash inside ``execute()`` would otherwise
+        # silently drop billing rows.
         self._log_events_id: str = ""
         self._log_component: dict[str, str] = {}
         self._execution_id: str | None = None
         self._file_execution_id: str | None = None
         self._organization_id: str | None = None
+        self._usage_records: list[dict[str, Any]] = []
 
     @property
     def name(self) -> str:
@@ -85,7 +90,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
         self._log_component: dict[str, str] = (
             getattr(context, "_log_component", None) or {}
         )
-        self._usage_records: list[dict[str, Any]] = []
+        self._usage_records = []
         self._execution_id = context.execution_id
         self._file_execution_id = context.file_execution_id
         self._organization_id = context.organization_id
@@ -152,7 +157,14 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                         level=LogLevel.ERROR,
                     )
                 except Exception:
-                    pass  # Best-effort — don't mask the original error
+                    # Best-effort — don't mask the original error, but log
+                    # so the secondary failure (broker down, serialization
+                    # bug, etc.) is recoverable.
+                    logger.debug(
+                        "Failed to stream error to FE for run_id=%s",
+                        context.run_id,
+                        exc_info=True,
+                    )
             # Preserve any usage rows collected before the failure so the task
             # wrapper still flushes them. Without this, transient errors that
             # trigger Celery autoretry re-run LLMs and lose billing rows.
@@ -1436,8 +1448,12 @@ def _run_challenge_if_enabled(
             platform_key=platform_api_key,
             metadata=metadata,
         )
-        challenger.run()
-        self._usage_records.extend(challenge_llm.flush_pending_usage())
+        try:
+            challenger.run()
+        finally:
+            # Flush even on exception so transient errors don't drop the
+            # challenge LLM's billing rows.
+            self._usage_records.extend(challenge_llm.flush_pending_usage())
         shim.stream_log(f"Challenge verification completed for: `{prompt_name}`")
         logger.info("Challenge completed: prompt=%s", prompt_name)
 
@@ -1799,15 +1815,14 @@ def _flush_per_prompt_metrics(
         )
         self._usage_records.extend(llm.flush_pending_usage())
         if chunk_size > 0 and embedding is not None:
-            try:
+            # Public adapters (``is_public_adapter() is True``) construct
+            # ``EmbeddingCompat`` without a callback_manager, so there's
+            # nothing to flush. Skip silently rather than catching the
+            # AttributeError — the broad catch was masking real bugs.
+            if embedding.callback_manager is not None:
                 for handler in embedding.callback_manager.handlers:
                     if hasattr(handler, "flush_pending_usage"):
                         self._usage_records.extend(handler.flush_pending_usage())
-            except Exception:
-                logger.warning(
-                    "Failed to flush embedding usage from callback handlers",
-                    exc_info=True,
-                )
         if vector_db:
             vector_db.close()
 
@@ -2269,8 +2284,12 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
             )
 
             shim.stream_log("Running document summarization...")
-            summary = answer_prompt_svc.run_completion(llm=llm, prompt=prompt)
-            self._usage_records.extend(llm.flush_pending_usage())
+            try:
+                summary = answer_prompt_svc.run_completion(llm=llm, prompt=prompt)
+            finally:
+                # Flush even on exception so the summarization LLM's
+                # billing rows aren't lost on transient errors.
+                self._usage_records.extend(llm.flush_pending_usage())
             logger.info("Summarization completed: run_id=%s", context.run_id)
             shim.stream_log("Summarization completed")
             return ExecutionResult(
diff --git a/workers/executor/tasks.py b/workers/executor/tasks.py
index ea02b7c353..49fbfe8746 100644
--- a/workers/executor/tasks.py
+++ b/workers/executor/tasks.py
@@ -105,16 +105,27 @@ def execute_extraction(self, execution_context_dict: dict) -> dict:
         try:
             config = WorkerConfig()
             with UsageAPIClient(config) as usage_client:
+                # ``set_organization_context`` covers the org for every
+                # request on this client; passing it again as a kwarg was
+                # redundant.
                 usage_client.set_organization_context(context.organization_id)
-                usage_client.bulk_create_usage(
-                    usage_records,
-                    organization_id=context.organization_id,
+                ok = usage_client.bulk_create_usage(usage_records)
+            if not ok:
+                # Promote to ERROR so on-call has the run_id/org/count to
+                # recover dropped billing rows from logs.
+                logger.error(
+                    "bulk_create_usage returned failure for %d records "
+                    "(run_id=%s organization_id=%s)",
+                    len(usage_records),
+                    context.run_id,
+                    context.organization_id,
                 )
         except Exception:
-            logger.warning(
-                "Failed to flush %d usage records for run_id=%s",
+            logger.error(
+                "Failed to flush %d usage records for run_id=%s organization_id=%s",
                 len(usage_records),
                 context.run_id,
+                context.organization_id,
                 exc_info=True,
             )
 
diff --git a/workers/shared/clients/usage_client.py b/workers/shared/clients/usage_client.py
index 1fc87eb0dc..acd6dd4c4d 100644
--- a/workers/shared/clients/usage_client.py
+++ b/workers/shared/clients/usage_client.py
@@ -191,7 +191,15 @@ def bulk_create_usage(
                 data={"records": records},
                 organization_id=organization_id,
             )
-            return response.get("success", False) or "created" in response
+            # The success path returns ``{"created": N}`` (no ``success``
+            # key); the error path returns ``{"success": False, "error":
+            # ...}``. Accept either an explicit success flag or the
+            # presence of ``created`` *as long as* ``success`` isn't
+            # explicitly False — guards against future contracts that may
+            # report a partial body.
+            if response.get("success") is False:
+                return False
+            return response.get("success") is True or "created" in response
         except Exception:
             logger.error(
                 "Failed to bulk create %d usage records", len(records), exc_info=True

From 9ef8c800f0abc59d56298610afa4f484dd4d072d Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 13:18:50 +0530
Subject: [PATCH 37/57] UN-2946 [FIX] Cross-cutting hygiene around lookup
 enrichment & webhook
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Tighten LookupEnrichmentProtocol to declare run_with_metrics
  and METRICS_KEY so it actually matches the plugin call site —
  run() -> None was structurally identical to the no-op protocols.
- Wrap the cloud run_with_metrics call in _run_lookup_enrichment
  in a defensive try/except that logs + streams a WARN to the IDE log,
  so plugin contract drift degrades the lookup gracefully instead of
  aborting the answer-prompt batch.
- Hoist llm_cls out of the per-prompt hot loop — it was being
  unpacked from a 7-tuple inside _run_lookup_enrichment on every
  prompt; the caller already has it.
- Extract the is_empty ladder into a module-level _is_blank
  helper so the predicate (and the falsy-but-valid 0/False rationale
  comment) lives next to the predicate, not the executor.
- _run_webhook_postprocessing: when webhook_enabled and output
  is non-JSON, log + shim.stream_log so the user sees the skip in
  the IDE panel instead of silently never receiving the webhook call.
- Narrow persist_lookup_output catch to (IntegrityError,
  ValidationError) and promote to logger.error — broad catches
  were hiding plugin schema drift while reporting success.
- Wrap enrich_prompt_output in the prompt-output serializer's
  to_representation so an enrichment exception no longer 500s the
  list endpoint; matches the surrounding log-and-continue policy.
---
 .../output_manager_helper.py                  | 13 ++-
 .../serializers.py                            | 12 ++-
 workers/executor/executors/legacy_executor.py | 96 ++++++++++++++-----
 .../executor/executors/plugins/protocols.py   | 23 ++++-
 4 files changed, 114 insertions(+), 30 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 21aad3ed94..672749d4d7 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -2,7 +2,8 @@
 import logging
 from typing import Any
 
-from django.core.exceptions import ObjectDoesNotExist
+from django.core.exceptions import ObjectDoesNotExist, ValidationError
+from django.db import IntegrityError
 
 from prompt_studio.lookup_utils import (
     attach_combined_output_enrichment,
@@ -213,12 +214,16 @@ def update_or_create_prompt_output(
                 word_confidence_data=prompt_word_confidence_data,
             )
 
-            # Persist lookup outputs if present (cloud plugin, no-op in OSS)
+            # Persist lookup outputs if present (cloud plugin, no-op in OSS).
+            # Narrow to known DB-level errors so unexpected exceptions
+            # (plugin contract drift, KeyError on the lookup payload) bubble
+            # up rather than getting hidden as a warning that masquerades
+            # as a successful save.
             if prompt_lookup:
                 try:
                     persist_lookup_output(prompt_output, prompt_lookup)
-                except Exception:
-                    logger.warning(
+                except (IntegrityError, ValidationError):
+                    logger.error(
                         "Failed to persist lookup output for prompt %s",
                         prompt.prompt_key,
                         exc_info=True,
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
index e4276dbb23..dad8d52979 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
@@ -48,7 +48,17 @@ def to_representation(self, instance):
                 " | Process continued"
             )
             data["coverage"] = {}
-        data = enrich_prompt_output(instance, data)
+        # Match the surrounding ``log + continue`` policy used by token-usage
+        # and coverage above — an enrichment failure shouldn't 500 the entire
+        # prompt-output list endpoint and hide the raw output.
+        try:
+            data = enrich_prompt_output(instance, data)
+        except Exception as e:
+            logger.error(
+                "Error occurred while enriching prompt output for "
+                f"prompt_id {instance.prompt_id} (run_id={instance.run_id}): {e}"
+                " | Process continued"
+            )
 
         # Convert string to list
         try:
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 83e7c76ec0..a321e6be07 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -37,6 +37,21 @@
 logger = logging.getLogger(__name__)
 
 
+def _is_blank(value: Any) -> bool:
+    """Treat None / whitespace strings / empty containers as no-value.
+
+    Boolean ``False`` and numeric ``0`` are *not* blank — they're valid
+    inputs for boolean / number prompts whose lookups should still run.
+    """
+    if value is None:
+        return True
+    if isinstance(value, str):
+        return not value.strip()
+    if isinstance(value, (list, dict)):
+        return not value
+    return False
+
+
 @ExecutorRegistry.register
 class LegacyExecutor(BaseExecutor):
     """Executor that wraps the full prompt-service extraction pipeline.
@@ -1708,11 +1723,13 @@ def _execute_single_prompt(
                 metrics=metrics,
                 shim=shim,
                 usage_kwargs=usage_kwargs,
+                llm_cls=llm_cls,
             )
             self._run_webhook_postprocessing(
                 output=output,
                 structured_output=structured_output,
                 metadata=metadata,
+                shim=shim,
             )
 
             self._run_challenge_if_enabled(
@@ -1990,9 +2007,14 @@ def _run_lookup_enrichment(
         metadata: dict[str, Any],
         metrics: dict[str, Any],
         shim: Any,
+        llm_cls: Any,
         usage_kwargs: dict[str, Any] | None = None,
     ) -> None:
-        """Run lookup enrichment plugin if enabled and available."""
+        """Run lookup enrichment plugin if enabled and available.
+
+        ``llm_cls`` is passed in by the caller so we don't re-unpack the
+        7-tuple returned by ``_get_prompt_deps()`` on every prompt.
+        """
         from executor.executors.constants import PromptServiceConstants as PSKeys
         from executor.executors.plugins import ExecutorPluginLoader
 
@@ -2003,16 +2025,9 @@ def _run_lookup_enrichment(
         lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
         if not (lookup_config and lookup_cls):
             return
-        # Treat empty strings/containers as "no value" too — for boolean and
-        # number prompts, falsy 0/False are still valid inputs and must run.
-        is_empty = (
-            current_value is None
-            or (isinstance(current_value, str) and not current_value.strip())
-            or (isinstance(current_value, (list, dict)) and not current_value)
-        )
-        if is_empty:
-            # Skipping silently here would leave the user wondering why a
-            # configured lookup didn't run — surface it to the workflow log.
+        if _is_blank(current_value):
+            # Surface a skip log instead of silently no-op-ing — the user
+            # configured a lookup and would otherwise wonder why it didn't run.
             lookup_name = lookup_config.get("lookup_name") or "lookup"
             shim.stream_log(
                 f"Skipping lookup `{lookup_name}` for `{prompt_name}` — "
@@ -2020,17 +2035,34 @@ def _run_lookup_enrichment(
             )
             return
 
-        _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
-        outcome = lookup_cls.run_with_metrics(
-            llm_cls=llm_cls,
-            lookup_config=lookup_config,
-            structured_output=structured_output,
-            current_value=current_value,
-            metadata=metadata,
-            prompt_name=prompt_name,
-            shim=shim,
-            usage_kwargs=usage_kwargs,
-        )
+        try:
+            outcome = lookup_cls.run_with_metrics(
+                llm_cls=llm_cls,
+                lookup_config=lookup_config,
+                structured_output=structured_output,
+                current_value=current_value,
+                metadata=metadata,
+                prompt_name=prompt_name,
+                shim=shim,
+                usage_kwargs=usage_kwargs,
+            )
+        except Exception:
+            # Enrichment is post-extraction — degrade gracefully on
+            # plugin contract drift (missing METRICS_KEY, unexpected
+            # outcome shape) rather than aborting the whole prompt run
+            # and losing the answer-prompt billing rows.
+            lookup_name = lookup_config.get("lookup_name") or "lookup"
+            logger.exception(
+                "Lookup enrichment failed for prompt=%s lookup=%s",
+                prompt_name,
+                lookup_name,
+            )
+            shim.stream_log(
+                f"Lookup `{lookup_name}` failed for `{prompt_name}`; "
+                f"continuing without enrichment.",
+                level=LogLevel.WARN,
+            )
+            return
         self._usage_records.extend(outcome.usage_records)
         metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = outcome.llm_metrics
 
@@ -2039,6 +2071,7 @@ def _run_webhook_postprocessing(
         output: dict[str, Any],
         structured_output: dict[str, Any],
         metadata: dict[str, Any],
+        shim: Any,
     ) -> None:
         """Run webhook postprocessing if enabled (JSON outputs only)."""
         from executor.executors.answer_prompt import AnswerPromptService
@@ -2047,7 +2080,24 @@ def _run_webhook_postprocessing(
         prompt_name = output[PSKeys.NAME]
         output_type = output.get(PSKeys.TYPE, "")
         webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
-        if not (webhook_enabled and output_type == PSKeys.JSON):
+        if not webhook_enabled:
+            return
+        if output_type != PSKeys.JSON:
+            # The pre-refactor behaviour fired the webhook regardless of
+            # output_type. The new restriction is intentional, but the
+            # user enabled a webhook URL and would otherwise see no call
+            # firing — surface the skip in the IDE log panel.
+            logger.warning(
+                "Webhook postprocessing supports JSON outputs only; "
+                "skipping for prompt=%s (output_type=%s)",
+                prompt_name,
+                output_type,
+            )
+            shim.stream_log(
+                f"Webhook postprocessing supports JSON outputs only; "
+                f"skipping for `{prompt_name}`.",
+                level=LogLevel.WARN,
+            )
             return
 
         webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
diff --git a/workers/executor/executors/plugins/protocols.py b/workers/executor/executors/plugins/protocols.py
index 9ce1c5eb9e..c59973d734 100644
--- a/workers/executor/executors/plugins/protocols.py
+++ b/workers/executor/executors/plugins/protocols.py
@@ -53,6 +53,25 @@ def run(self, **kwargs: Any) -> dict: ...
 
 @runtime_checkable
 class LookupEnrichmentProtocol(Protocol):
-    """Legacy executor: post-extraction lookup enrichment."""
+    """Legacy executor: post-extraction lookup enrichment.
 
-    def run(self) -> None: ...
+    The executor calls ``run_with_metrics`` (not ``run``) because the
+    plugin returns an outcome object exposing ``usage_records`` and
+    ``llm_metrics`` for the calling executor to flush. ``METRICS_KEY``
+    keys the lookup metrics into the per-prompt metrics dict.
+    """
+
+    METRICS_KEY: str
+
+    def run_with_metrics(
+        self,
+        *,
+        llm_cls: Any,
+        lookup_config: dict,
+        structured_output: dict,
+        current_value: Any,
+        metadata: dict,
+        prompt_name: str,
+        shim: Any,
+        usage_kwargs: dict | None = None,
+    ) -> Any: ...

From 29a7050476132804373b64d1bb9bc1dd386e3a18 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 13:53:41 +0530
Subject: [PATCH 38/57] UN-2946 [FIX] Tighten Usage choices & lookup_utils
 contracts
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- UsageStatus(TextChoices) so the status field has an enforced
  domain instead of free-text — producers (llm.py, usage_handler.py)
  already write the canonical "SUCCESS" string so no producer changes
  needed.
- Add usage_reference_pair_consistent CheckConstraint so a row
  with reference_id set but reference_type NULL (or vice versa)
  is rejected at the DB. Cheap to validate on apply because both fields
  landed together in lookups V2 — legacy rows have both NULL. The
  sibling (usage_type, llm_usage_reason) constraint is deferred to
  a follow-up issue: legacy embedding rows have llm_usage_reason=''
  from the old SDK default, and a full-table backfill or default
  ADD CONSTRAINT scan would lock the billing table for too long in
  prod.
- internal_views.py: write llm_usage_reason as None instead of
  "" when missing so the choice column doesn't store an
  out-of-domain value.
- lookup_utils.py: narrow the ImportError catch to the four cloud
  lookup modules so a failing transitive import inside the cloud plugin
  re-raises instead of silently degrading the whole feature to a no-op.
  Annotate get_original_value_if_enriched return as
  tuple[Any, dict] | None and rephrase the docstring to match the
  actual shape callers tuple-unpack.
- Drop the attach_lookup_config /
  attach_lookup_configs_to_tool_settings /
  get_lookup_config_from_output wrappers — they were trivial dict
  ops over a hardcoded key already used directly by the executor and
  single-pass plugin, so the "key owned by the bridge" framing was
  misleading. Inline at all five callsites.
- Drop the "future prompt_studio" forward-looking comment in
  ide_callback/tasks.py — only source='lookup' is wired up, and
  the cloud lookups plugin is the only registrant of the underlying
  endpoints.
---
 backend/prompt_studio/lookup_utils.py         | 61 +++++++++----------
 .../prompt_studio_helper.py                   | 10 ++-
 .../prompt_studio_registry_helper.py          |  7 +--
 backend/usage_v2/internal_views.py            |  7 ++-
 .../0006_alter_usage_status_and_more.py       | 42 +++++++++++++
 backend/usage_v2/models.py                    | 32 ++++++++++
 workers/ide_callback/tasks.py                 |  7 ++-
 7 files changed, 120 insertions(+), 46 deletions(-)
 create mode 100644 backend/usage_v2/migrations/0006_alter_usage_status_and_more.py

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index b1bc79a707..5bc21bc90e 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -1,15 +1,29 @@
 """Shared utility for lookup operations.
 
-Wraps cloud-only lookup calls so that OSS callers don't repeat the
-try/except ImportError guard. All functions are no-ops in OSS. A single
-module-level probe decides availability so downstream errors inside the
-cloud plugin surface instead of being silently swallowed as ImportError.
+Wraps cloud-only lookup calls so OSS callers don't repeat the
+``try/except ImportError`` guard. All functions are no-ops in OSS.
+
+The probe below catches *only* the absence of the cloud
+``pluggable_apps.lookups`` package — an ImportError raised transitively
+inside the cloud plugin (e.g. a missing third-party dependency it needs)
+re-raises so the failure surfaces instead of silently degrading the
+whole feature to a no-op.
 """
 
 import logging
+from typing import Any
 
 logger = logging.getLogger(__name__)
 
+_CLOUD_LOOKUP_MODULES = {
+    "pluggable_apps.lookups",
+    "pluggable_apps.lookups.execution",
+    "pluggable_apps.lookups.output_enrichment",
+    "pluggable_apps.lookups.staleness",
+    "pluggable_apps.lookups.validation",
+    "pluggable_apps.lookups.models",
+}
+
 try:
     from pluggable_apps.lookups import execution as _execution
     from pluggable_apps.lookups import output_enrichment as _output_enrichment
@@ -18,7 +32,9 @@
     from pluggable_apps.lookups.models import LookupOutputResult as _LookupOutputResult
 
     LOOKUPS_AVAILABLE = True
-except ImportError:
+except ImportError as e:
+    if e.name not in _CLOUD_LOOKUP_MODULES:
+        raise
     LOOKUPS_AVAILABLE = False
 
 
@@ -103,12 +119,16 @@ def get_latest_lookup_mutation_for_tool(tool):
     return _staleness.get_latest_lookup_mutation_for_tool(tool)
 
 
-def get_original_value_if_enriched(metadata: dict, prompt_key: str):
-    """Return the pre-enrichment value for ``prompt_key`` if present.
+def get_original_value_if_enriched(
+    metadata: dict, prompt_key: str
+) -> tuple[Any, dict] | None:
+    """Return ``(original_value, prompt_lookup_dict)`` if ``prompt_key`` was
+    enriched, or ``None`` otherwise.
 
-    Opaque wrapper around the cloud plugin's ``lookup_outputs`` metadata
-    shape so OSS callers don't need to know the key names. Returns None
-    when no enrichment happened or the plugin is absent.
+    Operates purely on metadata shape — the plugin-availability flag is
+    not consulted, so callers can invoke this even when ``LOOKUPS_AVAILABLE``
+    is False (it still returns ``None`` because the metadata shape won't
+    match).
     """
     if not isinstance(metadata, dict):
         return None
@@ -158,24 +178,3 @@ def get_lookup_validation_for_tool(tool) -> dict:
             ),
         }
     return _validation.get_lookup_validation_for_tool(tool)
-
-
-def attach_lookup_config(output: dict, config: dict) -> None:
-    """Stamp a per-prompt output dict with the lookup config payload.
-
-    Keeps the payload key name owned by the bridge so OSS call sites
-    don't encode the contract.
-    """
-    output["lookup_config"] = config
-
-
-def attach_lookup_configs_to_tool_settings(
-    tool_settings: dict, configs: list[dict]
-) -> None:
-    """Stamp tool_settings with the per-tool lookup configs list."""
-    tool_settings["lookup_configs"] = configs
-
-
-def get_lookup_config_from_output(output: dict) -> dict | None:
-    """Read the lookup config stamped on a prompt output, if any."""
-    return output.get("lookup_config")
diff --git a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
index a706ac366c..62cbf2d9a2 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/prompt_studio_helper.py
@@ -22,8 +22,6 @@
 
 from backend.celery_service import app as celery_app
 from prompt_studio.lookup_utils import (
-    attach_lookup_config,
-    attach_lookup_configs_to_tool_settings,
     get_lookup_config,
     get_lookup_configs_for_tool,
 )
@@ -395,7 +393,7 @@ def _build_prompt_output(
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
         if lookup_config := get_lookup_config(prompt):
-            attach_lookup_config(output, lookup_config)
+            output["lookup_config"] = lookup_config
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -809,7 +807,7 @@ def build_fetch_response_payload(
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
 
         if lookup_config := get_lookup_config(prompt):
-            attach_lookup_config(output, lookup_config)
+            output["lookup_config"] = lookup_config
 
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
@@ -1181,7 +1179,7 @@ def build_single_pass_payload(
 
         lookup_configs = get_lookup_configs_for_tool(tool, prompts=prompts)
         if lookup_configs:
-            attach_lookup_configs_to_tool_settings(tool_settings, lookup_configs)
+            tool_settings["lookup_configs"] = lookup_configs
 
         for p in prompts:
             if not p.prompt:
@@ -1935,7 +1933,7 @@ def _fetch_response(
         if webhook_enabled:
             output[TSPKeys.POSTPROCESSING_WEBHOOK_URL] = webhook_url
         if lookup_config := get_lookup_config(prompt):
-            attach_lookup_config(output, lookup_config)
+            output["lookup_config"] = lookup_config
         # Eval settings for the prompt
         output[TSPKeys.EVAL_SETTINGS] = {}
         output[TSPKeys.EVAL_SETTINGS][TSPKeys.EVAL_SETTINGS_EVALUATE] = prompt.evaluate
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 8b29e437e3..998022cbbb 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -7,10 +7,7 @@
 from django.db import IntegrityError
 from plugins import get_plugin
 
-from prompt_studio.lookup_utils import (
-    attach_lookup_config,
-    validate_lookups_for_export,
-)
+from prompt_studio.lookup_utils import validate_lookups_for_export
 from prompt_studio.prompt_profile_manager_v2.models import ProfileManager
 from prompt_studio.prompt_studio_core_v2.models import CustomTool
 from prompt_studio.prompt_studio_core_v2.prompt_studio_helper import PromptStudioHelper
@@ -366,7 +363,7 @@ def frame_export_json(
             )
             prompt_id_str = str(prompt.prompt_id)
             if prompt_id_str in lookup_configs:
-                attach_lookup_config(output, lookup_configs[prompt_id_str])
+                output["lookup_config"] = lookup_configs[prompt_id_str]
             # Retaining the old fields in condition
             # for backward compatibility. To be removed in future.
             if (
diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 1ff9b1376f..9cfa9699c6 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -171,7 +171,12 @@ def post(self, request: Request) -> JsonResponse:
                     adapter_instance_id=r.get("adapter_instance_id", ""),
                     run_id=r.get("run_id"),
                     usage_type=r.get("usage_type", "llm"),
-                    llm_usage_reason=r.get("llm_usage_reason", ""),
+                    # ``llm_usage_reason`` has a fixed choice set and a
+                    # cross-field CheckConstraint vs. ``usage_type``. Coerce
+                    # missing/empty to None so embedding rows don't trip
+                    # the constraint and so we don't silently store ""
+                    # which isn't a valid choice.
+                    llm_usage_reason=r.get("llm_usage_reason") or None,
                     model_name=r.get("model_name", ""),
                     embedding_tokens=r.get("embedding_tokens", 0),
                     prompt_tokens=r.get("prompt_tokens", 0),
diff --git a/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py b/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py
new file mode 100644
index 0000000000..c15203bb60
--- /dev/null
+++ b/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py
@@ -0,0 +1,42 @@
+# Generated by Django 4.2.1 on 2026-04-28 08:22
+
+from django.db import migrations, models
+
+
+class Migration(migrations.Migration):
+    dependencies = [
+        ("usage_v2", "0005_usage_reason_ref_created_idx"),
+    ]
+
+    operations = [
+        migrations.AlterField(
+            model_name="usage",
+            name="status",
+            field=models.CharField(
+                blank=True,
+                choices=[
+                    ("SUCCESS", "Success"),
+                    ("ERROR", "Error"),
+                    ("SKIPPED", "Skipped"),
+                ],
+                db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
+                max_length=16,
+                null=True,
+            ),
+        ),
+        migrations.AddConstraint(
+            model_name="usage",
+            constraint=models.CheckConstraint(
+                check=models.Q(
+                    models.Q(
+                        ("reference_id__isnull", True), ("reference_type__isnull", True)
+                    ),
+                    models.Q(
+                        ("reference_id__isnull", False), ("reference_type__isnull", False)
+                    ),
+                    _connector="OR",
+                ),
+                name="usage_reference_pair_consistent",
+            ),
+        ),
+    ]
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index ac0f583aa4..2d6c7e2144 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -13,6 +13,12 @@ class UsageType(models.TextChoices):
     EMBEDDING = "embedding", "Embedding Usage"
 
 
+class UsageStatus(models.TextChoices):
+    SUCCESS = "SUCCESS", "Success"
+    ERROR = "ERROR", "Error"
+    SKIPPED = "SKIPPED", "Skipped"
+
+
 # ── Choice lists (static union of OSS + cloud values) ────────────────
 # Cloud-only entries (e.g. "lookup", "lookup_version") are listed here
 # even on OSS-only builds where they're never written. A previous
@@ -116,6 +122,7 @@ class Usage(DefaultOrganizationMixin, BaseModel):
     )
     status = models.CharField(
         max_length=16,
+        choices=UsageStatus.choices,
         null=True,
         blank=True,
         db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
@@ -141,3 +148,28 @@ class Meta:
                 name="idx_usage_reason_ref_created",
             ),
         ]
+        constraints = [
+            # ``reference_type`` is a discriminator for ``reference_id``.
+            # Either both are NULL (no entity attribution) or both are set
+            # (decodable). A row with one but not the other is undecodable
+            # at billing-aggregation time. Cheap to validate on apply
+            # because both fields landed together in lookups V2 — legacy
+            # rows have both NULL.
+            models.CheckConstraint(
+                check=(
+                    models.Q(reference_id__isnull=True, reference_type__isnull=True)
+                    | models.Q(reference_id__isnull=False, reference_type__isnull=False)
+                ),
+                name="usage_reference_pair_consistent",
+            ),
+            # NOTE: a sibling ``(usage_type, llm_usage_reason)`` constraint
+            # would be a natural extension here — embedding rows must have
+            # llm_usage_reason NULL, LLM rows must have it set. Skipped in
+            # this PR because the ``usage`` table is large in prod and
+            # legacy embedding rows have ``llm_usage_reason=''`` from the
+            # old SDK default; both the data backfill and Django's default
+            # ``ADD CONSTRAINT`` (full-table scan) would lock the billing
+            # table for too long. To be added in a follow-up via
+            # ``ADD CONSTRAINT ... NOT VALID`` + batched ``VALIDATE
+            # CONSTRAINT`` during a maintenance window.
+        ]
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index 6f4e62087b..d7c305224f 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -519,10 +519,11 @@ def ide_prompt_error(
 
 
 # ------------------------------------------------------------------
-# Generic Text Extraction Callbacks
+# Text Extraction Callbacks
 #
-# Reusable extraction callbacks that route based on ``source`` in
-# callback_kwargs (e.g. "lookup", future "prompt_studio").
+# Today only ``source="lookup"`` is wired up; the cloud lookups plugin
+# is the only registrant of the underlying extraction-complete /
+# extraction-error endpoints (see workers/shared/clients/extraction_client.py).
 # ------------------------------------------------------------------
 
 

From 993ae95d19352b00b10583060f45e9e688c788d1 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 13:56:42 +0530
Subject: [PATCH 39/57] UN-2946 [PERF] Push Combined Output queries into SQL
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- latest_outputs_by_keys: switch the per-prompt latest pick to
  order_by('prompt_id', '-modified_at').distinct('prompt_id') so
  Postgres returns at most one row per prompt instead of materialising
  every historical run + relying on a Python break.
- fetch_default_output_response: collapse the previous N+1
  (exists() + for output in queryset per prompt) into a single
  DISTINCT ON (prompt_id, profile_manager_id) query, plus a
  per-tool cache for the default-profile lookup. Combined Output is a
  hot path — the old shape made every panel switch O(prompts × runs)
  with a plugin invocation per matching row.
- Drop the unused _resolve_profile_for_prompt and
  _collect_default_output_for_prompt helpers, and the dead
  except ObjectDoesNotExist: return '' (neither .exists() nor
  the queryset iteration ever raised that exception).
---
 .../output_manager_helper.py                  | 119 ++++++++++--------
 .../prompt_studio_output_manager_v2/views.py  |  11 +-
 2 files changed, 71 insertions(+), 59 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index 672749d4d7..f5ec54c94e 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -2,7 +2,7 @@
 import logging
 from typing import Any
 
-from django.core.exceptions import ObjectDoesNotExist, ValidationError
+from django.core.exceptions import ValidationError
 from django.db import IntegrityError
 
 from prompt_studio.lookup_utils import (
@@ -260,49 +260,6 @@ def fetch_default_llm_profile(tool: CustomTool) -> ProfileManager:
         except DefaultProfileError:
             raise DefaultProfileError("Default ProfileManager does not exist.")
 
-    @staticmethod
-    def _resolve_profile_for_prompt(
-        tool_prompt: ToolStudioPrompt,
-        use_default_profile: bool,
-    ) -> str | None:
-        profile_manager_id = tool_prompt.profile_manager_id
-        if not profile_manager_id and not use_default_profile:
-            return None
-        if not profile_manager_id:
-            default_profile = ProfileManager.get_default_llm_profile(tool_prompt.tool_id)
-            profile_manager_id = default_profile.profile_id
-        return profile_manager_id
-
-    @staticmethod
-    def _collect_default_output_for_prompt(
-        tool_prompt: ToolStudioPrompt,
-        profile_manager_id: str,
-        document_manager_id: str,
-        enrichment_by_key: dict[str, Any],
-    ) -> Any:
-        from prompt_studio.lookup_utils import enrich_prompt_output
-
-        try:
-            queryset = PromptStudioOutputManager.objects.filter(
-                prompt_id=str(tool_prompt.prompt_id),
-                profile_manager=profile_manager_id,
-                is_single_pass_extract=False,
-                document_manager_id=document_manager_id,
-            )
-            if not queryset.exists():
-                return ""
-
-            value: Any = ""
-            for output in queryset:
-                value = output.output
-                enriched = enrich_prompt_output(output, {})
-                bundle = extract_prompt_output_enrichment(enriched)
-                if bundle is not None:
-                    enrichment_by_key[tool_prompt.prompt_key] = bundle
-            return value
-        except ObjectDoesNotExist:
-            return ""
-
     @staticmethod
     def fetch_default_output_response(
         tool_studio_prompts: list[ToolStudioPrompt],
@@ -322,26 +279,78 @@ def fetch_default_output_response(
                 When lookups are configured, the cloud plugin adds an
                 opaque enrichment payload via ``attach_combined_output_enrichment``.
         """
-        result: dict[str, Any] = {}
-        enrichment_by_key: dict[str, Any] = {}
+        from prompt_studio.lookup_utils import enrich_prompt_output
 
+        # Pre-resolve (prompt, profile_id) pairs once so the per-prompt
+        # default-profile lookup memoises against the small set of tool IDs
+        # involved. Combined Output is a hot path — the previous N+1 (two
+        # DB calls per prompt + a plugin invocation per matching row)
+        # turned every panel switch into a multi-second wait.
+        default_profile_cache: dict[str, str | None] = {}
+
+        def _resolve(tool_prompt: ToolStudioPrompt) -> str | None:
+            profile_manager_id = tool_prompt.profile_manager_id
+            if profile_manager_id:
+                return profile_manager_id
+            if not use_default_profile:
+                return None
+            tool_id = tool_prompt.tool_id_id
+            if tool_id not in default_profile_cache:
+                try:
+                    default_profile_cache[tool_id] = (
+                        ProfileManager.get_default_llm_profile(
+                            tool_prompt.tool_id
+                        ).profile_id
+                    )
+                except DefaultProfileError:
+                    default_profile_cache[tool_id] = None
+            return default_profile_cache[tool_id]
+
+        prompts_to_query: list[tuple[ToolStudioPrompt, str]] = []
+        result: dict[str, Any] = {}
         for tool_prompt in tool_studio_prompts:
             if tool_prompt.prompt_type == PSOMKeys.NOTES:
                 continue
-            profile_manager_id = OutputManagerHelper._resolve_profile_for_prompt(
-                tool_prompt, use_default_profile
-            )
+            profile_manager_id = _resolve(tool_prompt)
             if profile_manager_id is None:
                 result[tool_prompt.prompt_key] = ""
                 continue
-            result[tool_prompt.prompt_key] = (
-                OutputManagerHelper._collect_default_output_for_prompt(
-                    tool_prompt,
-                    profile_manager_id,
-                    document_manager_id,
-                    enrichment_by_key,
+            prompts_to_query.append((tool_prompt, profile_manager_id))
+
+        # Single batch query keyed on the (prompt_id, profile_manager_id)
+        # pair — ``DISTINCT ON`` (Postgres) gives the latest row per pair
+        # in SQL so we don't materialise every historical run per prompt.
+        outputs_index: dict[tuple[str, str], PromptStudioOutputManager] = {}
+        if prompts_to_query:
+            prompt_ids = [str(p.prompt_id) for p, _ in prompts_to_query]
+            profile_ids = list({pmid for _, pmid in prompts_to_query})
+            outputs = (
+                PromptStudioOutputManager.objects.filter(
+                    prompt_id__in=prompt_ids,
+                    profile_manager_id__in=profile_ids,
+                    is_single_pass_extract=False,
+                    document_manager_id=document_manager_id,
                 )
+                .order_by("prompt_id", "profile_manager_id", "-modified_at")
+                .distinct("prompt_id", "profile_manager_id")
             )
+            outputs_index = {
+                (str(o.prompt_id), str(o.profile_manager_id)): o for o in outputs
+            }
+
+        enrichment_by_key: dict[str, Any] = {}
+        for tool_prompt, profile_manager_id in prompts_to_query:
+            output = outputs_index.get(
+                (str(tool_prompt.prompt_id), str(profile_manager_id))
+            )
+            if output is None:
+                result[tool_prompt.prompt_key] = ""
+                continue
+            result[tool_prompt.prompt_key] = output.output
+            enriched = enrich_prompt_output(output, {})
+            bundle = extract_prompt_output_enrichment(enriched)
+            if bundle is not None:
+                enrichment_by_key[tool_prompt.prompt_key] = bundle
 
         attach_combined_output_enrichment(result, enrichment_by_key)
         return result
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
index ff9818962d..f7b7aa8582 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
@@ -97,6 +97,10 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
         if not prompt_id_to_key:
             return Response({}, status=status.HTTP_200_OK)
 
+        # ``DISTINCT ON("prompt_id")`` (Postgres) keeps only the latest row
+        # per prompt at the SQL layer — without it Django materialises the
+        # full ``M docs × N runs × len(prompt_keys)`` result set just to
+        # let the Python loop pick one row per prompt.
         outputs = (
             PromptStudioOutputManager.objects.filter(
                 prompt_id__in=prompt_id_to_key.keys(),
@@ -104,17 +108,16 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
             )
             .exclude(output__isnull=True)
             .exclude(output__exact="")
-            .order_by("-modified_at")
+            .order_by("prompt_id", "-modified_at")
+            .distinct("prompt_id")
             .values("prompt_id", "output")
         )
 
         result: dict[str, str] = {}
         for row in outputs:
             key = prompt_id_to_key.get(row["prompt_id"])
-            if key and key not in result:
+            if key:
                 result[key] = row["output"]
-            if len(result) == len(prompt_id_to_key):
-                break
 
         return Response(result, status=status.HTTP_200_OK)
 

From cc544e476fa1ad68460bcbe81a0b4e0bfd165bcf Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 13:59:15 +0530
Subject: [PATCH 40/57] UN-2946 [FIX] Frontend & callback hygiene around lookup
 hooks

- PromptOutput.jsx: replace empty catch {} on the lookup
  dynamic-import sites with console.warn so unexpected chunk-load
  failures don't masquerade as OSS-mode behaviour. Add a
  resolveCopyText helper that wraps getEnrichedCopyText in
  try/catch + fallback so a plugin-side throw can't break the Copy
  button at either of the two call sites.
- usePromptOutput.js: same catch (error) -> console.warn for
  the two existing dynamic-import sites; wrap the per-item
  handleLookupOutput call in try/catch so a single bad enrichment
  payload no longer aborts the surrounding forEach and skips the
  prompt-output state update.
- prompt_studio_core_v2/views.py: validate prompt_id before
  the multi-var lookup gate so a missing field returns a clean 400
  instead of a lookup-related error.
- ide_callback/tasks.py: (result_dict.get('data') or {}) so an
  explicit data=None from the executor doesn't AttributeError into
  a generic ERROR callback. Replace the inner except: pass swallow
  with logger.debug so a secondary WS-emit failure during the
  outer extraction_complete fallback is recoverable from logs.
---
 .../prompt_studio_core_v2/views.py            | 19 ++++----
 .../custom-tools/prompt-card/PromptOutput.jsx | 43 ++++++++++++++-----
 frontend/src/hooks/usePromptOutput.js         | 27 +++++++++---
 workers/ide_callback/tasks.py                 | 13 +++++-
 4 files changed, 75 insertions(+), 27 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 0ba0597a4d..9510fb962f 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -511,9 +511,15 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
         document_id: str = request.data.get(ToolStudioPromptKeys.DOCUMENT_ID)
         prompt_id: str = request.data.get(ToolStudioPromptKeys.ID)
         run_id: str = request.data.get(ToolStudioPromptKeys.RUN_ID)
-        if err := _multi_var_lookup_block_response(
-            custom_tool, prompt_ids=[prompt_id] if prompt_id else None
-        ):
+        # Validate ``prompt_id`` before the lookup gate so a request
+        # missing the field returns a clear 400 instead of a lookup-related
+        # error.
+        if not prompt_id:
+            return Response(
+                {"error": "prompt id is required."},
+                status=status.HTTP_400_BAD_REQUEST,
+            )
+        if err := _multi_var_lookup_block_response(custom_tool, prompt_ids=[prompt_id]):
             return err
         profile_manager_id: str = request.data.get(
             ToolStudioPromptKeys.PROFILE_MANAGER_ID
@@ -523,13 +529,6 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
 
         org_id = UserSessionUtils.get_organization_id(request)
         user_id = custom_tool.created_by.user_id
-
-        # Resolve prompt — guard against missing / stale prompt_id
-        if not prompt_id:
-            return Response(
-                {"error": "prompt id is required."},
-                status=status.HTTP_400_BAD_REQUEST,
-            )
         try:
             prompt = ToolStudioPrompt.objects.get(pk=prompt_id)
         except ToolStudioPrompt.DoesNotExist:
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index 23246f611f..c9d9c44143 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -57,7 +57,12 @@ try {
     "../../../plugins/lookup-studio/prompt-card/LookupOutputTabs"
   );
   LookupOutputTabs = mod.LookupOutputTabs;
-} catch {}
+} catch (error) {
+  // OSS: plugin may not exist; cloud: surface unexpected chunk-load
+  // failures so they don't degrade silently to OSS-mode behaviour.
+  // eslint-disable-next-line no-console
+  console.warn("[PromptOutput] LookupOutputTabs unavailable:", error);
+}
 
 let getEnrichedCopyText;
 try {
@@ -65,7 +70,27 @@ try {
     "../../../plugins/lookup-studio/prompt-card/getEnrichedCopyText"
   );
   getEnrichedCopyText = mod.getEnrichedCopyText;
-} catch {}
+} catch (error) {
+  // eslint-disable-next-line no-console
+  console.warn("[PromptOutput] getEnrichedCopyText unavailable:", error);
+}
+
+// Resolve enriched copy text with fallback so a plugin-side throw
+// can't break the Copy button. ``getEnrichedCopyText`` may not exist
+// in OSS (plugin import failed) or may throw on a malformed enrichment.
+const resolveCopyText = (promptOutputId, fallbackText) => {
+  if (!getEnrichedCopyText) {
+    return fallbackText;
+  }
+  try {
+    const enriched = getEnrichedCopyText(promptOutputId);
+    return typeof enriched === "string" && enriched ? enriched : fallbackText;
+  } catch (err) {
+    // eslint-disable-next-line no-console
+    console.warn("[PromptOutput] getEnrichedCopyText threw:", err);
+    return fallbackText;
+  }
+};
 
 // Wraps children in LookupOutputTabs when available (cloud),
 // passes through children directly in OSS.
@@ -245,16 +270,15 @@ function PromptOutput({
             <CopyPromptOutputBtn
               isDisabled={isTableExtraction}
               copyToClipboard={() => {
-                const enrichedText = getEnrichedCopyText?.(
-                  promptOutputData?.promptOutputId,
-                );
                 copyOutputToClipboard(
-                  enrichedText ||
+                  resolveCopyText(
+                    promptOutputData?.promptOutputId,
                     displayPromptResult(
                       promptOutput,
                       true,
                       promptDetails?.enable_highlight,
                     ),
+                  ),
                 );
               }}
             />
@@ -501,15 +525,14 @@ function PromptOutput({
                           <CopyPromptOutputBtn
                             isDisabled={isTableExtraction}
                             copyToClipboard={() => {
-                              const enrichedText = getEnrichedCopyText?.(
-                                promptOutputData?.promptOutputId,
-                              );
                               copyOutputToClipboard(
-                                enrichedText ||
+                                resolveCopyText(
+                                  promptOutputData?.promptOutputId,
                                   displayPromptResult(
                                     promptOutputData?.output,
                                     true,
                                   ),
+                                ),
                               );
                             }}
                           />
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index 12d451315d..9cf6c27853 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -29,7 +29,12 @@ try {
     "../plugins/lookup-studio/prompt-card/handleLookupOutput"
   );
   handleLookupOutput = mod.handleLookupOutput;
-} catch {}
+} catch (error) {
+  // OSS: plugin may not exist; cloud: surface unexpected chunk-load
+  // failures so they don't degrade silently to OSS-mode behaviour.
+  // eslint-disable-next-line no-console
+  console.warn("[usePromptOutput] handleLookupOutput unavailable:", error);
+}
 
 // Opaque extractor so the per-item enrichment payload key name lives in
 // the plugin, not OSS. OSS falls back to a no-op. Stub signature matches
@@ -38,7 +43,10 @@ let getEnrichmentFromItem = (_item) => null;
 try {
   const mod = await import("../plugins/lookup-enriched-toggle/helpers");
   getEnrichmentFromItem = mod.getEnrichmentFromItem;
-} catch {}
+} catch (error) {
+  // eslint-disable-next-line no-console
+  console.warn("[usePromptOutput] getEnrichmentFromItem unavailable:", error);
+}
 
 const usePromptOutput = () => {
   const { sessionDetails } = useSessionStore();
@@ -142,9 +150,18 @@ const usePromptOutput = () => {
         wordConfidenceData: item?.word_confidence_data,
       };
 
-      const enrichment = getEnrichmentFromItem(item);
-      if (handleLookupOutput && enrichment) {
-        handleLookupOutput(item.prompt_output_id, enrichment);
+      // Guard the lookup hook so a per-item plugin failure can't abort
+      // the surrounding ``forEach`` and skip the whole prompt-output state
+      // update — the user would otherwise see partial / stale outputs
+      // with no error surfaced.
+      try {
+        const enrichment = getEnrichmentFromItem(item);
+        if (handleLookupOutput && enrichment) {
+          handleLookupOutput(item.prompt_output_id, enrichment);
+        }
+      } catch (err) {
+        // eslint-disable-next-line no-console
+        console.warn("[usePromptOutput] lookup enrichment failed:", err);
       }
 
       if (item?.is_single_pass_extract && isTokenUsageForSinglePassAdded) {
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index d7c305224f..345bf06c9e 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -583,7 +583,10 @@ def extraction_complete(
                 )
             return {"status": "failed", "error": error_msg}
 
-        extracted_text = result_dict.get("data", {}).get("extracted_text", "")
+        # ``result_dict["data"]`` may be explicitly ``None`` on early-return
+        # paths; guard against AttributeError so a benign empty-data response
+        # doesn't escalate to a generic "ERROR" callback.
+        extracted_text = (result_dict.get("data") or {}).get("extracted_text", "")
         token_count = len(extracted_text) // 4
 
         api.mark_extraction_complete(
@@ -631,7 +634,13 @@ def extraction_complete(
                     },
                 )
             except Exception:
-                pass
+                # ``_emit_websocket`` already swallows-and-logs internally,
+                # but if anything reaches this far we'd rather see the
+                # secondary failure in the log than lose it silently.
+                logger.debug(
+                    "Failed to emit ws ERROR event in extraction_complete fallback",
+                    exc_info=True,
+                )
         raise
 
 

From 301dc9bfc68487f9788eebad7e075acaf98194db Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 14:00:42 +0530
Subject: [PATCH 41/57] UN-2946 [FIX] Skip webhook on JSON parse failure &
 re-include compose.debug
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- _run_webhook_postprocessing: skip when structured_output[prompt_name]
  is empty or non-iterable. Pre-refactor, the webhook lived inside
  handle_json after its parse-failure early-return (which sets the
  output to {}), so a malformed JSON answer never dispatched the
  webhook — the new explicit gate restores that behaviour. Subscribers
  no longer receive empty-payload calls they didn't see before.
- .gitignore: re-include docker/compose.debug.yaml after the
  broader docker/compose.*.yaml rule so a delete + recreate doesn't
  make the tracked file look untracked, and so teammate-added compose
  files aren't silently masked.
---
 .gitignore                                    |  4 ++++
 workers/executor/executors/legacy_executor.py | 13 +++++++++++++
 2 files changed, 17 insertions(+)

diff --git a/.gitignore b/.gitignore
index f0c0cb8438..0901e18b4c 100644
--- a/.gitignore
+++ b/.gitignore
@@ -654,6 +654,10 @@ docker/*.env
 docker/public_tools.json
 docker/proxy_overrides.yaml
 docker/compose.*.yaml
+# ``docker/compose.debug.yaml`` is checked-in tooling — keep it out of the
+# broader ``compose.*.yaml`` ignore so a delete + recreate doesn't make it
+# look untracked, and so teammates can spot it.
+!docker/compose.debug.yaml
 docker/workflow_data/
 
 # Tool development
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index a321e6be07..fc4101c575 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -2082,6 +2082,19 @@ def _run_webhook_postprocessing(
         webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
         if not webhook_enabled:
             return
+        # Pre-refactor, the webhook lived inside ``handle_json`` after its
+        # parse-failure early-return, so a malformed JSON answer (which sets
+        # ``structured_output[prompt_name] = {}``) never fired a webhook.
+        # The new explicit gate keeps that contract — empty / None payloads
+        # are skipped with a log rather than dispatched.
+        parsed_value = structured_output.get(prompt_name)
+        if not isinstance(parsed_value, (dict, list)) or not parsed_value:
+            logger.warning(
+                "Webhook postprocessing skipped: prompt=%s parsed payload "
+                "is empty or non-JSON (likely a parse failure)",
+                prompt_name,
+            )
+            return
         if output_type != PSKeys.JSON:
             # The pre-refactor behaviour fired the webhook regardless of
             # output_type. The new restriction is intentional, but the

From 2fd9cf5d0605ce340d9f3afaf4a7851a6ee8473d Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 14:04:10 +0530
Subject: [PATCH 42/57] UN-2946 [FIX] Return 400 for missing tool_id (was 500)

`APIException(code=400)` only sets `detail.code` in the JSON body;
`status_code` is hardcoded to HTTP_500_INTERNAL_SERVER_ERROR. Switch to
`ValidationError` so the missing-tool_id and tool-not-found branches in
`latest_outputs_by_keys` and `get_output_for_tool_default` actually
respond with 400 as the comment / docstring imply.
---
 .../prompt_studio_output_manager_v2/views.py       | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
index f7b7aa8582..2c81c5191a 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
@@ -5,7 +5,7 @@
 from django.db.models import QuerySet
 from django.http import HttpRequest
 from rest_framework import status, viewsets
-from rest_framework.exceptions import APIException
+from rest_framework.exceptions import ValidationError
 from rest_framework.response import Response
 from rest_framework.versioning import URLPathVersioning
 from utils.common_utils import CommonUtils
@@ -74,10 +74,10 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
         tool_id = request.GET.get("tool_id")
         keys_param = request.GET.get("prompt_keys", "")
         if not tool_id:
-            raise APIException(
-                detail=PromptOutputManagerErrorMessage.TOOL_VALIDATION,
-                code=400,
-            )
+            # ``APIException(code=400)`` only sets ``detail.code`` in the body;
+            # ``status_code`` is hardcoded to 500. Use ``ValidationError`` so
+            # callers get the intended 400.
+            raise ValidationError(detail=PromptOutputManagerErrorMessage.TOOL_VALIDATION)
 
         prompt_keys = [k.strip() for k in keys_param.split(",") if k.strip()]
         if not prompt_keys:
@@ -129,7 +129,7 @@ def get_output_for_tool_default(self, request: HttpRequest) -> Response:
         tool_validation_message = PromptOutputManagerErrorMessage.TOOL_VALIDATION
         tool_not_found = PromptOutputManagerErrorMessage.TOOL_NOT_FOUND
         if not tool_id:
-            raise APIException(detail=tool_validation_message, code=400)
+            raise ValidationError(detail=tool_validation_message)
 
         try:
             # Fetch ToolStudioPrompt records based on tool_id
@@ -137,7 +137,7 @@ def get_output_for_tool_default(self, request: HttpRequest) -> Response:
                 tool_id=tool_id
             ).order_by("sequence_number")
         except ObjectDoesNotExist:
-            raise APIException(detail=tool_not_found, code=400)
+            raise ValidationError(detail=tool_not_found)
 
         # Invoke helper method to frame and fetch default response.
         result: dict[str, Any] = OutputManagerHelper.fetch_default_output_response(

From ba6c32ab0658f56ccd889827dcba0b88b0f48f13 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 28 Apr 2026 19:20:22 +0530
Subject: [PATCH 43/57] UN-2946 [FIX] Address remaining post-disposition review
 comments (OSS)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Five threads on PR #1929 raised against the latest disposition push:

* prompt_studio_core_v2/views.py: drop the ``single_pass_extraction_mode``
  bypass from ``_multi_var_lookup_block_response`` — fetch_response /
  bulk_fetch_response are always non-SP, so the tool-setting check just
  let multi-var lookups slip past the gate when the tool happened to be
  configured for SP.

* prompt_studio_registry_helper.py: filter out NOTES + inactive prompts
  *before* calling ``validate_lookups_for_export`` so an incomplete
  lookup on a non-exportable prompt no longer fails the whole export.

* unstract/sdk1/usage_handler.py: guard ``self.token_counter is None``
  in the embedding-end branch — degrade with a warning instead of an
  AttributeError on early callbacks.

* workers/executor/legacy_executor.py: move the ``outcome.usage_records``
  / ``outcome.llm_metrics`` access inside the ``try`` so plugin contract
  drift hits the same graceful-degrade branch as a thrown ``run_with_metrics``.

* backend/prompt_studio/lookup_utils.py: include ``pluggable_apps`` itself
  in ``_CLOUD_LOOKUP_MODULES``. Pure OSS images don't have the parent
  package, so ``ImportError.name`` surfaces as ``"pluggable_apps"`` and
  the previous filter re-raised instead of setting LOOKUPS_AVAILABLE=False.
---
 backend/prompt_studio/lookup_utils.py                    | 3 +++
 backend/prompt_studio/prompt_studio_core_v2/views.py     | 5 +++--
 .../prompt_studio_registry_helper.py                     | 9 +++++++--
 unstract/sdk1/src/unstract/sdk1/usage_handler.py         | 6 ++++++
 workers/executor/executors/legacy_executor.py            | 8 ++++++--
 5 files changed, 25 insertions(+), 6 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 5bc21bc90e..653cfdf1b5 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -16,6 +16,9 @@
 logger = logging.getLogger(__name__)
 
 _CLOUD_LOOKUP_MODULES = {
+    # ``e.name`` is the first missing component in the chain — in pure
+    # OSS images the parent ``pluggable_apps`` package itself is absent.
+    "pluggable_apps",
     "pluggable_apps.lookups",
     "pluggable_apps.lookups.execution",
     "pluggable_apps.lookups.output_enrichment",
diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 9510fb962f..d123175545 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -103,11 +103,12 @@ def _multi_var_lookup_block_response(custom_tool, prompt_ids=None):
     multi-var lookup attached to an unrelated prompt in the same project
     doesn't block a single-var lookup's run.
 
+    Callers are responsible for only invoking this on non-SP execution
+    paths — the SP entry point skips the helper entirely.
+
     Returns a Response object (HTTP 400) when a block applies, or None
     to let the caller proceed.
     """
-    if getattr(custom_tool, "single_pass_extraction_mode", False):
-        return None
     names = get_multi_var_lookups_for_tool(custom_tool, prompt_ids=prompt_ids)
     if not names:
         return None
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index 998022cbbb..f2477e73dc 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -298,8 +298,13 @@ def frame_export_json(
             settings, JsonSchemaKey.WORD_CONFIDENCE_POSTAMBLE.upper(), ""
         )
 
-        # Validate lookup assignments (cloud-only, no-op in OSS)
-        lookup_configs, lookup_error = validate_lookups_for_export(prompts)
+        # Validate lookup assignments (cloud-only, no-op in OSS) on the
+        # subset that will actually be exported — NOTES / inactive prompts
+        # never run, so an incomplete lookup on those shouldn't fail export.
+        exportable_prompts = [
+            p for p in prompts if p.prompt_type != JsonSchemaKey.NOTES and p.active
+        ]
+        lookup_configs, lookup_error = validate_lookups_for_export(exportable_prompts)
         if lookup_error:
             raise InValidCustomToolError(lookup_error)
 
diff --git a/unstract/sdk1/src/unstract/sdk1/usage_handler.py b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
index 9836bdf87a..9819f42ac5 100644
--- a/unstract/sdk1/src/unstract/sdk1/usage_handler.py
+++ b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
@@ -107,6 +107,12 @@ def on_event_end(
         ):
             if self.embed_model is None:
                 return
+            if self.token_counter is None:
+                logger.warning(
+                    "Embedding usage callback invoked without token_counter; "
+                    "skipping usage record."
+                )
+                return
             model_name = self.embed_model.model_name
             embedding_tokens = self.token_counter.total_embedding_token_count
             self.stream_log(
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index fc4101c575..052f349602 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -2046,6 +2046,12 @@ def _run_lookup_enrichment(
                 shim=shim,
                 usage_kwargs=usage_kwargs,
             )
+            # Inside the try so a missing/renamed attribute on the outcome
+            # (plugin contract drift) hits the same graceful-degrade branch.
+            self._usage_records.extend(outcome.usage_records)
+            metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = (
+                outcome.llm_metrics
+            )
         except Exception:
             # Enrichment is post-extraction — degrade gracefully on
             # plugin contract drift (missing METRICS_KEY, unexpected
@@ -2063,8 +2069,6 @@ def _run_lookup_enrichment(
                 level=LogLevel.WARN,
             )
             return
-        self._usage_records.extend(outcome.usage_records)
-        metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = outcome.llm_metrics
 
     @staticmethod
     def _run_webhook_postprocessing(

From 4aea7e45581aa30ca27c5c0ce02717997498b6e4 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 10:39:37 +0530
Subject: [PATCH 44/57] UN-2946 [DOCS] Tighten comments across lookups V2 OSS
 surface

Drop archaeology / "previously / before-X-now-Y" framing; collapse
multi-line WHAT walkthroughs to single-line WHY. No logic changes.
---
 backend/prompt_studio/lookup_utils.py         | 48 +++++++------------
 .../prompt_studio_core_v2/views.py            | 41 ++++++++--------
 .../output_manager_helper.py                  | 29 ++++-------
 .../serializers.py                            |  4 +-
 .../prompt_studio_output_manager_v2/views.py  | 22 +++------
 .../prompt_studio_registry_helper.py          |  5 +-
 backend/usage_v2/models.py                    | 39 +++++----------
 .../custom-tools/combined-output/JsonView.jsx |  1 -
 .../custom-tools/prompt-card/Header.jsx       |  5 +-
 .../prompt-card/RunAllPrompts.jsx             |  3 --
 .../custom-tools/tool-ide/ToolIde.jsx         | 10 ++--
 .../custom-markdown/CustomMarkdown.jsx        |  3 +-
 .../helpers/custom-tools/CustomToolsHelper.js |  1 -
 .../logging/execution-logs/ExecutionLogs.jsx  |  3 +-
 frontend/src/helpers/urlSafety.js             |  7 ++-
 frontend/src/hooks/usePromptOutput.js         | 13 ++---
 frontend/src/hooks/usePromptRun.js            |  5 +-
 frontend/src/pages/CustomTools.jsx            |  2 -
 .../src/unstract/sdk1/execution/context.py    |  3 +-
 .../unstract/sdk1/execution/orchestrator.py   |  3 +-
 .../sdk1/src/unstract/sdk1/usage_handler.py   |  8 ++--
 21 files changed, 87 insertions(+), 168 deletions(-)

diff --git a/backend/prompt_studio/lookup_utils.py b/backend/prompt_studio/lookup_utils.py
index 653cfdf1b5..8cfb0a7286 100644
--- a/backend/prompt_studio/lookup_utils.py
+++ b/backend/prompt_studio/lookup_utils.py
@@ -1,13 +1,8 @@
-"""Shared utility for lookup operations.
+"""Shared utility for lookup operations. No-ops in OSS.
 
-Wraps cloud-only lookup calls so OSS callers don't repeat the
-``try/except ImportError`` guard. All functions are no-ops in OSS.
-
-The probe below catches *only* the absence of the cloud
-``pluggable_apps.lookups`` package — an ImportError raised transitively
-inside the cloud plugin (e.g. a missing third-party dependency it needs)
-re-raises so the failure surfaces instead of silently degrading the
-whole feature to a no-op.
+Only the absence of ``pluggable_apps.lookups`` itself is treated as
+"cloud not installed"; an ImportError from a transitive dependency
+re-raises so we don't silently degrade to a no-op on a real bug.
 """
 
 import logging
@@ -16,8 +11,7 @@
 logger = logging.getLogger(__name__)
 
 _CLOUD_LOOKUP_MODULES = {
-    # ``e.name`` is the first missing component in the chain — in pure
-    # OSS images the parent ``pluggable_apps`` package itself is absent.
+    # OSS images lack the parent ``pluggable_apps`` package, so include it.
     "pluggable_apps",
     "pluggable_apps.lookups",
     "pluggable_apps.lookups.execution",
@@ -51,9 +45,8 @@ def get_lookup_config(prompt) -> dict | None:
 def get_lookup_configs_for_tool(tool, prompts=None) -> list[dict] | None:
     """Return lookup configs for a tool (single pass), or None in OSS.
 
-    ``prompts`` scopes the build+validation to the prompts actually
-    participating in the run so an unrelated incomplete assignment on
-    the tool doesn't block it.
+    ``prompts`` scopes validation to the run's prompts so unrelated
+    incomplete assignments on the tool don't block it.
     """
     if not LOOKUPS_AVAILABLE:
         return None
@@ -63,9 +56,8 @@ def get_lookup_configs_for_tool(tool, prompts=None) -> list[dict] | None:
 def get_multi_var_lookups_for_tool(tool, prompt_ids=None) -> list[str]:
     """Return names of multi-variable lookups linked to the tool, [] in OSS.
 
-    ``prompt_ids`` scopes the check to a specific subset of linked prompts
-    so single / bulk runs only block when a lookup the run actually uses
-    is multi-variable.
+    ``prompt_ids`` scopes the check so a run is only blocked when the
+    multi-var lookup is actually used by it.
     """
     if not LOOKUPS_AVAILABLE:
         return []
@@ -112,10 +104,9 @@ def validate_lookups_for_export(prompts) -> tuple[dict, str | None]:
 
 
 def get_latest_lookup_mutation_for_tool(tool):
-    """Return the max modified_at across all lookup-related records linked to
-    the tool (version, reference file, assignment). Used for banner staleness.
-
-    Returns None if lookups are unavailable or nothing is linked.
+    """Max ``modified_at`` across lookup-related records linked to the tool
+    (version, reference file, assignment) — feeds the staleness banner.
+    None if unavailable or nothing linked.
     """
     if not LOOKUPS_AVAILABLE:
         return None
@@ -128,10 +119,8 @@ def get_original_value_if_enriched(
     """Return ``(original_value, prompt_lookup_dict)`` if ``prompt_key`` was
     enriched, or ``None`` otherwise.
 
-    Operates purely on metadata shape — the plugin-availability flag is
-    not consulted, so callers can invoke this even when ``LOOKUPS_AVAILABLE``
-    is False (it still returns ``None`` because the metadata shape won't
-    match).
+    Pure metadata-shape check — safe to call even when LOOKUPS_AVAILABLE
+    is False (returns None because the shape won't match).
     """
     if not isinstance(metadata, dict):
         return None
@@ -145,9 +134,8 @@ def get_original_value_if_enriched(
 def attach_combined_output_enrichment(result: dict, enriched_by_key: dict) -> None:
     """Stamp the combined-output payload with enriched-output metadata.
 
-    OSS ships a stub that ignores the call; cloud reroutes into the payload
-    key its FE plugin expects. Keeping the key name out of OSS lets cloud
-    evolve the shape without OSS-side coordination.
+    Key name stays cloud-side so the FE-plugin shape can evolve without
+    coordinating with OSS.
     """
     if not LOOKUPS_AVAILABLE:
         return
@@ -157,8 +145,8 @@ def attach_combined_output_enrichment(result: dict, enriched_by_key: dict) -> No
 def extract_prompt_output_enrichment(item) -> dict | None:
     """Pick enriched-output data off a serialized prompt-output row.
 
-    Returns a plugin-opaque dict (the FE treats it as a black box) or None
-    when no enrichment is present / plugin missing.
+    Returns a plugin-opaque dict (FE-only) or None when no enrichment
+    is present / plugin missing.
     """
     if not LOOKUPS_AVAILABLE:
         return None
diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index d123175545..6043d1a57a 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -99,15 +99,9 @@
 def _multi_var_lookup_block_response(custom_tool, prompt_ids=None):
     """Block non-SP runs when a linked lookup has >1 input variable.
 
-    ``prompt_ids`` scopes the check to the prompt(s) being run so a
-    multi-var lookup attached to an unrelated prompt in the same project
-    doesn't block a single-var lookup's run.
-
-    Callers are responsible for only invoking this on non-SP execution
-    paths — the SP entry point skips the helper entirely.
-
-    Returns a Response object (HTTP 400) when a block applies, or None
-    to let the caller proceed.
+    Multi-var lookups only resolve correctly under single-pass; ``prompt_ids``
+    scopes the gate so an unrelated multi-var lookup doesn't block runs that
+    don't actually use it. Caller must skip this on the SP path.
     """
     names = get_multi_var_lookups_for_tool(custom_tool, prompt_ids=prompt_ids)
     if not names:
@@ -512,9 +506,7 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
         document_id: str = request.data.get(ToolStudioPromptKeys.DOCUMENT_ID)
         prompt_id: str = request.data.get(ToolStudioPromptKeys.ID)
         run_id: str = request.data.get(ToolStudioPromptKeys.RUN_ID)
-        # Validate ``prompt_id`` before the lookup gate so a request
-        # missing the field returns a clear 400 instead of a lookup-related
-        # error.
+        # Must precede the lookup gate so missing prompt_id returns a clear 400.
         if not prompt_id:
             return Response(
                 {"error": "prompt id is required."},
@@ -548,9 +540,8 @@ def fetch_response(self, request: HttpRequest, pk: Any = None) -> Response:
         document: DocumentManager = DocumentManager.objects.get(pk=document_id)
         doc_path = str(Path(doc_path) / document.document_name)
 
-        # Agentic table prompts have a separate executor worker. Build the
-        # payload via the cloud payload_modifier plugin and dispatch directly
-        # so the legacy answer_prompt path is bypassed.
+        # Agentic table prompts have their own executor — build payload via
+        # the cloud plugin and dispatch directly, bypassing answer_prompt.
         if prompt.enforce_type == ToolStudioPromptKeys.AGENTIC_TABLE:
             payload_modifier_plugin = get_plugin("payload_modifier")
             if not payload_modifier_plugin:
@@ -921,10 +912,17 @@ def create_profile_manager(self, request: HttpRequest, pk: Any = None) -> Respon
         serializer = ProfileManagerSerializer(data=request.data, context=context)
         serializer.is_valid(raise_exception=True)
         # Check for the maximum number of profiles constraint
-        prompt_studio_tool = (
-            serializer.validated_data.get(ProfileManagerKeys.PROMPT_STUDIO_TOOL)
-            or self.get_object()
+        prompt_studio_tool = serializer.validated_data.get(
+            ProfileManagerKeys.PROMPT_STUDIO_TOOL
         )
+        if not prompt_studio_tool:
+            # Write back into validated_data so perform_create() doesn't
+            # persist NULL and orphan the profile from every
+            # ``filter(prompt_studio_tool=...)`` query.
+            prompt_studio_tool = self.get_object()
+            serializer.validated_data[ProfileManagerKeys.PROMPT_STUDIO_TOOL] = (
+                prompt_studio_tool
+            )
         profile_count = ProfileManager.objects.filter(
             prompt_studio_tool=prompt_studio_tool
         ).count()
@@ -1144,8 +1142,7 @@ def export_tool(self, request: Request, pk: Any = None) -> Response:
             force_export=force_export,
         )
 
-        # Record export timestamp so staleness checks (e.g. lookup-change
-        # banner) can compare against mutations that happened afterwards.
+        # Anchor for staleness checks (e.g. lookup-change banner).
         custom_tool.last_exported_at = timezone.now()
         custom_tool.save(update_fields=["last_exported_at"])
 
@@ -1349,8 +1346,8 @@ def check_deployment_usage(self, request: Request, pk: Any = None) -> Response:
             instance: CustomTool = self.get_object()
             is_used, workflow_ids = self._check_tool_usage_in_workflows(instance)
 
-            # Lookup staleness: NULL last_exported_at means we can't compare,
-            # so treat as clean (don't false-alarm pre-feature projects).
+            # NULL last_exported_at → treat as clean to avoid false alarms
+            # on pre-feature projects.
             is_lookup_dirty = False
             if instance.last_exported_at is not None:
                 latest = get_latest_lookup_mutation_for_tool(instance)
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
index f5ec54c94e..9c963cf3f6 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/output_manager_helper.py
@@ -178,11 +178,8 @@ def update_or_create_prompt_output(
             # TODO: use enums here
             output = outputs.get(prompt.prompt_key)
 
-            # If lookup enrichment ran, structured_output contains the
-            # enriched value. Restore the original raw LLM output for the
-            # prompt output table — the enriched value is persisted by the
-            # cloud plugin via persist_lookup_output. Cloud owns the
-            # metadata shape; OSS queries through the bridge.
+            # On enrichment, store the raw LLM output here; the enriched
+            # value is persisted separately via persist_lookup_output.
             enrichment = get_original_value_if_enriched(metadata, prompt.prompt_key)
             if enrichment is not None:
                 output, prompt_lookup = enrichment
@@ -214,11 +211,8 @@ def update_or_create_prompt_output(
                 word_confidence_data=prompt_word_confidence_data,
             )
 
-            # Persist lookup outputs if present (cloud plugin, no-op in OSS).
-            # Narrow to known DB-level errors so unexpected exceptions
-            # (plugin contract drift, KeyError on the lookup payload) bubble
-            # up rather than getting hidden as a warning that masquerades
-            # as a successful save.
+            # Narrow except so plugin contract drift surfaces as a real
+            # error instead of being masked as a successful save.
             if prompt_lookup:
                 try:
                     persist_lookup_output(prompt_output, prompt_lookup)
@@ -276,16 +270,12 @@ def fetch_default_output_response(
 
         Returns:
             dict[str, Any]: Formatted JSON response for combined output.
-                When lookups are configured, the cloud plugin adds an
-                opaque enrichment payload via ``attach_combined_output_enrichment``.
+                Cloud plugins may attach an opaque enrichment payload.
         """
         from prompt_studio.lookup_utils import enrich_prompt_output
 
-        # Pre-resolve (prompt, profile_id) pairs once so the per-prompt
-        # default-profile lookup memoises against the small set of tool IDs
-        # involved. Combined Output is a hot path — the previous N+1 (two
-        # DB calls per prompt + a plugin invocation per matching row)
-        # turned every panel switch into a multi-second wait.
+        # Memoise default-profile resolution per tool to avoid N+1 on this
+        # hot path (panel-switch latency).
         default_profile_cache: dict[str, str | None] = {}
 
         def _resolve(tool_prompt: ToolStudioPrompt) -> str | None:
@@ -317,9 +307,8 @@ def _resolve(tool_prompt: ToolStudioPrompt) -> str | None:
                 continue
             prompts_to_query.append((tool_prompt, profile_manager_id))
 
-        # Single batch query keyed on the (prompt_id, profile_manager_id)
-        # pair — ``DISTINCT ON`` (Postgres) gives the latest row per pair
-        # in SQL so we don't materialise every historical run per prompt.
+        # ``DISTINCT ON`` (Postgres) yields the latest row per
+        # (prompt_id, profile_manager_id) at the SQL layer.
         outputs_index: dict[tuple[str, str], PromptStudioOutputManager] = {}
         if prompts_to_query:
             prompt_ids = [str(p.prompt_id) for p, _ in prompts_to_query]
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
index dad8d52979..1c56e2323d 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/serializers.py
@@ -48,9 +48,7 @@ def to_representation(self, instance):
                 " | Process continued"
             )
             data["coverage"] = {}
-        # Match the surrounding ``log + continue`` policy used by token-usage
-        # and coverage above — an enrichment failure shouldn't 500 the entire
-        # prompt-output list endpoint and hide the raw output.
+        # log+continue: enrichment failure shouldn't 500 the list endpoint.
         try:
             data = enrich_prompt_output(instance, data)
         except Exception as e:
diff --git a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
index 2c81c5191a..44111dc744 100644
--- a/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_output_manager_v2/views.py
@@ -65,27 +65,21 @@ def get_queryset(self) -> QuerySet | None:
     def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
         """Return the most recent raw output value per source prompt key.
 
-        Used by the lookup Test panel's "Use Latest Outputs" button to
-        pre-fill {{input.X}} fields from prior prompt runs in the linked
-        tool. Always returns the raw extraction — the enriched value would
-        already include lookup post-processing, which would defeat the
-        purpose of testing the lookup with sample inputs.
+        Backs the lookup Test panel's "Use Latest Outputs" button. Returns
+        raw extraction (not enriched) so the lookup can be tested fresh.
         """
         tool_id = request.GET.get("tool_id")
         keys_param = request.GET.get("prompt_keys", "")
         if not tool_id:
-            # ``APIException(code=400)`` only sets ``detail.code`` in the body;
-            # ``status_code`` is hardcoded to 500. Use ``ValidationError`` so
-            # callers get the intended 400.
+            # APIException(code=400) returns 500; ValidationError returns 400.
             raise ValidationError(detail=PromptOutputManagerErrorMessage.TOOL_VALIDATION)
 
         prompt_keys = [k.strip() for k in keys_param.split(",") if k.strip()]
         if not prompt_keys:
             return Response({}, status=status.HTTP_200_OK)
 
-        # Custom actions don't go through self.filter_queryset(), so
-        # OrganizationFilterBackend does not run. Scope explicitly here via
-        # the tool's organization FK to prevent cross-tenant reads.
+        # Custom actions skip filter_queryset(), so OrganizationFilterBackend
+        # never runs — scope explicitly to prevent cross-tenant reads.
         organization = UserContext.get_organization()
         prompt_id_to_key = dict(
             ToolStudioPrompt.objects.filter(
@@ -97,10 +91,8 @@ def latest_outputs_by_keys(self, request: HttpRequest) -> Response:
         if not prompt_id_to_key:
             return Response({}, status=status.HTTP_200_OK)
 
-        # ``DISTINCT ON("prompt_id")`` (Postgres) keeps only the latest row
-        # per prompt at the SQL layer — without it Django materialises the
-        # full ``M docs × N runs × len(prompt_keys)`` result set just to
-        # let the Python loop pick one row per prompt.
+        # ``DISTINCT ON("prompt_id")`` keeps the latest row per prompt at
+        # the SQL layer to avoid materialising every doc × run combo.
         outputs = (
             PromptStudioOutputManager.objects.filter(
                 prompt_id__in=prompt_id_to_key.keys(),
diff --git a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
index f2477e73dc..4fee8c10bc 100644
--- a/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
+++ b/backend/prompt_studio/prompt_studio_registry_v2/prompt_studio_registry_helper.py
@@ -298,9 +298,8 @@ def frame_export_json(
             settings, JsonSchemaKey.WORD_CONFIDENCE_POSTAMBLE.upper(), ""
         )
 
-        # Validate lookup assignments (cloud-only, no-op in OSS) on the
-        # subset that will actually be exported — NOTES / inactive prompts
-        # never run, so an incomplete lookup on those shouldn't fail export.
+        # Validate only what will actually be exported — NOTES / inactive
+        # prompts never run, so incomplete lookups on them shouldn't fail export.
         exportable_prompts = [
             p for p in prompts if p.prompt_type != JsonSchemaKey.NOTES and p.active
         ]
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 2d6c7e2144..8b04240aef 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -19,14 +19,8 @@ class UsageStatus(models.TextChoices):
     SKIPPED = "SKIPPED", "Skipped"
 
 
-# ── Choice lists (static union of OSS + cloud values) ────────────────
-# Cloud-only entries (e.g. "lookup", "lookup_version") are listed here
-# even on OSS-only builds where they're never written. A previous
-# try-import pattern extended these at runtime when the cloud plugin
-# was importable, but that left model state ≠ migration state in OSS
-# builds and broke ``makemigrations --check`` in CI. Carrying the union
-# statically keeps both sides in lockstep at the cost of a couple of
-# unused choice entries on OSS.
+# Static union of OSS + cloud values — keeps OSS model state aligned with
+# migration state so ``makemigrations --check`` doesn't drift in CI.
 
 LLM_USAGE_REASON_CHOICES: list[tuple[str, str]] = [
     ("extraction", "Extraction"),
@@ -46,10 +40,9 @@ class UsageModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
 
 
 class Usage(DefaultOrganizationMixin, BaseModel):
-    # reference_type → reference_id mapping (no FK constraint):
-    #   "prompt_key"      → ToolStudioPrompt UUID (OSS-only writer)
-    #   "lookup_version"  → LookupVersion UUID (cloud-only writer)
-    # Usage records survive entity deletion.
+    # reference_type → reference_id (no FK; survives entity deletion):
+    #   "prompt_key"     → ToolStudioPrompt UUID (OSS)
+    #   "lookup_version" → LookupVersion UUID (cloud)
 
     id = models.UUIDField(
         primary_key=True,
@@ -149,12 +142,8 @@ class Meta:
             ),
         ]
         constraints = [
-            # ``reference_type`` is a discriminator for ``reference_id``.
-            # Either both are NULL (no entity attribution) or both are set
-            # (decodable). A row with one but not the other is undecodable
-            # at billing-aggregation time. Cheap to validate on apply
-            # because both fields landed together in lookups V2 — legacy
-            # rows have both NULL.
+            # Both NULL or both set; a half-populated row is undecodable
+            # at billing-aggregation time.
             models.CheckConstraint(
                 check=(
                     models.Q(reference_id__isnull=True, reference_type__isnull=True)
@@ -162,14 +151,8 @@ class Meta:
                 ),
                 name="usage_reference_pair_consistent",
             ),
-            # NOTE: a sibling ``(usage_type, llm_usage_reason)`` constraint
-            # would be a natural extension here — embedding rows must have
-            # llm_usage_reason NULL, LLM rows must have it set. Skipped in
-            # this PR because the ``usage`` table is large in prod and
-            # legacy embedding rows have ``llm_usage_reason=''`` from the
-            # old SDK default; both the data backfill and Django's default
-            # ``ADD CONSTRAINT`` (full-table scan) would lock the billing
-            # table for too long. To be added in a follow-up via
-            # ``ADD CONSTRAINT ... NOT VALID`` + batched ``VALIDATE
-            # CONSTRAINT`` during a maintenance window.
+            # TODO: add (usage_type, llm_usage_reason) consistency constraint
+            # via ``ADD CONSTRAINT ... NOT VALID`` + batched ``VALIDATE`` —
+            # legacy embedding rows have ``llm_usage_reason=''`` and the
+            # default full-table scan would lock the billing table.
         ]
diff --git a/frontend/src/components/custom-tools/combined-output/JsonView.jsx b/frontend/src/components/custom-tools/combined-output/JsonView.jsx
index dfc82f92e1..34a733598a 100644
--- a/frontend/src/components/custom-tools/combined-output/JsonView.jsx
+++ b/frontend/src/components/custom-tools/combined-output/JsonView.jsx
@@ -33,7 +33,6 @@ function JsonView({
     Prism.highlightAll();
   }, [combinedOutput, enrichedOutput, activeView]);
 
-  // Reset to Raw when enriched data is not available
   useEffect(() => {
     if (!enrichedOutput || Object.keys(enrichedOutput).length === 0) {
       setActiveView("Raw");
diff --git a/frontend/src/components/custom-tools/prompt-card/Header.jsx b/frontend/src/components/custom-tools/prompt-card/Header.jsx
index 551c58c978..30fe75fe54 100644
--- a/frontend/src/components/custom-tools/prompt-card/Header.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/Header.jsx
@@ -60,8 +60,7 @@ try {
   lookupPluginLoadError = err;
 }
 
-// If the sibling plugin import succeeded, a failure here means the
-// plugin is present but broken — surface it so the no-op fallback
+// Sibling plugin loaded but this hook didn't — surface so the no-op fallback
 // doesn't silently disable the run gate.
 if (lookupPluginLoadError && LookupMenuItem) {
   // eslint-disable-next-line no-console
@@ -71,7 +70,7 @@ if (lookupPluginLoadError && LookupMenuItem) {
   );
 }
 
-// Stable identity so React doesn't see a conditional hook call.
+// Stable identity — avoid conditional hook call.
 const usePromptRunGate = usePromptRunGatePlugin || (() => null);
 
 function Header({
diff --git a/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx b/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
index 6a0229f7e8..abf187845e 100644
--- a/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/RunAllPrompts.jsx
@@ -4,9 +4,6 @@ import { PROMPT_RUN_TYPES } from "../../../helpers/GetStaticData";
 import usePromptRun from "../../../hooks/usePromptRun";
 import { useCustomToolStore } from "../../../store/custom-tool-store";
 
-// No tool-wide gate here — per-prompt Run buttons + server already
-// block broken prompts, so disabling bulk would only hide valid ones.
-
 function RunAllPrompts() {
   const { selectedDoc, isMultiPassExtractLoading, isPublicSource } =
     useCustomToolStore();
diff --git a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
index 483ebd80f4..1f7e21c259 100644
--- a/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
+++ b/frontend/src/components/custom-tools/tool-ide/ToolIde.jsx
@@ -45,8 +45,7 @@ try {
   // Do nothing if plugins are not loaded.
 }
 
-// Cloud-only hook that seeds hasUnsavedChanges from server-side
-// lookup-staleness. No-op stub in OSS.
+// Cloud-only — OSS stub.
 let useLookupDirtySeed = () => {};
 try {
   const mod = await import(
@@ -55,8 +54,7 @@ try {
   useLookupDirtySeed = mod.useLookupDirtySeed;
 } catch {}
 
-// Cloud-only lookup export validation gate. OSS stub resolves true so
-// the reminder bar's "Export" button proceeds directly.
+// Cloud-only — OSS stub resolves true to skip the gate.
 let useLookupExportGate = () => ({
   checkLookups: () => Promise.resolve(true),
   modalEl: null,
@@ -203,9 +201,7 @@ function ToolIde() {
     }
   }, [details?.tool_id]);
 
-  // Cloud plugin seeds hasUnsavedChanges when a linked lookup has been
-  // edited since the tool's last export — surfaces the re-export banner
-  // for mutations made on the standalone /lookups page. No-op in OSS.
+  // Surfaces re-export banner when /lookups page edits made the tool stale.
   useLookupDirtySeed(details?.tool_id);
 
   // Cleanup abort controller on unmount
diff --git a/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx b/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
index 458f319557..177299a0f8 100644
--- a/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
+++ b/frontend/src/components/helpers/custom-markdown/CustomMarkdown.jsx
@@ -55,8 +55,7 @@ const CustomMarkdown = ({
           </Text>
         );
       case "link": {
-        // Protocol-relative URLs (`//evil.com/...`) also start with `/`
-        // so exclude them from the internal-route branch.
+        // Exclude protocol-relative `//evil.com` from internal-route branch.
         const isInternal = url?.startsWith("/") && !url.startsWith("//");
         if (isInternal) {
           const resolvedUrl = orgName ? `/${orgName}${url}` : url;
diff --git a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
index a917c30b77..35c2854cb0 100644
--- a/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
+++ b/frontend/src/components/helpers/custom-tools/CustomToolsHelper.js
@@ -128,7 +128,6 @@ function CustomToolsHelper() {
         const data = res?.data;
         updatedCusTool["adapters"] = data;
 
-        // Fetch lookup data (cloud only, fire-and-forget)
         if (fetchLookupAssignments) {
           const toolId = updatedCusTool["details"]?.tool_id;
           fetchLookupAssignments(axiosPrivate, sessionDetails?.orgId, toolId);
diff --git a/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx b/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
index 1b0b6ea208..8e44287e2d 100644
--- a/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
+++ b/frontend/src/components/logging/execution-logs/ExecutionLogs.jsx
@@ -54,8 +54,7 @@ function ExecutionLogs() {
     ? location.state?.from || `/${sessionDetails?.orgName}/logs`
     : null;
 
-  // Scroll-restoration takes precedence; fall back to caller-provided
-  // backRouteState so callers can restore arbitrary upstream UI state.
+  // Scroll-restoration wins; otherwise preserve caller's upstream UI state.
   const backRouteState =
     id && location.state?.scrollToCardId
       ? {
diff --git a/frontend/src/helpers/urlSafety.js b/frontend/src/helpers/urlSafety.js
index b5ca23e795..fede217e22 100644
--- a/frontend/src/helpers/urlSafety.js
+++ b/frontend/src/helpers/urlSafety.js
@@ -1,13 +1,12 @@
 const SAFE_URL_SCHEMES = ["http:", "https:", "mailto:", "tel:"];
 
-// Guards against unsafe schemes (e.g. `javascript:`, `data:`) when
-// rendering links built from user- or tool-derived content.
+// Block unsafe schemes (e.g. `javascript:`, `data:`) in user/tool-derived links.
 const isSafeExternalUrl = (url) => {
   if (typeof url !== "string" || url === "") {
     return false;
   }
-  // Parse without a base so bare strings (e.g. "javascript", "../foo") fail
-  // instead of silently resolving to `https://<origin>/...` and passing.
+  // No base URL — bare strings ("javascript", "../foo") must fail rather than
+  // silently resolve to the current origin.
   try {
     const parsed = new URL(url);
     return SAFE_URL_SCHEMES.includes(parsed.protocol);
diff --git a/frontend/src/hooks/usePromptOutput.js b/frontend/src/hooks/usePromptOutput.js
index 9cf6c27853..c27a0dbf54 100644
--- a/frontend/src/hooks/usePromptOutput.js
+++ b/frontend/src/hooks/usePromptOutput.js
@@ -30,15 +30,12 @@ try {
   );
   handleLookupOutput = mod.handleLookupOutput;
 } catch (error) {
-  // OSS: plugin may not exist; cloud: surface unexpected chunk-load
-  // failures so they don't degrade silently to OSS-mode behaviour.
+  // Surface chunk-load failures — silent catch hid them.
   // eslint-disable-next-line no-console
   console.warn("[usePromptOutput] handleLookupOutput unavailable:", error);
 }
 
-// Opaque extractor so the per-item enrichment payload key name lives in
-// the plugin, not OSS. OSS falls back to a no-op. Stub signature matches
-// the cloud helper so static analysis doesn't see call sites as arity mismatches.
+// Cloud-only extractor; OSS no-op. Signature matches plugin helper.
 let getEnrichmentFromItem = (_item) => null;
 try {
   const mod = await import("../plugins/lookup-enriched-toggle/helpers");
@@ -150,10 +147,8 @@ const usePromptOutput = () => {
         wordConfidenceData: item?.word_confidence_data,
       };
 
-      // Guard the lookup hook so a per-item plugin failure can't abort
-      // the surrounding ``forEach`` and skip the whole prompt-output state
-      // update — the user would otherwise see partial / stale outputs
-      // with no error surfaced.
+      // Per-item plugin failure must not abort the forEach — would leave
+      // partial state with no error surfaced.
       try {
         const enrichment = getEnrichmentFromItem(item);
         if (handleLookupOutput && enrichment) {
diff --git a/frontend/src/hooks/usePromptRun.js b/frontend/src/hooks/usePromptRun.js
index 34fb42e7d7..eb97502d02 100644
--- a/frontend/src/hooks/usePromptRun.js
+++ b/frontend/src/hooks/usePromptRun.js
@@ -16,10 +16,7 @@ import usePromptOutput from "./usePromptOutput";
 // Tracks the latest run nonce per (promptId, statusKey) so stale timeouts
 // from a previous run don't falsely cancel a newer run of the same combo.
 const runNonceMap = new Map();
-// Safety-net timeout for the fire-and-forget prompt run flow. Must trail the
-// server-side LLM adapter timeout (default 900s in
-// unstract/sdk1/src/unstract/sdk1/adapters/llm1/static/openai.json) so the UI
-// never gives up before the backend does. 16 minutes leaves a 1-minute buffer.
+// Must exceed server LLM adapter timeout (default 900s) so UI doesn't bail first.
 const SOCKET_TIMEOUT_MS = 16 * 60 * 1000; // 16 minutes
 
 const usePromptRun = () => {
diff --git a/frontend/src/pages/CustomTools.jsx b/frontend/src/pages/CustomTools.jsx
index 9543fb5c16..0864d9d262 100644
--- a/frontend/src/pages/CustomTools.jsx
+++ b/frontend/src/pages/CustomTools.jsx
@@ -18,14 +18,12 @@ function CustomTools() {
       .catch(() => {});
   }, []);
 
-  // Honor tab from navigation state on subsequent entries
   useEffect(() => {
     if (location.state?.activeTab) {
       setActiveTab(location.state.activeTab);
     }
   }, [location.state?.activeTab]);
 
-  // No lookup plugin = just render projects list (OSS mode)
   if (!LookupListComp) {
     return <ListOfTools />;
   }
diff --git a/unstract/sdk1/src/unstract/sdk1/execution/context.py b/unstract/sdk1/src/unstract/sdk1/execution/context.py
index 83eb650a29..0edb3e40b7 100644
--- a/unstract/sdk1/src/unstract/sdk1/execution/context.py
+++ b/unstract/sdk1/src/unstract/sdk1/execution/context.py
@@ -96,8 +96,7 @@ def __post_init__(self) -> None:
             raise ValueError("run_id is required")
         if not self.execution_source:
             raise ValueError("execution_source is required")
-        # When execution_id is set, organization_id must be too — they
-        # travel together for workflow-level log correlation.
+        # Workflow-level log correlation needs both fields together.
         if self.execution_id and not self.organization_id:
             raise ValueError("organization_id is required when execution_id is set")
 
diff --git a/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py b/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
index af5684fb1f..0f1454a32b 100644
--- a/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
+++ b/unstract/sdk1/src/unstract/sdk1/execution/orchestrator.py
@@ -62,8 +62,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                 elapsed,
             )
             metadata: dict[str, Any] = {"elapsed_seconds": round(elapsed, 3)}
-            # Preserve usage records the executor collected before crashing so
-            # the task wrapper still flushes them on retry.
+            # Don't lose pre-crash billing rows on retry.
             collected = getattr(executor, "_usage_records", None) or []
             if collected:
                 metadata["usage_records"] = list(collected)
diff --git a/unstract/sdk1/src/unstract/sdk1/usage_handler.py b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
index 9819f42ac5..0d1abf8aeb 100644
--- a/unstract/sdk1/src/unstract/sdk1/usage_handler.py
+++ b/unstract/sdk1/src/unstract/sdk1/usage_handler.py
@@ -135,8 +135,8 @@ def on_event_end(
                 )
                 cost = 0.0
 
-            # rsplit so multi-segment IDs (e.g. ``bedrock/anthropic/claude``)
-            # collapse to the trailing segment, matching legacy Audit semantics.
+            # Collapse multi-segment IDs (``bedrock/anthropic/claude``) to
+            # the trailing segment to match legacy Audit semantics.
             display_model = model_name.rsplit("/", 1)[-1] if model_name else model_name
 
             self._pending_usage.append(
@@ -144,9 +144,7 @@ def on_event_end(
                     "usage_type": "embedding",
                     "model_name": display_model,
                     "adapter_instance_id": self.kwargs.get("adapter_instance_id", ""),
-                    # ``run_id`` lands in a UUIDField column; "" would fail the
-                    # cast — keep absent values as None so the bulk-create view
-                    # writes NULL.
+                    # run_id lands in a UUIDField — "" fails the cast; keep None.
                     "run_id": self.kwargs.get("run_id") or None,
                     "execution_id": self.kwargs.get("execution_id", ""),
                     "embedding_tokens": embedding_tokens,

From 21caca202caa1c4e0b7447da4cdf38010bc3c2b2 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 10:52:29 +0530
Subject: [PATCH 45/57] UN-2946 [REFACTOR] Drop unused token_count param from
 ExtractionAPIClient
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Pairs with the cloud-side removal of the lookup token_count /
estimated_tokens fields — the worker no longer computes a value to send.
---
 workers/shared/clients/extraction_client.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/workers/shared/clients/extraction_client.py b/workers/shared/clients/extraction_client.py
index 43f64c712e..72400f62e8 100644
--- a/workers/shared/clients/extraction_client.py
+++ b/workers/shared/clients/extraction_client.py
@@ -34,7 +34,6 @@ def mark_extraction_complete(
         self,
         source: str,
         file_id: str,
-        token_count: int,
         extracted_text_path: str,
         organization_id: str | None = None,
         **extra: Any,
@@ -43,7 +42,6 @@ def mark_extraction_complete(
         payload: dict[str, Any] = {
             "source": source,
             "file_id": file_id,
-            "token_count": token_count,
             "extracted_text_path": extracted_text_path,
             **extra,
         }

From 7b4438a9d02bef2846d80cbd6356cc0d04b7fabd Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 12:56:15 +0530
Subject: [PATCH 46/57] UN-2946 [REFACTOR] DRF-ify Usage internal batch
 endpoint + squash migration
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- UsageBatchCreateView raises DRF exceptions (drf-standardized-errors
  envelope) instead of hand-rolled JsonResponse — serializer validation
  via raise_exception=True, dedicated UsagePersistError(APIException)
  for the bulk_create failure path.
- Records validated through UsageBatchCreateSerializer / nested
  UsageRecordCreateSerializer so adapter_instance_id, model_name,
  usage_type are required and the rest get explicit defaults.
- Fold 0006_alter_usage_status_and_more (UsageStatus choices +
  reference_pair CheckConstraint) into 0004 — branch hasn't merged to
  main, so squashing avoids an extra ALTER on deploy.
---
 backend/usage_v2/internal_views.py            | 51 +++++++++----------
 .../migrations/0004_usage_metrics_fields.py   | 22 ++++++++
 .../0006_alter_usage_status_and_more.py       | 42 ---------------
 backend/usage_v2/serializers.py               | 33 ++++++++++++
 4 files changed, 80 insertions(+), 68 deletions(-)
 delete mode 100644 backend/usage_v2/migrations/0006_alter_usage_status_and_more.py

diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 9cfa9699c6..59d1f5204d 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -1,10 +1,15 @@
-"""Internal API views for Usage access by workers."""
+"""Internal API views for Usage access by workers.
+
+Mounted under ``/internal/`` and gated by ``InternalAPIAuthMiddleware``.
+"""
 
 import logging
 
 from django.http import JsonResponse
 from rest_framework import status
+from rest_framework.exceptions import APIException, ValidationError
 from rest_framework.request import Request
+from rest_framework.response import Response
 from rest_framework.views import APIView
 from utils.user_context import UserContext
 
@@ -12,10 +17,17 @@
 
 from .helper import UsageHelper
 from .models import Usage
+from .serializers import UsageBatchCreateSerializer
 
 logger = logging.getLogger(__name__)
 
 
+class UsagePersistError(APIException):
+    status_code = status.HTTP_500_INTERNAL_SERVER_ERROR
+    default_detail = "Failed to persist usage records."
+    default_code = "usage_persist_failed"
+
+
 class UsageInternalView(APIView):
     """Internal API view for workers to access usage data.
 
@@ -140,10 +152,12 @@ def get(self, request: Request, file_execution_id: str) -> JsonResponse:
 class UsageBatchCreateView(APIView):
     """Bulk create usage records from worker finalization."""
 
-    def post(self, request: Request) -> JsonResponse:
-        records = request.data.get("records", [])
+    def post(self, request: Request) -> Response:
+        input_serializer = UsageBatchCreateSerializer(data=request.data)
+        input_serializer.is_valid(raise_exception=True)
+        records = input_serializer.validated_data["records"]
         if not records:
-            return JsonResponse({"created": 0}, status=200)
+            return Response({"created": 0}, status=status.HTTP_200_OK)
 
         organization = UserContext.get_organization()
         if organization is None:
@@ -152,13 +166,8 @@ def post(self, request: Request) -> JsonResponse:
                 "refusing to write rows that would be invisible to tenant dashboards",
                 len(records),
             )
-            return JsonResponse(
-                {
-                    "success": False,
-                    "error": "Organization context missing. "
-                    "Worker must send X-Organization-ID.",
-                },
-                status=status.HTTP_400_BAD_REQUEST,
+            raise ValidationError(
+                "Organization context missing. Worker must send X-Organization-ID."
             )
 
         usage_objects = []
@@ -171,11 +180,7 @@ def post(self, request: Request) -> JsonResponse:
                     adapter_instance_id=r.get("adapter_instance_id", ""),
                     run_id=r.get("run_id"),
                     usage_type=r.get("usage_type", "llm"),
-                    # ``llm_usage_reason`` has a fixed choice set and a
-                    # cross-field CheckConstraint vs. ``usage_type``. Coerce
-                    # missing/empty to None so embedding rows don't trip
-                    # the constraint and so we don't silently store ""
-                    # which isn't a valid choice.
+                    # Coerce "" to None so the cross-field CheckConstraint passes.
                     llm_usage_reason=r.get("llm_usage_reason") or None,
                     model_name=r.get("model_name", ""),
                     embedding_tokens=r.get("embedding_tokens", 0),
@@ -192,21 +197,15 @@ def post(self, request: Request) -> JsonResponse:
             )
 
         try:
-            # Chunk to bound transaction size on the billing-critical table.
+            # Bound transaction size on the billing-critical table.
             created = Usage.objects.bulk_create(usage_objects, batch_size=500)
         except Exception as e:
             logger.error(
                 "bulk_create failed for %d usage records (org=%s): %s",
                 len(usage_objects),
-                organization.organization_id if organization else None,
+                organization.organization_id,
                 e,
                 exc_info=True,
             )
-            return JsonResponse(
-                {
-                    "success": False,
-                    "error": "Failed to persist usage records",
-                },
-                status=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            )
-        return JsonResponse({"created": len(created)}, status=201)
+            raise UsagePersistError() from e
+        return Response({"created": len(created)}, status=status.HTTP_201_CREATED)
diff --git a/backend/usage_v2/migrations/0004_usage_metrics_fields.py b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
index 182cfb6ca2..8405a319b4 100644
--- a/backend/usage_v2/migrations/0004_usage_metrics_fields.py
+++ b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
@@ -70,6 +70,11 @@ class Migration(migrations.Migration):
             name="status",
             field=models.CharField(
                 blank=True,
+                choices=[
+                    ("SUCCESS", "Success"),
+                    ("ERROR", "Error"),
+                    ("SKIPPED", "Skipped"),
+                ],
                 db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
                 max_length=16,
                 null=True,
@@ -84,6 +89,23 @@ class Migration(migrations.Migration):
                 null=True,
             ),
         ),
+        # reference_id and reference_type must both be NULL or both be set
+        # so reference_id is always decodable.
+        migrations.AddConstraint(
+            model_name="usage",
+            constraint=models.CheckConstraint(
+                check=models.Q(
+                    models.Q(
+                        ("reference_id__isnull", True), ("reference_type__isnull", True)
+                    ),
+                    models.Q(
+                        ("reference_id__isnull", False), ("reference_type__isnull", False)
+                    ),
+                    _connector="OR",
+                ),
+                name="usage_reference_pair_consistent",
+            ),
+        ),
         # Index creation moved to 0005 so it can run CONCURRENTLY — the usage
         # table is billing-critical and a plain AddIndex takes a share-update
         # lock for the duration of the build on large tables.
diff --git a/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py b/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py
deleted file mode 100644
index c15203bb60..0000000000
--- a/backend/usage_v2/migrations/0006_alter_usage_status_and_more.py
+++ /dev/null
@@ -1,42 +0,0 @@
-# Generated by Django 4.2.1 on 2026-04-28 08:22
-
-from django.db import migrations, models
-
-
-class Migration(migrations.Migration):
-    dependencies = [
-        ("usage_v2", "0005_usage_reason_ref_created_idx"),
-    ]
-
-    operations = [
-        migrations.AlterField(
-            model_name="usage",
-            name="status",
-            field=models.CharField(
-                blank=True,
-                choices=[
-                    ("SUCCESS", "Success"),
-                    ("ERROR", "Error"),
-                    ("SKIPPED", "Skipped"),
-                ],
-                db_comment="Operation outcome: SUCCESS, ERROR, or SKIPPED",
-                max_length=16,
-                null=True,
-            ),
-        ),
-        migrations.AddConstraint(
-            model_name="usage",
-            constraint=models.CheckConstraint(
-                check=models.Q(
-                    models.Q(
-                        ("reference_id__isnull", True), ("reference_type__isnull", True)
-                    ),
-                    models.Q(
-                        ("reference_id__isnull", False), ("reference_type__isnull", False)
-                    ),
-                    _connector="OR",
-                ),
-                name="usage_reference_pair_consistent",
-            ),
-        ),
-    ]
diff --git a/backend/usage_v2/serializers.py b/backend/usage_v2/serializers.py
index a823297083..47c6f1f11f 100644
--- a/backend/usage_v2/serializers.py
+++ b/backend/usage_v2/serializers.py
@@ -21,3 +21,36 @@ class UsageSerializer(serializers.ModelSerializer):
     class Meta:
         model = Usage
         fields = "__all__"
+
+
+class UsageRecordCreateSerializer(serializers.Serializer):
+    """Worker-emitted usage record. Required fields anchor billing-critical attribution."""
+
+    adapter_instance_id = serializers.CharField(required=True, allow_blank=False)
+    model_name = serializers.CharField(required=True, allow_blank=False)
+    usage_type = serializers.CharField(required=True, allow_blank=False)
+
+    workflow_id = serializers.CharField(required=False, allow_blank=True, default="")
+    execution_id = serializers.CharField(required=False, allow_blank=True, default="")
+    run_id = serializers.CharField(required=False, allow_null=True, default=None)
+    llm_usage_reason = serializers.CharField(
+        required=False, allow_null=True, allow_blank=True, default=None
+    )
+    embedding_tokens = serializers.IntegerField(required=False, default=0)
+    prompt_tokens = serializers.IntegerField(required=False, default=0)
+    completion_tokens = serializers.IntegerField(required=False, default=0)
+    total_tokens = serializers.IntegerField(required=False, default=0)
+    cost_in_dollars = serializers.FloatField(required=False, default=0.0)
+    reference_id = serializers.CharField(required=False, allow_null=True, default=None)
+    reference_type = serializers.CharField(required=False, allow_null=True, default=None)
+    execution_time_ms = serializers.IntegerField(
+        required=False, allow_null=True, default=None
+    )
+    status = serializers.CharField(required=False, allow_null=True, default=None)
+    error_message = serializers.CharField(
+        required=False, allow_null=True, allow_blank=True, default=None
+    )
+
+
+class UsageBatchCreateSerializer(serializers.Serializer):
+    records = UsageRecordCreateSerializer(many=True, allow_empty=True)

From 1104cf48d11bb8b3bad1ae7e89284292f0280500 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 12:58:15 +0530
Subject: [PATCH 47/57] UN-2946 [REFACTOR] Harden SDK / worker billing path +
 extract lookup helpers
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- llm.py: token_counter fallback when prompt_tokens=0; rsplit('/',1) for
  multi-segment provider IDs; spread _usage_kwargs first so explicit
  billing fields win.
- utils/common.py: stamp every record appended during the call window
  (was clobbering only the last entry).
- legacy_executor.py: extract run_lookup_enrichment / run_webhook_postprocessing
  / is_blank into workers/executor/executors/lookup_enrichment.py — caller
  passes shim/state in, plugin returns usage_records for the caller to
  extend its billing batch. Orchestrator stays pure dispatch.
- ide_callback/tasks.py: drop the char-÷4 token estimate heuristic;
  context-manage the API clients so HTTP sessions don't leak.
---
 unstract/sdk1/src/unstract/sdk1/llm.py        |  38 ++--
 .../sdk1/src/unstract/sdk1/utils/common.py    |  15 +-
 workers/executor/executors/legacy_executor.py | 205 +++---------------
 .../executor/executors/lookup_enrichment.py   | 145 +++++++++++++
 workers/ide_callback/tasks.py                 | 187 ++++++++--------
 5 files changed, 294 insertions(+), 296 deletions(-)
 create mode 100644 workers/executor/executors/lookup_enrichment.py

diff --git a/unstract/sdk1/src/unstract/sdk1/llm.py b/unstract/sdk1/src/unstract/sdk1/llm.py
index 08a0077768..14bc4b33ca 100644
--- a/unstract/sdk1/src/unstract/sdk1/llm.py
+++ b/unstract/sdk1/src/unstract/sdk1/llm.py
@@ -653,11 +653,10 @@ def get_last_usage(self) -> Mapping[str, int]:
         }
 
     def get_last_usage_record(self) -> dict | None:
-        """Full usage record for the most recent LLM call (sync, async, or streaming).
+        """Full usage record for the most recent LLM call.
 
-        Returns the complete record (tokens + cost + model + reason
-        metadata) so callers don't have to reach into ``_pending_usage``
-        directly. ``None`` if no call has been made yet.
+        Returns tokens + cost + model + reason metadata; ``None`` if no
+        call has been made yet.
         """
         if not self._pending_usage:
             return None
@@ -669,7 +668,7 @@ def get_usage_reason(self) -> object:
     def flush_pending_usage(self) -> list[dict]:
         """Return and clear all pending usage records.
 
-        Called by the executor at finalization to collect records for batch write.
+        Called at executor finalization.
         """
         records = self._pending_usage
         self._pending_usage = []
@@ -687,6 +686,20 @@ def _record_usage(
         completion_tokens = usage_data.get("completion_tokens", 0)
         total_tokens = usage_data.get("total_tokens", 0)
 
+        # Fall back to litellm when providers omit prompt tokens — avoids 0-token billing.
+        if prompt_tokens == 0 and messages:
+            try:
+                prompt_tokens = litellm.token_counter(model=model, messages=messages)
+                if total_tokens == 0:
+                    total_tokens = prompt_tokens + completion_tokens
+            except Exception:
+                logger.warning(
+                    "[sdk1][LLM][%s] prompt_tokens missing on response and "
+                    "litellm.token_counter() fallback failed; recording 0",
+                    model,
+                    exc_info=True,
+                )
+
         logger.info(
             "[sdk1][LLM][%s][%s] Usage: prompt=%d completion=%d total=%d",
             model,
@@ -711,14 +724,10 @@ def _record_usage(
             )
             cost = 0.0
 
-        # rsplit so multi-segment IDs (e.g. ``bedrock/anthropic/claude``)
-        # collapse to the trailing segment, matching legacy Audit semantics.
+        # Trailing segment matches legacy Audit semantics (e.g. bedrock/anthropic/claude).
         display_model = model.rsplit("/", 1)[-1] if model else model
 
-        # ``_usage_kwargs`` spread first so explicit fields below win — those
-        # are the canonical billing values (tokens, cost, status); we only
-        # want callers to provide context (reference_id, reference_type),
-        # not override computed numbers.
+        # Spread _usage_kwargs first so computed billing fields below win.
         self._pending_usage.append(
             {
                 **self._usage_kwargs,
@@ -728,13 +737,10 @@ def _record_usage(
                 "adapter_instance_id": self.platform_kwargs.get(
                     "adapter_instance_id", ""
                 ),
-                # ``run_id`` lands in a UUIDField column; "" would fail the
-                # cast — keep absent values as None so the bulk-create view
-                # writes NULL.
+                # run_id lands in a UUIDField — "" fails the cast; keep None.
                 "run_id": self.platform_kwargs.get("run_id") or None,
                 "execution_id": self.platform_kwargs.get("execution_id", ""),
-                # ``llm_usage_reason`` has a fixed choice set; "" isn't a
-                # valid choice, so write None when missing.
+                # "" isn't a valid choice for llm_usage_reason.
                 "llm_usage_reason": self.platform_kwargs.get("llm_usage_reason") or None,
                 "prompt_tokens": prompt_tokens,
                 "completion_tokens": completion_tokens,
diff --git a/unstract/sdk1/src/unstract/sdk1/utils/common.py b/unstract/sdk1/src/unstract/sdk1/utils/common.py
index c2c3fdbca5..68a3fe0688 100644
--- a/unstract/sdk1/src/unstract/sdk1/utils/common.py
+++ b/unstract/sdk1/src/unstract/sdk1/utils/common.py
@@ -223,6 +223,10 @@ def wrapper(self: object, *args: object, **kwargs: object) -> object:
         if self._run_id and self._capture_metrics:
             metrics_mixin = MetricsMixin(run_id=self._run_id)
 
+        # Snapshot index so timing stamps every row appended during this call —
+        # internal retries would otherwise leave NULL execution_time_ms rows.
+        pending_at_entry = len(getattr(self, "_pending_usage", []))
+
         try:
             result = func(self, *args, **kwargs)
         finally:
@@ -250,12 +254,13 @@ def wrapper(self: object, *args: object, **kwargs: object) -> object:
                     # If the key isn't in self._metrics, set it to new_metrics
                     self._metrics = new_metrics
 
-                # Stamp timing onto the most recent pending usage record
+                # Stamp timing on every record appended during this call.
                 pending = getattr(self, "_pending_usage", [])
-                if pending:
-                    time_taken = new_metrics.get(time_taken_key)
-                    if time_taken is not None:
-                        pending[-1]["execution_time_ms"] = int(time_taken * 1000)
+                time_taken = new_metrics.get(time_taken_key)
+                if time_taken is not None and len(pending) > pending_at_entry:
+                    elapsed_ms = int(time_taken * 1000)
+                    for record in pending[pending_at_entry:]:
+                        record["execution_time_ms"] = elapsed_ms
 
         return result
 
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 052f349602..afa33b7c00 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -21,6 +21,10 @@
 )
 from executor.executors.exceptions import ExtractionError, LegacyExecutorError
 from executor.executors.file_utils import FileUtils
+from executor.executors.lookup_enrichment import (
+    run_lookup_enrichment,
+    run_webhook_postprocessing,
+)
 
 from unstract.sdk1.adapters.exceptions import AdapterError
 from unstract.sdk1.adapters.x2text.constants import X2TextConstants
@@ -37,21 +41,6 @@
 logger = logging.getLogger(__name__)
 
 
-def _is_blank(value: Any) -> bool:
-    """Treat None / whitespace strings / empty containers as no-value.
-
-    Boolean ``False`` and numeric ``0`` are *not* blank — they're valid
-    inputs for boolean / number prompts whose lookups should still run.
-    """
-    if value is None:
-        return True
-    if isinstance(value, str):
-        return not value.strip()
-    if isinstance(value, (list, dict)):
-        return not value
-    return False
-
-
 @ExecutorRegistry.register
 class LegacyExecutor(BaseExecutor):
     """Executor that wraps the full prompt-service extraction pipeline.
@@ -73,11 +62,8 @@ class LegacyExecutor(BaseExecutor):
     }
 
     def __init__(self) -> None:
-        # Per-request state — overwritten on every ``execute()`` call.
-        # ``_usage_records`` initialised here too so the orchestrator's
-        # ``getattr(executor, "_usage_records", None)`` always sees a real
-        # list — an early-init crash inside ``execute()`` would otherwise
-        # silently drop billing rows.
+        # Per-request state, overwritten in execute(). Seed _usage_records here
+        # so an early-init crash still exposes a real list to the orchestrator.
         self._log_events_id: str = ""
         self._log_component: dict[str, str] = {}
         self._execution_id: str | None = None
@@ -172,9 +158,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                         level=LogLevel.ERROR,
                     )
                 except Exception:
-                    # Best-effort — don't mask the original error, but log
-                    # so the secondary failure (broker down, serialization
-                    # bug, etc.) is recoverable.
+                    # Don't mask the original error; log the secondary at DEBUG.
                     logger.debug(
                         "Failed to stream error to FE for run_id=%s",
                         context.run_id,
@@ -1716,16 +1700,18 @@ def _execute_single_prompt(
             )
             shim.stream_log(f"Applied type conversion for: `{prompt_name}`")
 
-            self._run_lookup_enrichment(
-                output=output,
-                structured_output=structured_output,
-                metadata=metadata,
-                metrics=metrics,
-                shim=shim,
-                usage_kwargs=usage_kwargs,
-                llm_cls=llm_cls,
+            self._usage_records.extend(
+                run_lookup_enrichment(
+                    output=output,
+                    structured_output=structured_output,
+                    metadata=metadata,
+                    metrics=metrics,
+                    shim=shim,
+                    usage_kwargs=usage_kwargs,
+                    llm_cls=llm_cls,
+                )
             )
-            self._run_webhook_postprocessing(
+            run_webhook_postprocessing(
                 output=output,
                 structured_output=structured_output,
                 metadata=metadata,
@@ -1831,15 +1817,20 @@ def _flush_per_prompt_metrics(
             }
         )
         self._usage_records.extend(llm.flush_pending_usage())
-        if chunk_size > 0 and embedding is not None:
-            # Public adapters (``is_public_adapter() is True``) construct
-            # ``EmbeddingCompat`` without a callback_manager, so there's
-            # nothing to flush. Skip silently rather than catching the
-            # AttributeError — the broad catch was masking real bugs.
-            if embedding.callback_manager is not None:
-                for handler in embedding.callback_manager.handlers:
-                    if hasattr(handler, "flush_pending_usage"):
-                        self._usage_records.extend(handler.flush_pending_usage())
+        # Public adapters skip the callback_manager, so there's nothing to flush.
+        if chunk_size > 0 and embedding is not None and embedding.callback_manager:
+            for handler in embedding.callback_manager.handlers:
+                if not hasattr(handler, "flush_pending_usage"):
+                    continue
+                # Per-handler guard so one bad handler doesn't drop the rest.
+                try:
+                    self._usage_records.extend(handler.flush_pending_usage())
+                except Exception:
+                    logger.warning(
+                        "Failed to flush usage from embedding handler %s",
+                        type(handler).__name__,
+                        exc_info=True,
+                    )
         if vector_db:
             vector_db.close()
 
@@ -2000,138 +1991,6 @@ def _run_line_item_extraction(
                 level=LogLevel.ERROR,
             )
 
-    def _run_lookup_enrichment(
-        self,
-        output: dict[str, Any],
-        structured_output: dict[str, Any],
-        metadata: dict[str, Any],
-        metrics: dict[str, Any],
-        shim: Any,
-        llm_cls: Any,
-        usage_kwargs: dict[str, Any] | None = None,
-    ) -> None:
-        """Run lookup enrichment plugin if enabled and available.
-
-        ``llm_cls`` is passed in by the caller so we don't re-unpack the
-        7-tuple returned by ``_get_prompt_deps()`` on every prompt.
-        """
-        from executor.executors.constants import PromptServiceConstants as PSKeys
-        from executor.executors.plugins import ExecutorPluginLoader
-
-        prompt_name = output[PSKeys.NAME]
-        current_value = structured_output.get(prompt_name)
-
-        lookup_config = output.get("lookup_config")
-        lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
-        if not (lookup_config and lookup_cls):
-            return
-        if _is_blank(current_value):
-            # Surface a skip log instead of silently no-op-ing — the user
-            # configured a lookup and would otherwise wonder why it didn't run.
-            lookup_name = lookup_config.get("lookup_name") or "lookup"
-            shim.stream_log(
-                f"Skipping lookup `{lookup_name}` for `{prompt_name}` — "
-                f"source prompt produced no value."
-            )
-            return
-
-        try:
-            outcome = lookup_cls.run_with_metrics(
-                llm_cls=llm_cls,
-                lookup_config=lookup_config,
-                structured_output=structured_output,
-                current_value=current_value,
-                metadata=metadata,
-                prompt_name=prompt_name,
-                shim=shim,
-                usage_kwargs=usage_kwargs,
-            )
-            # Inside the try so a missing/renamed attribute on the outcome
-            # (plugin contract drift) hits the same graceful-degrade branch.
-            self._usage_records.extend(outcome.usage_records)
-            metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = (
-                outcome.llm_metrics
-            )
-        except Exception:
-            # Enrichment is post-extraction — degrade gracefully on
-            # plugin contract drift (missing METRICS_KEY, unexpected
-            # outcome shape) rather than aborting the whole prompt run
-            # and losing the answer-prompt billing rows.
-            lookup_name = lookup_config.get("lookup_name") or "lookup"
-            logger.exception(
-                "Lookup enrichment failed for prompt=%s lookup=%s",
-                prompt_name,
-                lookup_name,
-            )
-            shim.stream_log(
-                f"Lookup `{lookup_name}` failed for `{prompt_name}`; "
-                f"continuing without enrichment.",
-                level=LogLevel.WARN,
-            )
-            return
-
-    @staticmethod
-    def _run_webhook_postprocessing(
-        output: dict[str, Any],
-        structured_output: dict[str, Any],
-        metadata: dict[str, Any],
-        shim: Any,
-    ) -> None:
-        """Run webhook postprocessing if enabled (JSON outputs only)."""
-        from executor.executors.answer_prompt import AnswerPromptService
-        from executor.executors.constants import PromptServiceConstants as PSKeys
-
-        prompt_name = output[PSKeys.NAME]
-        output_type = output.get(PSKeys.TYPE, "")
-        webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
-        if not webhook_enabled:
-            return
-        # Pre-refactor, the webhook lived inside ``handle_json`` after its
-        # parse-failure early-return, so a malformed JSON answer (which sets
-        # ``structured_output[prompt_name] = {}``) never fired a webhook.
-        # The new explicit gate keeps that contract — empty / None payloads
-        # are skipped with a log rather than dispatched.
-        parsed_value = structured_output.get(prompt_name)
-        if not isinstance(parsed_value, (dict, list)) or not parsed_value:
-            logger.warning(
-                "Webhook postprocessing skipped: prompt=%s parsed payload "
-                "is empty or non-JSON (likely a parse failure)",
-                prompt_name,
-            )
-            return
-        if output_type != PSKeys.JSON:
-            # The pre-refactor behaviour fired the webhook regardless of
-            # output_type. The new restriction is intentional, but the
-            # user enabled a webhook URL and would otherwise see no call
-            # firing — surface the skip in the IDE log panel.
-            logger.warning(
-                "Webhook postprocessing supports JSON outputs only; "
-                "skipping for prompt=%s (output_type=%s)",
-                prompt_name,
-                output_type,
-            )
-            shim.stream_log(
-                f"Webhook postprocessing supports JSON outputs only; "
-                f"skipping for `{prompt_name}`.",
-                level=LogLevel.WARN,
-            )
-            return
-
-        webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
-        highlight_data = None
-        if metadata and PSKeys.HIGHLIGHT_DATA in metadata:
-            highlight_data = metadata.get(PSKeys.HIGHLIGHT_DATA, {}).get(prompt_name)
-        processed, updated_highlights = AnswerPromptService._run_webhook_postprocess(
-            parsed_data=structured_output.get(prompt_name),
-            webhook_url=webhook_url,
-            highlight_data=highlight_data,
-        )
-        structured_output[prompt_name] = processed
-        if updated_highlights is not None and metadata:
-            metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_name] = (
-                updated_highlights
-            )
-
     @staticmethod
     def _apply_type_conversion(
         output: dict[str, Any],
diff --git a/workers/executor/executors/lookup_enrichment.py b/workers/executor/executors/lookup_enrichment.py
new file mode 100644
index 0000000000..0b224badb5
--- /dev/null
+++ b/workers/executor/executors/lookup_enrichment.py
@@ -0,0 +1,145 @@
+"""Lookup enrichment + webhook postprocessing helpers.
+
+Extracted from ``LegacyExecutor`` so the orchestrator stays focused on
+dispatch. Both helpers are free functions — callers pass shim/state in.
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import Any
+
+from executor.executors.constants import PromptServiceConstants as PSKeys
+from executor.executors.plugins import ExecutorPluginLoader
+
+from unstract.sdk1.constants import LogLevel
+
+logger = logging.getLogger(__name__)
+
+
+def is_blank(value: Any) -> bool:
+    """Treat None / whitespace strings / empty containers as no-value.
+
+    Boolean False / numeric 0 are NOT blank — valid inputs for
+    boolean/number prompts whose lookups should still run.
+    """
+    if value is None:
+        return True
+    if isinstance(value, str):
+        return not value.strip()
+    if isinstance(value, (list, dict)):
+        return not value
+    return False
+
+
+def run_lookup_enrichment(
+    output: dict[str, Any],
+    structured_output: dict[str, Any],
+    metadata: dict[str, Any],
+    metrics: dict[str, Any],
+    shim: Any,
+    llm_cls: Any,
+    usage_kwargs: dict[str, Any] | None = None,
+) -> list[dict[str, Any]]:
+    """Run lookup enrichment plugin if enabled and available.
+
+    Returns any usage records the plugin emitted (recovered even on
+    plugin failure) so the caller can extend its billing batch.
+    """
+    prompt_name = output[PSKeys.NAME]
+    current_value = structured_output.get(prompt_name)
+
+    lookup_config = output.get("lookup_config")
+    lookup_cls = ExecutorPluginLoader.get("lookup-enrichment")
+    if not (lookup_config and lookup_cls):
+        return []
+    if is_blank(current_value):
+        # Surface a skip log instead of silently no-op-ing.
+        lookup_name = lookup_config.get("lookup_name") or "lookup"
+        shim.stream_log(
+            f"Skipping lookup `{lookup_name}` for `{prompt_name}` — "
+            f"source prompt produced no value."
+        )
+        return []
+
+    outcome = None
+    try:
+        outcome = lookup_cls.run_with_metrics(
+            llm_cls=llm_cls,
+            lookup_config=lookup_config,
+            structured_output=structured_output,
+            current_value=current_value,
+            metadata=metadata,
+            prompt_name=prompt_name,
+            shim=shim,
+            usage_kwargs=usage_kwargs,
+        )
+        metrics.setdefault(prompt_name, {})[lookup_cls.METRICS_KEY] = outcome.llm_metrics
+    except Exception:
+        # Degrade gracefully on plugin contract drift.
+        lookup_name = lookup_config.get("lookup_name") or "lookup"
+        logger.exception(
+            "Lookup enrichment failed for prompt=%s lookup=%s",
+            prompt_name,
+            lookup_name,
+        )
+        shim.stream_log(
+            f"Lookup `{lookup_name}` failed for `{prompt_name}`; "
+            f"continuing without enrichment.",
+            level=LogLevel.WARN,
+        )
+
+    if outcome is not None and getattr(outcome, "usage_records", None):
+        return list(outcome.usage_records)
+    return []
+
+
+def run_webhook_postprocessing(
+    output: dict[str, Any],
+    structured_output: dict[str, Any],
+    metadata: dict[str, Any],
+    shim: Any,
+) -> None:
+    """Run webhook postprocessing if enabled (JSON outputs only)."""
+    from executor.executors.answer_prompt import AnswerPromptService
+
+    prompt_name = output[PSKeys.NAME]
+    output_type = output.get(PSKeys.TYPE, "")
+    webhook_enabled = output.get(PSKeys.ENABLE_POSTPROCESSING_WEBHOOK, False)
+    if not webhook_enabled:
+        return
+    # Empty / non-JSON payloads are skipped — typically a parse failure.
+    parsed_value = structured_output.get(prompt_name)
+    if not isinstance(parsed_value, (dict, list)) or not parsed_value:
+        logger.warning(
+            "Webhook postprocessing skipped: prompt=%s parsed payload "
+            "is empty or non-JSON (likely a parse failure)",
+            prompt_name,
+        )
+        return
+    if output_type != PSKeys.JSON:
+        logger.warning(
+            "Webhook postprocessing supports JSON outputs only; "
+            "skipping for prompt=%s (output_type=%s)",
+            prompt_name,
+            output_type,
+        )
+        shim.stream_log(
+            f"Webhook postprocessing supports JSON outputs only; "
+            f"skipping for `{prompt_name}`.",
+            level=LogLevel.WARN,
+        )
+        return
+
+    webhook_url = output.get(PSKeys.POSTPROCESSING_WEBHOOK_URL)
+    highlight_data = None
+    if metadata and PSKeys.HIGHLIGHT_DATA in metadata:
+        highlight_data = metadata.get(PSKeys.HIGHLIGHT_DATA, {}).get(prompt_name)
+    processed, updated_highlights = AnswerPromptService._run_webhook_postprocess(
+        parsed_data=structured_output.get(prompt_name),
+        webhook_url=webhook_url,
+        highlight_data=highlight_data,
+    )
+    structured_output[prompt_name] = processed
+    if updated_highlights is not None and metadata:
+        metadata.setdefault(PSKeys.HIGHLIGHT_DATA, {})[prompt_name] = updated_highlights
diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index 345bf06c9e..000b61eba6 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -551,97 +551,79 @@ def extraction_complete(
     ws_room = cb.get("ws_room", "")
     ws_event = cb.get("ws_event", "")
 
-    api = _get_extraction_client()
-    ps_api = _get_api_client()
+    with _get_extraction_client() as api, _get_api_client() as ps_api:
+        try:
+            # Check executor-level failure
+            if not result_dict.get("success", False):
+                error_msg = result_dict.get("error", _UNKNOWN_EXECUTOR_ERROR)
+                logger.error(
+                    "extraction executor reported failure: source=%s file=%s error=%s",
+                    source,
+                    file_id,
+                    error_msg,
+                )
+                api.mark_extraction_error(
+                    source=source,
+                    file_id=file_id,
+                    error=error_msg,
+                    organization_id=org_id,
+                )
+                if ws_room and ws_event:
+                    _emit_websocket(
+                        ps_api,
+                        room=ws_room,
+                        event=ws_event,
+                        data={
+                            "file_id": file_id,
+                            "status": "ERROR",
+                            "error": error_msg[:500],
+                        },
+                    )
+                return {"status": "failed", "error": error_msg}
 
-    try:
-        # Check executor-level failure
-        if not result_dict.get("success", False):
-            error_msg = result_dict.get("error", _UNKNOWN_EXECUTOR_ERROR)
-            logger.error(
-                "extraction executor reported failure: source=%s file=%s error=%s",
-                source,
-                file_id,
-                error_msg,
-            )
-            api.mark_extraction_error(
+            api.mark_extraction_complete(
                 source=source,
                 file_id=file_id,
-                error=error_msg,
+                extracted_text_path=extracted_text_path,
                 organization_id=org_id,
             )
+
             if ws_room and ws_event:
                 _emit_websocket(
                     ps_api,
                     room=ws_room,
                     event=ws_event,
-                    data={
-                        "file_id": file_id,
-                        "status": "ERROR",
-                        "error": error_msg[:500],
-                    },
+                    data={"file_id": file_id, "status": "COMPLETED"},
                 )
-            return {"status": "failed", "error": error_msg}
 
-        # ``result_dict["data"]`` may be explicitly ``None`` on early-return
-        # paths; guard against AttributeError so a benign empty-data response
-        # doesn't escalate to a generic "ERROR" callback.
-        extracted_text = (result_dict.get("data") or {}).get("extracted_text", "")
-        token_count = len(extracted_text) // 4
-
-        api.mark_extraction_complete(
-            source=source,
-            file_id=file_id,
-            token_count=token_count,
-            extracted_text_path=extracted_text_path,
-            organization_id=org_id,
-        )
+            logger.info("Extraction completed: source=%s file=%s", source, file_id)
+            return {"status": "completed", "file_id": file_id}
 
-        if ws_room and ws_event:
-            _emit_websocket(
-                ps_api,
-                room=ws_room,
-                event=ws_event,
-                data={
-                    "file_id": file_id,
-                    "status": "COMPLETED",
-                    "token_count": token_count,
-                },
+        except Exception as e:
+            logger.exception(
+                "extraction_complete callback failed: source=%s file=%s",
+                source,
+                file_id,
             )
-
-        logger.info(
-            "Extraction completed: source=%s file=%s tokens=%d",
-            source,
-            file_id,
-            token_count,
-        )
-        return {"status": "completed", "file_id": file_id, "token_count": token_count}
-
-    except Exception as e:
-        logger.exception(
-            "extraction_complete callback failed: source=%s file=%s", source, file_id
-        )
-        if ws_room and ws_event:
-            try:
-                _emit_websocket(
-                    ps_api,
-                    room=ws_room,
-                    event=ws_event,
-                    data={
-                        "file_id": file_id,
-                        "status": "ERROR",
-                        "error": str(e)[:500],
-                    },
-                )
-            except Exception:
-                # ``_emit_websocket`` already swallows-and-logs internally,
-                # but if anything reaches this far we'd rather see the
-                # secondary failure in the log than lose it silently.
-                logger.debug(
-                    "Failed to emit ws ERROR event in extraction_complete fallback",
-                    exc_info=True,
-                )
-        raise
+            if ws_room and ws_event:
+                try:
+                    _emit_websocket(
+                        ps_api,
+                        room=ws_room,
+                        event=ws_event,
+                        data={
+                            "file_id": file_id,
+                            "status": "ERROR",
+                            "error": str(e)[:500],
+                        },
+                    )
+                except Exception:
+                    # _emit_websocket swallows internally; log if anything escapes.
+                    logger.debug(
+                        "Failed to emit ws ERROR event in extraction_complete fallback",
+                        exc_info=True,
+                    )
+            raise
 
 
 @app.task(name="extraction_error")
@@ -657,31 +639,32 @@ def extraction_error(
     ws_room = cb.get("ws_room", "")
     ws_event = cb.get("ws_event", "")
 
-    api = _get_extraction_client()
-    ps_api = _get_api_client()
+    # Context-manage clients to avoid per-task session leaks.
+    with _get_extraction_client() as api, _get_api_client() as ps_api:
+        try:
+            error_msg = _get_task_error(failed_task_id, default="Text extraction failed")
 
-    try:
-        error_msg = _get_task_error(failed_task_id, default="Text extraction failed")
-
-        api.mark_extraction_error(
-            source=source,
-            file_id=file_id,
-            error=error_msg,
-            organization_id=org_id,
-        )
+            api.mark_extraction_error(
+                source=source,
+                file_id=file_id,
+                error=error_msg,
+                organization_id=org_id,
+            )
 
-        if ws_room and ws_event:
-            _emit_websocket(
-                ps_api,
-                room=ws_room,
-                event=ws_event,
-                data={
-                    "file_id": file_id,
-                    "status": "ERROR",
-                    "error": error_msg[:500],
-                },
+            if ws_room and ws_event:
+                _emit_websocket(
+                    ps_api,
+                    room=ws_room,
+                    event=ws_event,
+                    data={
+                        "file_id": file_id,
+                        "status": "ERROR",
+                        "error": error_msg[:500],
+                    },
+                )
+        except Exception:
+            logger.exception(
+                "extraction_error callback failed: source=%s file=%s",
+                source,
+                file_id,
             )
-    except Exception:
-        logger.exception(
-            "extraction_error callback failed: source=%s file=%s", source, file_id
-        )

From dab3ffa64489227c69327de65dabfe3392cc1acc Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 12:59:07 +0530
Subject: [PATCH 48/57] UN-2946 [FIX] Lookup-related FE polish + DRF error
 envelope
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- prompt_studio/views.py: _multi_var_lookup_block_response uses
  ``detail`` instead of ``error`` to match drf-standardized-errors.
- CombinedOutput.jsx: hoist build helpers to module scope (selectedProfile
  passed as arg) — no per-render allocation, fewer useEffect closures.
- DocumentParser.jsx: hoist UUID_RE to module scope (no per-render compile).
- PromptOutput.jsx: silent ``catch {}`` on plugin dynamic-import failures
  so OSS doesn't surface noisy warnings for cloud-only modules.
- SideNavBar.jsx: hide the lookups submenu item when the lookup-studio
  plugin isn't loaded (keeps OSS nav clean).
---
 .../prompt_studio_core_v2/views.py            |   2 +-
 .../combined-output/CombinedOutput.jsx        | 104 +++++++++---------
 .../document-parser/DocumentParser.jsx        |   9 +-
 .../custom-tools/prompt-card/PromptOutput.jsx |  19 +---
 .../navigations/side-nav-bar/SideNavBar.jsx   |  17 +--
 5 files changed, 74 insertions(+), 77 deletions(-)

diff --git a/backend/prompt_studio/prompt_studio_core_v2/views.py b/backend/prompt_studio/prompt_studio_core_v2/views.py
index 6043d1a57a..30ea7045e2 100644
--- a/backend/prompt_studio/prompt_studio_core_v2/views.py
+++ b/backend/prompt_studio/prompt_studio_core_v2/views.py
@@ -108,7 +108,7 @@ def _multi_var_lookup_block_response(custom_tool, prompt_ids=None):
         return None
     return Response(
         {
-            "error": (
+            "detail": (
                 "Multi-variable lookup(s) "
                 f"{', '.join(names)} are linked to prompts in this project. "
                 "These can only run in single pass extraction mode. "
diff --git a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
index 9aeffdff54..7e30a99339 100644
--- a/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
+++ b/frontend/src/components/custom-tools/combined-output/CombinedOutput.jsx
@@ -47,8 +47,7 @@ try {
   // The component will remain null if it is not available
 }
 
-// Cloud plugin hook — OSS falls back to passthrough helpers that leave
-// the payload untouched and report "no enrichment".
+// OSS falls back to passthrough helpers — no enrichment.
 let splitCombinedData = (data) => ({ combined: data, bundle: null });
 let buildEnrichedFromBundle = (_output, _bundle, _formatter) => ({});
 let getEnrichmentFromItem = (_item) => null;
@@ -59,6 +58,56 @@ try {
   getEnrichmentFromItem = mod.getEnrichmentFromItem;
 } catch {}
 
+const buildDefaultProfileOutputs = (data) => {
+  const { combined: payload, bundle } = splitCombinedData(data);
+  const output = Object.entries(payload).reduce((acc, [key, value]) => {
+    acc[key] = displayPromptResult(value, false);
+    return acc;
+  }, {});
+  const enriched = buildEnrichedFromBundle(output, bundle, displayPromptResult);
+  return {
+    output,
+    enriched,
+    hasEnriched: bundle != null && Object.keys(enriched).length > 0,
+  };
+};
+
+const buildPerPromptOutput = (item, data, selectedProfile) => {
+  const profileManager = selectedProfile || item?.profile_manager;
+  const outputDetails = data.find(
+    (outputValue) =>
+      outputValue?.prompt_id === item?.prompt_id &&
+      outputValue?.profile_manager === profileManager,
+  );
+  const value =
+    outputDetails?.output?.length > 0
+      ? displayPromptResult(outputDetails?.output, false)
+      : "";
+  const enrichment = getEnrichmentFromItem(outputDetails);
+  const enrichedValue = enrichment?.output
+    ? displayPromptResult(enrichment.output, false)
+    : value;
+  return { value, enrichedValue, hasEnriched: !!enrichment?.output };
+};
+
+const buildSelectedProfileOutputs = (data, prompts, selectedProfile) => {
+  const output = {};
+  const enriched = {};
+  let hasEnriched = false;
+  for (const item of prompts) {
+    if (item?.prompt_type === promptType.notes) continue;
+    const {
+      value,
+      enrichedValue,
+      hasEnriched: enrichedHit,
+    } = buildPerPromptOutput(item, data, selectedProfile);
+    output[item?.prompt_key] = value;
+    enriched[item?.prompt_key] = enrichedValue;
+    hasEnriched = hasEnriched || enrichedHit;
+  }
+  return { output, enriched: hasEnriched ? enriched : {}, hasEnriched };
+};
+
 function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
   const {
     details,
@@ -120,55 +169,6 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
       return;
     }
 
-    const buildDefaultProfileOutputs = (data) => {
-      const { combined: payload, bundle } = splitCombinedData(data);
-      const output = Object.entries(payload).reduce((acc, [key, value]) => {
-        acc[key] = displayPromptResult(value, false);
-        return acc;
-      }, {});
-      return {
-        output,
-        enriched: buildEnrichedFromBundle(output, bundle, displayPromptResult),
-        hasEnriched: true,
-      };
-    };
-
-    const buildPerPromptOutput = (item, data) => {
-      const profileManager = selectedProfile || item?.profile_manager;
-      const outputDetails = data.find(
-        (outputValue) =>
-          outputValue?.prompt_id === item?.prompt_id &&
-          outputValue?.profile_manager === profileManager,
-      );
-      const value =
-        outputDetails?.output?.length > 0
-          ? displayPromptResult(outputDetails?.output, false)
-          : "";
-      const enrichment = getEnrichmentFromItem(outputDetails);
-      const enrichedValue = enrichment?.output
-        ? displayPromptResult(enrichment.output, false)
-        : value;
-      return { value, enrichedValue, hasEnriched: !!enrichment?.output };
-    };
-
-    const buildSelectedProfileOutputs = (data, prompts) => {
-      const output = {};
-      const enriched = {};
-      let hasEnriched = false;
-      for (const item of prompts) {
-        if (item?.prompt_type === promptType.notes) continue;
-        const {
-          value,
-          enrichedValue,
-          hasEnriched: enrichedHit,
-        } = buildPerPromptOutput(item, data);
-        output[item?.prompt_key] = value;
-        enriched[item?.prompt_key] = enrichedValue;
-        hasEnriched = hasEnriched || enrichedHit;
-      }
-      return { output, enriched: hasEnriched ? enriched : {}, hasEnriched };
-    };
-
     const fetchCombinedOutput = async () => {
       setIsOutputLoading(true);
       setCombinedOutput({});
@@ -180,7 +180,7 @@ function CombinedOutput({ docId, setFilledFields, selectedPrompts }) {
         const useDefaultProfile = activeKey === "0" && !isSimplePromptStudio;
         const { output, enriched } = useDefaultProfile
           ? buildDefaultProfileOutputs(data)
-          : buildSelectedProfileOutputs(data, prompts);
+          : buildSelectedProfileOutputs(data, prompts, selectedProfile);
         setCombinedOutput(output);
         setEnrichedOutput(enriched);
       } catch (err) {
diff --git a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
index 2b55e26807..63b1a037c5 100644
--- a/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
+++ b/frontend/src/components/custom-tools/document-parser/DocumentParser.jsx
@@ -33,6 +33,10 @@ try {
   // The component will remain null of it is not available
 }
 
+// Module-scoped to avoid per-render recompilation.
+const UUID_RE =
+  /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
+
 function DocumentParser({
   addPromptInstance,
   scrollToBottom,
@@ -110,9 +114,7 @@ function DocumentParser({
     }
   }, [scrollToBottom]);
 
-  // Handle scrollTo query param for cross-linking from Lookup Studio
-  const UUID_RE =
-    /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
+  // Cross-link from Lookup Studio: scroll to a specific prompt.
   useEffect(() => {
     const scrollToPromptId = searchParams.get("scrollTo");
     if (
@@ -130,7 +132,6 @@ function DocumentParser({
       setTimeout(() => el.classList.remove("highlighted-prompt"), 2000);
     }
 
-    // Clear the param so it doesn't re-trigger
     searchParams.delete("scrollTo");
     setSearchParams(searchParams, { replace: true });
   }, [details?.prompts, searchParams]);
diff --git a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
index c9d9c44143..b8aaa4b393 100644
--- a/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
+++ b/frontend/src/components/custom-tools/prompt-card/PromptOutput.jsx
@@ -57,11 +57,8 @@ try {
     "../../../plugins/lookup-studio/prompt-card/LookupOutputTabs"
   );
   LookupOutputTabs = mod.LookupOutputTabs;
-} catch (error) {
-  // OSS: plugin may not exist; cloud: surface unexpected chunk-load
-  // failures so they don't degrade silently to OSS-mode behaviour.
-  // eslint-disable-next-line no-console
-  console.warn("[PromptOutput] LookupOutputTabs unavailable:", error);
+} catch {
+  // Cloud-only plugin — absent in OSS builds; LookupOutputTabs stays null.
 }
 
 let getEnrichedCopyText;
@@ -70,14 +67,11 @@ try {
     "../../../plugins/lookup-studio/prompt-card/getEnrichedCopyText"
   );
   getEnrichedCopyText = mod.getEnrichedCopyText;
-} catch (error) {
-  // eslint-disable-next-line no-console
-  console.warn("[PromptOutput] getEnrichedCopyText unavailable:", error);
+} catch {
+  // Cloud-only plugin — absent in OSS builds; falls back to raw copy text.
 }
 
-// Resolve enriched copy text with fallback so a plugin-side throw
-// can't break the Copy button. ``getEnrichedCopyText`` may not exist
-// in OSS (plugin import failed) or may throw on a malformed enrichment.
+// Fallback to raw text — plugin throw on malformed enrichment shouldn't break Copy.
 const resolveCopyText = (promptOutputId, fallbackText) => {
   if (!getEnrichedCopyText) {
     return fallbackText;
@@ -92,8 +86,7 @@ const resolveCopyText = (promptOutputId, fallbackText) => {
   }
 };
 
-// Wraps children in LookupOutputTabs when available (cloud),
-// passes through children directly in OSS.
+// Cloud wraps children in LookupOutputTabs; OSS passes through.
 const renderWithLookupWrapper = (lookupProps, children) =>
   LookupOutputTabs ? (
     <LookupOutputTabs {...lookupProps}>{children}</LookupOutputTabs>
diff --git a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
index 724c241e7c..164fdab145 100644
--- a/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
+++ b/frontend/src/components/navigations/side-nav-bar/SideNavBar.jsx
@@ -512,13 +512,16 @@ const SideNavBar = ({ collapsed, setCollapsed }) => {
     });
   }
 
-  // Extend Prompt Studio active state to include /lookups paths
-  if (lookupStudioEnabled && isUnstract) {
-    const psItem = data[0]?.subMenu?.find((el) => el.id === 1.1);
-    if (psItem) {
-      psItem.active =
-        psItem.active ||
-        globalThis.location.pathname.startsWith(`/${orgName}/lookups`);
+  // Keep Prompt Studio highlighted on /lookups. Replace, don't mutate —
+  // `data` may alias the `menu` prop.
+  if (lookupStudioEnabled && isUnstract && data[0]?.subMenu) {
+    const onLookupPath = globalThis.location.pathname.startsWith(
+      `/${orgName}/lookups`,
+    );
+    if (onLookupPath) {
+      data[0].subMenu = data[0].subMenu.map((el) =>
+        el.id === 1.1 ? { ...el, active: true } : el,
+      );
     }
   }
 

From 4b9e0fd28ae6094527636f24dfa3baa57f0db1e5 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Tue, 5 May 2026 15:47:51 +0530
Subject: [PATCH 49/57] UN-2946 [FIX] Type run_id / reference_id as UUIDField
 in batch serializer
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Both columns are UUIDField on the Usage model — leaving them as
CharField in the serializer let invalid UUIDs slip through to bulk_create
and surface as a 500. UUIDField catches them at validation with a
standard DRF 400.
---
 backend/usage_v2/serializers.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/backend/usage_v2/serializers.py b/backend/usage_v2/serializers.py
index 47c6f1f11f..5fb44f5423 100644
--- a/backend/usage_v2/serializers.py
+++ b/backend/usage_v2/serializers.py
@@ -32,7 +32,7 @@ class UsageRecordCreateSerializer(serializers.Serializer):
 
     workflow_id = serializers.CharField(required=False, allow_blank=True, default="")
     execution_id = serializers.CharField(required=False, allow_blank=True, default="")
-    run_id = serializers.CharField(required=False, allow_null=True, default=None)
+    run_id = serializers.UUIDField(required=False, allow_null=True, default=None)
     llm_usage_reason = serializers.CharField(
         required=False, allow_null=True, allow_blank=True, default=None
     )
@@ -41,7 +41,7 @@ class UsageRecordCreateSerializer(serializers.Serializer):
     completion_tokens = serializers.IntegerField(required=False, default=0)
     total_tokens = serializers.IntegerField(required=False, default=0)
     cost_in_dollars = serializers.FloatField(required=False, default=0.0)
-    reference_id = serializers.CharField(required=False, allow_null=True, default=None)
+    reference_id = serializers.UUIDField(required=False, allow_null=True, default=None)
     reference_type = serializers.CharField(required=False, allow_null=True, default=None)
     execution_time_ms = serializers.IntegerField(
         required=False, allow_null=True, default=None

From 4bbf2dee64ce4f14f97e28dfa86817f3e75ad5c4 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 6 May 2026 03:57:39 +0530
Subject: [PATCH 50/57] UN-2946 [DOCS] Tighten extraction_complete docstring
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Drops the stale "Computes token count" line — the callback no longer
derives a token count.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 workers/ide_callback/tasks.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/workers/ide_callback/tasks.py b/workers/ide_callback/tasks.py
index 000b61eba6..c6494e036f 100644
--- a/workers/ide_callback/tasks.py
+++ b/workers/ide_callback/tasks.py
@@ -540,8 +540,7 @@ def extraction_complete(
 ) -> dict[str, Any]:
     """Celery link callback after successful text extraction.
 
-    Computes token count from extracted text, persists result via
-    internal API, and emits a WebSocket event.
+    Persists the result via internal API and emits a WebSocket event.
     """
     cb = callback_kwargs or {}
     source = cb.get("source", "")

From 3734332679f50046834bdff956368dfc3c8f8db6 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Wed, 6 May 2026 13:48:31 +0530
Subject: [PATCH 51/57] UN-2946 [FIX] Pre-bind validated_file_execution_id in
 usage client

If _validate_file_execution_id raised, the except handler hit
UnboundLocalError and masked the original ValueError. Pre-bind a
str(file_execution_id) fallback so the error response carries the
real cause. Also gitignore Codex's AGENTS.md scratchpad.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .gitignore                             | 3 +++
 workers/shared/clients/usage_client.py | 2 ++
 2 files changed, 5 insertions(+)

diff --git a/.gitignore b/.gitignore
index 0901e18b4c..6c099a4071 100644
--- a/.gitignore
+++ b/.gitignore
@@ -700,6 +700,9 @@ CLAUDE.md
 CONTRIBUTION_GUIDE.md
 .mcp.json
 
+# Codex
+AGENTS.md
+
 # Windsurf
 .qodo
 .windsurfrules
diff --git a/workers/shared/clients/usage_client.py b/workers/shared/clients/usage_client.py
index acd6dd4c4d..0bbaba9f67 100644
--- a/workers/shared/clients/usage_client.py
+++ b/workers/shared/clients/usage_client.py
@@ -119,6 +119,8 @@ def get_aggregated_token_count(
         Returns:
             UsageResponse containing aggregated usage data
         """
+        # Pre-bind so the except handler can log even if validation raises.
+        validated_file_execution_id = str(file_execution_id)
         try:
             validated_file_execution_id = self._validate_file_execution_id(
                 file_execution_id

From e67be152967970b2478782f772ee0a65bc4f4b04 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Thu, 7 May 2026 11:31:21 +0530
Subject: [PATCH 52/57] [CHORE] Ignore .pi/ tooling directory

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .gitignore | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/.gitignore b/.gitignore
index 6c099a4071..c655f4acff 100644
--- a/.gitignore
+++ b/.gitignore
@@ -703,6 +703,9 @@ CONTRIBUTION_GUIDE.md
 # Codex
 AGENTS.md
 
+# Pi
+.pi/
+
 # Windsurf
 .qodo
 .windsurfrules

From a4de618a1e6f5d29d82e45486da5df3a6f85525c Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 8 May 2026 10:49:32 +0530
Subject: [PATCH 53/57] UN-3494 [REFACTOR] Replace polymorphic Usage
 attribution with typed columns + post-write hooks
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Drop reference_id / reference_type from Usage in favour of typed
project_id / prompt_id columns indexed CONCURRENTLY for dashboard
rollups. Cloud-only attribution (e.g. lookup_version_id) now flows
through an opaque cloud_extras carrier on the batch endpoint, which
forwards it verbatim to plugin-registered post-write hooks invoked
inside the same atomic transaction as bulk_create — a hook failure
rolls back the Usage rows so attribution stays consistent or nothing
is written.

Removes the need for cloud to subclass UsageBatchCreateView or prepend
a URL override; the hook seam is generic for any future cloud feature.
---
 backend/usage_v2/hooks.py                     | 25 ++++++++++
 backend/usage_v2/internal_views.py            | 12 +++--
 .../migrations/0004_usage_metrics_fields.py   | 47 +++++--------------
 .../0005_usage_reason_ref_created_idx.py      | 37 ++++++++++-----
 backend/usage_v2/models.py                    | 47 +++++--------------
 backend/usage_v2/serializers.py               |  6 ++-
 6 files changed, 86 insertions(+), 88 deletions(-)
 create mode 100644 backend/usage_v2/hooks.py

diff --git a/backend/usage_v2/hooks.py b/backend/usage_v2/hooks.py
new file mode 100644
index 0000000000..615fa667ea
--- /dev/null
+++ b/backend/usage_v2/hooks.py
@@ -0,0 +1,25 @@
+"""Post-write hooks for ``UsageBatchCreateView``.
+
+Hooks fire inside the view's transaction; a failure rolls the batch back
+so Usage rows and any side-table writes stay consistent. Records carry
+an opaque ``cloud_extras`` dict that OSS forwards verbatim — plugins
+read only the keys they own.
+"""
+
+from collections.abc import Callable
+
+from .models import Usage
+
+PostWriteHook = Callable[[list[dict], list[Usage]], None]
+
+_post_write_hooks: list[PostWriteHook] = []
+
+
+def register_post_write_hook(fn: PostWriteHook) -> PostWriteHook:
+    _post_write_hooks.append(fn)
+    return fn
+
+
+def run_post_write_hooks(records: list[dict], usage_objects: list[Usage]) -> None:
+    for hook in _post_write_hooks:
+        hook(records, usage_objects)
diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 59d1f5204d..9c5c8caaeb 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -5,6 +5,7 @@
 
 import logging
 
+from django.db import transaction
 from django.http import JsonResponse
 from rest_framework import status
 from rest_framework.exceptions import APIException, ValidationError
@@ -16,6 +17,7 @@
 from unstract.core.data_models import UsageResponseData
 
 from .helper import UsageHelper
+from .hooks import run_post_write_hooks
 from .models import Usage
 from .serializers import UsageBatchCreateSerializer
 
@@ -188,8 +190,8 @@ def post(self, request: Request) -> Response:
                     completion_tokens=r.get("completion_tokens", 0),
                     total_tokens=r.get("total_tokens", 0),
                     cost_in_dollars=r.get("cost_in_dollars", 0.0),
-                    reference_id=r.get("reference_id"),
-                    reference_type=r.get("reference_type"),
+                    project_id=r.get("project_id"),
+                    prompt_id=r.get("prompt_id"),
                     execution_time_ms=r.get("execution_time_ms"),
                     status=r.get("status"),
                     error_message=r.get("error_message"),
@@ -197,8 +199,10 @@ def post(self, request: Request) -> Response:
             )
 
         try:
-            # Bound transaction size on the billing-critical table.
-            created = Usage.objects.bulk_create(usage_objects, batch_size=500)
+            # Atomic with hooks: orphan Usage rows are worse than retrying.
+            with transaction.atomic():
+                created = Usage.objects.bulk_create(usage_objects, batch_size=500)
+                run_post_write_hooks(records, created)
         except Exception as e:
             logger.error(
                 "bulk_create failed for %d usage records (org=%s): %s",
diff --git a/backend/usage_v2/migrations/0004_usage_metrics_fields.py b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
index 8405a319b4..191a31dd27 100644
--- a/backend/usage_v2/migrations/0004_usage_metrics_fields.py
+++ b/backend/usage_v2/migrations/0004_usage_metrics_fields.py
@@ -26,33 +26,27 @@ class Migration(migrations.Migration):
         ),
         migrations.AddField(
             model_name="usage",
-            name="reference_id",
+            name="project_id",
             field=models.UUIDField(
                 blank=True,
                 db_comment=(
-                    "Polymorphic correlation ID (no FK constraint) linking to the "
-                    "entity that triggered this usage. Interpret via reference_type. "
-                    "OSS values: prompt_key UUID. "
-                    "NULL for most operations; survives entity deletion."
+                    "Prompt Studio project (tool) the call belongs to (no FK; "
+                    "survives tool deletion). NULL for embeddings and historical "
+                    "rows."
                 ),
                 null=True,
             ),
         ),
         migrations.AddField(
             model_name="usage",
-            name="reference_type",
-            field=models.CharField(
+            name="prompt_id",
+            field=models.UUIDField(
                 blank=True,
-                choices=[
-                    ("prompt_key", "Prompt Key"),
-                    ("lookup_version", "Lookup Version"),
-                ],
                 db_comment=(
-                    "Discriminator for reference_id. "
-                    "OSS values: 'prompt_key'. "
-                    "NULL when reference_id is NULL."
+                    "Prompt key UUID that triggered the call (no FK; survives "
+                    "prompt deletion). NULL for single-pass / embeddings / "
+                    "historical rows."
                 ),
-                max_length=64,
                 null=True,
             ),
         ),
@@ -89,24 +83,7 @@ class Migration(migrations.Migration):
                 null=True,
             ),
         ),
-        # reference_id and reference_type must both be NULL or both be set
-        # so reference_id is always decodable.
-        migrations.AddConstraint(
-            model_name="usage",
-            constraint=models.CheckConstraint(
-                check=models.Q(
-                    models.Q(
-                        ("reference_id__isnull", True), ("reference_type__isnull", True)
-                    ),
-                    models.Q(
-                        ("reference_id__isnull", False), ("reference_type__isnull", False)
-                    ),
-                    _connector="OR",
-                ),
-                name="usage_reference_pair_consistent",
-            ),
-        ),
-        # Index creation moved to 0005 so it can run CONCURRENTLY — the usage
-        # table is billing-critical and a plain AddIndex takes a share-update
-        # lock for the duration of the build on large tables.
+        # Indexes on project_id / prompt_id moved to 0005 so they can run
+        # CONCURRENTLY — usage is billing-critical and a plain AddIndex takes
+        # a share-update lock for the duration of the build on large tables.
     ]
diff --git a/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
index 4d56d4efe7..58bac40acb 100644
--- a/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
+++ b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
@@ -2,12 +2,12 @@
 
 
 class Migration(migrations.Migration):
-    """Build the lookup-usage dashboard index without locking the table.
+    """Build the project_id / prompt_id dashboard indexes without locking.
 
-    CONCURRENTLY requires that the migration itself runs outside a
-    transaction, hence atomic = False. We use RunSQL with IF NOT EXISTS so
-    a partial-apply (process killed between SQL success and django_migrations
-    insert) is recoverable on retry without manual --fake intervention.
+    CONCURRENTLY requires the migration to run outside a transaction, hence
+    atomic = False. RunSQL with IF NOT EXISTS makes a partial-apply
+    (process killed between SQL success and django_migrations insert)
+    recoverable on retry without manual --fake intervention.
     """
 
     atomic = False
@@ -20,18 +20,33 @@ class Migration(migrations.Migration):
         migrations.RunSQL(
             sql=(
                 "CREATE INDEX CONCURRENTLY IF NOT EXISTS "
-                "idx_usage_reason_ref_created "
-                'ON "usage" (llm_usage_reason, reference_id, created_at DESC);'
+                "idx_usage_project_created "
+                'ON "usage" (project_id, created_at DESC);'
             ),
-            reverse_sql=(
-                "DROP INDEX CONCURRENTLY IF EXISTS idx_usage_reason_ref_created;"
+            reverse_sql=("DROP INDEX CONCURRENTLY IF EXISTS idx_usage_project_created;"),
+            state_operations=[
+                migrations.AddIndex(
+                    model_name="usage",
+                    index=models.Index(
+                        fields=["project_id", "-created_at"],
+                        name="idx_usage_project_created",
+                    ),
+                ),
+            ],
+        ),
+        migrations.RunSQL(
+            sql=(
+                "CREATE INDEX CONCURRENTLY IF NOT EXISTS "
+                "idx_usage_prompt_created "
+                'ON "usage" (prompt_id, created_at DESC);'
             ),
+            reverse_sql=("DROP INDEX CONCURRENTLY IF EXISTS idx_usage_prompt_created;"),
             state_operations=[
                 migrations.AddIndex(
                     model_name="usage",
                     index=models.Index(
-                        fields=["llm_usage_reason", "reference_id", "-created_at"],
-                        name="idx_usage_reason_ref_created",
+                        fields=["prompt_id", "-created_at"],
+                        name="idx_usage_prompt_created",
                     ),
                 ),
             ],
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index 8b04240aef..b1ff6a297b 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -29,21 +29,12 @@ class UsageStatus(models.TextChoices):
     ("lookup", "Lookup"),
 ]
 
-REFERENCE_TYPE_CHOICES: list[tuple[str, str]] = [
-    ("prompt_key", "Prompt Key"),
-    ("lookup_version", "Lookup Version"),
-]
-
 
 class UsageModelManager(DefaultOrganizationManagerMixin, BaseModelManager):
     pass
 
 
 class Usage(DefaultOrganizationMixin, BaseModel):
-    # reference_type → reference_id (no FK; survives entity deletion):
-    #   "prompt_key"     → ToolStudioPrompt UUID (OSS)
-    #   "lookup_version" → LookupVersion UUID (cloud)
-
     id = models.UUIDField(
         primary_key=True,
         default=uuid.uuid4,
@@ -87,25 +78,20 @@ class Usage(DefaultOrganizationMixin, BaseModel):
     )
     total_tokens = models.IntegerField(db_comment="Total number of tokens used")
     cost_in_dollars = models.FloatField(db_comment="Total number of tokens used")
-    reference_id = models.UUIDField(
+    project_id = models.UUIDField(
         null=True,
         blank=True,
         db_comment=(
-            "Polymorphic correlation ID (no FK constraint) linking to the "
-            "entity that triggered this usage. Interpret via reference_type. "
-            "OSS values: prompt_key UUID. "
-            "NULL for most operations; survives entity deletion."
+            "Prompt Studio project (tool) the call belongs to (no FK; survives "
+            "tool deletion). NULL for embeddings and historical rows."
         ),
     )
-    reference_type = models.CharField(
-        max_length=64,
-        choices=REFERENCE_TYPE_CHOICES,
+    prompt_id = models.UUIDField(
         null=True,
         blank=True,
         db_comment=(
-            "Discriminator for reference_id. "
-            "OSS values: 'prompt_key'. "
-            "NULL when reference_id is NULL."
+            "Prompt key UUID that triggered the call (no FK; survives prompt "
+            "deletion). NULL for single-pass / embeddings / historical rows."
         ),
     )
     execution_time_ms = models.IntegerField(
@@ -137,22 +123,11 @@ class Meta:
             models.Index(fields=["run_id"]),
             models.Index(fields=["execution_id"]),
             models.Index(
-                fields=["llm_usage_reason", "reference_id", "-created_at"],
-                name="idx_usage_reason_ref_created",
+                fields=["project_id", "-created_at"],
+                name="idx_usage_project_created",
             ),
-        ]
-        constraints = [
-            # Both NULL or both set; a half-populated row is undecodable
-            # at billing-aggregation time.
-            models.CheckConstraint(
-                check=(
-                    models.Q(reference_id__isnull=True, reference_type__isnull=True)
-                    | models.Q(reference_id__isnull=False, reference_type__isnull=False)
-                ),
-                name="usage_reference_pair_consistent",
+            models.Index(
+                fields=["prompt_id", "-created_at"],
+                name="idx_usage_prompt_created",
             ),
-            # TODO: add (usage_type, llm_usage_reason) consistency constraint
-            # via ``ADD CONSTRAINT ... NOT VALID`` + batched ``VALIDATE`` —
-            # legacy embedding rows have ``llm_usage_reason=''`` and the
-            # default full-table scan would lock the billing table.
         ]
diff --git a/backend/usage_v2/serializers.py b/backend/usage_v2/serializers.py
index 5fb44f5423..7b7f8aaed5 100644
--- a/backend/usage_v2/serializers.py
+++ b/backend/usage_v2/serializers.py
@@ -41,8 +41,8 @@ class UsageRecordCreateSerializer(serializers.Serializer):
     completion_tokens = serializers.IntegerField(required=False, default=0)
     total_tokens = serializers.IntegerField(required=False, default=0)
     cost_in_dollars = serializers.FloatField(required=False, default=0.0)
-    reference_id = serializers.UUIDField(required=False, allow_null=True, default=None)
-    reference_type = serializers.CharField(required=False, allow_null=True, default=None)
+    project_id = serializers.UUIDField(required=False, allow_null=True, default=None)
+    prompt_id = serializers.UUIDField(required=False, allow_null=True, default=None)
     execution_time_ms = serializers.IntegerField(
         required=False, allow_null=True, default=None
     )
@@ -50,6 +50,8 @@ class UsageRecordCreateSerializer(serializers.Serializer):
     error_message = serializers.CharField(
         required=False, allow_null=True, allow_blank=True, default=None
     )
+    # Opaque carrier forwarded to post-write hooks; OSS never reads it.
+    cloud_extras = serializers.DictField(required=False, allow_null=True, default=None)
 
 
 class UsageBatchCreateSerializer(serializers.Serializer):

From c935d5891197489586c12246a12a75018395eceb Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 8 May 2026 13:49:15 +0530
Subject: [PATCH 54/57] UN-3494 [REVIEW] Idempotent hook registration +
 lookup-usage partial index

- register_post_write_hook now dedupes by identity so AppConfig.ready()
  re-firing under test reloads or dev autoreload can't queue a second
  LookupUsage write that would IntegrityError and roll back the batch.
- usage_objects builder collapsed to a comprehension (review polish).
- New 0005 migration step adds a partial index
  idx_usage_lookup_recent on (organization_id, created_at DESC)
  WHERE llm_usage_reason='lookup', so the per-(run x prompt) dashboard
  aggregation stops heap-scanning all Usage rows when filtering by
  organisation + reason.
---
 backend/usage_v2/hooks.py                     |  4 +-
 backend/usage_v2/internal_views.py            | 47 +++++++++----------
 .../0005_usage_reason_ref_created_idx.py      | 22 +++++++++
 backend/usage_v2/models.py                    |  6 +++
 4 files changed, 54 insertions(+), 25 deletions(-)

diff --git a/backend/usage_v2/hooks.py b/backend/usage_v2/hooks.py
index 615fa667ea..31d576e693 100644
--- a/backend/usage_v2/hooks.py
+++ b/backend/usage_v2/hooks.py
@@ -16,7 +16,9 @@
 
 
 def register_post_write_hook(fn: PostWriteHook) -> PostWriteHook:
-    _post_write_hooks.append(fn)
+    # Idempotent: ready() can re-fire under test reloads / dev autoreload.
+    if fn not in _post_write_hooks:
+        _post_write_hooks.append(fn)
     return fn
 
 
diff --git a/backend/usage_v2/internal_views.py b/backend/usage_v2/internal_views.py
index 9c5c8caaeb..85c20c16e4 100644
--- a/backend/usage_v2/internal_views.py
+++ b/backend/usage_v2/internal_views.py
@@ -172,31 +172,30 @@ def post(self, request: Request) -> Response:
                 "Organization context missing. Worker must send X-Organization-ID."
             )
 
-        usage_objects = []
-        for r in records:
-            usage_objects.append(
-                Usage(
-                    organization=organization,
-                    workflow_id=r.get("workflow_id", ""),
-                    execution_id=r.get("execution_id", ""),
-                    adapter_instance_id=r.get("adapter_instance_id", ""),
-                    run_id=r.get("run_id"),
-                    usage_type=r.get("usage_type", "llm"),
-                    # Coerce "" to None so the cross-field CheckConstraint passes.
-                    llm_usage_reason=r.get("llm_usage_reason") or None,
-                    model_name=r.get("model_name", ""),
-                    embedding_tokens=r.get("embedding_tokens", 0),
-                    prompt_tokens=r.get("prompt_tokens", 0),
-                    completion_tokens=r.get("completion_tokens", 0),
-                    total_tokens=r.get("total_tokens", 0),
-                    cost_in_dollars=r.get("cost_in_dollars", 0.0),
-                    project_id=r.get("project_id"),
-                    prompt_id=r.get("prompt_id"),
-                    execution_time_ms=r.get("execution_time_ms"),
-                    status=r.get("status"),
-                    error_message=r.get("error_message"),
-                )
+        usage_objects = [
+            Usage(
+                organization=organization,
+                workflow_id=r.get("workflow_id", ""),
+                execution_id=r.get("execution_id", ""),
+                adapter_instance_id=r.get("adapter_instance_id", ""),
+                run_id=r.get("run_id"),
+                usage_type=r.get("usage_type", "llm"),
+                # Coerce "" to None so the cross-field CheckConstraint passes.
+                llm_usage_reason=r.get("llm_usage_reason") or None,
+                model_name=r.get("model_name", ""),
+                embedding_tokens=r.get("embedding_tokens", 0),
+                prompt_tokens=r.get("prompt_tokens", 0),
+                completion_tokens=r.get("completion_tokens", 0),
+                total_tokens=r.get("total_tokens", 0),
+                cost_in_dollars=r.get("cost_in_dollars", 0.0),
+                project_id=r.get("project_id"),
+                prompt_id=r.get("prompt_id"),
+                execution_time_ms=r.get("execution_time_ms"),
+                status=r.get("status"),
+                error_message=r.get("error_message"),
             )
+            for r in records
+        ]
 
         try:
             # Atomic with hooks: orphan Usage rows are worse than retrying.
diff --git a/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
index 58bac40acb..c93d4de605 100644
--- a/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
+++ b/backend/usage_v2/migrations/0005_usage_reason_ref_created_idx.py
@@ -1,4 +1,5 @@
 from django.db import migrations, models
+from django.db.models import Q
 
 
 class Migration(migrations.Migration):
@@ -51,4 +52,25 @@ class Migration(migrations.Migration):
                 ),
             ],
         ),
+        # Partial — only lookup-reason rows. Avoids heap-scanning all
+        # Usage rows when the dashboard groups by (run × prompt).
+        migrations.RunSQL(
+            sql=(
+                "CREATE INDEX CONCURRENTLY IF NOT EXISTS "
+                "idx_usage_lookup_recent "
+                'ON "usage" (organization_id, created_at DESC) '
+                "WHERE llm_usage_reason = 'lookup';"
+            ),
+            reverse_sql=("DROP INDEX CONCURRENTLY IF EXISTS idx_usage_lookup_recent;"),
+            state_operations=[
+                migrations.AddIndex(
+                    model_name="usage",
+                    index=models.Index(
+                        fields=["organization", "-created_at"],
+                        name="idx_usage_lookup_recent",
+                        condition=Q(llm_usage_reason="lookup"),
+                    ),
+                ),
+            ],
+        ),
     ]
diff --git a/backend/usage_v2/models.py b/backend/usage_v2/models.py
index b1ff6a297b..0267d4a68f 100644
--- a/backend/usage_v2/models.py
+++ b/backend/usage_v2/models.py
@@ -1,6 +1,7 @@
 import uuid
 
 from django.db import models
+from django.db.models import Q
 from utils.models.base_model import BaseModel, BaseModelManager
 from utils.models.organization_mixin import (
     DefaultOrganizationManagerMixin,
@@ -130,4 +131,9 @@ class Meta:
                 fields=["prompt_id", "-created_at"],
                 name="idx_usage_prompt_created",
             ),
+            models.Index(
+                fields=["organization", "-created_at"],
+                name="idx_usage_lookup_recent",
+                condition=Q(llm_usage_reason="lookup"),
+            ),
         ]

From a4969ffecd5919a602f4753463f4637f9d4e4b92 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 8 May 2026 17:21:34 +0530
Subject: [PATCH 55/57] UN-3494 [FIX] Forward answer-step metadata in structure
 pipeline
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The SP cloud plugin returns its usage_records via ExecutionResult.metadata;
the non-SP path recovers them via self._usage_records in
LegacyExecutor.execute(). _handle_structure_pipeline only honoured the
second carrier — every SP-mode API deployment lost its extraction +
lookup billing rows silently because tasks.py guards the flush behind
``if usage_records:`` and the empty list short-circuits the post.

Forwarding answer_result.metadata closes the gap. Surface drift here
deserves a follow-up to consolidate to a single carrier; tracked
separately.
---
 workers/executor/executors/legacy_executor.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index afa33b7c00..795cbfe27e 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -665,7 +665,13 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
         )
 
         shim.stream_log("Pipeline completed successfully")
-        return ExecutionResult(success=True, data=structured_output)
+        # SP plugin returns usage_records via metadata; non-SP recovers
+        # them via self._usage_records in execute(). Forward either way.
+        return ExecutionResult(
+            success=True,
+            data=structured_output,
+            metadata=answer_result.metadata or {},
+        )
 
     def _run_pipeline_answer_step(
         self,

From c53c51d260d761f56ea800cd1dcff36795e8220f Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Fri, 8 May 2026 19:53:53 +0530
Subject: [PATCH 56/57] UN-3494 [REFACTOR] Unify usage-records carrier and
 propagate execution_id
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Collapses the dual-carrier pattern in the executor worker so every
handler returns its rows via ExecutionResult.metadata["usage_records"].
LegacyExecutor's instance attribute and recovery hook are removed; each
helper returns its records, orchestrators absorb child metadata into a
single list, and partial rows survive a mid-pipeline failure via
LegacyExecutorError.partial_usage_records. tasks.py now logs an INFO
line when an LLM-bearing op succeeds with zero rows so future drift
surfaces immediately.

Also fixes the long-standing dispatcher gap where structure_tool_task
omitted execution_id and file_execution_id when constructing
ExecutionContext for structure_pipeline / table_extract. The fields were
only stuffed inside executor_params, so context.execution_id was None
for every downstream handler. The legacy answer-prompt handler dug into
executor_params and worked, but SP plugin and summarize handlers
fell back to "" — and the dashboard's classifier mapped empty
execution_id to the IDE bucket. Setting the dataclass field at dispatch
plus reading context.execution_id in _handle_summarize lets workflow
rows classify as WF/API.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 workers/executor/executors/exceptions.py      |  13 +-
 workers/executor/executors/legacy_executor.py | 452 +++++++++++-------
 workers/executor/tasks.py                     |  18 +
 .../file_processing/structure_tool_task.py    |   4 +
 4 files changed, 299 insertions(+), 188 deletions(-)

diff --git a/workers/executor/executors/exceptions.py b/workers/executor/executors/exceptions.py
index 69cd0a8a16..d73c56d970 100644
--- a/workers/executor/executors/exceptions.py
+++ b/workers/executor/executors/exceptions.py
@@ -9,18 +9,25 @@ class is replaced with ``LegacyExecutorError`` so these exceptions
 class LegacyExecutorError(Exception):
     """Base exception for legacy executor errors.
 
-    Replaces Flask's ``APIError`` — carries ``message`` and ``code``
-    attributes so callers can map to ``ExecutionResult.failure()``.
+    ``partial_usage_records`` lets each layer that catches this error
+    prepend its in-flight records before re-raising, so rows already
+    paid for survive a mid-pipeline failure.
     """
 
     code: int = 500
     message: str = "Internal executor error"
 
-    def __init__(self, message: str | None = None, code: int | None = None):
+    def __init__(
+        self,
+        message: str | None = None,
+        code: int | None = None,
+        partial_usage_records: list[dict] | None = None,
+    ):
         if message is not None:
             self.message = message
         if code is not None:
             self.code = code
+        self.partial_usage_records: list[dict] = list(partial_usage_records or [])
         super().__init__(self.message)
 
 
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 795cbfe27e..773684aa07 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -62,14 +62,12 @@ class LegacyExecutor(BaseExecutor):
     }
 
     def __init__(self) -> None:
-        # Per-request state, overwritten in execute(). Seed _usage_records here
-        # so an early-init crash still exposes a real list to the orchestrator.
+        # Per-request state, overwritten in execute().
         self._log_events_id: str = ""
         self._log_component: dict[str, str] = {}
         self._execution_id: str | None = None
         self._file_execution_id: str | None = None
         self._organization_id: str | None = None
-        self._usage_records: list[dict[str, Any]] = []
 
     @property
     def name(self) -> str:
@@ -91,7 +89,6 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
         self._log_component: dict[str, str] = (
             getattr(context, "_log_component", None) or {}
         )
-        self._usage_records = []
         self._execution_id = context.execution_id
         self._file_execution_id = context.file_execution_id
         self._organization_id = context.organization_id
@@ -133,11 +130,6 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                 context.run_id,
                 result.success,
             )
-            # Attach collected usage records to the result metadata
-            if self._usage_records:
-                result.metadata.setdefault("usage_records", []).extend(
-                    self._usage_records
-                )
             return result
         except LegacyExecutorError as exc:
             elapsed = time.monotonic() - start
@@ -164,12 +156,11 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                         context.run_id,
                         exc_info=True,
                     )
-            # Preserve any usage rows collected before the failure so the task
-            # wrapper still flushes them. Without this, transient errors that
-            # trigger Celery autoretry re-run LLMs and lose billing rows.
+            # Handlers attach partial records to the exception so a
+            # mid-pipeline failure still flushes rows already paid for.
             failure_metadata: dict[str, Any] = {}
-            if self._usage_records:
-                failure_metadata["usage_records"] = list(self._usage_records)
+            if exc.partial_usage_records:
+                failure_metadata["usage_records"] = list(exc.partial_usage_records)
             return ExecutionResult.failure(error=exc.message, metadata=failure_metadata)
 
     def _build_shim(
@@ -371,12 +362,10 @@ def _get_indexing_deps():
 
     def _run_summarize_step(
         self, summarize_params: dict, context: ExecutionContext
-    ) -> ExecutionResult | None:
+    ) -> ExecutionResult:
         """Run summarization if not already cached.
 
-        Returns:
-            ``None`` on success (summary written or cached), or an
-            ``ExecutionResult`` failure to propagate to the caller.
+        Cache hit returns success with empty metadata (no LLM call).
         """
         extract_file_path = summarize_params.get("extract_file_path", "")
         summarize_file_path = summarize_params.get("summarize_file_path", "")
@@ -391,7 +380,7 @@ def _run_summarize_step(
         if fs.exists(summarize_file_path):
             existing = fs.read(path=summarize_file_path, mode="r")
             if existing:
-                return None
+                return ExecutionResult(success=True, data={})
 
         doc_context = fs.read(path=extract_file_path, mode="r")
         if not doc_context:
@@ -428,7 +417,9 @@ def _run_summarize_step(
             mode="w",
             data=summarize_result.data.get("data", ""),
         )
-        return None
+        return ExecutionResult(
+            success=True, data={}, metadata=dict(summarize_result.metadata or {})
+        )
 
     # ------------------------------------------------------------------
     # Phase 5C — Compound IDE index handler (extract + index)
@@ -465,60 +456,81 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
                 error=f"ide_index missing required params: {', '.join(missing)}"
             )
 
-        # Step 1: Extract (or reuse pre-extracted text on marker hit)
-        pre_extracted_text = index_params.get(IKeys.EXTRACTED_TEXT, "") or ""
-        if pre_extracted_text:
-            logger.info(
-                "ide_index: marker hit, skipping extract step (len=%d, run_id=%s)",
-                len(pre_extracted_text),
-                context.run_id,
-            )
-            extracted_text = pre_extracted_text
-        else:
-            extract_ctx = ExecutionContext(
+        # Aggregated across child steps so the caller sees one list.
+        ide_records: list[dict[str, Any]] = []
+
+        def _absorb(child: ExecutionResult) -> None:
+            child_records = (child.metadata or {}).get("usage_records") or []
+            if child_records:
+                ide_records.extend(child_records)
+
+        def _failure(child: ExecutionResult) -> ExecutionResult:
+            metadata = dict(child.metadata or {})
+            existing = metadata.get("usage_records") or []
+            metadata["usage_records"] = ide_records + list(existing)
+            return ExecutionResult.failure(error=child.error, metadata=metadata)
+
+        try:
+            # Step 1: Extract (or reuse pre-extracted text on marker hit)
+            pre_extracted_text = index_params.get(IKeys.EXTRACTED_TEXT, "") or ""
+            if pre_extracted_text:
+                logger.info(
+                    "ide_index: marker hit, skipping extract step (len=%d, run_id=%s)",
+                    len(pre_extracted_text),
+                    context.run_id,
+                )
+                extracted_text = pre_extracted_text
+            else:
+                extract_ctx = ExecutionContext(
+                    executor_name=context.executor_name,
+                    operation=Operation.EXTRACT.value,
+                    run_id=context.run_id,
+                    execution_source=context.execution_source,
+                    organization_id=context.organization_id,
+                    executor_params=extract_params,
+                    request_id=context.request_id,
+                    log_events_id=context.log_events_id,
+                    execution_id=context.execution_id,
+                    file_execution_id=context.file_execution_id,
+                )
+                extract_result = self._handle_extract(extract_ctx)
+                if not extract_result.success:
+                    return _failure(extract_result)
+                _absorb(extract_result)
+                extracted_text = extract_result.data.get(IKeys.EXTRACTED_TEXT, "")
+
+            # Step 2: Optional summarize
+            summarize_params = params.get("summarize_params")
+            summarize_file_path = ""
+            if summarize_params:
+                summarize_file_path = summarize_params.get("summarize_file_path", "")
+                summarize_result = self._run_summarize_step(summarize_params, context)
+                if not summarize_result.success:
+                    return _failure(summarize_result)
+                _absorb(summarize_result)
+
+            # Step 3: Index — inject extracted text
+            index_params[IKeys.EXTRACTED_TEXT] = extracted_text
+
+            index_ctx = ExecutionContext(
                 executor_name=context.executor_name,
-                operation=Operation.EXTRACT.value,
+                operation=Operation.INDEX.value,
                 run_id=context.run_id,
                 execution_source=context.execution_source,
                 organization_id=context.organization_id,
-                executor_params=extract_params,
+                executor_params=index_params,
                 request_id=context.request_id,
                 log_events_id=context.log_events_id,
                 execution_id=context.execution_id,
                 file_execution_id=context.file_execution_id,
             )
-            extract_result = self._handle_extract(extract_ctx)
-            if not extract_result.success:
-                return extract_result
-            extracted_text = extract_result.data.get(IKeys.EXTRACTED_TEXT, "")
-
-        # Step 2: Optional summarize
-        summarize_params = params.get("summarize_params")
-        summarize_file_path = ""
-        if summarize_params:
-            summarize_file_path = summarize_params.get("summarize_file_path", "")
-            result = self._run_summarize_step(summarize_params, context)
-            if result is not None:
-                return result
-
-        # Step 3: Index — inject extracted text
-        index_params[IKeys.EXTRACTED_TEXT] = extracted_text
-
-        index_ctx = ExecutionContext(
-            executor_name=context.executor_name,
-            operation=Operation.INDEX.value,
-            run_id=context.run_id,
-            execution_source=context.execution_source,
-            organization_id=context.organization_id,
-            executor_params=index_params,
-            request_id=context.request_id,
-            log_events_id=context.log_events_id,
-            execution_id=context.execution_id,
-            file_execution_id=context.file_execution_id,
-        )
-        index_result = self._handle_index(index_ctx)
-        if not index_result.success:
-            return index_result
+            index_result = self._handle_index(index_ctx)
+            if not index_result.success:
+                return _failure(index_result)
+            _absorb(index_result)
+        except LegacyExecutorError as e:
+            e.partial_usage_records = ide_records + e.partial_usage_records
+            raise
 
         return ExecutionResult(
             success=True,
@@ -526,6 +538,7 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
                 IKeys.DOC_ID: index_result.data.get(IKeys.DOC_ID, ""),
                 "summarize_file_path": summarize_file_path,
             },
+            metadata={"usage_records": ide_records},
         )
 
     # ------------------------------------------------------------------
@@ -579,81 +592,101 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
 
         extracted_text = ""
         index_metrics: dict = {}
+        # Aggregated across child steps so the caller sees one list.
+        pipeline_records: list[dict[str, Any]] = []
+
+        def _absorb(child_result: ExecutionResult) -> None:
+            child_records = (child_result.metadata or {}).get("usage_records") or []
+            if child_records:
+                pipeline_records.extend(child_records)
+
+        def _failure(child_result: ExecutionResult) -> ExecutionResult:
+            metadata = dict(child_result.metadata or {})
+            existing = metadata.get("usage_records") or []
+            metadata["usage_records"] = pipeline_records + list(existing)
+            return ExecutionResult.failure(error=child_result.error, metadata=metadata)
 
         shim = self._build_shim(
             platform_api_key=extract_params.get("platform_api_key", ""),
         )
         step = 1
 
-        # ---- Step 1: Extract ----
-        if not skip_extraction:
-            shim.stream_log(f"Pipeline step {step}: Extracting text from document...")
-            step += 1
-            extract_ctx = ExecutionContext(
-                executor_name=context.executor_name,
-                operation=Operation.EXTRACT.value,
-                run_id=context.run_id,
-                execution_source=context.execution_source,
-                organization_id=context.organization_id,
-                executor_params=extract_params,
-                request_id=context.request_id,
-                log_events_id=context.log_events_id,
-                execution_id=context.execution_id,
-                file_execution_id=context.file_execution_id,
-            )
-            extract_result = self._handle_extract(extract_ctx)
-            if not extract_result.success:
-                return extract_result
-            extracted_text = extract_result.data.get(IKeys.EXTRACTED_TEXT, "")
-
-        # ---- Step 2: Summarize (if enabled) ----
-        if is_summarization:
-            shim.stream_log(f"Pipeline step {step}: Summarizing extracted text...")
-            step += 1
-            summarize_result = self._run_pipeline_summarize(
-                context=context,
-                summarize_params=summarize_params or {},
-                answer_params=answer_params,
-            )
-            if not summarize_result.success:
-                return summarize_result
-            # answer_params file_path/hash updated in-place by helper
-        elif skip_extraction:
-            # Smart table: use original source file
-            answer_params["file_path"] = input_file_path
-        elif not is_single_pass:
-            # ---- Step 3: Index per output with dedup ----
-            shim.stream_log(
-                f"Pipeline step {step}: Indexing document into vector store..."
-            )
-            step += 1
-            index_metrics = self._run_pipeline_index(
-                context=context,
-                index_template=index_template,
-                answer_params=answer_params,
-                extracted_text=extracted_text,
-                usage_kwargs=extract_params.get("usage_kwargs", {}),
-            )
+        try:
+            # ---- Step 1: Extract ----
+            if not skip_extraction:
+                shim.stream_log(f"Pipeline step {step}: Extracting text from document...")
+                step += 1
+                extract_ctx = ExecutionContext(
+                    executor_name=context.executor_name,
+                    operation=Operation.EXTRACT.value,
+                    run_id=context.run_id,
+                    execution_source=context.execution_source,
+                    organization_id=context.organization_id,
+                    executor_params=extract_params,
+                    request_id=context.request_id,
+                    log_events_id=context.log_events_id,
+                    execution_id=context.execution_id,
+                    file_execution_id=context.file_execution_id,
+                )
+                extract_result = self._handle_extract(extract_ctx)
+                if not extract_result.success:
+                    return _failure(extract_result)
+                _absorb(extract_result)
+                extracted_text = extract_result.data.get(IKeys.EXTRACTED_TEXT, "")
+
+            # ---- Step 2: Summarize (if enabled) ----
+            if is_summarization:
+                shim.stream_log(f"Pipeline step {step}: Summarizing extracted text...")
+                step += 1
+                summarize_result = self._run_pipeline_summarize(
+                    context=context,
+                    summarize_params=summarize_params or {},
+                    answer_params=answer_params,
+                )
+                if not summarize_result.success:
+                    return _failure(summarize_result)
+                _absorb(summarize_result)
+                # answer_params file_path/hash updated in-place by helper
+            elif skip_extraction:
+                # Smart table: use original source file
+                answer_params["file_path"] = input_file_path
+            elif not is_single_pass:
+                # ---- Step 3: Index per output with dedup ----
+                shim.stream_log(
+                    f"Pipeline step {step}: Indexing document into vector store..."
+                )
+                step += 1
+                index_metrics = self._run_pipeline_index(
+                    context=context,
+                    index_template=index_template,
+                    answer_params=answer_params,
+                    extracted_text=extracted_text,
+                    usage_kwargs=extract_params.get("usage_kwargs", {}),
+                )
 
-        # ---- Step 4: Table settings injection ----
-        if not is_single_pass:
-            self._inject_table_settings(
+            # ---- Step 4: Table settings injection ----
+            if not is_single_pass:
+                self._inject_table_settings(
+                    answer_params=answer_params,
+                    index_template=index_template,
+                    skip_extraction=skip_extraction,
+                    input_file_path=input_file_path,
+                )
+
+            # ---- Step 5: Answer prompt / Single pass ----
+            answer_result = self._run_pipeline_answer_step(
+                context=context,
                 answer_params=answer_params,
-                index_template=index_template,
-                skip_extraction=skip_extraction,
-                input_file_path=input_file_path,
+                is_single_pass=is_single_pass,
+                shim=shim,
+                step=step,
             )
-
-        # ---- Step 5: Answer prompt / Single pass ----
-        answer_result = self._run_pipeline_answer_step(
-            context=context,
-            answer_params=answer_params,
-            is_single_pass=is_single_pass,
-            shim=shim,
-            step=step,
-        )
-        if not answer_result.success:
-            return answer_result
+            if not answer_result.success:
+                return _failure(answer_result)
+            _absorb(answer_result)
+        except LegacyExecutorError as e:
+            e.partial_usage_records = pipeline_records + e.partial_usage_records
+            raise
 
         # ---- Step 6: Merge results ----
         structured_output = answer_result.data
@@ -665,12 +698,17 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
         )
 
         shim.stream_log("Pipeline completed successfully")
-        # SP plugin returns usage_records via metadata; non-SP recovers
-        # them via self._usage_records in execute(). Forward either way.
+        # Forward non-usage_records metadata keys as-is.
+        out_metadata = {
+            k: v
+            for k, v in (answer_result.metadata or {}).items()
+            if k != "usage_records"
+        }
+        out_metadata["usage_records"] = pipeline_records
         return ExecutionResult(
             success=True,
             data=structured_output,
-            metadata=answer_result.metadata or {},
+            metadata=out_metadata,
         )
 
     def _run_pipeline_answer_step(
@@ -834,13 +872,17 @@ def _run_pipeline_summarize(
                 mode="w",
                 data=summarized_context,
             )
+            forward_metadata = dict(summarize_result.metadata or {})
+        else:
+            # Cache hit: no LLM call.
+            forward_metadata = {}
 
         # Update answer_params
         summarize_file_hash = fs.get_hash_from_file(path=summarize_file_path)
         answer_params["file_hash"] = summarize_file_hash
         answer_params["file_path"] = str(summarize_file_path)
 
-        return ExecutionResult(success=True, data={})
+        return ExecutionResult(success=True, data={}, metadata=forward_metadata)
 
     def _run_pipeline_index(
         self,
@@ -1334,19 +1376,26 @@ def _handle_answer_prompt(self, context: ExecutionContext) -> ExecutionResult:
             embedding_compat_cls,
             vector_db_cls,
         )
-        for output in prompts:
-            self._execute_single_prompt(
-                output=output,
-                context=context,
-                structured_output=structured_output,
-                metadata=metadata,
-                metrics=metrics,
-                variable_names=variable_names,
-                context_retrieval_metrics=context_retrieval_metrics,
-                deps=_deps,
-                tool_settings=tool_settings,
-                process_text_fn=process_text_fn,
-            )
+        usage_records: list[dict[str, Any]] = []
+        try:
+            for output in prompts:
+                usage_records.extend(
+                    self._execute_single_prompt(
+                        output=output,
+                        context=context,
+                        structured_output=structured_output,
+                        metadata=metadata,
+                        metrics=metrics,
+                        variable_names=variable_names,
+                        context_retrieval_metrics=context_retrieval_metrics,
+                        deps=_deps,
+                        tool_settings=tool_settings,
+                        process_text_fn=process_text_fn,
+                    )
+                )
+        except LegacyExecutorError as e:
+            e.partial_usage_records = usage_records + e.partial_usage_records
+            raise
 
         pipeline_shim.stream_log(f"All {len(prompts)} prompts processed successfully")
         logger.info(
@@ -1366,6 +1415,7 @@ def _handle_answer_prompt(self, context: ExecutionContext) -> ExecutionResult:
                 PSKeys.METADATA: metadata,
                 PSKeys.METRICS: metrics,
             },
+            metadata={"usage_records": usage_records},
         )
 
     @staticmethod
@@ -1422,19 +1472,19 @@ def _run_challenge_if_enabled(
         metadata: dict[str, Any],
         shim: Any,
         prompt_name: str,
-    ) -> None:
-        """Run challenge verification plugin if enabled and available."""
+    ) -> list[dict[str, Any]]:
+        """Run the challenge plugin if enabled. Returns its usage rows."""
         from executor.executors.constants import PromptServiceConstants as PSKeys
         from executor.executors.plugins import ExecutorPluginLoader
 
         if not tool_settings.get(PSKeys.ENABLE_CHALLENGE):
-            return
+            return []
         challenge_cls = ExecutorPluginLoader.get("challenge")
         if not challenge_cls:
-            return
+            return []
         challenge_llm_id = tool_settings.get(PSKeys.CHALLENGE_LLM)
         if not challenge_llm_id:
-            return
+            return []
         shim.stream_log(f"Running challenge for: `{prompt_name}`")
         challenge_llm = llm_cls(
             adapter_instance_id=challenge_llm_id,
@@ -1455,12 +1505,16 @@ def _run_challenge_if_enabled(
         )
         try:
             challenger.run()
-        finally:
-            # Flush even on exception so transient errors don't drop the
-            # challenge LLM's billing rows.
-            self._usage_records.extend(challenge_llm.flush_pending_usage())
+        except LegacyExecutorError as e:
+            # Flush before bubbling so partial rows survive.
+            e.partial_usage_records = (
+                list(challenge_llm.flush_pending_usage()) + e.partial_usage_records
+            )
+            raise
+        records = list(challenge_llm.flush_pending_usage())
         shim.stream_log(f"Challenge verification completed for: `{prompt_name}`")
         logger.info("Challenge completed: prompt=%s", prompt_name)
+        return records
 
     @staticmethod
     def _run_evaluation_if_enabled(
@@ -1506,8 +1560,8 @@ def _execute_single_prompt(
         deps: tuple,
         tool_settings: dict[str, Any],
         process_text_fn: Any,
-    ) -> None:
-        """Execute one prompt: variable replacement, retrieval, LLM, post-process."""
+    ) -> list[dict[str, Any]]:
+        """Run one prompt end-to-end; return its usage rows."""
         from executor.executors.constants import PromptServiceConstants as PSKeys
         from executor.executors.constants import RetrievalStrategy
 
@@ -1598,7 +1652,7 @@ def _execute_single_prompt(
                 prompt_name=prompt_name,
                 shim=shim,
             )
-            return
+            return []
 
         if output.get(PSKeys.TYPE) == PSKeys.LINE_ITEM:
             self._run_line_item_extraction(
@@ -1620,7 +1674,7 @@ def _execute_single_prompt(
                 },
                 shim=shim,
             )
-            return
+            return []
 
         usage_kwargs = {"run_id": run_id, "execution_id": execution_id}
         llm, embedding, vector_db = self._init_llm_and_retrieval(
@@ -1635,6 +1689,7 @@ def _execute_single_prompt(
         )
 
         context_list: list[str] = []
+        records: list[dict[str, Any]] = []
         try:
             answer = "NA"
             retrieval_strategy = output.get(PSKeys.RETRIEVAL_STRATEGY)
@@ -1706,7 +1761,7 @@ def _execute_single_prompt(
             )
             shim.stream_log(f"Applied type conversion for: `{prompt_name}`")
 
-            self._usage_records.extend(
+            records.extend(
                 run_lookup_enrichment(
                     output=output,
                     structured_output=structured_output,
@@ -1724,19 +1779,21 @@ def _execute_single_prompt(
                 shim=shim,
             )
 
-            self._run_challenge_if_enabled(
-                tool_settings=tool_settings,
-                output=output,
-                structured_output=structured_output,
-                context_list=context_list,
-                llm=llm,
-                llm_cls=llm_cls,
-                usage_kwargs=usage_kwargs,
-                run_id=run_id,
-                platform_api_key=platform_api_key,
-                metadata=metadata,
-                shim=shim,
-                prompt_name=prompt_name,
+            records.extend(
+                self._run_challenge_if_enabled(
+                    tool_settings=tool_settings,
+                    output=output,
+                    structured_output=structured_output,
+                    context_list=context_list,
+                    llm=llm,
+                    llm_cls=llm_cls,
+                    usage_kwargs=usage_kwargs,
+                    run_id=run_id,
+                    platform_api_key=platform_api_key,
+                    metadata=metadata,
+                    shim=shim,
+                    prompt_name=prompt_name,
+                )
             )
             self._run_evaluation_if_enabled(
                 output=output,
@@ -1751,7 +1808,20 @@ def _execute_single_prompt(
             val = structured_output.get(prompt_name)
             if isinstance(val, str):
                 structured_output[prompt_name] = val.rstrip("\n")
-        finally:
+        except LegacyExecutorError as e:
+            # Flush before bubbling so partial rows survive.
+            flushed = self._flush_per_prompt_metrics(
+                metrics=metrics,
+                context_retrieval_metrics=context_retrieval_metrics,
+                prompt_name=prompt_name,
+                llm=llm,
+                embedding=embedding,
+                vector_db=vector_db,
+                chunk_size=chunk_size,
+            )
+            e.partial_usage_records = records + flushed + e.partial_usage_records
+            raise
+        records.extend(
             self._flush_per_prompt_metrics(
                 metrics=metrics,
                 context_retrieval_metrics=context_retrieval_metrics,
@@ -1761,6 +1831,8 @@ def _execute_single_prompt(
                 vector_db=vector_db,
                 chunk_size=chunk_size,
             )
+        )
+        return records
 
     def _init_llm_and_retrieval(
         self,
@@ -1815,14 +1887,15 @@ def _flush_per_prompt_metrics(
         embedding: Any,
         vector_db: Any,
         chunk_size: int,
-    ) -> None:
+    ) -> list[dict[str, Any]]:
+        """Flush LLM + embedding usage rows and return them."""
         metrics.setdefault(prompt_name, {}).update(
             {
                 "context_retrieval": context_retrieval_metrics.get(prompt_name, {}),
                 f"{llm.get_usage_reason()}_llm": llm.get_metrics(),
             }
         )
-        self._usage_records.extend(llm.flush_pending_usage())
+        records: list[dict[str, Any]] = list(llm.flush_pending_usage())
         # Public adapters skip the callback_manager, so there's nothing to flush.
         if chunk_size > 0 and embedding is not None and embedding.callback_manager:
             for handler in embedding.callback_manager.handlers:
@@ -1830,7 +1903,7 @@ def _flush_per_prompt_metrics(
                     continue
                 # Per-handler guard so one bad handler doesn't drop the rest.
                 try:
-                    self._usage_records.extend(handler.flush_pending_usage())
+                    records.extend(handler.flush_pending_usage())
                 except Exception:
                     logger.warning(
                         "Failed to flush usage from embedding handler %s",
@@ -1839,6 +1912,7 @@ def _flush_per_prompt_metrics(
                     )
         if vector_db:
             vector_db.close()
+        return records
 
     def _run_table_extraction(
         self,
@@ -2197,14 +2271,17 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
         )
 
         shim = self._build_shim(platform_api_key=platform_api_key)
+        # ``execution_id`` drives Usage-row classification on the dashboard.
         usage_kwargs = {
             "run_id": context.run_id,
+            "execution_id": context.execution_id or "",
             PSKeys.LLM_USAGE_REASON: PSKeys.SUMMARIZE,
         }
 
         _, _, _, _, llm_cls, _, _ = self._get_prompt_deps()
 
         shim.stream_log("Initializing LLM for summarization...")
+        llm: Any = None
         try:
             llm = llm_cls(
                 adapter_instance_id=llm_adapter_id,
@@ -2216,22 +2293,27 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
             )
 
             shim.stream_log("Running document summarization...")
-            try:
-                summary = answer_prompt_svc.run_completion(llm=llm, prompt=prompt)
-            finally:
-                # Flush even on exception so the summarization LLM's
-                # billing rows aren't lost on transient errors.
-                self._usage_records.extend(llm.flush_pending_usage())
+            summary = answer_prompt_svc.run_completion(llm=llm, prompt=prompt)
+            records = list(llm.flush_pending_usage())
             logger.info("Summarization completed: run_id=%s", context.run_id)
             shim.stream_log("Summarization completed")
             return ExecutionResult(
                 success=True,
                 data={"data": summary},
+                metadata={"usage_records": records},
             )
         except Exception as e:
+            # Flush before re-raising so partial rows survive.
+            partial: list[dict] = []
+            if llm is not None:
+                try:
+                    partial = list(llm.flush_pending_usage())
+                except Exception:
+                    logger.debug("flush_pending_usage failed during error path")
             logger.error("Summarization failed: error=%s", str(e))
             status_code = getattr(e, "status_code", None) or 500
             raise LegacyExecutorError(
                 message=f"Error during summarization: {e}",
                 code=status_code,
+                partial_usage_records=partial,
             ) from e
diff --git a/workers/executor/tasks.py b/workers/executor/tasks.py
index 49fbfe8746..dc817dc099 100644
--- a/workers/executor/tasks.py
+++ b/workers/executor/tasks.py
@@ -17,6 +17,16 @@
 
 logger = WorkerLogger.get_logger(__name__)
 
+# Operations that always make LLM calls; used by the empty-records guard.
+_LLM_BEARING_OPS = frozenset(
+    {
+        "answer_prompt",
+        "single_pass_extraction",
+        "summarize",
+        "structure_pipeline",
+    }
+)
+
 
 @shared_task(
     bind=True,
@@ -128,6 +138,14 @@ def execute_extraction(self, execution_context_dict: dict) -> dict:
                 context.organization_id,
                 exc_info=True,
             )
+    elif result.success and context.operation in _LLM_BEARING_OPS:
+        logger.info(
+            "No usage_records emitted for op=%s run_id=%s organization_id=%s "
+            "(unexpected for an LLM-bearing operation)",
+            context.operation,
+            context.run_id,
+            context.organization_id,
+        )
 
     logger.info(
         "execute_extraction complete: celery_task_id=%s request_id=%s success=%s",
diff --git a/workers/file_processing/structure_tool_task.py b/workers/file_processing/structure_tool_task.py
index c0fdee1c00..502e48ff32 100644
--- a/workers/file_processing/structure_tool_task.py
+++ b/workers/file_processing/structure_tool_task.py
@@ -459,6 +459,8 @@ def _execute_structure_tool_impl(params: dict) -> dict:
             execution_source="tool",
             organization_id=organization_id,
             request_id=file_execution_id,
+            execution_id=execution_id,
+            file_execution_id=file_execution_id,
             executor_params=agentic_params,
         )
         at_result = dispatcher.dispatch(at_ctx, timeout=EXECUTOR_TIMEOUT)
@@ -488,6 +490,8 @@ def _execute_structure_tool_impl(params: dict) -> dict:
             execution_source="tool",
             organization_id=organization_id,
             request_id=file_execution_id,
+            execution_id=execution_id,
+            file_execution_id=file_execution_id,
             executor_params={
                 "extract_params": extract_params,
                 "index_template": index_template,

From ff85c38b84782ba5aee5000512977f066f656ae9 Mon Sep 17 00:00:00 2001
From: Chandrasekharan M <chandrasekharan@zipstack.com>
Date: Mon, 11 May 2026 11:06:16 +0530
Subject: [PATCH 57/57] UN-3494 [REVIEW] Trim verbose code comments

Drop WHAT-comments, references to PR/conversation context, and
multi-line explanations that didn't add WHY. Comments now describe
behavior generically so they make sense without prior context.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 workers/executor/executors/exceptions.py      |  4 +---
 workers/executor/executors/legacy_executor.py | 10 ++--------
 workers/executor/tasks.py                     |  9 ++-------
 3 files changed, 5 insertions(+), 18 deletions(-)

diff --git a/workers/executor/executors/exceptions.py b/workers/executor/executors/exceptions.py
index d73c56d970..3db8358827 100644
--- a/workers/executor/executors/exceptions.py
+++ b/workers/executor/executors/exceptions.py
@@ -9,9 +9,7 @@ class is replaced with ``LegacyExecutorError`` so these exceptions
 class LegacyExecutorError(Exception):
     """Base exception for legacy executor errors.
 
-    ``partial_usage_records`` lets each layer that catches this error
-    prepend its in-flight records before re-raising, so rows already
-    paid for survive a mid-pipeline failure.
+    ``partial_usage_records`` preserves billing rows across mid-pipeline failures.
     """
 
     code: int = 500
diff --git a/workers/executor/executors/legacy_executor.py b/workers/executor/executors/legacy_executor.py
index 773684aa07..0ddb29e261 100644
--- a/workers/executor/executors/legacy_executor.py
+++ b/workers/executor/executors/legacy_executor.py
@@ -62,7 +62,6 @@ class LegacyExecutor(BaseExecutor):
     }
 
     def __init__(self) -> None:
-        # Per-request state, overwritten in execute().
         self._log_events_id: str = ""
         self._log_component: dict[str, str] = {}
         self._execution_id: str | None = None
@@ -156,8 +155,7 @@ def execute(self, context: ExecutionContext) -> ExecutionResult:
                         context.run_id,
                         exc_info=True,
                     )
-            # Handlers attach partial records to the exception so a
-            # mid-pipeline failure still flushes rows already paid for.
+            # Preserve partial usage rows from a mid-pipeline failure.
             failure_metadata: dict[str, Any] = {}
             if exc.partial_usage_records:
                 failure_metadata["usage_records"] = list(exc.partial_usage_records)
@@ -456,7 +454,6 @@ def _handle_ide_index(self, context: ExecutionContext) -> ExecutionResult:
                 error=f"ide_index missing required params: {', '.join(missing)}"
             )
 
-        # Aggregated across child steps so the caller sees one list.
         ide_records: list[dict[str, Any]] = []
 
         def _absorb(child: ExecutionResult) -> None:
@@ -592,7 +589,6 @@ def _handle_structure_pipeline(self, context: ExecutionContext) -> ExecutionResu
 
         extracted_text = ""
         index_metrics: dict = {}
-        # Aggregated across child steps so the caller sees one list.
         pipeline_records: list[dict[str, Any]] = []
 
         def _absorb(child_result: ExecutionResult) -> None:
@@ -698,7 +694,6 @@ def _failure(child_result: ExecutionResult) -> ExecutionResult:
         )
 
         shim.stream_log("Pipeline completed successfully")
-        # Forward non-usage_records metadata keys as-is.
         out_metadata = {
             k: v
             for k, v in (answer_result.metadata or {}).items()
@@ -874,7 +869,6 @@ def _run_pipeline_summarize(
             )
             forward_metadata = dict(summarize_result.metadata or {})
         else:
-            # Cache hit: no LLM call.
             forward_metadata = {}
 
         # Update answer_params
@@ -2271,7 +2265,7 @@ def _handle_summarize(self, context: ExecutionContext) -> ExecutionResult:
         )
 
         shim = self._build_shim(platform_api_key=platform_api_key)
-        # ``execution_id`` drives Usage-row classification on the dashboard.
+        # execution_id is required for correct usage-row classification.
         usage_kwargs = {
             "run_id": context.run_id,
             "execution_id": context.execution_id or "",
diff --git a/workers/executor/tasks.py b/workers/executor/tasks.py
index dc817dc099..a30243bca3 100644
--- a/workers/executor/tasks.py
+++ b/workers/executor/tasks.py
@@ -17,7 +17,6 @@
 
 logger = WorkerLogger.get_logger(__name__)
 
-# Operations that always make LLM calls; used by the empty-records guard.
 _LLM_BEARING_OPS = frozenset(
     {
         "answer_prompt",
@@ -109,20 +108,16 @@ def execute_extraction(self, execution_context_dict: dict) -> dict:
     orchestrator = ExecutionOrchestrator()
     result = orchestrator.execute(context)
 
-    # Batch write usage records collected during execution
     usage_records = result.metadata.get("usage_records", [])
     if usage_records:
         try:
             config = WorkerConfig()
             with UsageAPIClient(config) as usage_client:
-                # ``set_organization_context`` covers the org for every
-                # request on this client; passing it again as a kwarg was
-                # redundant.
+                # Org context is set on the client; no need to pass it per call.
                 usage_client.set_organization_context(context.organization_id)
                 ok = usage_client.bulk_create_usage(usage_records)
             if not ok:
-                # Promote to ERROR so on-call has the run_id/org/count to
-                # recover dropped billing rows from logs.
+                # ERROR severity so dropped billing rows are recoverable from logs.
                 logger.error(
                     "bulk_create_usage returned failure for %d records "
                     "(run_id=%s organization_id=%s)",