Open-Source-Legal
diff --git a/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎compose/local/django/celery/worker/start‎
100644100755
Lines changed: 1 addition & 1 deletion b/‎compose/local/django/celery/worker/start‎
100644100755
Lines changed: 1 addition & 1 deletion
diff --git a/‎frontend/playwright.video.config.ts‎
Lines changed: 16 additions & 0 deletions b/‎frontend/playwright.video.config.ts‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎frontend/src/components/documents/ModernDocumentItem.tsx‎
Lines changed: 4 additions & 0 deletions b/‎frontend/src/components/documents/ModernDocumentItem.tsx‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎frontend/src/views/Documents.tsx‎
Lines changed: 9 additions & 0 deletions b/‎frontend/src/views/Documents.tsx‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎frontend/tests/e2e/extract-pdf-workflow.spec.ts‎
Lines changed: 202 additions & 0 deletions b/‎frontend/tests/e2e/extract-pdf-workflow.spec.ts‎
Lines changed: 202 additions & 0 deletions
@@ -9,6 +9,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ### Added
 
+- **`frontend/tests/e2e/extract-pdf-workflow.spec.ts`** — full-stack Playwright E2E spec for the extract pipeline: login → create corpus → upload two PDFs (`frontend/tests/fixtures/{usc-title-1,eton-agreement}.pdf`) → wait for parse + embedding → create extract with one column → run with a real OpenAI call → CSV export → assert non-empty cells. Adds new helpers to `frontend/tests/e2e/helpers.ts` (`uploadPdfViaUI`, `waitForDocumentReady`, `createExtractViaUI`, `openExtractByName`, `addColumnViaUI`, `addDocumentsToExtractViaUI`, `runExtractAndWaitForFinish`). Gated on `E2E_RUN_LLM_TESTS=true`; skipped in CI until LLM responses can be mocked over the wire. Runs on the live `local.yml` stack; required tweaks to disable Auth0 (`.envs/.local/.django USE_AUTH0=false`) and to widen the celeryworker `watchfiles --ignore-paths` (in `compose/local/django/celery/worker/start` and the `local.yml` command pointer) so editor / Playwright artifact writes don't hot-reload the worker mid-task. Also adds `data-testid="document-card"` + `data-title` (+ `data-processing` on the `/documents`-view variants) to `frontend/src/views/Documents.tsx` and `data-testid="document-card"` + `data-title` to `frontend/src/components/documents/ModernDocumentItem.tsx`, so tests can poll for the `backendLock` UI signal without depending on hover-only action menus.
 - **Mypy: type analyzer, shared, agents, badges, worker_uploads; introduce shared protocols** (Issue #1335): Brought the five smaller, interface-rich target packages over the ≥70% return-annotation bar called for by the issue and seeded `opencontractserver/types/protocols.py` with the four protocols requested in the scope:
   - `VectorStoreProtocol` — minimum surface (`search` / `async_search`) implemented by `CoreAnnotationVectorStore` (`opencontractserver/llms/vector_stores/core_vector_stores.py`); imported and re-exported from that module so consumers can annotate against the protocol rather than the concrete dataclass.
   - `PipelineComponentProtocol` — `title` / `description` / `author` / `dependencies` surface that the pipeline registry duck-types against; imported from `opencontractserver/pipeline/base/base_component.py` so any future parser/embedder/thumbnailer registered outside the inheritance hierarchy still type-checks against the same contract.
 
@@ -4,4 +4,4 @@ set -o errexit
 set -o nounset
 
 
-watchfiles --target-type command "celery -A config.celery_app worker -l INFO --concurrency=1 -Q celery,worker_uploads"
+watchfiles --ignore-paths frontend,node_modules,.git,__pycache__,.mypy_cache,.pytest_cache,media,staticfiles,docs,.claude,.playwright-mcp,playwright-report-e2e,test-results --target-type command "celery -A config.celery_app worker -l INFO --concurrency=1 -Q celery,worker_uploads"
@@ -0,0 +1,16 @@
+import baseConfig from "./playwright.config";
+import { defineConfig } from "@playwright/test";
+
+/**
+ * Playwright config override that forces video recording for every test.
+ * Use only for capturing demo footage (`yarn playwright test -c playwright.video.config.ts ...`);
+ * the default config keeps `video: "retain-on-failure"` to avoid bloat.
+ */
+export default defineConfig({
+  ...baseConfig,
+  use: {
+    ...baseConfig.use,
+    video: "on",
+    viewport: { width: 1280, height: 800 },
+  },
+});
@@ -1286,6 +1286,8 @@ export const ModernDocumentItem: React.FC<ModernDocumentItemProps> = ({
       <>
         <CardContainer
           ref={setNodeRef}
+          data-testid="document-card"
+          data-title={title || ""}
           className={`${is_selected ? "is-selected" : ""} ${
             isProcessing ? "backend-locked" : ""
           } ${isFailed ? "failed" : ""} ${
@@ -1497,6 +1499,8 @@ export const ModernDocumentItem: React.FC<ModernDocumentItemProps> = ({
     <>
       <ListContainer
         ref={setNodeRef}
+        data-testid="document-card"
+        data-title={title || ""}
         className={`${is_selected ? "is-selected" : ""} ${
           isProcessing ? "backend-locked" : ""
         } ${isFailed ? "failed" : ""} ${isLongPressing ? "long-pressing" : ""}`}
 
@@ -1380,6 +1380,9 @@ export const Documents = () => {
                       key={doc.id}
                       role="button"
                       tabIndex={0}
+                      data-testid="document-card"
+                      data-title={doc.title || ""}
+                      data-processing={doc.backendLock ? "true" : "false"}
                       aria-label={`Open document ${doc.title || "Untitled"}`}
                       $selected={selected_document_ids.includes(doc.id)}
                       onClick={() => handleDocumentClick(doc)}
@@ -1502,6 +1505,9 @@ export const Documents = () => {
                       key={doc.id}
                       role="row"
                       tabIndex={0}
+                      data-testid="document-card"
+                      data-title={doc.title || ""}
+                      data-processing={doc.backendLock ? "true" : "false"}
                       aria-label={`Open document ${doc.title || "Untitled"}`}
                       $selected={selected_document_ids.includes(doc.id)}
                       onClick={() => handleDocumentClick(doc)}
@@ -1569,6 +1575,9 @@ export const Documents = () => {
                       key={doc.id}
                       role="listitem"
                       tabIndex={0}
+                      data-testid="document-card"
+                      data-title={doc.title || ""}
+                      data-processing={doc.backendLock ? "true" : "false"}
                       aria-label={`Open document ${doc.title || "Untitled"}`}
                       $selected={selected_document_ids.includes(doc.id)}
                       onClick={() => handleDocumentClick(doc)}
 
@@ -0,0 +1,202 @@
+/**
+ * E2E integration test: PDF upload → ingest → extract → CSV export.
+ *
+ * Drives the full Vite + Django + Postgres + Celery + OpenAI stack:
+ *
+ *   1. Logs in via the password form.
+ *   2. Creates a corpus.
+ *   3. Uploads two distinct PDFs into the corpus.
+ *   4. Polls until both documents finish parsing + embedding.
+ *   5. Creates a new Extract on the corpus with one column ("Document
+ *      Title") prompting for each PDF's title.
+ *   6. Runs the extract, polls until cells finish.
+ *   7. Exports to CSV and asserts each row produced *some* non-empty
+ *      title-related content (body-text or metadata fallback).
+ *
+ * Gated on `E2E_RUN_LLM_TESTS=true` because step 6 makes a real OpenAI
+ * call. CI does not set the gate, so this spec is skipped there until
+ * we have a way to mock LLM responses over the wire.
+ *
+ * INTENTIONAL ASSERTION SCOPE: this spec validates the *pipeline*
+ * (upload → parse → embed → extract → export), not LLM commit behavior.
+ * The default extraction model tends to echo upload-time metadata when
+ * the prompt is permissive, and to enter a `failure_mode=no_final_response`
+ * tool-loop when the prompt is strict (verbatim from page 1). Both
+ * behaviors are tracked separately in the follow-up issue at
+ * `docs/superpowers/specs/2026-04-29-followup-issue-no-final-response.md`.
+ * Until that lands, the assertions here accept either body-text or
+ * description-fallback cell contents — empty cells still fail loudly.
+ */
+
+import { test, expect } from "./fixtures";
+import {
+  TEST_USER,
+  loginViaUI,
+  createCorpusViaUI,
+  uploadPdfViaUI,
+  waitForDocumentReady,
+  createExtractViaUI,
+  openExtractByName,
+  addColumnViaUI,
+  addDocumentsToExtractViaUI,
+  runExtractAndWaitForFinish,
+} from "./helpers";
+import fs from "fs";
+import path from "path";
+
+const FIXTURE_DIR = path.resolve(__dirname, "../fixtures");
+const FIXTURE_USC = path.join(FIXTURE_DIR, "usc-title-1.pdf");
+const FIXTURE_ETON = path.join(FIXTURE_DIR, "eton-agreement.pdf");
+
+// Unique per-run names so back-to-back local runs don't collide on
+// existing rows (the test does not currently clean up).
+const RUN_ID = Date.now();
+const CORPUS_TITLE = `E2E Extract PDF Corpus ${RUN_ID}`;
+const CORPUS_DESCRIPTION = "Corpus created by extract-pdf-workflow E2E spec.";
+const DOC_USC_TITLE = `USC Title 1 ${RUN_ID}`;
+const DOC_ETON_TITLE = `Eton Agreement ${RUN_ID}`;
+const EXTRACT_NAME = `Extract Titles ${RUN_ID}`;
+const COLUMN_NAME = "Document Title";
+// Permissive query. A strict "read first page verbatim" wording reliably
+// triggers the `failure_mode=no_final_response` issue — the agent reads
+// every byte sequentially and never commits — see the follow-up issue
+// for the agent-behavior fix. For this E2E test we only want to exercise
+// the upload → ingest → extract → CSV-export *pipeline*, not validate
+// model commit behavior, so we keep the query simple and the assertions
+// tolerant of either body-text or metadata-fallback answers.
+const COLUMN_QUERY = "What is the title of this document?";
+
+test.describe("Extract PDF workflow (LLM-gated)", () => {
+  test.skip(
+    process.env.E2E_RUN_LLM_TESTS !== "true",
+    "Requires E2E_RUN_LLM_TESTS=true and a backend OPENAI_API_KEY. " +
+      "Local-only until LLM responses are mocked in CI."
+  );
+
+  test.setTimeout(20 * 60 * 1000);
+
+  test("uploads two PDFs, runs an extract, exports CSV", async ({ page }) => {
+    await test.step("login", async () => {
+      await loginViaUI(page, TEST_USER.username, TEST_USER.password);
+    });
+
+    await test.step("create corpus", async () => {
+      await createCorpusViaUI(page, CORPUS_TITLE, CORPUS_DESCRIPTION);
+    });
+
+    await test.step("upload USC Title 1 PDF", async () => {
+      await uploadPdfViaUI(
+        page,
+        FIXTURE_USC,
+        DOC_USC_TITLE,
+        "USC Title 1 fixture",
+        CORPUS_TITLE
+      );
+    });
+
+    await test.step("upload Eton agreement PDF", async () => {
+      await uploadPdfViaUI(
+        page,
+        FIXTURE_ETON,
+        DOC_ETON_TITLE,
+        "Eton agreement fixture",
+        CORPUS_TITLE
+      );
+    });
+
+    await test.step("wait for USC Title 1 to finish ingest", async () => {
+      await waitForDocumentReady(page, DOC_USC_TITLE);
+    });
+
+    await test.step("wait for Eton agreement to finish ingest", async () => {
+      await waitForDocumentReady(page, DOC_ETON_TITLE);
+    });
+
+    await test.step("create extract on the corpus", async () => {
+      await createExtractViaUI(page, EXTRACT_NAME, CORPUS_TITLE);
+    });
+
+    await test.step("open extract detail", async () => {
+      await openExtractByName(page, EXTRACT_NAME);
+    });
+
+    await test.step("add 'Document Title' column", async () => {
+      await addColumnViaUI(page, COLUMN_NAME, COLUMN_QUERY);
+    });
+
+    await test.step("add both documents to the extract", async () => {
+      await addDocumentsToExtractViaUI(page, [DOC_USC_TITLE, DOC_ETON_TITLE]);
+    });
+
+    await test.step("run extract and wait for finish", async () => {
+      await runExtractAndWaitForFinish(page);
+    });
+
+    await test.step("each row's title cell is non-empty", async () => {
+      // Both rows present in the grid.
+      await expect(page.getByText(DOC_USC_TITLE).first()).toBeVisible();
+      await expect(page.getByText(DOC_ETON_TITLE).first()).toBeVisible();
+
+      // We assert every row has a non-empty Document Title cell whose
+      // content isn't just the row's own document title. This catches a
+      // regression where extraction silently produces empty cells, but
+      // does NOT validate that the LLM reads the PDF body — that's a
+      // separate concern tracked in the follow-up issue (see
+      // docs/superpowers/specs/2026-04-29-followup-issue-no-final-response.md).
+      // AG-Grid uses role="cell" for data cells.
+      for (const docTitle of [DOC_USC_TITLE, DOC_ETON_TITLE]) {
+        const row = page.getByRole("row").filter({ hasText: docTitle });
+        const cells = row.getByRole("cell");
+        const cellCount = await cells.count();
+        expect(cellCount).toBeGreaterThan(0);
+        let nonEmptySeen = false;
+        for (let i = 0; i < cellCount; i++) {
+          const text = (await cells.nth(i).textContent())?.trim() ?? "";
+          if (text.length > 0 && text !== docTitle) {
+            nonEmptySeen = true;
+            break;
+          }
+        }
+        expect(
+          nonEmptySeen,
+          `Row "${docTitle}" has no non-empty extracted cell — extract may have failed`
+        ).toBe(true);
+      }
+    });
+
+    await test.step("export CSV and verify contents", async () => {
+      const downloadPromise = page.waitForEvent("download");
+      await page
+        .getByRole("button", { name: /Export CSV/i })
+        .first()
+        .click();
+      const download = await downloadPromise;
+
+      const csvPath = await download.path();
+      expect(
+        csvPath,
+        "Playwright did not give us a download path"
+      ).not.toBeNull();
+      const csv = fs.readFileSync(csvPath!, "utf-8");
+
+      // Header line.
+      expect(csv).toMatch(/Document Title/);
+
+      // At least three non-empty lines: header + one row per document.
+      const dataLines = csv.split("\n").filter((l) => l.trim().length > 0);
+      expect(dataLines.length).toBeGreaterThanOrEqual(3);
+
+      // CSV must contain SOME title-related text for each document.
+      // Match either the body-text title (best case) or the upload-time
+      // description fallback. The pipeline-only assertion is intentional:
+      // the agent's tendency to echo metadata over body text is tracked
+      // separately (see the follow-up issue). If ALL rows are empty, the
+      // pipeline failed, and these regexes won't match anything either,
+      // so the test still catches that.
+      // USC: body says "TITLE 1 — GENERAL PROVISIONS"; description fallback "USC Title 1 fixture"
+      expect(csv).toMatch(/general provisions|usc\s*title|title\s*1/i);
+      // Eton: body says "EXCLUSIVE LICENSE AND PRODUCT DEVELOPMENT AGREEMENT"; fallback "Eton agreement fixture"
+      expect(csv).toMatch(/exclusive license|development agreement|eton/i);
+    });
+  });
+});
Original file line number	Diff line number	Diff line change
`@@ -4,4 +4,4 @@ set -o errexit`
`4`	`4`	`set -o nounset`
`5`	`5`
`6`	`6`
`7`		`-watchfiles --target-type command "celery -A config.celery_app worker -l INFO --concurrency=1 -Q celery,worker_uploads"`
	`7`	`+watchfiles --ignore-paths frontend,node_modules,.git,__pycache__,.mypy_cache,.pytest_cache,media,staticfiles,docs,.claude,.playwright-mcp,playwright-report-e2e,test-results --target-type command "celery -A config.celery_app worker -l INFO --concurrency=1 -Q celery,worker_uploads"`