fix: add debug log and null company_id comment to webhook scheduling

feat: emit case-status webhook on status change in PUT /api/cases/:case
fix: include case details in webhook failure warning log
2026-05-16 17:13:07 +00:00 · 2026-05-16 17:10:30 +00:00 · 2026-05-16 17:08:33 +00:00 · 2026-05-16 17:06:37 +00:00 · 2026-05-10 18:54:44 +00:00 · 2026-05-10 18:38:05 +00:00
8 changed files with 150 additions and 34 deletions
--- a/mcp-server/src/legal_mcp/services/block_writer.py
+++ b/mcp-server/src/legal_mcp/services/block_writer.py
@@ -360,13 +360,9 @@ async def write_block(
        post_hearing_context=post_hearing_context,
    )
-    # Restructure: sources first, then instructions
+    # source_context is already embedded inside formatted_prompt via {source_context} in the
-    prompt = (
+    # template. Do NOT prepend it again — doing so doubles the prompt size (was 465K chars).
-        f"## חומרי מקור (מסמכים מלאים — צטט מהם מילה במילה כשאפשר):\n\n"
+    prompt = formatted_prompt
        f"{source_context}\n\n"
        f"---\n\n"
        f"{formatted_prompt}"
    )
    if instructions:
        prompt += f"\n\n## הנחיות נוספות:\n{instructions}"
@@ -377,6 +373,19 @@ async def write_block(
        if not dir_doc.get("approved"):
            raise ValueError("לא ניתן לכתוב בלוק דיון ללא כיוון מאושר. הפעל brainstorm → approve_direction קודם.")
    # Guard against context overflow before calling claude -p.
    # Sonnet: 200K context → ~800K chars max; Opus: 200K context → same.
    # In practice the CLI has crashed on prompts above ~400K chars, so use
    # that as a conservative ceiling (well below the token limit).
    _MAX_PROMPT_CHARS = 400_000
    if len(prompt) > _MAX_PROMPT_CHARS:
        raise RuntimeError(
            f"Prompt too large for {block_id}: {len(prompt):,} chars "
            f"(limit {_MAX_PROMPT_CHARS:,}). "
            f"source_context: {len(source_context):,} chars. "
            f"Reduce documents or call extract_appraiser_facts first."
        )
    # Call Claude via Claude Code session (no API)
    model_key = block_cfg["model"]
    timeout = claude_session.LONG_TIMEOUT if model_key == "opus" else claude_session.DEFAULT_TIMEOUT
@@ -414,16 +423,35 @@ def _build_case_context(case: dict, decision: dict | None) -> str:
 - תוצאה: {outcome_heb}"""
 # Which doc_types are relevant per block.
 # None  → skip source docs entirely (block uses other context, e.g. claims_context)
 # []    → include all doc types (default for unspecified blocks)
 # [..] → include only the listed doc_type values
 _BLOCK_DOC_TYPES: dict[str, list[str] | None] = {
    "block-he":    None,                      # only case_context needed; no full docs
    "block-vav":   ["appeal", "protocol"],    # כתב ערר + פרוטוקול ועדה
    "block-zayin": None,                      # claims_context is sufficient
    "block-chet":  ["protocol"],              # פרוטוקול + השלמות טיעון
    "block-tet":   ["appraisal"],             # שומות בלבד
    # block-yod, block-yod-alef, block-he etc. default → all docs
 }
 async def _build_source_context(case_id: UUID, block_id: str) -> str:
-    """Get full document texts for the block.
+    """Get document texts for the block, filtered by relevance.
    Per Anthropic best practices: send full source documents, not truncated excerpts.
-    Place documents at the TOP of the prompt (before instructions) for 30% better recall.
+    Per-block filtering prevents context overflow on large cases (9+ docs).
    For grounding: instruct Claude to cite word-for-word from these documents.
    """
    allowed = _BLOCK_DOC_TYPES.get(block_id, [])  # [] sentinel = not in map → all docs
    if allowed is None:
        return ""  # this block doesn't need raw source docs
    docs = await db.list_documents(case_id)
    context_parts = []
    for doc in docs:
        if allowed and doc["doc_type"] not in allowed:
            continue
        text = await db.get_document_text(UUID(doc["id"]))
        if text:
            context_parts.append(f"--- מסמך: {doc['title']} ({doc['doc_type']}) ---\n{text}")
--- a/mcp-server/src/legal_mcp/services/claude_session.py
+++ b/mcp-server/src/legal_mcp/services/claude_session.py
@@ -72,6 +72,9 @@ async def query(
    """
    full_prompt = f"{system}\n\n{prompt}" if system else prompt
    if len(full_prompt) > 150_000:
        logger.warning("Large prompt: %d chars — may hit context limits", len(full_prompt))
    cmd = [
        "claude", "-p",
        "--output-format", "json",
@@ -110,7 +113,8 @@ async def query(
    if proc.returncode != 0:
        stderr = stderr_b.decode("utf-8", errors="replace").strip()[:500] or "unknown error"
-        raise RuntimeError(f"Claude CLI failed (exit {proc.returncode}): {stderr}")
+        size_info = f"; prompt_len={len(full_prompt):,} chars" if len(full_prompt) > 100_000 else ""
        raise RuntimeError(f"Claude CLI failed (exit {proc.returncode}): {stderr}{size_info}")
    stdout = stdout_b.decode("utf-8", errors="replace").strip()
    if not stdout:
--- a/mcp-server/src/legal_mcp/services/db.py
+++ b/mcp-server/src/legal_mcp/services/db.py
@@ -2052,9 +2052,19 @@ async def list_external_case_law(
    offset: int = 0,
    source_kind: str = "external_upload",
 ) -> list[dict]:
-    """List chair-uploaded precedents, with simple filters."""
+    """List chair-uploaded precedents, with simple filters.
    source_kind="all_committees" expands to: source_kind='internal_committee'
    OR (source_kind='external_upload' AND source_type='appeals_committee').
    """
    pool = await get_pool()
-    conditions = [f"source_kind = '{source_kind}'"]
+    if source_kind == "all_committees":
        conditions = [
            "(source_kind = 'internal_committee' OR "
            "(source_kind = 'external_upload' AND source_type = 'appeals_committee'))"
        ]
    else:
        conditions = [f"source_kind = '{source_kind}'"]
    params: list = []
    idx = 1
    if practice_area:
@@ -2488,19 +2498,17 @@ async def precedent_library_stats() -> dict:
    pool = await get_pool()
    async with pool.acquire() as conn:
        total = await conn.fetchval(
-            "SELECT COUNT(*) FROM case_law WHERE source_kind = 'external_upload'"
+            "SELECT COUNT(*) FROM case_law"
        )
        by_practice = await conn.fetch(
            """SELECT practice_area, COUNT(*) AS n
               FROM case_law
               WHERE source_kind = 'external_upload'
               GROUP BY practice_area
               ORDER BY n DESC"""
        )
        by_level = await conn.fetch(
            """SELECT precedent_level, COUNT(*) AS n
               FROM case_law
               WHERE source_kind = 'external_upload'
               GROUP BY precedent_level
               ORDER BY n DESC"""
        )
--- a/mcp-server/src/legal_mcp/services/lessons.py
+++ b/mcp-server/src/legal_mcp/services/lessons.py
@@ -123,7 +123,7 @@ SUMMARY_STRATEGIES = {
 DISCUSSION_RULES: dict[str, list[str]] = {
    "universal": [
-        "פרק הדיון = אסה רציפה. אין כותרות משנה (H2/H3). מעברים רק עם ביטויי מעבר טקסטואליים.",
+        "פרק הדיון = מאסה רציפה. אין כותרות משנה (H2/H3). מעברים רק עם ביטויי מעבר טקסטואליים.",
        "חריג יחיד לכותרות משנה: נושאים נפרדים לחלוטין (למשל: הקלה בגובה + התייחסות לטענות נוספות).",
        "טווח אורך סעיפים: 20 עד 600+ מילים. סעיף עם ציטוט מקיף = בלוק אחד שלם, לא שבירה לסעיפים קצרים.",
    ],
--- a/web-ui/src/components/precedents/library-list-panel.tsx
+++ b/web-ui/src/components/precedents/library-list-panel.tsx
@@ -1,6 +1,7 @@
 "use client";
 import { useState } from "react";
 import Link from "next/link";
 import { Trash2, Plus, Pencil, Wand2 } from "lucide-react";
 import { toast } from "sonner";
 import {
@@ -151,7 +152,9 @@ function CourtRow({ p, onEdit }: { p: Precedent; onEdit: (id: string) => void })
        className="font-semibold text-navy text-right whitespace-normal break-words min-w-[280px] max-w-[420px] py-3"
        dir="rtl"
      >
-        <span dir="auto">{cleanCitation(p.case_number)}</span>
+        <Link href={`/precedents/${p.id}`} className="hover:underline hover:text-gold-deep" dir="auto">
          {cleanCitation(p.case_number)}
        </Link>
      </TableCell>
      <TableCell className="text-ink whitespace-normal break-words max-w-[260px] py-3">
        <div className="font-medium">{cleanCitation(p.case_name)}</div>
@@ -233,7 +236,9 @@ function CommitteeRow({ p, onEdit }: { p: Precedent; onEdit: (id: string) => voi
        className="font-semibold text-navy text-right whitespace-normal break-words min-w-[200px] max-w-[320px] py-3"
        dir="rtl"
      >
-        <span dir="auto">{cleanCitation(p.case_number)}</span>
+        <Link href={`/precedents/${p.id}`} className="hover:underline hover:text-gold-deep" dir="auto">
          {cleanCitation(p.case_number)}
        </Link>
      </TableCell>
      <TableCell className="text-ink whitespace-normal break-words max-w-[220px] py-3">
        <div className="font-medium">{cleanCitation(p.case_name)}</div>
@@ -308,8 +313,8 @@ export function LibraryListPanel() {
    limit: 200,
  };
-  const courts = usePrecedents({ ...sharedFilters, sourceKind: "external_upload" });
+  const courts = usePrecedents({ ...sharedFilters, sourceKind: "external_upload", sourceType: "court_ruling" });
-  const committee = usePrecedents({ ...sharedFilters, sourceKind: "internal_committee" });
+  const committee = usePrecedents({ ...sharedFilters, sourceKind: "all_committees" });
  return (
    <div className="space-y-8">
--- a/web-ui/src/components/precedents/precedent-edit-sheet.tsx
+++ b/web-ui/src/components/precedents/precedent-edit-sheet.tsx
@@ -1,6 +1,6 @@
 "use client";
-import { useEffect, useState } from "react";
+import { useState } from "react";
 import { Save, Sparkles } from "lucide-react";
 import { toast } from "sonner";
 import {
@@ -65,10 +65,12 @@ export function PrecedentEditSheet({ caseLawId, onOpenChange }: Props) {
  const [form, setForm] = useState<FormState>(EMPTY);
-  // Hydrate form when the record loads.
+  // React-approved derived-state pattern: sync form whenever a different
-  useEffect(() => {
+  // record arrives (including after save+refetch). Using setState during
-    if (!record) return;
+  // render avoids the one-frame flash that useEffect would produce.
-    // eslint-disable-next-line react-hooks/set-state-in-effect
+  const [syncedRecordId, setSyncedRecordId] = useState<string | null>(null);
  if (record && record.id !== syncedRecordId) {
    setSyncedRecordId(record.id as string);
    setForm({
      citation: record.case_number || "",
      case_name: record.case_name || "",
@@ -84,7 +86,7 @@ export function PrecedentEditSheet({ caseLawId, onOpenChange }: Props) {
      headnote: record.headnote || "",
      key_quote: (record as { key_quote?: string }).key_quote || "",
    });
-  }, [record]);
+  }
  const onSubmit = async (e: React.FormEvent) => {
    e.preventDefault();
--- a/web/app.py
+++ b/web/app.py
@@ -20,7 +20,7 @@ sys.path.insert(0, str(Path(__file__).resolve().parent.parent / "mcp-server" / "
 import zipfile
-from fastapi import FastAPI, File, Form, HTTPException, UploadFile
+from fastapi import BackgroundTasks, FastAPI, File, Form, HTTPException, UploadFile
 from fastapi.responses import FileResponse, StreamingResponse
 from typing import Any, Literal
 from pydantic import BaseModel
@@ -44,7 +44,7 @@ from web.mcp_env_catalog import (
    normalize_for_compare,
 )
 from web.progress_store import ProgressStore
-from web.paperclip_api import pc_request
+from web.paperclip_api import emit_case_status_webhook, pc_request
 from web.paperclip_client import (
    COMPANIES as PAPERCLIP_COMPANIES,
    accept_interaction as pc_accept_interaction,
@@ -1337,8 +1337,12 @@ async def api_case_get(case_number: str):
@app.put("/api/cases/{case_number}")
-async def api_case_update(case_number: str, req: CaseUpdateRequest):
+async def api_case_update(case_number: str, req: CaseUpdateRequest, background_tasks: BackgroundTasks):
    """Update case details."""
    # Capture old status before the update so we can detect changes.
    existing = await db.get_case_by_number(case_number)
    old_status = (existing or {}).get("status", "")
    result = await cases_tools.case_update(
        case_number=case_number,
        status=req.status,
@@ -1351,10 +1355,30 @@ async def api_case_update(case_number: str, req: CaseUpdateRequest):
        expected_outcome=req.expected_outcome,
    )
    try:
-        return json.loads(result)
+        parsed = json.loads(result)
    except json.JSONDecodeError:
        raise HTTPException(404, result)
    # Emit webhook when status changes (fire-and-forget via BackgroundTasks).
    new_status = req.status
    if new_status and old_status != new_status:
        prefix = case_number[:1]
        company_id = (
            PAPERCLIP_COMPANIES["licensing"] if prefix == "1"
            else PAPERCLIP_COMPANIES["betterment"] if prefix in ("8", "9")
            else None
        )
        background_tasks.add_task(
            emit_case_status_webhook,
            case_number=case_number,
            old_status=old_status,
            new_status=new_status,
            company_id=company_id,  # None is safe — plugin handles unknown company gracefully
        )
        logger.debug("webhook scheduled: case %s %s → %s", case_number, old_status, new_status)
    return parsed
@app.delete("/api/cases")
 async def api_case_delete(case_number: str, remove_files: bool = False):
@@ -3057,8 +3081,16 @@ async def api_get_methodology(category: str):
    items = {}
    for key, default_val in defaults.items():
        if key in overrides:
            raw = overrides[key]["rule_value"]
            # asyncpg returns JSONB as a raw JSON string when no codec is registered.
            # Parse it back to a Python object so the frontend receives the correct type.
            if isinstance(raw, str):
                try:
                    raw = json.loads(raw)
                except (json.JSONDecodeError, TypeError):
                    pass
            items[key] = {
-                "value": overrides[key]["rule_value"],
+                "value": raw,
                "is_override": True,
                "updated_at": overrides[key]["created_at"].isoformat() if overrides[key]["created_at"] else None,
            }
@@ -3095,10 +3127,14 @@ async def api_update_methodology(category: str, key: str, req: MethodologyUpdate
            raise HTTPException(422, "content_checklists value must be a non-empty string")
    pool = await db.get_pool()
    # json.dumps → text, then PostgreSQL casts text→jsonb.
    # Passing a Python list directly causes "expected str, got list" in asyncpg;
    # passing a str with ::jsonb causes double-encoding (stored as JSONB string).
    # ::text::jsonb bypasses asyncpg's codec and lets PostgreSQL parse the JSON.
    await pool.execute(
        "INSERT INTO appeal_type_rules (id, appeal_type, rule_category, rule_key, rule_value) "
-        "VALUES (gen_random_uuid(), '_global', $1, $2, $3::jsonb) "
+        "VALUES (gen_random_uuid(), '_global', $1, $2, $3::text::jsonb) "
-        "ON CONFLICT (appeal_type, rule_category, rule_key) DO UPDATE SET rule_value = $3::jsonb",
+        "ON CONFLICT (appeal_type, rule_category, rule_key) DO UPDATE SET rule_value = $3::text::jsonb",
        category, key, json.dumps(req.value, ensure_ascii=False),
    )
--- a/web/paperclip_api.py
+++ b/web/paperclip_api.py
@@ -19,6 +19,7 @@ from __future__ import annotations
 import logging
 import os
 from datetime import datetime
 from typing import Any
 import httpx
@@ -81,3 +82,35 @@ async def pc_request(
    if raise_on_error:
        resp.raise_for_status()
    return resp
 async def emit_case_status_webhook(
    case_number: str,
    old_status: str,
    new_status: str,
    company_id: str | None = None,
    run_id: str | None = None,
 ) -> None:
    """Notify the Paperclip plugin that a case status changed.
    Fire-and-forget: logs errors but never raises, so callers aren't blocked.
    """
    try:
        await pc_request(
            "POST",
            "/api/plugins/marcusgroup.legal-ai/webhooks/case-status",
            json={
                "caseNumber": case_number,
                "oldStatus": old_status,
                "newStatus": new_status,
                "companyId": company_id,
                "timestamp": datetime.utcnow().isoformat() + "Z",
            },
            run_id=run_id,
            timeout=5.0,
        )
    except Exception as exc:
        logger.warning(
            "emit_case_status_webhook failed for case %s (%s → %s): %s",
            case_number, old_status, new_status, exc,
        )
Author	SHA1	Message	Date
Chaim	015e553d06	fix: add debug log and null company_id comment to webhook scheduling All checks were successful Build & Deploy / build-and-deploy (push) Successful in 4m16s Details	2026-05-16 17:13:07 +00:00
Chaim	6bdf9786ac	feat: emit case-status webhook on status change in PUT /api/cases/:case	2026-05-16 17:10:30 +00:00
Chaim	d87f9c5a5f	fix: include case details in webhook failure warning log	2026-05-16 17:08:33 +00:00
Chaim	a0fab1f6de	feat: add emit_case_status_webhook helper	2026-05-16 17:06:37 +00:00
Chaim	d5043100a7	fix: json.loads JSONB overrides on GET — asyncpg has no codec registered All checks were successful Build & Deploy / build-and-deploy (push) Successful in 8s Details asyncpg returns JSONB columns as raw JSON strings when no type codec is configured (only pgvector is registered in _init_connection). The stored value is a correct JSONB array (jsonb_typeof=array confirmed), but asyncpg decodes it as str. Parse it explicitly in the GET handler so the frontend receives the correct Python list/dict. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 18:54:44 +00:00
Chaim	932cc7191c	fix: use ::text::jsonb to store methodology overrides correctly All checks were successful Build & Deploy / build-and-deploy (push) Successful in 8s Details asyncpg cannot encode a Python list as JSONB directly (expects str). Passing str with ::jsonb causes double-encoding (stored as JSONB string). Solution: json.dumps() the value → pass as text → PostgreSQL parses with ::text::jsonb cast, storing it as the correct JSONB array/object. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 18:38:05 +00:00
chaim	d983cfdd3b	Merge pull request 'fix: prevent JSONB double-encoding on methodology save' (#6 ) from fix/methodology-jsonb-double-encoding into main All checks were successful Build & Deploy / build-and-deploy (push) Successful in 1m39s Details	2026-05-10 18:34:03 +00:00
Chaim	50649baeed	fix: prevent JSONB double-encoding on methodology save Pass req.value directly to asyncpg instead of json.dumps(req.value). When a Python string was passed with ::jsonb, asyncpg encoded it as a JSONB string (not an array), causing the frontend spread operator to split it into individual characters — one textarea per character. Also fix typo in DISCUSSION_RULES default: "אסה" → "מאסה". Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 18:30:49 +00:00
Chaim	a9cd8aeb12	fix: prevent write_interim_draft context overflow (465K → ≤300K chars) Two bugs caused all 5 interim blocks to fail with "Claude CLI failed (exit 1): unknown error": 1. source_context was embedded BOTH inside the prompt template (via {source_context}) AND prepended again in write_block — doubling every block's context size (232K chars × 2 = 465K chars). 2. _build_source_context loaded all 9 case documents for every block regardless of relevance. Fixes: - Remove the duplicate source_context prepend in write_block; the template already contains it via {source_context} - Add per-block document filtering (_BLOCK_DOC_TYPES): block-he/zayin → empty, block-chet → protocol only, block-tet → appraisals only - Add 400K char guard before calling claude -p with a descriptive error (vs opaque "exit 1: unknown error") - Add prompt-size warning and size info in claude_session error messages Result: block-he 0 chars, block-zayin 0 chars, block-vav ~172K, block-chet ~45K, block-tet ~300K (all under 400K limit) Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 10:49:47 +00:00
Chaim	10a63fb9e0	fix(precedents): separate court rulings from committee decisions correctly All checks were successful Build & Deploy / build-and-deploy (push) Successful in 1m37s Details - DB: add 'all_committees' virtual source_kind covering internal_committee + external_upload appeals_committee rows in one query - DB: stats now count all case_law rows (not just external_upload), fixing the precedents_total that excluded 44 internal-committee records - UI: courts table filters to source_type=court_ruling only; committees table uses the new all_committees query Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 09:59:30 +00:00
Chaim	f94201c577	feat(precedents): make citation link to detail page All checks were successful Build & Deploy / build-and-deploy (push) Successful in 34s Details Both CourtRow and CommitteeRow citation cells are now Next.js Links → /precedents/{id}, letting users navigate directly from the list. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 09:01:26 +00:00
Chaim	026457dac4	fix(precedent-edit): sync form from record without useEffect flash All checks were successful Build & Deploy / build-and-deploy (push) Successful in 36s Details Replace useEffect-based form hydration with React's approved derived-state pattern (setState-during-render). This eliminates the one-frame flash where the precedent_level Select showed "—" before useEffect fired, and fixes cases where the same record reference returned from TanStack cache caused useEffect to not re-run after save+invalidate. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-05-10 08:35:04 +00:00
chaim	75493ce233	Merge pull request 'feat: link related precedents across court instances (SCHEMA_V11)' (#4 ) from feat/related-precedents-v11 into main All checks were successful Build & Deploy / build-and-deploy (push) Successful in 1m41s Details Reviewed-on: #4	2026-05-10 07:54:37 +00:00