Add consensus correlator: rules + Gemini LLM with smart tiebreaker

Refactor incident_correlator.py to a decision/commit split (preview_correlation / apply_correlation) so the rules engine and LLM can both produce decisions before anything is written to Firestore. Add llm_correlator.py: cheap Gemini Flash first-pass + Gemini Pro tiebreaker. Wire _correlate_with_consensus in upload.py — rules-only fallback when key is absent or call is thin; agreed/tiebreak consensus written to corr_debug.
2026-06-01 00:56:11 -04:00
parent 6bf4333b72
commit cbcc85f7b1
4 changed files with 619 additions and 119 deletions
@@ -26,6 +26,11 @@ class Settings(BaseSettings):
    # Gemini (intelligence extraction, embeddings, incident summaries)
    gemini_api_key: Optional[str] = None
    # Correlation consensus models
    # corr_cheap_model  — first-pass LLM correlator (runs on every call)
    # corr_smart_model  — tiebreaker (only fires when rules and cheap LLM disagree)
    corr_cheap_model: str = "gemini-2.0-flash"
    corr_smart_model: str = "gemini-1.5-pro"
    summary_interval_minutes: int = 2          # how often the summary loop runs
    correlation_window_hours: int = 2          # slow/location path: max hours since last call
    embedding_similarity_threshold: float = 0.93  # slow-path: requires location corroboration
@@ -172,7 +172,7 @@ def _incident_idle_minutes(inc: dict, now: datetime) -> float:
 # ─────────────────────────────────────────────────────────────────────────────
-# Public entry point
+# Public API
 # ─────────────────────────────────────────────────────────────────────────────
 async def correlate_call(
@@ -194,47 +194,155 @@ async def correlate_call(
 ) -> Optional[str]:
    """
    Link call_id to an existing incident or create a new one.
-
+    Thin wrapper: builds context → runs rules decision → commits.
    reference_time — time anchor for the time-limited paths (location + slow).
                     Defaults to now. Pass call.started_at when re-correlating
                     orphaned calls so the window is anchored to when the call
                     actually happened, not when the sweep runs.
    create_if_new  — when False, skip new-incident creation (re-correlation only
                     links to existing incidents; it never creates new ones).
    Returns the incident_id, or None if skipped.
    """
    ctx = await _build_context(
        call_id=call_id, units=units, vehicles=vehicles, cleared_units=cleared_units,
        location_coords=location_coords, reference_time=reference_time,
        system_id=system_id, talkgroup_id=talkgroup_id, talkgroup_name=talkgroup_name,
        tags=tags, incident_type=incident_type, location=location,
        reassignment=reassignment, create_if_new=create_if_new,
    )
    decision = _run_decision(ctx)
    return await _apply_and_log(decision, ctx)
 async def preview_correlation(
    call_id: str,
    node_id: str,
    system_id: Optional[str],
    talkgroup_id: Optional[int],
    talkgroup_name: Optional[str],
    tags: list[str],
    incident_type: Optional[str],
    location: Optional[str] = None,
    location_coords: Optional[dict] = None,
    reference_time: Optional[datetime] = None,
    create_if_new: bool = True,
    units: Optional[list[str]] = None,
    vehicles: Optional[list[str]] = None,
    cleared_units: Optional[list[str]] = None,
    reassignment: bool = False,
 ) -> dict:
    """
    Run the rules engine and return the decision WITHOUT committing to Firestore.
    Returns {"decision": {...}, "ctx": {...}}.
    Pass the result to apply_correlation() to commit, or use the decision
    fields directly for comparison in the consensus correlator.
    decision keys:
      action           "link" | "new" | "orphan"
      matched_incident  the candidate incident doc  (action == "link")
      incident_type     resolved type after tag inference  (action == "new")
      corr_debug        fields to persist on the call doc
    """
    ctx = await _build_context(
        call_id=call_id, units=units, vehicles=vehicles, cleared_units=cleared_units,
        location_coords=location_coords, reference_time=reference_time,
        system_id=system_id, talkgroup_id=talkgroup_id, talkgroup_name=talkgroup_name,
        tags=tags, incident_type=incident_type, location=location,
        reassignment=reassignment, create_if_new=create_if_new,
    )
    decision = _run_decision(ctx)
    return {"decision": decision, "ctx": ctx}
 async def apply_correlation(preview: dict) -> Optional[str]:
    """
    Commit the decision returned by preview_correlation() to Firestore.
    Returns the incident_id, or None if the call was orphaned.
    """
    return await _apply_and_log(preview["decision"], preview["ctx"])
 # ─────────────────────────────────────────────────────────────────────────────
 # Context builder — fetches all Firestore data needed for correlation
 # ─────────────────────────────────────────────────────────────────────────────
 async def _build_context(
    call_id: str,
    units: Optional[list[str]],
    vehicles: Optional[list[str]],
    cleared_units: Optional[list[str]],
    location_coords: Optional[dict],
    reference_time: Optional[datetime],
    system_id: Optional[str],
    talkgroup_id: Optional[int],
    talkgroup_name: Optional[str],
    tags: list[str],
    incident_type: Optional[str],
    location: Optional[str],
    reassignment: bool,
    create_if_new: bool,
 ) -> dict:
    now    = reference_time or datetime.now(timezone.utc)
    window = timedelta(hours=settings.correlation_window_hours)
    # Fetch all active incidents cross-type (mutual aid needs this)
    all_active = await fstore.collection_list("incidents", status="active")
    recent     = [inc for inc in all_active if _within_window_of(inc, now, window)]
-    # Fetch call doc once — reused for disambiguation, embedding merge, unit accumulation
+    call_doc       = await fstore.doc_get("calls", call_id) or {}
-    call_doc      = await fstore.doc_get("calls", call_id) or {}
+    call_embedding = call_doc.get("embedding")
-    call_embedding: Optional[list] = call_doc.get("embedding")
+    call_units     = units         if units         is not None else (call_doc.get("units")         or [])
-    # Prefer explicitly passed units/vehicles (per-scene, from intelligence extraction)
+    call_vehicles  = vehicles      if vehicles      is not None else (call_doc.get("vehicles")      or [])
-    # over the call doc, which merges units from ALL scenes in a multi-scene recording.
+    call_cleared   = cleared_units if cleared_units is not None else (call_doc.get("cleared_units") or [])
-    # Falling back to the call doc is correct for recorrelation sweeps where we have no
+    call_severity  = call_doc.get("severity") or "unknown"
-    # scene-level breakdown.
+    coords         = location_coords or call_doc.get("location_coords")
-    call_units:    list[str] = units    if units    is not None else (call_doc.get("units")    or [])
+    is_thin_call   = not call_units and not call_vehicles and not coords
-    call_vehicles: list[str] = vehicles if vehicles is not None else (call_doc.get("vehicles") or [])
+
-    call_cleared:  list[str] = cleared_units if cleared_units is not None else (call_doc.get("cleared_units") or [])
+    return {
-    call_severity: str             = call_doc.get("severity") or "unknown"
+        "call_id": call_id, "all_active": all_active, "recent": recent,
-    # Use passed coords first (freshly geocoded), fall back to what's on the call doc
+        "call_doc": call_doc, "call_embedding": call_embedding,
-    coords: Optional[dict] = location_coords or call_doc.get("location_coords")
+        "call_units": call_units, "call_vehicles": call_vehicles,
        "call_cleared": call_cleared, "call_severity": call_severity,
        "coords": coords, "is_thin_call": is_thin_call, "now": now,
        "system_id": system_id, "talkgroup_id": talkgroup_id,
        "talkgroup_name": talkgroup_name, "tags": tags,
        "incident_type": incident_type, "location": location,
        "location_coords": location_coords, "reassignment": reassignment,
        "create_if_new": create_if_new,
    }
 # ─────────────────────────────────────────────────────────────────────────────
 # Rules decision engine — pure logic, no Firestore writes
 # ─────────────────────────────────────────────────────────────────────────────
 def _run_decision(ctx: dict) -> dict:
    """
    Run the hybrid rules correlation engine against a pre-built context.
    No Firestore reads or writes — all data comes from ctx.
    Returns:
      action           "link" | "new" | "orphan"
      matched_incident  incident doc to update  (action == "link")
      incident_type     resolved type            (action == "new")
      corr_debug        fields to write to the call doc
    """
    all_active     = ctx["all_active"]
    recent         = ctx["recent"]
    call_doc       = ctx["call_doc"]
    call_embedding = ctx["call_embedding"]
    call_units     = ctx["call_units"]
    call_vehicles  = ctx["call_vehicles"]
    coords         = ctx["coords"]
    is_thin_call   = ctx["is_thin_call"]
    now            = ctx["now"]
    system_id      = ctx["system_id"]
    talkgroup_id   = ctx["talkgroup_id"]
    talkgroup_name = ctx["talkgroup_name"]
    tags           = ctx["tags"]
    incident_type  = ctx["incident_type"]
    location       = ctx["location"]
    location_coords= ctx["location_coords"]
    reassignment   = ctx["reassignment"]
    create_if_new  = ctx["create_if_new"]
    call_id        = ctx["call_id"]
    matched_incident: Optional[dict] = None
    corr_debug: dict = {}
    # A "thin" call carries no scene-identifying information — it is a pure
    # status transmission (10-4, en route, acknowledgement).  Detected by the
    # absence of extracted units, vehicles, AND geocoded coordinates.  Thin
    # calls should link to wherever the last active conversation on this TGID
    # was happening rather than running the full scene-verification logic.
    is_thin_call = not call_units and not call_vehicles and not coords
    # ── 1. Fast path: talkgroup match with recency gate ──────────────────────
    #
    # Only considers incidents updated within tg_fast_path_idle_minutes (default 30 min).
@@ -589,103 +697,153 @@ async def correlate_call(
                    f"call {call_id} → {best_inc['incident_id']} (sim={best_score:.3f})"
                )
-    # ── Update existing or create new ────────────────────────────────────────
+    # ── Decision output ───────────────────────────────────────────────────────
    if matched_incident:
-        incident_id = matched_incident["incident_id"]
+        return {
            "action": "link",
            "matched_incident": matched_incident,
            "incident_type": incident_type,
            "corr_debug": corr_debug,
        }
    if not create_if_new:
        return {"action": "orphan", "matched_incident": None, "incident_type": None, "corr_debug": corr_debug}
    # Attempt type inference from tags before giving up on creation
    resolved_type = incident_type
    if not resolved_type and tags:
        resolved_type = _infer_type_from_tags(tags)
        if resolved_type:
            logger.info(
                f"Correlator: inferred incident_type={resolved_type!r} from tags {tags} for call {call_id}"
            )
    if not resolved_type:
        return {"action": "orphan", "matched_incident": None, "incident_type": None, "corr_debug": corr_debug}
    return {
        "action": "new",
        "matched_incident": None,
        "incident_type": resolved_type,
        "corr_debug": corr_debug,
    }
 # ─────────────────────────────────────────────────────────────────────────────
 # Commit layer — writes decisions to Firestore
 # ─────────────────────────────────────────────────────────────────────────────
 async def _apply_and_log(decision: dict, ctx: dict) -> Optional[str]:
    """Commit a rules decision and persist the corr_debug fields to the call doc."""
    incident_id = await _apply_decision(decision, ctx)
    corr_debug = decision.get("corr_debug") or {}
    if corr_debug:
        try:
            await fstore.doc_set("calls", ctx["call_id"], corr_debug)
        except Exception as e:
            logger.warning(f"Could not write corr_debug for call {ctx['call_id']}: {e}")
    return incident_id
 async def _apply_decision(decision: dict, ctx: dict) -> Optional[str]:
    """
    Execute a correlation decision produced by _run_decision().
    Handles all Firestore writes; returns the incident_id or None.
    """
    action = decision["action"]
    if action == "orphan":
        return None
    call_id         = ctx["call_id"]
    talkgroup_id    = ctx["talkgroup_id"]
    talkgroup_name  = ctx["talkgroup_name"]
    system_id       = ctx["system_id"]
    tags            = ctx["tags"]
    location        = ctx["location"]
    location_coords = ctx["location_coords"]
    call_units      = ctx["call_units"]
    call_vehicles   = ctx["call_vehicles"]
    call_embedding  = ctx["call_embedding"]
    call_severity   = ctx["call_severity"]
    call_cleared    = ctx["call_cleared"]
    coords          = ctx["coords"]
    now             = ctx["now"]
    incident_type   = decision["incident_type"]
    if action == "link":
        matched_incident = decision["matched_incident"]
        await _update_incident(
            matched_incident, call_id, talkgroup_id, system_id, tags,
            location, location_coords, call_units, call_vehicles, call_embedding, now,
            talkgroup_name=talkgroup_name, incident_type=incident_type,
            cleared_units=call_cleared,
        )
-    elif create_if_new:
+        return matched_incident["incident_id"]
        # If GPT returned no type (missing talkgroup context is common), attempt
        # to recover a type from the extracted tags before giving up on creation.
        if not incident_type and tags:
            incident_type = _infer_type_from_tags(tags)
            if incident_type:
                logger.info(
                    f"Correlator: inferred incident_type={incident_type!r} from tags "
                    f"{tags} for call {call_id} (no GPT type)"
                )
        if not incident_type:
            # No type and none inferred — nothing to create
            return None
-        # ── Cross-system parent detection ─────────────────────────────────────
+    # action == "new"
-        # Before creating a standalone incident, check whether this call belongs
+    # ── Cross-system parent detection ─────────────────────────────────────────
-        # to an incident already opened by a different agency (multi-agency chase,
+    # Before creating a standalone incident, check whether this call belongs
-        # mutual aid, etc.).  If a parent candidate is found:
+    # to an incident already opened by a different agency (multi-agency chase,
-        #   • The existing candidate is demoted to a child (incident_type → "child")
+    # mutual aid, etc.).  If a parent candidate is found:
-        #   • A new master shell is created linking both children
+    #   • The existing candidate is demoted to a child (incident_type → "child")
-        #   • The new call's incident is created as a second child of the master
+    #   • A new master shell is created linking both children
-        cross_parent: Optional[dict] = None
+    #   • The new call's incident is created as a second child of the master
-        if system_id:
+    cross_parent: Optional[dict] = None
-            cross_parent = await _find_cross_system_parent(
+    if system_id:
-                system_id=system_id,
+        cross_parent = await _find_cross_system_parent(
-                incident_type=incident_type,
+            system_id=system_id,
-                location=location,
+            incident_type=incident_type,
-                location_coords=coords,
+            location=location,
-                call_embedding=call_embedding,
+            location_coords=coords,
-                recent=recent,
+            call_embedding=call_embedding,
            recent=ctx["recent"],
        )
    if cross_parent:
        existing_child_id  = cross_parent["incident_id"]
        existing_master_id = cross_parent.get("parent_incident_id")
        # Create the new agency's child incident first
        incident_id = await _create_incident(
            call_id, incident_type, talkgroup_id, talkgroup_name, system_id,
            tags, location, location_coords,
            call_units, call_vehicles, call_embedding, call_severity, now,
        )
        if existing_master_id:
            # Candidate is already a child — link new child to the existing master
            await _demote_to_child(incident_id, existing_master_id)
            await _add_child_to_master(existing_master_id, incident_id, now)
            decision["corr_debug"]["corr_path"] = "new/cross-system-child"
            logger.info(
                f"Correlator cross-system: call {call_id} → new child {incident_id} "
                f"under existing master {existing_master_id}"
            )
        if cross_parent:
            existing_child_id = cross_parent["incident_id"]
            existing_master_id = cross_parent.get("parent_incident_id")
            # Create the new agency's child incident first
            incident_id = await _create_incident(
                call_id, incident_type, talkgroup_id, talkgroup_name, system_id,
                tags, location, location_coords,
                call_units, call_vehicles, call_embedding, call_severity, now,
            )
            if existing_master_id:
                # Candidate is already a child — link new child to the existing master
                await _demote_to_child(incident_id, existing_master_id)
                await _add_child_to_master(existing_master_id, incident_id, now)
                corr_debug["corr_path"] = "new/cross-system-child"
                logger.info(
                    f"Correlator cross-system: call {call_id} → new child {incident_id} "
                    f"under existing master {existing_master_id}"
                )
            else:
                # Candidate is a standalone master — create master shell, demote both
                master_id = await _create_master_incident(
                    first_child_id=existing_child_id,
                    second_child_id=incident_id,
                    operational_type=incident_type,
                    location=cross_parent.get("location") or location,
                    location_coords=cross_parent.get("location_coords") or coords,
                    now=now,
                )
                await _demote_to_child(existing_child_id, master_id)
                await _demote_to_child(incident_id, master_id)
                corr_debug["corr_path"] = "new/cross-system-master"
                logger.info(
                    f"Correlator cross-system: created master {master_id}, "
                    f"demoted {existing_child_id} + new {incident_id} as children"
                )
        else:
-            # Normal single-agency incident creation
+            # Candidate is a standalone — create master shell, demote both
-            incident_id = await _create_incident(
+            master_id = await _create_master_incident(
-                call_id, incident_type, talkgroup_id, talkgroup_name, system_id,
+                first_child_id=existing_child_id,
-                tags, location, location_coords,
+                second_child_id=incident_id,
-                call_units, call_vehicles, call_embedding, call_severity, now,
+                operational_type=incident_type,
                location=cross_parent.get("location") or location,
                location_coords=cross_parent.get("location_coords") or coords,
                now=now,
            )
            await _demote_to_child(existing_child_id, master_id)
            await _demote_to_child(incident_id, master_id)
            decision["corr_debug"]["corr_path"] = "new/cross-system-master"
            logger.info(
                f"Correlator cross-system: created master {master_id}, "
                f"demoted {existing_child_id} + new {incident_id} as children"
            )
            corr_debug["corr_path"] = "new"
    else:
-        # Creation suppressed (re-correlation sweep) — nothing to do
+        # Normal single-agency incident creation
-        return None
+        incident_id = await _create_incident(
-
+            call_id, incident_type, talkgroup_id, talkgroup_name, system_id,
-    # Persist the correlation decision to the call document so it can be
+            tags, location, location_coords,
-    # inspected in Firestore or the admin UI without log-scraping.
+            call_units, call_vehicles, call_embedding, call_severity, now,
-    if corr_debug:
+        )
-        try:
+        decision["corr_debug"]["corr_path"] = "new"
            await fstore.doc_set("calls", call_id, corr_debug)
        except Exception as e:
            logger.warning(f"Could not write corr_debug for call {call_id}: {e}")
    return incident_id
@@ -0,0 +1,278 @@
 """
 LLM-based incident correlator using Gemini.
 Two functions are exposed:
  decide(call_id, ctx)                           — cheap first-pass (corr_cheap_model)
  tiebreak(rules_decision, llm_decision, ctx)    — smart tiebreaker (corr_smart_model)
 Both return a decision dict compatible with _run_decision() in incident_correlator:
  {"action": "link"|"new"|"orphan",
   "matched_incident": dict|None,
   "incident_type": str|None,
   "corr_debug": dict,
   "reasoning": str}     ← extra field for logging/tiebreak comparison
 decide() is skipped for thin calls (no content to reason about) and when
 GEMINI_API_KEY is not set — in those cases returns None so the caller knows
 to fall back to the rules decision.
 Error handling: any Gemini failure returns None from decide() and the
 rules_decision from tiebreak() so the pipeline never stalls.
 """
 import asyncio
 import json
 from datetime import datetime, timezone
 from typing import Optional
 from app.internal.logger import logger
 from app.config import settings
 # ─────────────────────────────────────────────────────────────────────────────
 # Prompt helpers
 # ─────────────────────────────────────────────────────────────────────────────
 def _fmt_idle(inc: dict, now: datetime) -> str:
    try:
        raw = inc.get("updated_at") or inc.get("started_at") or ""
        dt  = datetime.fromisoformat(str(raw).replace("Z", "+00:00"))
        if dt.tzinfo is None:
            dt = dt.replace(tzinfo=timezone.utc)
        minutes = int((now - dt).total_seconds() / 60)
        return f"{minutes}min ago" if minutes < 60 else f"{minutes // 60}h{minutes % 60:02d}m ago"
    except Exception:
        return "?"
 def _inc_summary(inc: dict, now: datetime) -> str:
    parts = [f"id:{inc['incident_id']}", f"type:{inc.get('type') or '?'}"]
    if inc.get("location"):
        parts.append(f"loc:{inc['location']}")
    units = inc.get("units") or []
    if units:
        parts.append(f"units:[{', '.join(units[:6])}]")
    tags = inc.get("tags") or []
    if tags:
        parts.append(f"tags:[{', '.join(tags[:4])}]")
    parts.append(f"idle:{_fmt_idle(inc, now)}")
    return " | ".join(parts)
 def _call_block(ctx: dict) -> str:
    lines = []
    call_doc = ctx["call_doc"]
    transcript = call_doc.get("transcript_corrected") or call_doc.get("transcript")
    if transcript:
        lines.append(f"Transcript: {transcript[:700]}")
    if ctx["tags"]:
        lines.append(f"Tags: {ctx['tags']}")
    if ctx["incident_type"]:
        lines.append(f"Incident type: {ctx['incident_type']}")
    if ctx["location"]:
        lines.append(f"Location: {ctx['location']}")
    if ctx["call_units"]:
        lines.append(f"Units: {ctx['call_units']}")
    if ctx["call_vehicles"]:
        lines.append(f"Vehicles: {ctx['call_vehicles']}")
    if ctx["talkgroup_name"]:
        lines.append(f"Talkgroup: {ctx['talkgroup_name']}")
    return "\n".join(lines) if lines else "(no details)"
 _SCHEMA = '{"action": "link" | "new" | "orphan", "incident_id": "<id_string or null>", "reasoning": "<one sentence>"}'
 _RULES = """
 Rules:
 - "link" only with clear positive evidence: same units, same geocoded location, or semantically identical scene on the same talkgroup within the last few minutes.
 - A call on a DIFFERENT talkgroup than an incident requires unit overlap or geocoded location match — topic similarity alone is not enough.
 - "new" only if the call has a clear incident_type AND describes a distinct, identifiable scene.
 - "orphan" when in doubt — conservative is always correct.
 - Do NOT link just because both calls involve police or both mention a road.
 """
 def _build_decide_prompt(ctx: dict) -> str:
    now    = ctx["now"]
    recent = ctx["recent"]
    inc_block = (
        "\n".join(_inc_summary(inc, now) for inc in recent[:20])
        if recent else "(none)"
    )
    return (
        "You are an incident correlator for a public safety radio monitoring system.\n\n"
        "A new radio call has arrived. Decide whether it belongs to an existing active incident, "
        "represents a new incident, or should be orphaned (not enough information).\n\n"
        f"NEW CALL:\n{_call_block(ctx)}\n\n"
        f"ACTIVE INCIDENTS ({len(recent)} recent):\n{inc_block}\n"
        f"{_RULES}\n"
        f"Respond with JSON only (no markdown):\n{_SCHEMA}"
    )
 def _build_tiebreak_prompt(rules_decision: dict, llm_decision: dict, ctx: dict) -> str:
    now    = ctx["now"]
    recent = ctx["recent"]
    inc_block = (
        "\n".join(_inc_summary(inc, now) for inc in recent[:20])
        if recent else "(none)"
    )
    def _fmt(d: dict, name: str) -> str:
        action  = d.get("action", "?")
        inc     = d.get("matched_incident")
        inc_id  = inc["incident_id"] if inc else (d.get("incident_id") or "null")
        reason  = d.get("reasoning") or (d.get("corr_debug") or {}).get("corr_fit_signal") or "—"
        return f"  {name}: action={action}, incident_id={inc_id}, reasoning={reason!r}"
    return (
        "You are a senior incident correlator for a public safety radio monitoring system.\n\n"
        "Two correlation engines disagree. You must make the final decision.\n\n"
        f"NEW CALL:\n{_call_block(ctx)}\n\n"
        f"ACTIVE INCIDENTS ({len(recent)} recent):\n{inc_block}\n\n"
        "DISAGREEMENT:\n"
        f"{_fmt(rules_decision, 'Rules engine')}\n"
        f"{_fmt(llm_decision, 'LLM correlator')}\n"
        f"{_RULES}\n"
        f"Respond with JSON only (no markdown):\n{_SCHEMA}"
    )
 # ─────────────────────────────────────────────────────────────────────────────
 # Gemini API call (sync, runs in thread pool)
 # ─────────────────────────────────────────────────────────────────────────────
 def _sync_gemini(model_name: str, prompt: str) -> dict:
    import google.generativeai as genai  # lazy import — only when needed
    genai.configure(api_key=settings.gemini_api_key)
    model = genai.GenerativeModel(
        model_name,
        generation_config={"response_mime_type": "application/json"},
    )
    response = model.generate_content(prompt)
    return json.loads(response.text)
 # ─────────────────────────────────────────────────────────────────────────────
 # Decision parsing
 # ─────────────────────────────────────────────────────────────────────────────
 def _parse_response(raw: dict, ctx: dict) -> dict:
    """
    Convert raw Gemini JSON output to a decision dict compatible with _run_decision().
    Resolves incident_id → full incident doc from ctx["all_active"].
    Handles type inference for "new" actions the same way as the rules engine.
    """
    from app.internal.incident_correlator import _infer_type_from_tags  # same-package import
    action    = raw.get("action", "orphan")
    reasoning = raw.get("reasoning", "")
    if action not in ("link", "new", "orphan"):
        action = "orphan"
    matched_incident: Optional[dict] = None
    if action == "link":
        inc_id = raw.get("incident_id")
        if inc_id:
            matched_incident = next(
                (i for i in ctx["all_active"] if i.get("incident_id") == inc_id),
                None,
            )
        if not matched_incident:
            logger.warning(
                f"LLM correlator: incident_id={inc_id!r} not in active incidents — orphaning"
            )
            action = "orphan"
    incident_type: Optional[str] = None
    if action in ("link", "new"):
        incident_type = ctx["incident_type"]
        if not incident_type:
            incident_type = _infer_type_from_tags(ctx["tags"])
        if action == "new" and not incident_type:
            # Can't create an incident without a type — demote to orphan
            action = "orphan"
            matched_incident = None
    return {
        "action":            action,
        "matched_incident":  matched_incident,
        "incident_type":     incident_type,
        "corr_debug":        {"corr_llm_reasoning": reasoning},
        "reasoning":         reasoning,
    }
 # ─────────────────────────────────────────────────────────────────────────────
 # Public API
 # ─────────────────────────────────────────────────────────────────────────────
 async def decide(call_id: str, ctx: dict) -> Optional[dict]:
    """
    Run the cheap LLM correlator (corr_cheap_model) on the call.
    Returns a decision dict or None if:
      - GEMINI_API_KEY is not configured
      - the call is thin (content-free — no value from LLM)
      - there are no recent active incidents to reason about
      - Gemini fails
    Callers should treat None as "fall back to rules decision".
    """
    if not settings.gemini_api_key:
        return None
    if ctx["is_thin_call"]:
        return None  # thin calls have no transcript/units/coords to reason about
    if not ctx["recent"]:
        return None  # no incidents to correlate against — rules handles new-only
    try:
        prompt   = _build_decide_prompt(ctx)
        raw      = await asyncio.to_thread(_sync_gemini, settings.corr_cheap_model, prompt)
        decision = _parse_response(raw, ctx)
        _id = (decision["matched_incident"] or {}).get("incident_id", "null")
        logger.info(
            f"LLM correlator ({settings.corr_cheap_model}): call {call_id} → "
            f"action={decision['action']} incident={_id} "
            f"reasoning={decision['reasoning']!r}"
        )
        return decision
    except Exception as e:
        logger.warning(f"LLM correlator failed for call {call_id}: {e}")
        return None
 async def tiebreak(rules_decision: dict, llm_decision: dict, ctx: dict) -> dict:
    """
    Run the smart tiebreaker (corr_smart_model) when rules and LLM disagree.
    Falls back to rules_decision on any error.
    """
    call_id = ctx["call_id"]
    try:
        prompt   = _build_tiebreak_prompt(rules_decision, llm_decision, ctx)
        raw      = await asyncio.to_thread(_sync_gemini, settings.corr_smart_model, prompt)
        decision = _parse_response(raw, ctx)
        _id = (decision["matched_incident"] or {}).get("incident_id", "null")
        logger.info(
            f"LLM tiebreak ({settings.corr_smart_model}): call {call_id} → "
            f"action={decision['action']} incident={_id} "
            f"reasoning={decision['reasoning']!r}"
        )
        return decision
    except Exception as e:
        logger.warning(f"LLM tiebreak failed for call {call_id}: {e} — using rules decision")
        return rules_decision
 def decisions_agree(rules: dict, llm: dict) -> bool:
    """True if both decisions agree on action and (when action=="link") on the target incident."""
    if rules["action"] != llm["action"]:
        return False
    if rules["action"] == "link":
        r_id = (rules.get("matched_incident") or {}).get("incident_id")
        l_id = (llm.get("matched_incident")   or {}).get("incident_id")
        return r_id == l_id
    return True
@@ -83,6 +83,65 @@ def _public_url_to_gcs_uri(url: str) -> Optional[str]:
    return None
 async def _correlate_with_consensus(
    call_id: str,
    node_id: str,
    system_id: Optional[str],
    talkgroup_id: Optional[int],
    talkgroup_name: Optional[str],
    tags: list[str],
    incident_type: Optional[str],
    location: Optional[str],
    location_coords: Optional[dict],
    units: Optional[list] = None,
    vehicles: Optional[list] = None,
    cleared_units: Optional[list] = None,
    reassignment: bool = False,
 ) -> Optional[str]:
    """
    Consensus correlator: runs the rules engine and the cheap LLM in sequence.
    If they agree the rules decision is committed directly.
    If they disagree a smarter tiebreaker LLM makes the final call.
    Falls back to rules-only when GEMINI_API_KEY is absent, the call is
    content-free (thin), or any LLM call fails.
    """
    from app.internal import incident_correlator, llm_correlator
    preview = await incident_correlator.preview_correlation(
        call_id=call_id, node_id=node_id, system_id=system_id,
        talkgroup_id=talkgroup_id, talkgroup_name=talkgroup_name,
        tags=tags, incident_type=incident_type, location=location,
        location_coords=location_coords, units=units, vehicles=vehicles,
        cleared_units=cleared_units, reassignment=reassignment,
    )
    ctx             = preview["ctx"]
    rules_decision  = preview["decision"]
    llm_decision = await llm_correlator.decide(call_id, ctx)
    if llm_decision is None:
        # LLM unavailable, skipped (thin call), or errored — rules wins.
        rules_decision["corr_debug"]["corr_consensus"] = "rules_only"
        return await incident_correlator.apply_correlation(preview)
    if llm_correlator.decisions_agree(rules_decision, llm_decision):
        rules_decision["corr_debug"]["corr_consensus"] = "agreed"
        rules_decision["corr_debug"]["corr_llm_reasoning"] = llm_decision.get("reasoning", "")
        return await incident_correlator.apply_correlation(preview)
    # Disagree — escalate to the smarter tiebreaker.
    logger.info(
        f"Consensus disagreement for call {call_id}: "
        f"rules={rules_decision['action']} vs llm={llm_decision['action']} — tiebreak"
    )
    final = await llm_correlator.tiebreak(rules_decision, llm_decision, ctx)
    final["corr_debug"]["corr_consensus"]    = "tiebreak"
    final["corr_debug"]["corr_rules_action"] = rules_decision["action"]
    final["corr_debug"]["corr_llm_action"]   = llm_decision["action"]
    return await incident_correlator.apply_correlation({"decision": final, "ctx": ctx})
 async def _run_extraction_pipeline(
    call_id: str,
    node_id: str,
@@ -114,7 +173,7 @@ async def _run_extraction_pipeline(
        # overlap so the new scene doesn't chain into the unit's previous incident.
        is_reassignment = bool(scene.get("reassignment"))
        corr_units = [] if is_reassignment else scene.get("units")
-        incident_id = await incident_correlator.correlate_call(
+        incident_id = await _correlate_with_consensus(
            call_id=call_id,
            node_id=node_id,
            system_id=system_id,
@@ -217,7 +276,7 @@ async def _run_intelligence_pipeline(
            all_tags.extend(scene["tags"])
            is_reassignment = bool(scene.get("reassignment"))
            corr_units = [] if is_reassignment else scene.get("units")
-            incident_id = await incident_correlator.correlate_call(
+            incident_id = await _correlate_with_consensus(
                call_id=call_id,
                node_id=node_id,
                system_id=system_id,
@@ -246,7 +305,7 @@ async def _run_intelligence_pipeline(
        if not scenes:
            _call_doc = await fstore.doc_get("calls", call_id)
            if not (_call_doc or {}).get("skip_reason"):
-                incident_id = await incident_correlator.correlate_call(
+                incident_id = await _correlate_with_consensus(
                    call_id=call_id,
                    node_id=node_id,
                    system_id=system_id,