diff --git a/.gitignore b/.gitignore
index 02414e2b..6fad4cde 100644
--- a/.gitignore
+++ b/.gitignore
@@ -48,5 +48,7 @@ nul
 /.github/plans
 *.xlsx
 /artifacts/tests
+/artifacts/tmp/*
+/artifacts/tmp
 scripts/agent.json
 scripts/me.json
diff --git a/application/single_app/config.py b/application/single_app/config.py
index dd712ec8..e8c682fe 100644
--- a/application/single_app/config.py
+++ b/application/single_app/config.py
@@ -94,7 +94,7 @@
 EXECUTOR_TYPE = 'thread'
 EXECUTOR_MAX_WORKERS = 30
 SESSION_TYPE = 'filesystem'
-VERSION = "0.240.020"
+VERSION = "0.240.056"
 
 SECRET_KEY = os.getenv('SECRET_KEY', 'dev-secret-key-change-in-production')
 
diff --git a/application/single_app/functions_conversation_metadata.py b/application/single_app/functions_conversation_metadata.py
index 1b83752d..0a993ee9 100644
--- a/application/single_app/functions_conversation_metadata.py
+++ b/application/single_app/functions_conversation_metadata.py
@@ -104,6 +104,53 @@ def _build_primary_context_from_scope_selection(
     return None
 
 
+def _extract_document_id_from_search_result(doc):
+    """Resolve a stable parent document ID from a search result."""
+    document_id = str(doc.get('document_id') or '').strip()
+    if document_id:
+        return document_id
+
+    chunk_identifier = str(doc.get('id') or '').strip()
+    if not chunk_identifier:
+        return None
+
+    if '_' in chunk_identifier:
+        return '_'.join(chunk_identifier.split('_')[:-1])
+
+    return chunk_identifier
+
+
+def _build_last_grounded_document_refs(document_map):
+    """Build the exact reusable grounded document set for the latest search-backed turn."""
+    grounded_refs = []
+
+    for document_id, doc_info in document_map.items():
+        scope_info = doc_info.get('scope') or {}
+        scope_type = scope_info.get('scope')
+        scope_id = scope_info.get('id')
+        if not document_id or not scope_type or not scope_id:
+            continue
+
+        ref = {
+            'document_id': document_id,
+            'scope': scope_type,
+            'scope_id': scope_id,
+            'file_name': doc_info.get('file_name'),
+            'classification': doc_info.get('classification'),
+        }
+
+        if scope_type == 'group':
+            ref['group_id'] = scope_id
+        elif scope_type == 'public':
+            ref['public_workspace_id'] = scope_id
+        else:
+            ref['user_id'] = scope_id
+
+        grounded_refs.append(ref)
+
+    return grounded_refs
+
+
 def collect_conversation_metadata(user_message, conversation_id, user_id, active_group_id=None, 
                                 document_scope=None, selected_document_id=None, model_deployment=None,
                                 hybrid_search_enabled=False, 
@@ -179,20 +226,17 @@ def collect_conversation_metadata(user_message, conversation_id, user_id, active
             chunk_id = doc.get('id')
             doc_scope_result = _determine_document_scope(doc, user_id, active_group_id)
             classification = doc.get('document_classification', 'None')
-            
-            if chunk_id:
-                # Extract document ID from chunk ID (assumes format: doc_id_chunkNumber)
-                if '_' in chunk_id:
-                    document_id = '_'.join(chunk_id.split('_')[:-1])  # Remove last part (chunk number)
-                else:
-                    document_id = chunk_id  # Use full ID if no underscore
+            document_id = _extract_document_id_from_search_result(doc)
+
+            if document_id and chunk_id:
                 
                 # Initialize document entry if not exists
                 if document_id not in document_map:
                     document_map[document_id] = {
                         'scope': doc_scope_result,
                         'chunk_ids': [],
-                        'classification': classification
+                        'classification': classification,
+                        'file_name': doc.get('file_name') or doc.get('title') or 'Unknown Document'
                     }
                 
                 # Add chunk ID to this document
@@ -538,6 +582,9 @@ def collect_conversation_metadata(user_message, conversation_id, user_id, active
             current_tags[semantic_key] = semantic_tag    # Update the tags array
     conversation_item['tags'] = list(current_tags.values())
 
+    if document_map:
+        conversation_item['last_grounded_document_refs'] = _build_last_grounded_document_refs(document_map)
+
     # --- Scope Lock Logic ---
     current_scope_locked = conversation_item.get('scope_locked')
 
diff --git a/application/single_app/functions_documents.py b/application/single_app/functions_documents.py
index 4dec6803..2ff2fc95 100644
--- a/application/single_app/functions_documents.py
+++ b/application/single_app/functions_documents.py
@@ -15,6 +15,540 @@ def allowed_file(filename, allowed_extensions=None):
         allowed_extensions = ALLOWED_EXTENSIONS
     return '.' in filename and \
            filename.rsplit('.', 1)[1].lower() in allowed_extensions
+
+
+ARCHIVED_SCOPE_PREFIX = "__archived__::"
+CURRENT_ALIAS_BLOB_PATH_MODE = "current_alias"
+ARCHIVED_REVISION_BLOB_PATH_MODE = "archived_revision"
+
+
+def _get_blob_container_name(group_id=None, public_workspace_id=None):
+    if public_workspace_id is not None:
+        return storage_account_public_documents_container_name
+    if group_id is not None:
+        return storage_account_group_documents_container_name
+    return storage_account_user_documents_container_name
+
+
+def _get_document_scope_id(document_item=None, user_id=None, group_id=None, public_workspace_id=None):
+    if public_workspace_id is None and document_item is not None:
+        public_workspace_id = document_item.get("public_workspace_id")
+    if group_id is None and document_item is not None:
+        group_id = document_item.get("group_id")
+    if user_id is None and document_item is not None:
+        user_id = document_item.get("user_id")
+
+    return public_workspace_id or group_id or user_id
+
+
+def build_current_blob_path(blob_filename, user_id=None, group_id=None, public_workspace_id=None):
+    scope_id = _get_document_scope_id(
+        user_id=user_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+    if not scope_id or not blob_filename:
+        return None
+
+    return f"{scope_id}/{blob_filename}"
+
+
+def build_archived_blob_path(document_item):
+    scope_id = _get_document_scope_id(document_item=document_item)
+    revision_family_id = document_item.get("revision_family_id") or document_item.get("id")
+    document_id = document_item.get("id")
+    file_name = document_item.get("file_name")
+
+    if not scope_id or not revision_family_id or not document_id or not file_name:
+        return None
+
+    return f"{scope_id}/{revision_family_id}/{document_id}/{file_name}"
+
+
+def get_document_blob_storage_info(document_item, user_id=None, group_id=None, public_workspace_id=None, prefer_archived=False):
+    if not document_item:
+        return None, None
+
+    container_name = document_item.get("blob_container") or _get_blob_container_name(
+        group_id=group_id or document_item.get("group_id"),
+        public_workspace_id=public_workspace_id or document_item.get("public_workspace_id"),
+    )
+
+    archived_blob_path = document_item.get("archived_blob_path")
+    blob_path = document_item.get("blob_path")
+
+    if prefer_archived and archived_blob_path:
+        return container_name, archived_blob_path
+
+    if blob_path:
+        return container_name, blob_path
+
+    if document_item.get("blob_path_mode") == ARCHIVED_REVISION_BLOB_PATH_MODE and archived_blob_path:
+        return container_name, archived_blob_path
+
+    return container_name, build_current_blob_path(
+        document_item.get("file_name"),
+        user_id=user_id or document_item.get("user_id"),
+        group_id=group_id or document_item.get("group_id"),
+        public_workspace_id=public_workspace_id or document_item.get("public_workspace_id"),
+    )
+
+
+def get_document_blob_delete_targets(document_item, user_id=None, group_id=None, public_workspace_id=None):
+    targets = []
+    seen = set()
+
+    container_name, primary_blob_path = get_document_blob_storage_info(
+        document_item,
+        user_id=user_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+
+    for blob_path in [primary_blob_path, document_item.get("archived_blob_path")]:
+        if not container_name or not blob_path:
+            continue
+
+        key = (container_name, blob_path)
+        if key in seen:
+            continue
+
+        seen.add(key)
+        targets.append(key)
+
+    return targets
+
+
+def _get_blob_service_client():
+    blob_service_client = CLIENTS.get("storage_account_office_docs_client")
+    if not blob_service_client:
+        raise Exception("Blob service client not available or not configured.")
+    return blob_service_client
+
+
+def _blob_exists(container_name, blob_path):
+    if not container_name or not blob_path:
+        return False
+
+    blob_service_client = _get_blob_service_client()
+    blob_client = blob_service_client.get_blob_client(container=container_name, blob=blob_path)
+    return blob_client.exists()
+
+
+def _copy_blob_to_blob(source_container_name, source_blob_path, destination_container_name, destination_blob_path, overwrite=False):
+    if not source_container_name or not source_blob_path:
+        raise ValueError("Source blob reference is required")
+    if not destination_container_name or not destination_blob_path:
+        raise ValueError("Destination blob reference is required")
+    if source_container_name == destination_container_name and source_blob_path == destination_blob_path:
+        return destination_blob_path
+
+    blob_service_client = _get_blob_service_client()
+    source_blob_client = blob_service_client.get_blob_client(container=source_container_name, blob=source_blob_path)
+    destination_blob_client = blob_service_client.get_blob_client(container=destination_container_name, blob=destination_blob_path)
+
+    if destination_blob_client.exists() and not overwrite:
+        return destination_blob_path
+    if not source_blob_client.exists():
+        raise FileNotFoundError(f"Source blob not found: {source_container_name}/{source_blob_path}")
+
+    properties = source_blob_client.get_blob_properties()
+    source_metadata = dict(properties.metadata) if properties.metadata else None
+    temp_file_path = None
+
+    try:
+        with tempfile.NamedTemporaryFile(delete=False) as temp_file:
+            temp_file_path = temp_file.name
+            download_stream = source_blob_client.download_blob()
+            for chunk in download_stream.chunks():
+                temp_file.write(chunk)
+
+        with open(temp_file_path, "rb") as temp_file_handle:
+            destination_blob_client.upload_blob(
+                temp_file_handle,
+                overwrite=overwrite,
+                metadata=source_metadata,
+            )
+    finally:
+        if temp_file_path and os.path.exists(temp_file_path):
+            os.remove(temp_file_path)
+
+    return destination_blob_path
+
+
+def _archive_previous_document_blob(previous_document, user_id=None, group_id=None, public_workspace_id=None):
+    if not previous_document:
+        return None
+
+    container_name, current_blob_path = get_document_blob_storage_info(
+        previous_document,
+        user_id=user_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+    archived_blob_path = previous_document.get("archived_blob_path") or build_archived_blob_path(previous_document)
+
+    if not container_name or not archived_blob_path:
+        return None
+
+    archived_available = False
+
+    if archived_blob_path == current_blob_path:
+        archived_available = _blob_exists(container_name, archived_blob_path)
+    elif _blob_exists(container_name, archived_blob_path):
+        archived_available = True
+    elif current_blob_path and _blob_exists(container_name, current_blob_path):
+        _copy_blob_to_blob(
+            container_name,
+            current_blob_path,
+            container_name,
+            archived_blob_path,
+            overwrite=False,
+        )
+        archived_available = True
+
+    if not archived_available:
+        print(
+            f"Warning: Could not archive prior revision blob for document {previous_document.get('id')}"
+        )
+        return None
+
+    previous_document["blob_container"] = container_name
+    previous_document["blob_path"] = archived_blob_path
+    previous_document["archived_blob_path"] = archived_blob_path
+    previous_document["blob_path_mode"] = ARCHIVED_REVISION_BLOB_PATH_MODE
+    return archived_blob_path
+
+
+def _promote_document_blob_to_current_alias(promoted_document, user_id=None, group_id=None, public_workspace_id=None):
+    if not promoted_document:
+        return None
+
+    container_name = promoted_document.get("blob_container") or _get_blob_container_name(
+        group_id=group_id or promoted_document.get("group_id"),
+        public_workspace_id=public_workspace_id or promoted_document.get("public_workspace_id"),
+    )
+    current_blob_path = build_current_blob_path(
+        promoted_document.get("file_name"),
+        user_id=user_id or promoted_document.get("user_id"),
+        group_id=group_id or promoted_document.get("group_id"),
+        public_workspace_id=public_workspace_id or promoted_document.get("public_workspace_id"),
+    )
+    source_blob_path = promoted_document.get("archived_blob_path") or promoted_document.get("blob_path")
+
+    if not container_name or not current_blob_path:
+        return None
+
+    if source_blob_path and source_blob_path != current_blob_path and _blob_exists(container_name, source_blob_path):
+        _copy_blob_to_blob(
+            container_name,
+            source_blob_path,
+            container_name,
+            current_blob_path,
+            overwrite=True,
+        )
+        if not promoted_document.get("archived_blob_path"):
+            promoted_document["archived_blob_path"] = source_blob_path
+
+    promoted_document["blob_container"] = container_name
+    promoted_document["blob_path"] = current_blob_path
+    promoted_document["blob_path_mode"] = CURRENT_ALIAS_BLOB_PATH_MODE
+    return current_blob_path
+
+
+def _safe_int(value):
+    try:
+        return int(value)
+    except (TypeError, ValueError):
+        return 0
+
+
+def _get_documents_container(group_id=None, public_workspace_id=None):
+    if public_workspace_id is not None:
+        return cosmos_public_documents_container
+    if group_id is not None:
+        return cosmos_group_documents_container
+    return cosmos_user_documents_container
+
+
+def _get_search_client(group_id=None, public_workspace_id=None):
+    if public_workspace_id is not None:
+        return CLIENTS["search_client_public"]
+    if group_id is not None:
+        return CLIENTS["search_client_group"]
+    return CLIENTS["search_client_user"]
+
+
+def _get_document_family_key(document_item):
+    revision_family_id = document_item.get("revision_family_id")
+    if revision_family_id:
+        return revision_family_id
+
+    scope_value = (
+        document_item.get("public_workspace_id")
+        or document_item.get("group_id")
+        or document_item.get("user_id")
+        or "unknown"
+    )
+    file_name = document_item.get("file_name", "")
+    return f"legacy::{scope_value}::{file_name}"
+
+
+def _document_revision_sort_key(document_item):
+    return (
+        _safe_int(document_item.get("version")),
+        str(document_item.get("upload_date") or ""),
+        _safe_int(document_item.get("_ts")),
+    )
+
+
+def _choose_current_document(family_documents):
+    explicitly_current = [doc for doc in family_documents if doc.get("is_current_version") is True]
+    candidate_pool = explicitly_current if explicitly_current else family_documents
+    return max(candidate_pool, key=_document_revision_sort_key)
+
+
+def select_current_documents(documents):
+    families = {}
+
+    for document_item in documents or []:
+        family_key = _get_document_family_key(document_item)
+        families.setdefault(family_key, []).append(document_item)
+
+    current_documents = []
+    for family_documents in families.values():
+        current_documents.append(_choose_current_document(family_documents))
+
+    return current_documents
+
+
+def sort_documents(documents, sort_by="_ts", sort_order="DESC"):
+    reverse = str(sort_order).lower() != "asc"
+
+    def sort_key(document_item):
+        value = document_item.get(sort_by)
+        if sort_by == "_ts":
+            return _safe_int(value)
+        if value is None:
+            return ""
+        if isinstance(value, str):
+            return value.lower()
+        if isinstance(value, (int, float)):
+            return value
+        return str(value).lower()
+
+    return sorted(documents or [], key=sort_key, reverse=reverse)
+
+
+def _query_accessible_documents(user_id, group_id=None, public_workspace_id=None):
+    cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+
+    if public_workspace_id is not None:
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.public_workspace_id = @public_workspace_id
+        """
+        parameters = [
+            {"name": "@public_workspace_id", "value": public_workspace_id}
+        ]
+    elif group_id is not None:
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.group_id = @group_id
+                OR ARRAY_CONTAINS(c.shared_group_ids, @group_id)
+                OR EXISTS(SELECT VALUE s FROM s IN c.shared_group_ids WHERE STARTSWITH(s, @group_id_prefix))
+        """
+        parameters = [
+            {"name": "@group_id", "value": group_id},
+            {"name": "@group_id_prefix", "value": f"{group_id},"}
+        ]
+    else:
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.user_id = @user_id
+                OR ARRAY_CONTAINS(c.shared_user_ids, @user_id)
+                OR EXISTS(SELECT VALUE s FROM s IN c.shared_user_ids WHERE STARTSWITH(s, @user_id_prefix))
+        """
+        parameters = [
+            {"name": "@user_id", "value": user_id},
+            {"name": "@user_id_prefix", "value": f"{user_id},"}
+        ]
+
+    return list(
+        cosmos_container.query_items(
+            query=query,
+            parameters=parameters,
+            enable_cross_partition_query=True,
+        )
+    )
+
+
+def _build_archived_scope_value(scope_value):
+    return f"{ARCHIVED_SCOPE_PREFIX}{scope_value}"
+
+
+def set_document_chunk_visibility(document_item, active=True):
+    document_id = document_item.get("id")
+    group_id = document_item.get("group_id")
+    public_workspace_id = document_item.get("public_workspace_id")
+    user_id = document_item.get("user_id")
+    is_group = group_id is not None
+    is_public_workspace = public_workspace_id is not None
+
+    if not document_id:
+        return 0
+
+    search_client = _get_search_client(group_id=group_id, public_workspace_id=public_workspace_id)
+    chunk_results = list(
+        search_client.search(
+            search_text="*",
+            filter=f"document_id eq '{document_id}'",
+        )
+    )
+
+    if not chunk_results:
+        return 0
+
+    documents_to_update = []
+    for chunk_item in chunk_results:
+        if is_public_workspace:
+            chunk_item["public_workspace_id"] = public_workspace_id if active else _build_archived_scope_value(public_workspace_id)
+        elif is_group:
+            chunk_item["group_id"] = group_id if active else _build_archived_scope_value(group_id)
+            chunk_item["shared_group_ids"] = document_item.get("shared_group_ids", []) if active else []
+        else:
+            chunk_item["user_id"] = user_id if active else _build_archived_scope_value(user_id)
+            chunk_item["shared_user_ids"] = document_item.get("shared_user_ids", []) if active else []
+
+        documents_to_update.append(chunk_item)
+
+    search_client.upload_documents(documents=documents_to_update)
+    return len(documents_to_update)
+
+
+def normalize_document_revision_families(user_id, group_id=None, public_workspace_id=None, document_items=None):
+    documents = document_items if document_items is not None else _query_accessible_documents(
+        user_id=user_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+    cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+    families = {}
+    changes_made = False
+
+    for document_item in documents:
+        family_key = _get_document_family_key(document_item)
+        families.setdefault(family_key, []).append(document_item)
+
+    for family_documents in families.values():
+        if len(family_documents) <= 1:
+            continue
+
+        current_document = _choose_current_document(family_documents)
+        revision_family_id = current_document.get("revision_family_id") or current_document.get("id")
+
+        for document_item in family_documents:
+            expected_current = document_item.get("id") == current_document.get("id")
+            update_occurred = False
+
+            if document_item.get("revision_family_id") != revision_family_id:
+                document_item["revision_family_id"] = revision_family_id
+                update_occurred = True
+
+            if document_item.get("is_current_version") != expected_current:
+                document_item["is_current_version"] = expected_current
+                update_occurred = True
+
+            if expected_current:
+                if document_item.get("search_visibility_state") == "archived":
+                    set_document_chunk_visibility(document_item, active=True)
+                    document_item["search_visibility_state"] = "active"
+                    update_occurred = True
+                elif document_item.get("search_visibility_state") != "active":
+                    document_item["search_visibility_state"] = "active"
+                    update_occurred = True
+            else:
+                if document_item.get("search_visibility_state") != "archived":
+                    set_document_chunk_visibility(document_item, active=False)
+                    document_item["search_visibility_state"] = "archived"
+                    update_occurred = True
+
+            if update_occurred:
+                cosmos_container.upsert_item(document_item)
+                changes_made = True
+
+    return changes_made
+
+
+def _get_document_family_items_from_document(document_item, user_id, group_id=None, public_workspace_id=None):
+    cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+    file_name = document_item.get("file_name")
+
+    if public_workspace_id is not None:
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.file_name = @file_name
+                AND c.public_workspace_id = @public_workspace_id
+        """
+        parameters = [
+            {"name": "@file_name", "value": file_name},
+            {"name": "@public_workspace_id", "value": public_workspace_id},
+        ]
+    elif group_id is not None:
+        owner_group_id = document_item.get("group_id") or group_id
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.file_name = @file_name
+                AND c.group_id = @group_id
+        """
+        parameters = [
+            {"name": "@file_name", "value": file_name},
+            {"name": "@group_id", "value": owner_group_id},
+        ]
+    else:
+        owner_user_id = document_item.get("user_id") or user_id
+        query = """
+            SELECT *
+            FROM c
+            WHERE c.file_name = @file_name
+                AND c.user_id = @owner_user_id
+        """
+        parameters = [
+            {"name": "@file_name", "value": file_name},
+            {"name": "@owner_user_id", "value": owner_user_id},
+        ]
+
+    return list(
+        cosmos_container.query_items(
+            query=query,
+            parameters=parameters,
+            enable_cross_partition_query=True,
+        )
+    )
+
+
+def _build_carried_forward_metadata(document_item, is_group=False):
+    carried_forward = {
+        "title": document_item.get("title"),
+        "abstract": document_item.get("abstract"),
+        "keywords": document_item.get("keywords"),
+        "publication_date": document_item.get("publication_date"),
+        "authors": ensure_list(document_item.get("authors")),
+        "document_classification": document_item.get("document_classification", "None"),
+        "tags": document_item.get("tags", []),
+    }
+
+    if is_group:
+        carried_forward["shared_group_ids"] = document_item.get("shared_group_ids", [])
+    else:
+        carried_forward["shared_user_ids"] = document_item.get("shared_user_ids", [])
+
+    return carried_forward
     
 def create_document(file_name, user_id, document_id, num_file_chunks, status, group_id=None, public_workspace_id=None):
     current_time = datetime.now(timezone.utc).strftime('%Y-%m-%dT%H:%M:%SZ')
@@ -64,14 +598,56 @@ def create_document(file_name, user_id, document_id, num_file_chunks, status, gr
         ]
 
     try:
-        existing_document = list(
+        existing_documents = list(
             cosmos_container.query_items(
                 query=query,
                 parameters=parameters,
                 enable_cross_partition_query=True
             )
         )
-        version = existing_document[0]['version'] + 1 if existing_document else 1
+        existing_documents = sorted(existing_documents, key=_document_revision_sort_key, reverse=True)
+
+        latest_existing_document = existing_documents[0] if existing_documents else None
+        revision_family_id = latest_existing_document.get('revision_family_id') if latest_existing_document else None
+        revision_family_id = revision_family_id or (latest_existing_document.get('id') if latest_existing_document else document_id)
+        version = (_safe_int(latest_existing_document.get('version')) + 1) if latest_existing_document else 1
+
+        if latest_existing_document:
+            carried_forward = _build_carried_forward_metadata(
+                latest_existing_document,
+                is_group=is_group,
+            )
+        else:
+            carried_forward = {
+                'title': None,
+                'abstract': None,
+                'keywords': None,
+                'publication_date': None,
+                'authors': [],
+                'document_classification': 'None',
+                'tags': [],
+                'shared_group_ids': [] if is_group else None,
+                'shared_user_ids': [] if not is_group else None,
+            }
+
+        for existing_document in existing_documents:
+            update_existing_document = False
+
+            if existing_document.get('revision_family_id') != revision_family_id:
+                existing_document['revision_family_id'] = revision_family_id
+                update_existing_document = True
+
+            if existing_document.get('is_current_version') is not False:
+                existing_document['is_current_version'] = False
+                update_existing_document = True
+
+            if existing_document.get('search_visibility_state') != 'archived':
+                set_document_chunk_visibility(existing_document, active=False)
+                existing_document['search_visibility_state'] = 'archived'
+                update_existing_document = True
+
+            if update_existing_document:
+                cosmos_container.upsert_item(existing_document)
         
         if is_public_workspace:
             document_metadata = {
@@ -84,13 +660,25 @@ def create_document(file_name, user_id, document_id, num_file_chunks, status, gr
                 "upload_date": current_time,
                 "last_updated": current_time,
                 "version": version,
+                "revision_family_id": revision_family_id,
+                "is_current_version": True,
+                "search_visibility_state": "active",
                 "status": status,
                 "percentage_complete": 0,
-                "document_classification": "None",
+                "document_classification": carried_forward.get("document_classification", "None"),
                 "type": "document_metadata",
                 "public_workspace_id": public_workspace_id,
                 "user_id": user_id,
-                "tags": []
+                "blob_container": _get_blob_container_name(public_workspace_id=public_workspace_id),
+                "blob_path": None,
+                "archived_blob_path": None,
+                "blob_path_mode": None,
+                "title": carried_forward.get("title"),
+                "abstract": carried_forward.get("abstract"),
+                "keywords": carried_forward.get("keywords"),
+                "publication_date": carried_forward.get("publication_date"),
+                "authors": ensure_list(carried_forward.get("authors")),
+                "tags": carried_forward.get("tags", [])
             }
         elif is_group:
             document_metadata = {
@@ -103,13 +691,25 @@ def create_document(file_name, user_id, document_id, num_file_chunks, status, gr
                 "upload_date": current_time,
                 "last_updated": current_time,
                 "version": version,
+                "revision_family_id": revision_family_id,
+                "is_current_version": True,
+                "search_visibility_state": "active",
                 "status": status,
                 "percentage_complete": 0,
-                "document_classification": "None",
+                "document_classification": carried_forward.get("document_classification", "None"),
                 "type": "document_metadata",
                 "group_id": group_id,
-                "shared_group_ids": [],
-                "tags": []
+                "blob_container": _get_blob_container_name(group_id=group_id),
+                "blob_path": None,
+                "archived_blob_path": None,
+                "blob_path_mode": None,
+                "shared_group_ids": carried_forward.get("shared_group_ids", []),
+                "title": carried_forward.get("title"),
+                "abstract": carried_forward.get("abstract"),
+                "keywords": carried_forward.get("keywords"),
+                "publication_date": carried_forward.get("publication_date"),
+                "authors": ensure_list(carried_forward.get("authors")),
+                "tags": carried_forward.get("tags", [])
             }
         else:
             document_metadata = {
@@ -122,15 +722,27 @@ def create_document(file_name, user_id, document_id, num_file_chunks, status, gr
                 "upload_date": current_time,
                 "last_updated": current_time,
                 "version": version,
+                "revision_family_id": revision_family_id,
+                "is_current_version": True,
+                "search_visibility_state": "active",
                 "status": status,
                 "percentage_complete": 0,
-                "document_classification": "None",
+                "document_classification": carried_forward.get("document_classification", "None"),
                 "type": "document_metadata",
                 "user_id": user_id,
-                "shared_user_ids": [],
+                "blob_container": _get_blob_container_name(),
+                "blob_path": None,
+                "archived_blob_path": None,
+                "blob_path_mode": None,
+                "shared_user_ids": carried_forward.get("shared_user_ids", []),
                 "embedding_tokens": 0,
                 "embedding_model_deployment_name": None,
-                "tags": []
+                "title": carried_forward.get("title"),
+                "abstract": carried_forward.get("abstract"),
+                "keywords": carried_forward.get("keywords"),
+                "publication_date": carried_forward.get("publication_date"),
+                "authors": ensure_list(carried_forward.get("authors")),
+                "tags": carried_forward.get("tags", [])
             }
 
         cosmos_container.upsert_item(document_metadata)
@@ -1379,7 +1991,7 @@ def update_document(**kwargs):
                         chunk_updates['title'] = existing_document.get('title')
                     if 'authors' in updated_fields_requiring_chunk_sync:
                          # Ensure authors is a list for the chunk metadata if needed
-                        chunk_updates['author'] = existing_document.get('authors')
+                        chunk_updates['author'] = ensure_list(existing_document.get('authors'))
                     if 'file_name' in updated_fields_requiring_chunk_sync:
                         chunk_updates['file_name'] = existing_document.get('file_name')
                     if 'document_classification' in updated_fields_requiring_chunk_sync:
@@ -1517,8 +2129,9 @@ def save_chunks(page_text_content, page_number, file_name, user_id, document_id,
         chunk_id = f"{document_id}_{page_number}"
         chunk_keywords = []
         chunk_summary = ""
-        author = []
-        title = ""
+        author = ensure_list(metadata.get('authors')) if metadata else []
+        title = metadata.get('title', '') if metadata else ''
+        document_classification = metadata.get('document_classification', 'None') if metadata else 'None'
         
         # Check if this document has vision analysis and append it to chunk_text
         vision_analysis = metadata.get('vision_analysis')
@@ -1567,7 +2180,7 @@ def save_chunks(page_text_content, page_number, file_name, user_id, document_id,
                 "page_number": page_number,
                 "author": author,
                 "title": title,
-                "document_classification": "None",
+                "document_classification": document_classification,
                 "document_tags": metadata.get('tags', []),
                 "chunk_sequence": page_number,  # or you can keep an incremental idx
                 "upload_date": current_time,
@@ -1589,7 +2202,7 @@ def save_chunks(page_text_content, page_number, file_name, user_id, document_id,
                 "page_number": page_number,
                 "author": author,
                 "title": title,
-                "document_classification": "None",
+                "document_classification": document_classification,
                 "document_tags": metadata.get('tags', []),
                 "chunk_sequence": page_number,  # or you can keep an incremental idx
                 "upload_date": current_time,
@@ -1613,7 +2226,7 @@ def save_chunks(page_text_content, page_number, file_name, user_id, document_id,
                 "page_number": page_number,
                 "author": author,
                 "title": title,
-                "document_classification": "None",
+                "document_classification": document_classification,
                 "document_tags": metadata.get('tags', []),
                 "chunk_sequence": page_number,  # or you can keep an incremental idx
                 "upload_date": current_time,
@@ -2023,7 +2636,10 @@ def update_chunk_metadata(chunk_id, user_id, group_id=None, public_workspace_id=
             
         for field in updatable_fields:
             if field in kwargs:
-                chunk_item[field] = kwargs[field]
+                if field == 'author':
+                    chunk_item[field] = ensure_list(kwargs[field])
+                else:
+                    chunk_item[field] = kwargs[field]
 
         search_client.upload_documents(documents=[chunk_item])
 
@@ -2082,62 +2698,14 @@ def chunk_pdf(input_pdf_path: str, max_pages: int = 500) -> list:
     return chunks
 
 def get_documents(user_id, group_id=None, public_workspace_id=None):
-    is_group = group_id is not None
-    is_public_workspace = public_workspace_id is not None
-
-    # Choose the correct cosmos_container and query parameters
-    if is_public_workspace:
-        cosmos_container = cosmos_public_documents_container
-    elif is_group:
-        cosmos_container = cosmos_group_documents_container
-    else:
-        cosmos_container = cosmos_user_documents_container
-
-    if is_public_workspace:
-        query = """
-            SELECT TOP 1 * 
-            FROM c
-            WHERE c.public_workspace_id = @public_workspace_id
-        """
-        parameters = [
-            {"name": "@public_workspace_id", "value": public_workspace_id}
-        ]
-    elif is_group:
-        query = """
-            SELECT *
-            FROM c
-            WHERE c.group_id = @group_id OR ARRAY_CONTAINS(c.shared_group_ids, @group_id)
-        """
-        parameters = [
-            {"name": "@group_id", "value": group_id}
-        ]
-    else:
-        query = """
-            SELECT *
-            FROM c
-            WHERE c.user_id = @user_id OR ARRAY_CONTAINS(c.shared_user_ids, @user_id)
-        """
-        parameters = [
-            {"name": "@user_id", "value": user_id}
-        ]
-    
     try:       
-        documents = list(
-            cosmos_container.query_items(
-                query=query,
-                parameters=parameters, 
-                enable_cross_partition_query=True
-            )
+        documents = _query_accessible_documents(
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
         )
-
-        latest_documents = {}
-
-        for doc in documents:
-            file_name = doc['file_name']
-            if file_name not in latest_documents or doc['version'] > latest_documents[file_name]['version']:
-                latest_documents[file_name] = doc
-                
-        return jsonify({"documents": list(latest_documents.values())}), 200
+        current_documents = sort_documents(select_current_documents(documents))
+        return jsonify({"documents": current_documents}), 200
     except Exception as e:
         return jsonify({'error': f'Error retrieving documents: {str(e)}'}), 500
 
@@ -2209,72 +2777,23 @@ def get_document(user_id, document_id, group_id=None, public_workspace_id=None):
 
         return jsonify(document_results[0]), 200
 
-    except Exception as e:
-        return jsonify({'error': f'Error retrieving document: {str(e)}'}), 500
-
-def get_latest_version(document_id, user_id, group_id=None, public_workspace_id=None):
-    is_group = group_id is not None
-    is_public_workspace = public_workspace_id is not None
-
-    # Choose the correct cosmos_container and query parameters
-    if is_public_workspace:
-        cosmos_container = cosmos_public_documents_container
-    elif is_group:
-        cosmos_container = cosmos_group_documents_container
-    else:
-        cosmos_container = cosmos_user_documents_container
-
-    if is_public_workspace:
-        query = """
-            SELECT TOP 1 * 
-            FROM c
-            WHERE c.id = @document_id 
-                AND c.public_workspace_id = @public_workspace_id
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@public_workspace_id", "value": public_workspace_id}
-        ]
-    elif is_group:
-        query = """
-            SELECT c.version
-            FROM c
-            WHERE c.id = @document_id
-                AND (c.group_id = @group_id OR ARRAY_CONTAINS(c.shared_group_ids, @group_id))
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@group_id", "value": group_id}
-        ]
-    else:
-        query = """
-            SELECT c.version
-            FROM c
-            WHERE c.id = @document_id
-                AND (c.user_id = @user_id OR ARRAY_CONTAINS(c.shared_user_ids, @user_id))
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@user_id", "value": user_id}
-        ]
-
-    try:
-        results = list(
-            cosmos_container.query_items(
-                query=query, 
-                parameters=parameters, 
-                enable_cross_partition_query=True
-            )
-        )
-
-        if results:
-            return results[0]['version']
-        else:
-            return None
+    except Exception as e:
+        return jsonify({'error': f'Error retrieving document: {str(e)}'}), 500
 
+def get_latest_version(document_id, user_id, group_id=None, public_workspace_id=None):
+    try:
+        target_document = _get_documents_container(
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        ).read_item(item=document_id, partition_key=document_id)
+        family_documents = _get_document_family_items_from_document(
+            target_document,
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
+        current_document = _choose_current_document(family_documents)
+        return current_document.get('version') if current_document else None
     except Exception as e:
         return None
 
@@ -2349,51 +2868,37 @@ def get_document_version(user_id, document_id, version, group_id=None, public_wo
     except Exception as e:
         return jsonify({'error': f'Error retrieving document version: {str(e)}'}), 500
 
-def delete_from_blob_storage(document_id, user_id, file_name, group_id=None, public_workspace_id=None):
+def delete_from_blob_storage(document_item, user_id=None, group_id=None, public_workspace_id=None):
     """Delete a document from Azure Blob Storage."""
-    is_group = group_id is not None
-    is_public_workspace = public_workspace_id is not None
-    
-    if is_public_workspace:
-        storage_account_container_name = storage_account_public_documents_container_name
-    elif is_group:
-        storage_account_container_name = storage_account_group_documents_container_name
-    else:
-        storage_account_container_name = storage_account_user_documents_container_name
-    
+
     # Check if enhanced citations are enabled and blob client is available
     settings = get_settings()
     enable_enhanced_citations = settings.get("enable_enhanced_citations", False)
-    
+
     if not enable_enhanced_citations:
         return  # No need to proceed if enhanced citations are disabled
-    
+
     try:
-        # Construct the blob path using the same format as in upload_to_blob
-        blob_path = f"{group_id}/{file_name}" if is_group else f"{user_id}/{file_name}"
-        
-        # Get the blob client
         blob_service_client = CLIENTS.get("storage_account_office_docs_client")
         if not blob_service_client:
-            print(f"Warning: Enhanced citations enabled but blob service client not configured.")
-            return
-            
-        # Get container client
-        container_client = blob_service_client.get_container_client(storage_account_container_name)
-        if not container_client:
-            print(f"Warning: Could not get container client for {storage_account_container_name}")
+            print("Warning: Enhanced citations enabled but blob service client not configured.")
             return
-            
-        # Get blob client
-        blob_client = container_client.get_blob_client(blob_path)
-        
-        # Delete the blob if it exists
-        if blob_client.exists():
-            blob_client.delete_blob()
-            print(f"Successfully deleted blob at {blob_path}")
-        else:
-            print(f"No blob found at {blob_path} to delete")
-            
+
+        delete_targets = get_document_blob_delete_targets(
+            document_item,
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
+
+        for container_name, blob_path in delete_targets:
+            blob_client = blob_service_client.get_blob_client(container=container_name, blob=blob_path)
+            if blob_client.exists():
+                blob_client.delete_blob()
+                print(f"Successfully deleted blob at {container_name}/{blob_path}")
+            else:
+                print(f"No blob found at {container_name}/{blob_path} to delete")
+
     except Exception as e:
         print(f"Error deleting document from blob storage: {str(e)}")
         # Don't raise the exception, as we want the Cosmos DB deletion to proceed
@@ -2466,13 +2971,14 @@ def delete_document(user_id, document_id, group_id=None, public_workspace_id=Non
             if document_item.get('user_id') != user_id:
                 raise Exception("Unauthorized access to document - only document owner can delete")
             
-        # Get the file name from the document to use for blob deletion
-        file_name = document_item.get('file_name')
-
         # Delete from blob storage
         try:
-            if file_name:
-                delete_from_blob_storage(document_id, user_id, file_name, group_id, public_workspace_id)
+            delete_from_blob_storage(
+                document_item,
+                user_id=user_id,
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
         except Exception as blob_error:
             # Log the error but continue with Cosmos DB deletion
             print(f"Error deleting from blob storage (continuing with document deletion): {str(blob_error)}")
@@ -2488,6 +2994,81 @@ def delete_document(user_id, document_id, group_id=None, public_workspace_id=Non
     except Exception as e:
         raise
 
+
+def delete_document_revision(user_id, document_id, delete_mode="all_versions", group_id=None, public_workspace_id=None):
+    if delete_mode not in {"all_versions", "current_only"}:
+        raise ValueError("Unsupported delete mode")
+
+    cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+    target_document = cosmos_container.read_item(item=document_id, partition_key=document_id)
+
+    family_documents = _get_document_family_items_from_document(
+        target_document,
+        user_id=user_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+    current_document = _choose_current_document(family_documents)
+    target_is_current = current_document and current_document.get('id') == document_id
+
+    if delete_mode == "all_versions":
+        deleted_document_ids = []
+        for family_document in family_documents:
+            delete_document(
+                user_id=user_id,
+                document_id=family_document['id'],
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            delete_document_chunks(
+                document_id=family_document['id'],
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            deleted_document_ids.append(family_document['id'])
+
+        return {
+            'deleted_mode': 'all_versions',
+            'deleted_document_ids': deleted_document_ids,
+            'promoted_document_id': None,
+        }
+
+    delete_document(
+        user_id=user_id,
+        document_id=document_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+    delete_document_chunks(
+        document_id=document_id,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+    )
+
+    promoted_document_id = None
+    if target_is_current:
+        remaining_documents = [doc for doc in family_documents if doc.get('id') != document_id]
+        if remaining_documents:
+            promoted_document = _choose_current_document(remaining_documents)
+            promoted_document['revision_family_id'] = target_document.get('revision_family_id') or promoted_document.get('revision_family_id') or promoted_document.get('id')
+            promoted_document['is_current_version'] = True
+            promoted_document['search_visibility_state'] = 'active'
+            _promote_document_blob_to_current_alias(
+                promoted_document,
+                user_id=user_id,
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            set_document_chunk_visibility(promoted_document, active=True)
+            cosmos_container.upsert_item(promoted_document)
+            promoted_document_id = promoted_document.get('id')
+
+    return {
+        'deleted_mode': 'current_only',
+        'deleted_document_ids': [document_id],
+        'promoted_document_id': promoted_document_id,
+    }
+
 def delete_document_chunks(document_id, group_id=None, public_workspace_id=None):
     """Delete document chunks from Azure Cognitive Search index."""
 
@@ -2533,66 +3114,26 @@ def delete_document_version_chunks(document_id, version, group_id=None, public_w
     )
 
 def get_document_versions(user_id, document_id, group_id=None, public_workspace_id=None):
-    """ Get all versions of a document for a user."""
-    is_group = group_id is not None
-    is_public_workspace = public_workspace_id is not None
-
-    if is_public_workspace:
-        cosmos_container = cosmos_public_documents_container
-    elif is_group:
-        cosmos_container = cosmos_group_documents_container
-    else:
-        cosmos_container = cosmos_user_documents_container
-
-    if is_public_workspace:
-        query = """
-            SELECT c.id, c.file_name, c.version, c.upload_date
-            FROM c
-            WHERE c.id = @document_id 
-                AND c.public_workspace_id = @public_workspace_id
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@public_workspace_id", "value": public_workspace_id}
-        ]
-    elif is_group:
-        query = """
-            SELECT c.id, c.file_name, c.version, c.upload_date
-            FROM c
-            WHERE c.id = @document_id
-                AND (c.group_id = @group_id OR ARRAY_CONTAINS(c.shared_group_ids, @group_id))
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@group_id", "value": group_id}
-        ]
-    else:
-        query = """
-            SELECT c.id, c.file_name, c.version, c.upload_date
-            FROM c
-            WHERE c.id = @document_id
-                AND (c.user_id = @user_id OR ARRAY_CONTAINS(c.shared_user_ids, @user_id))
-            ORDER BY c.version DESC
-        """
-        parameters = [
-            {"name": "@document_id", "value": document_id},
-            {"name": "@user_id", "value": user_id}
-        ]
-
     try:
-        versions_results = list(
-            cosmos_container.query_items(
-                query=query, 
-                parameters=parameters, 
-                enable_cross_partition_query=True
-            )
+        cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+        target_document = cosmos_container.read_item(item=document_id, partition_key=document_id)
+        family_documents = _get_document_family_items_from_document(
+            target_document,
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
         )
-
-        if not versions_results:
-            return []
-        return versions_results
+        sorted_family = sorted(family_documents, key=_document_revision_sort_key, reverse=True)
+        return [
+            {
+                'id': doc.get('id'),
+                'file_name': doc.get('file_name'),
+                'version': doc.get('version'),
+                'upload_date': doc.get('upload_date'),
+                'is_current_version': doc.get('id') == _choose_current_document(family_documents).get('id'),
+            }
+            for doc in sorted_family
+        ]
 
     except Exception as e:
         return []
@@ -2697,7 +3238,7 @@ def process_metadata_extraction_background(document_id, user_id, group_id=None,
             "document_id": document_id,
             "user_id": user_id,
             "title": metadata.get('title'),
-            "authors": metadata.get('authors'),
+            "authors": ensure_list(metadata.get('authors')),
             "abstract": metadata.get('abstract'),
             "keywords": metadata.get('keywords'),
             "publication_date": metadata.get('publication_date'),
@@ -3221,23 +3762,34 @@ def clean_json_codeFence(response_content: str) -> str:
 
 def ensure_list(value, delimiters=r"[;,]"):
     """
-    Ensures the provided value is returned as a list of strings.
-    - If `value` is already a list, it is returned as-is.
-    - If `value` is a string, it is split on the given delimiters
-      (default: commas and semicolons).
-    - Otherwise, return an empty list.
+    Ensures the provided value is returned as a list of non-empty strings.
+    - If `value` is a list/tuple/set, items are normalized one by one.
+    - If `value` is a string, it is split on the given delimiters.
+    - If `value` is any other scalar, it is coerced to a single string item.
+    - Null and blank items are removed.
     """
-    if isinstance(value, list):
-        return value
-    elif isinstance(value, str):
-        # Split on the given delimiters (commas, semicolons, etc.)
-        items = re.split(delimiters, value)
-        # Strip whitespace and remove empty strings
-        items = [item.strip() for item in items if item.strip()]
-        return items
-    else:
+    if value is None:
         return []
 
+    if isinstance(value, str):
+        raw_items = re.split(delimiters, value)
+    elif isinstance(value, (list, tuple, set)):
+        raw_items = list(value)
+    else:
+        raw_items = [value]
+
+    items = []
+    for raw_item in raw_items:
+        if raw_item is None:
+            continue
+
+        normalized_item = raw_item if isinstance(raw_item, str) else str(raw_item)
+        normalized_item = normalized_item.strip()
+        if normalized_item:
+            items.append(normalized_item)
+
+    return items
+
 def is_effectively_empty(value):
     """
     Returns True if the value is 'worthless' or empty.
@@ -3548,27 +4100,42 @@ def analyze_image_with_vision_model(image_path, user_id, document_id, settings):
 def upload_to_blob(temp_file_path, user_id, document_id, blob_filename, update_callback, group_id=None, public_workspace_id=None):
     """Uploads the file to Azure Blob Storage."""
 
-    is_group = group_id is not None
-    is_public_workspace = public_workspace_id is not None
-    
-    if is_public_workspace:
-        storage_account_container_name = storage_account_public_documents_container_name
-    elif is_group:
-        storage_account_container_name = storage_account_group_documents_container_name
-    else:
-        storage_account_container_name = storage_account_user_documents_container_name
-
     try:
-        if is_public_workspace:
-            blob_path = f"{public_workspace_id}/{blob_filename}"
-        elif is_group:
-            blob_path = f"{group_id}/{blob_filename}"
-        else:
-            blob_path = f"{user_id}/{blob_filename}"
+        cosmos_container = _get_documents_container(group_id=group_id, public_workspace_id=public_workspace_id)
+        current_document = cosmos_container.read_item(item=document_id, partition_key=document_id)
+        storage_account_container_name = current_document.get("blob_container") or _get_blob_container_name(
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
+        blob_path = build_current_blob_path(
+            blob_filename,
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
 
-        blob_service_client = CLIENTS.get("storage_account_office_docs_client")
-        if not blob_service_client:
-            raise Exception("Blob service client not available or not configured.")
+        previous_family_documents = [
+            family_document
+            for family_document in _get_document_family_items_from_document(
+                current_document,
+                user_id=user_id,
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            if family_document.get("id") != document_id
+        ]
+        previous_document = max(previous_family_documents, key=_document_revision_sort_key) if previous_family_documents else None
+        if previous_document:
+            archived_blob_path = _archive_previous_document_blob(
+                previous_document,
+                user_id=user_id,
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            if archived_blob_path:
+                cosmos_container.upsert_item(previous_document)
+
+        blob_service_client = _get_blob_service_client()
 
         blob_client = blob_service_client.get_blob_client(
             container=storage_account_container_name,
@@ -3577,8 +4144,8 @@ def upload_to_blob(temp_file_path, user_id, document_id, blob_filename, update_c
 
         metadata = {
             "document_id": str(document_id),
-            "group_id": str(group_id) if is_group else None,
-            "user_id": str(user_id) if not is_group else None
+            "group_id": str(group_id) if group_id is not None else None,
+            "user_id": str(user_id) if group_id is None else None
         }
 
         metadata = {k: v for k, v in metadata.items() if v is not None}
@@ -3588,6 +4155,13 @@ def upload_to_blob(temp_file_path, user_id, document_id, blob_filename, update_c
         with open(temp_file_path, "rb") as f:
             blob_client.upload_blob(f, overwrite=True, metadata=metadata)
 
+        current_document["blob_container"] = storage_account_container_name
+        current_document["blob_path"] = blob_path
+        current_document["blob_path_mode"] = CURRENT_ALIAS_BLOB_PATH_MODE
+        if current_document.get("archived_blob_path") is None:
+            current_document["archived_blob_path"] = None
+        cosmos_container.upsert_item(current_document)
+
         print(f"Successfully uploaded {blob_filename} to blob storage at {blob_path}")
         return blob_path
 
@@ -4809,6 +5383,173 @@ def process_json(document_id, user_id, temp_file_path, original_filename, enable
     # Return the count of chunks actually saved
     return total_chunks_saved, total_embedding_tokens, embedding_model_name
 
+TABULAR_SCHEMA_SUMMARY_MAX_SHEETS = 8
+TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS = 12
+TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS = 3
+TABULAR_SCHEMA_SUMMARY_MAX_CELL_CHARS = 60
+
+
+def _compact_tabular_schema_value(value, max_chars=TABULAR_SCHEMA_SUMMARY_MAX_CELL_CHARS):
+    text = "" if value is None else str(value)
+    text = " ".join(text.split())
+
+    if len(text) <= max_chars:
+        return text
+
+    return f"{text[:max_chars - 3]}..."
+
+
+def _compact_tabular_columns(columns, max_columns=TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS):
+    normalized_columns = [
+        _compact_tabular_schema_value(column, max_chars=80) or "(blank)"
+        for column in columns
+    ]
+    visible_columns = normalized_columns[:max_columns]
+    omitted_count = max(len(normalized_columns) - max_columns, 0)
+
+    if omitted_count:
+        visible_columns.append(f"... +{omitted_count} more columns")
+
+    return visible_columns
+
+
+def _build_compact_tabular_preview(df_preview):
+    if df_preview is None or df_preview.empty:
+        return "[No preview rows available]"
+
+    preview_df = df_preview.iloc[
+        :TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS,
+        :TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS,
+    ].copy()
+    preview_df.columns = [
+        _compact_tabular_schema_value(column, max_chars=80) or "(blank)"
+        for column in preview_df.columns
+    ]
+
+    for column in preview_df.columns:
+        preview_df[column] = preview_df[column].map(
+            lambda value: _compact_tabular_schema_value(value)
+        )
+
+    preview_text = preview_df.to_string(index=False)
+    omitted_column_count = max(len(df_preview.columns) - TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS, 0)
+    if omitted_column_count:
+        preview_text += (
+            f"\n[Preview truncated to the first {TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS} columns; "
+            f"{omitted_column_count} additional columns omitted.]"
+        )
+
+    return preview_text
+
+
+def _build_minimal_tabular_summary(temp_file_path, original_filename, file_ext):
+    plugin_note = "This file is stored in blob storage for detailed analysis via the Tabular Processing plugin."
+
+    if file_ext == '.csv':
+        column_summary = "Column discovery unavailable"
+        try:
+            header_df = pandas.read_csv(temp_file_path, keep_default_na=False, dtype=str, nrows=0)
+            compact_columns = _compact_tabular_columns(header_df.columns.tolist())
+            if compact_columns:
+                column_summary = ", ".join(compact_columns)
+        except Exception:
+            pass
+
+        return (
+            f"Tabular data file: {original_filename}\n"
+            f"Columns: {column_summary}\n"
+            f"{plugin_note}"
+        )
+
+    if file_ext in ('.xlsx', '.xls', '.xlsm'):
+        sheet_summary = "Sheet discovery unavailable"
+        try:
+            engine = 'openpyxl' if file_ext in ('.xlsx', '.xlsm') else 'xlrd'
+            excel_file = pandas.ExcelFile(temp_file_path, engine=engine)
+            visible_sheets = [
+                _compact_tabular_schema_value(sheet_name, max_chars=80)
+                for sheet_name in excel_file.sheet_names[:TABULAR_SCHEMA_SUMMARY_MAX_SHEETS]
+            ]
+            omitted_sheet_count = max(len(excel_file.sheet_names) - TABULAR_SCHEMA_SUMMARY_MAX_SHEETS, 0)
+
+            if visible_sheets:
+                sheet_summary = ", ".join(visible_sheets)
+                if omitted_sheet_count:
+                    sheet_summary += f", ... +{omitted_sheet_count} more sheets"
+        except Exception:
+            pass
+
+        return (
+            f"Tabular workbook: {original_filename}\n"
+            f"Sheets: {sheet_summary}\n"
+            f"{plugin_note}"
+        )
+
+    return (
+        f"Tabular file: {original_filename}\n"
+        f"{plugin_note}"
+    )
+
+
+def _build_tabular_schema_summary(temp_file_path, original_filename, file_ext):
+    plugin_note = "This file is available for detailed analysis via the Tabular Processing plugin."
+
+    if file_ext == '.csv':
+        df_preview = pandas.read_csv(
+            temp_file_path,
+            keep_default_na=False,
+            dtype=str,
+            nrows=TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS,
+        )
+        compact_columns = _compact_tabular_columns(df_preview.columns.tolist())
+        preview_rows = _build_compact_tabular_preview(df_preview)
+
+        return (
+            f"Tabular data file: {original_filename}\n"
+            f"Columns ({len(df_preview.columns)}): {', '.join(compact_columns) if compact_columns else 'None'}\n"
+            f"Preview (first {min(len(df_preview), TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS)} rows):\n{preview_rows}\n\n"
+            f"{plugin_note}"
+        )
+
+    if file_ext in ('.xlsx', '.xls', '.xlsm'):
+        engine = 'openpyxl' if file_ext in ('.xlsx', '.xlsm') else 'xlrd'
+        excel_file = pandas.ExcelFile(temp_file_path, engine=engine)
+        visible_sheet_names = excel_file.sheet_names[:TABULAR_SCHEMA_SUMMARY_MAX_SHEETS]
+        omitted_sheet_count = max(len(excel_file.sheet_names) - TABULAR_SCHEMA_SUMMARY_MAX_SHEETS, 0)
+        workbook_sections = []
+
+        for sheet_name in visible_sheet_names:
+            df_preview = excel_file.parse(
+                sheet_name,
+                keep_default_na=False,
+                dtype=str,
+                nrows=TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS,
+            )
+            compact_columns = _compact_tabular_columns(df_preview.columns.tolist())
+            preview_rows = _build_compact_tabular_preview(df_preview)
+            workbook_sections.append(
+                f"Sheet: {_compact_tabular_schema_value(sheet_name, max_chars=80)}\n"
+                f"Columns ({len(df_preview.columns)}): {', '.join(compact_columns) if compact_columns else 'None'}\n"
+                f"Preview (first {min(len(df_preview), TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS)} rows):\n{preview_rows}"
+            )
+
+        sheet_summary = ", ".join(
+            _compact_tabular_schema_value(sheet_name, max_chars=80)
+            for sheet_name in visible_sheet_names
+        )
+        if omitted_sheet_count:
+            sheet_summary += f", ... +{omitted_sheet_count} more sheets"
+
+        return (
+            f"Tabular workbook: {original_filename}\n"
+            f"Sheets ({len(excel_file.sheet_names)}): {sheet_summary if sheet_summary else 'None'}\n\n"
+            + "\n\n".join(workbook_sections)
+            + f"\n\n{plugin_note}"
+        )
+
+    raise ValueError(f"Unsupported tabular file type: {file_ext}")
+
+
 def process_single_tabular_sheet(df, document_id, user_id, file_name, update_callback, group_id=None, public_workspace_id=None):
     """Chunks a pandas DataFrame from a CSV or Excel sheet."""
     is_group = group_id is not None
@@ -4924,78 +5665,74 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
     # When enhanced citations is on, index a single schema summary chunk
     # instead of row-by-row chunking. The tabular processing plugin handles analysis.
     if enable_enhanced_citations:
-        try:
-            if file_ext == '.csv':
-                df_preview = pandas.read_csv(temp_file_path, keep_default_na=False, dtype=str, nrows=5)
-                full_df = pandas.read_csv(temp_file_path, keep_default_na=False, dtype=str)
-                row_count = len(full_df)
-                columns = [str(column) for column in df_preview.columns]
-                preview_rows = df_preview.head(5).to_string(index=False)
-
-                schema_summary = (
-                    f"Tabular data file: {original_filename}\n"
-                    f"Columns ({len(columns)}): {', '.join(columns)}\n"
-                    f"Total rows: {row_count}\n"
-                    f"Preview (first 5 rows):\n{preview_rows}\n\n"
-                    f"This file is available for detailed analysis via the Tabular Processing plugin."
-                )
-            elif file_ext in ('.xlsx', '.xls', '.xlsm'):
-                engine = 'openpyxl' if file_ext in ('.xlsx', '.xlsm') else 'xlrd'
-                excel_file = pandas.ExcelFile(temp_file_path, engine=engine)
-                workbook_sections = []
-
-                for sheet_name in excel_file.sheet_names:
-                    df_preview = excel_file.parse(sheet_name, keep_default_na=False, dtype=str, nrows=3)
-                    full_df = excel_file.parse(sheet_name, keep_default_na=False, dtype=str)
-                    columns = [str(column) for column in df_preview.columns]
-                    preview_rows = df_preview.head(3).to_string(index=False)
-                    workbook_sections.append(
-                        f"Sheet: {sheet_name}\n"
-                        f"Columns ({len(columns)}): {', '.join(columns)}\n"
-                        f"Total rows: {len(full_df)}\n"
-                        f"Preview (first 3 rows):\n{preview_rows}"
-                    )
-
-                schema_summary = (
-                    f"Tabular workbook: {original_filename}\n"
-                    f"Sheets ({len(excel_file.sheet_names)}): {', '.join(excel_file.sheet_names)}\n\n"
-                    + "\n\n".join(workbook_sections)
-                    + "\n\nThis workbook is available for detailed analysis via the Tabular Processing plugin."
-                )
-            else:
-                raise ValueError(f"Unsupported tabular file type: {file_ext}")
+        save_args = {
+            "page_number": 1,
+            "file_name": original_filename,
+            "user_id": user_id,
+            "document_id": document_id,
+        }
+        if is_public_workspace:
+            save_args["public_workspace_id"] = public_workspace_id
+        elif is_group:
+            save_args["group_id"] = group_id
 
+        try:
+            schema_summary = _build_tabular_schema_summary(
+                temp_file_path,
+                original_filename,
+                file_ext,
+            )
             update_callback(number_of_pages=1, status=f"Indexing schema summary for {original_filename}...")
+        except Exception as schema_error:
+            log_event(
+                f"[process_tabular] Error building bounded schema summary for {original_filename}; using compact fallback summary: {schema_error}",
+                level=logging.WARNING,
+            )
+            schema_summary = _build_minimal_tabular_summary(
+                temp_file_path,
+                original_filename,
+                file_ext,
+            )
+            update_callback(number_of_pages=1, status=f"Indexing compact schema summary for {original_filename}...")
 
-            save_args = {
-                "page_text_content": schema_summary,
-                "page_number": 1,
-                "file_name": original_filename,
-                "user_id": user_id,
-                "document_id": document_id
-            }
-            if is_public_workspace:
-                save_args["public_workspace_id"] = public_workspace_id
-            elif is_group:
-                save_args["group_id"] = group_id
-
+        try:
+            save_args["page_text_content"] = schema_summary
             token_usage = save_chunks(**save_args)
-            total_chunks_saved = 1
-            if token_usage:
-                total_embedding_tokens = token_usage.get('total_tokens', 0)
-                embedding_model_name = token_usage.get('model_deployment_name')
+        except Exception as schema_index_error:
+            minimal_summary = _build_minimal_tabular_summary(
+                temp_file_path,
+                original_filename,
+                file_ext,
+            )
 
-            # Don't return here — fall through to metadata extraction below
-        except Exception as e:
-            log_event(f"[process_tabular] Error creating schema summary, falling back to row-by-row: {e}", level=logging.WARNING)
-            # Fall through to existing row-by-row processing
+            if minimal_summary == schema_summary:
+                raise Exception(
+                    f"Failed indexing enhanced tabular schema summary for {original_filename}: {schema_index_error}"
+                ) from schema_index_error
+
+            log_event(
+                f"[process_tabular] Retrying compact schema summary for {original_filename} after schema summary indexing error: {schema_index_error}",
+                level=logging.WARNING,
+            )
+            update_callback(number_of_pages=1, status=f"Retrying compact schema summary for {original_filename}...")
 
-    # Only do row-by-row chunking if schema-only didn't produce chunks
-    if total_chunks_saved == 0:
+            try:
+                save_args["page_text_content"] = minimal_summary
+                token_usage = save_chunks(**save_args)
+            except Exception as minimal_summary_error:
+                raise Exception(
+                    f"Failed indexing enhanced tabular summary for {original_filename}: {minimal_summary_error}"
+                ) from minimal_summary_error
+
+        total_chunks_saved = 1
+        if token_usage:
+            total_embedding_tokens = token_usage.get('total_tokens', 0)
+            embedding_model_name = token_usage.get('model_deployment_name')
+
+    # Only do row-by-row chunking when enhanced citations is disabled.
+    if total_chunks_saved == 0 and not enable_enhanced_citations:
         try:
             if file_ext == '.csv':
-                # Process CSV
-                # Read CSV, attempt to infer header, keep data as string initially
                 df = pandas.read_csv(
                     temp_file_path,
                     keep_default_na=False,
@@ -5025,7 +5762,6 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
                     total_chunks_saved = result
 
             elif file_ext in ('.xlsx', '.xls', '.xlsm'):
-                # Process Excel (potentially multiple sheets)
                 excel_file = pandas.ExcelFile(
                     temp_file_path,
                     engine='openpyxl' if file_ext in ('.xlsx', '.xlsm') else 'xlrd'
@@ -5036,11 +5772,7 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
                 accumulated_total_chunks = 0
                 for sheet_name in sheet_names:
                     update_callback(status=f"Processing sheet '{sheet_name}'...")
-                    # Read specific sheet, get values (not formulas), keep data as string
-                    # Note: pandas typically reads values, not formulas by default.
                     df = excel_file.parse(sheet_name, keep_default_na=False, dtype=str)
-
-                    # Create effective filename for this sheet
                     effective_filename = f"{base_name}-{sheet_name}{ext}" if len(sheet_names) > 1 else original_filename
 
                     args = {
@@ -5066,7 +5798,7 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
                     else:
                         accumulated_total_chunks += result
 
-                total_chunks_saved = accumulated_total_chunks # Total across all sheets
+                total_chunks_saved = accumulated_total_chunks
 
         except pandas.errors.EmptyDataError:
             log_event(f"[process_tabular] Warning: Tabular file or sheet is empty: {original_filename}", level=logging.WARNING)
@@ -5074,7 +5806,6 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
         except Exception as e:
             raise Exception(f"Failed processing Tabular file {original_filename}: {e}")
 
-    # Extract metadata if enabled and chunks were processed
     settings = get_settings()
     enable_extract_meta_data = settings.get('enable_extract_meta_data', False)
     if enable_extract_meta_data and total_chunks_saved > 0:
@@ -5091,7 +5822,7 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
                 args["group_id"] = group_id
 
             document_metadata = extract_document_metadata(**args)
-            
+
             if document_metadata:
                 update_fields = {k: v for k, v in document_metadata.items() if v is not None and v != ""}
                 if update_fields:
@@ -5102,7 +5833,7 @@ def process_tabular(document_id, user_id, temp_file_path, original_filename, fil
         except Exception as e:
             print(f"Warning: Error extracting final metadata for Tabular document {document_id}: {str(e)}")
             update_callback(status=f"Processing complete (metadata extraction warning)")
-            
+
     return total_chunks_saved, total_embedding_tokens, embedding_model_name
 
 def process_di_document(document_id, user_id, temp_file_path, original_filename, file_ext, enable_enhanced_citations, update_callback, group_id=None, public_workspace_id=None):
@@ -6775,10 +7506,10 @@ def get_workspace_tags(user_id, group_id=None, public_workspace_id=None):
         workspace_type = 'personal'
     
     try:
-        # Query all documents with tags
+        # Query documents with enough metadata to collapse revisions to the current version.
         if is_public_workspace:
             query = """
-                SELECT c.tags
+                SELECT c.id, c.file_name, c.version, c._ts, c.upload_date, c.tags, c.revision_family_id, c.is_current_version
                 FROM c
                 WHERE c.public_workspace_id = @partition_key
                     AND IS_DEFINED(c.tags)
@@ -6786,7 +7517,7 @@ def get_workspace_tags(user_id, group_id=None, public_workspace_id=None):
             """
         elif is_group:
             query = """
-                SELECT c.tags
+                SELECT c.id, c.file_name, c.version, c._ts, c.upload_date, c.tags, c.revision_family_id, c.is_current_version, c.group_id
                 FROM c
                 WHERE c.group_id = @partition_key
                     AND IS_DEFINED(c.tags)
@@ -6794,7 +7525,7 @@ def get_workspace_tags(user_id, group_id=None, public_workspace_id=None):
             """
         else:
             query = """
-                SELECT c.tags
+                SELECT c.id, c.file_name, c.version, c._ts, c.upload_date, c.tags, c.revision_family_id, c.is_current_version, c.user_id
                 FROM c
                 WHERE c.user_id = @partition_key
                     AND IS_DEFINED(c.tags)
@@ -6811,7 +7542,9 @@ def get_workspace_tags(user_id, group_id=None, public_workspace_id=None):
             )
         )
         
-        # Count tag occurrences
+        documents = select_current_documents(documents)
+
+        # Count tag occurrences on current revisions only.
         tag_counts = {}
         for doc in documents:
             for tag in doc.get('tags', []):
@@ -6990,22 +7723,16 @@ def propagate_tags_to_blob_metadata(document_id, tags, user_id, group_id=None, p
             cosmos_container = cosmos_user_documents_container
 
         doc_item = cosmos_container.read_item(document_id, partition_key=document_id)
-        file_name = doc_item.get('file_name')
-        if not file_name:
-            print(f"Warning: No file_name found for document {document_id}, skipping blob metadata update")
+        storage_account_container_name, blob_path = get_document_blob_storage_info(
+            doc_item,
+            user_id=user_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
+        if not blob_path:
+            print(f"Warning: No blob path found for document {document_id}, skipping blob metadata update")
             return
 
-        # Determine container and blob path
-        if is_public_workspace:
-            storage_account_container_name = storage_account_public_documents_container_name
-            blob_path = f"{public_workspace_id}/{file_name}"
-        elif is_group:
-            storage_account_container_name = storage_account_group_documents_container_name
-            blob_path = f"{group_id}/{file_name}"
-        else:
-            storage_account_container_name = storage_account_user_documents_container_name
-            blob_path = f"{user_id}/{file_name}"
-
         blob_service_client = CLIENTS.get("storage_account_office_docs_client")
         if not blob_service_client:
             print(f"Warning: Blob service client not available, skipping blob metadata update")
diff --git a/application/single_app/functions_search.py b/application/single_app/functions_search.py
index 4ea75404..6851778f 100644
--- a/application/single_app/functions_search.py
+++ b/application/single_app/functions_search.py
@@ -120,6 +120,37 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
     elif document_id:
         document_ids = [document_id]
 
+    normalization_changed = False
+    try:
+        from functions_documents import normalize_document_revision_families
+
+        if doc_scope in ("all", "personal"):
+            normalization_changed = normalize_document_revision_families(user_id=user_id) or normalization_changed
+
+        if doc_scope in ("all", "group") and active_group_ids:
+            for current_group_id in active_group_ids:
+                normalization_changed = normalize_document_revision_families(
+                    user_id=user_id,
+                    group_id=current_group_id,
+                ) or normalization_changed
+
+        if doc_scope in ("all", "public"):
+            if doc_scope == "public" and active_public_workspace_id:
+                public_workspace_ids = [active_public_workspace_id]
+            else:
+                public_workspace_ids = get_user_visible_public_workspace_ids_from_settings(user_id)
+
+            for workspace_id in public_workspace_ids:
+                normalization_changed = normalize_document_revision_families(
+                    user_id=user_id,
+                    public_workspace_id=workspace_id,
+                ) or normalization_changed
+    except Exception as normalization_error:
+        debug_print(
+            f"Revision normalization failed before search: {normalization_error}",
+            "SEARCH",
+        )
+
     # Build document ID filter clause
     doc_id_filter = None
     if document_ids and len(document_ids) > 0:
@@ -144,13 +175,15 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
     )
 
     # Check cache first (pass scope parameters for correct partition key)
-    cached_results = get_cached_search_results(
-        cache_key,
-        user_id,
-        doc_scope,
-        active_group_ids=active_group_ids,
-        active_public_workspace_id=active_public_workspace_id
-    )
+    cached_results = None
+    if not normalization_changed:
+        cached_results = get_cached_search_results(
+            cache_key,
+            user_id,
+            doc_scope,
+            active_group_ids=active_group_ids,
+            active_public_workspace_id=active_public_workspace_id
+        )
     if cached_results is not None:
         debug_print(
             "Returning CACHED search results",
@@ -361,38 +394,44 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
 
     elif doc_scope == "personal":
         if doc_id_filter:
+            user_base_filter = (
+                (
+                    f"(user_id eq '{user_id}' or shared_user_ids/any(u: u eq '{user_id},approved')) "
+                    if enable_file_sharing else
+                    f"user_id eq '{user_id}' "
+                ) +
+                f"and {doc_id_filter}"
+            )
+            user_filter = f"{user_base_filter} and {tags_filter_clause}" if tags_filter_clause else user_base_filter
+
             user_results = search_client_user.search(
                 search_text=query,
                 vector_queries=[vector_query],
-                filter=(
-                    (
-                        f"(user_id eq '{user_id}' or shared_user_ids/any(u: u eq '{user_id},approved')) "
-                        if enable_file_sharing else
-                        f"user_id eq '{user_id}' "
-                    ) +
-                    f"and {doc_id_filter}"
-                ),
+                filter=user_filter,
                 query_type="semantic",
                 semantic_configuration_name="nexus-user-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "user_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "user_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(user_results, top_n)
         else:
+            user_base_filter = (
+                f"(user_id eq '{user_id}' or shared_user_ids/any(u: u eq '{user_id},approved')) "
+                if enable_file_sharing else
+                f"user_id eq '{user_id}' "
+            )
+            user_filter = f"{user_base_filter} and {tags_filter_clause}" if tags_filter_clause else user_base_filter.strip()
+
             user_results = search_client_user.search(
                 search_text=query,
                 vector_queries=[vector_query],
-                filter=(
-                    f"(user_id eq '{user_id}' or shared_user_ids/any(u: u eq '{user_id},approved')) "
-                    if enable_file_sharing else
-                    f"user_id eq '{user_id}' "
-                ),
+                filter=user_filter,
                 query_type="semantic",
                 semantic_configuration_name="nexus-user-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "user_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "user_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(user_results, top_n)
 
@@ -402,33 +441,35 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
         elif doc_id_filter:
             group_conditions = " or ".join([f"group_id eq '{gid}'" for gid in active_group_ids])
             shared_conditions = " or ".join([f"shared_group_ids/any(g: g eq '{gid},approved')" for gid in active_group_ids])
+            group_base_filter = f"({group_conditions} or {shared_conditions}) and {doc_id_filter}"
+            group_filter = f"{group_base_filter} and {tags_filter_clause}" if tags_filter_clause else group_base_filter
+
             group_results = search_client_group.search(
                 search_text=query,
                 vector_queries=[vector_query],
-                filter=(
-                    f"({group_conditions} or {shared_conditions}) and {doc_id_filter}"
-                ),
+                filter=group_filter,
                 query_type="semantic",
                 semantic_configuration_name="nexus-group-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "group_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "group_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(group_results, top_n)
         else:
             group_conditions = " or ".join([f"group_id eq '{gid}'" for gid in active_group_ids])
             shared_conditions = " or ".join([f"shared_group_ids/any(g: g eq '{gid},approved')" for gid in active_group_ids])
+            group_base_filter = f"({group_conditions} or {shared_conditions})"
+            group_filter = f"{group_base_filter} and {tags_filter_clause}" if tags_filter_clause else group_base_filter
+
             group_results = search_client_group.search(
                 search_text=query,
                 vector_queries=[vector_query],
-                filter=(
-                    f"({group_conditions} or {shared_conditions})"
-                ),
+                filter=group_filter,
                 query_type="semantic",
                 semantic_configuration_name="nexus-group-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "group_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "group_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(group_results, top_n)
     
@@ -441,11 +482,13 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
             if visible_public_workspace_ids:
                 # Use 'or' conditions instead of 'in' operator for OData compatibility
                 workspace_conditions = " or ".join([f"public_workspace_id eq '{id}'" for id in visible_public_workspace_ids])
-                public_filter = f"({workspace_conditions}) and {doc_id_filter}"
+                public_base_filter = f"({workspace_conditions}) and {doc_id_filter}"
             else:
                 # Fallback to active_public_workspace_id if no visible workspaces
-                public_filter = f"public_workspace_id eq '{active_public_workspace_id}' and {doc_id_filter}"
-                
+                public_base_filter = f"public_workspace_id eq '{active_public_workspace_id}' and {doc_id_filter}"
+
+            public_filter = f"{public_base_filter} and {tags_filter_clause}" if tags_filter_clause else public_base_filter
+
             public_results = search_client_public.search(
                 search_text=query,
                 vector_queries=[vector_query],
@@ -454,22 +497,24 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
                 semantic_configuration_name="nexus-public-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "public_workspace_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "public_workspace_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(public_results, top_n)
         else:
             # Get visible public workspace IDs from user settings
             visible_public_workspace_ids = get_user_visible_public_workspace_ids_from_settings(user_id)
-            
+
             # Create filter for visible public workspaces
             if visible_public_workspace_ids:
                 # Use 'or' conditions instead of 'in' operator for OData compatibility
                 workspace_conditions = " or ".join([f"public_workspace_id eq '{id}'" for id in visible_public_workspace_ids])
-                public_filter = f"({workspace_conditions})"
+                public_base_filter = f"({workspace_conditions})"
             else:
                 # Fallback to active_public_workspace_id if no visible workspaces
-                public_filter = f"public_workspace_id eq '{active_public_workspace_id}'"
-                
+                public_base_filter = f"public_workspace_id eq '{active_public_workspace_id}'"
+
+            public_filter = f"{public_base_filter} and {tags_filter_clause}" if tags_filter_clause else public_base_filter
+
             public_results = search_client_public.search(
                 search_text=query,
                 vector_queries=[vector_query],
@@ -478,7 +523,7 @@ def hybrid_search(query, user_id, document_id=None, document_ids=None, top_n=12,
                 semantic_configuration_name="nexus-public-index-semantic-configuration",
                 query_caption="extractive",
                 query_answer="extractive",
-                select=["id", "chunk_text", "chunk_id", "file_name", "public_workspace_id", "version", "chunk_sequence", "upload_date", "document_classification", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
+                select=["id", "chunk_text", "chunk_id", "file_name", "public_workspace_id", "version", "chunk_sequence", "upload_date", "document_classification", "document_tags", "page_number", "author", "chunk_keywords", "title", "chunk_summary"]
             )
             results = extract_search_results(public_results, top_n)
     
diff --git a/application/single_app/route_backend_chats.py b/application/single_app/route_backend_chats.py
index 92ff4dd3..26a71f41 100644
--- a/application/single_app/route_backend_chats.py
+++ b/application/single_app/route_backend_chats.py
@@ -5,6 +5,7 @@
 from semantic_kernel.contents.chat_message_content import ChatMessageContent
 from semantic_kernel.connectors.ai.prompt_execution_settings import PromptExecutionSettings
 from semantic_kernel.connectors.ai.chat_completion_client_base import ChatCompletionClientBase
+from semantic_kernel.connectors.ai.open_ai.prompt_execution_settings.azure_chat_prompt_execution_settings import AzureChatPromptExecutionSettings
 from semantic_kernel_fact_memory_store import FactMemoryStore
 from semantic_kernel_loader import initialize_semantic_kernel
 from semantic_kernel_plugins.plugin_invocation_thoughts import (
@@ -45,7 +46,9 @@
 from functions_keyvault import SecretReturnType, keyvault_model_endpoint_get_helper
 from functions_message_artifacts import (
     build_agent_citation_artifact_documents,
+    build_message_artifact_payload_map,
     filter_assistant_artifact_items,
+    hydrate_agent_citations_from_artifacts,
 )
 from functions_thoughts import ThoughtTracker
 
@@ -192,8 +195,33 @@ def is_tabular_entity_lookup_question(user_question):
         'installment',
         'related',
     )
+    explanatory_keywords = (
+        'because',
+        'detail',
+        'details',
+        'explain',
+        'reason',
+        'summary',
+        'why',
+    )
     if any(phrase in normalized_question for phrase in direct_phrases) and any(
-        keyword in normalized_question for keyword in relationship_keywords
+        keyword in normalized_question for keyword in relationship_keywords + explanatory_keywords
+    ):
+        return True
+
+    identifier_like_reference = bool(re.search(
+        r'\b(?:ret|tp|case|account|acct|payment|pay|notice|audit|w2|1099)[-_]?[a-z0-9]*\d{2,}[a-z0-9_-]*\b',
+        normalized_question,
+    ))
+    anchored_entity_reference = any(
+        re.search(pattern, normalized_question)
+        for pattern in (
+            r'\bfor\s+(?:return|taxpayer|case|account|payment|notice|audit)\b',
+            r'\b(?:return|taxpayer|case|account|payment|notice|audit)\s+[`"\']?[a-z0-9_-]*\d{2,}[a-z0-9_-]*[`"\']?\b',
+        )
+    )
+    if anchored_entity_reference and identifier_like_reference and any(
+        keyword in normalized_question for keyword in relationship_keywords + explanatory_keywords
     ):
         return True
 
@@ -204,6 +232,44 @@ def is_tabular_entity_lookup_question(user_question):
     return any(re.search(pattern, normalized_question) for pattern in entity_lookup_patterns)
 
 
+def is_tabular_distinct_value_question(user_question):
+    """Return True for unique-value questions that should start with get_distinct_values."""
+    normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
+    if not normalized_question or is_tabular_schema_summary_question(normalized_question):
+        return False
+
+    distinct_keywords = (
+        'different',
+        'discrete',
+        'distinct',
+        'unique',
+    )
+    count_keywords = (
+        'count',
+        'counts',
+        'how many',
+        'number of',
+    )
+    target_keywords = (
+        'link',
+        'links',
+        'location',
+        'locations',
+        'sharepoint',
+        'site',
+        'sites',
+        'url',
+        'urls',
+        'value',
+        'values',
+    )
+
+    has_distinct_intent = any(keyword in normalized_question for keyword in distinct_keywords)
+    has_count_intent = any(keyword in normalized_question for keyword in count_keywords)
+    has_target = any(keyword in normalized_question for keyword in target_keywords)
+    return (has_distinct_intent or has_count_intent) and has_target
+
+
 def is_tabular_cross_sheet_bridge_question(user_question):
     """Return True for grouped analytical questions that may need multiple worksheets."""
     normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
@@ -302,10 +368,209 @@ def build_tabular_computed_results_system_message(source_label, tabular_analysis
         f"{rendered_analysis}\n\n"
         "These are tool-backed results derived from the full underlying tabular data, not just retrieved schema excerpts. "
         "Treat them as authoritative for row-level facts, calculations, and numeric conclusions. "
-        "Do not say that you lack direct access to the data if the answer is present in these computed results."
+        "Do not say that you lack direct access to the data if the answer is present in these computed results. "
+        "If a tool summary includes a full scalar value list, you may enumerate those values directly in the final answer. "
+        "If a tool summary includes the full matching rows from a row or text search, use the surrounding cell context in those rows when deciding which content is relevant to the user's question."
     )
 
 
+MULTI_FILE_TABULAR_DISTINCT_URL_EXTRACT_PATTERN = (
+    r'(?i)https?://[^\s/]+/[^\s]*?(?:sites/|sitecollection/|teams/)[^\s"\']+'
+)
+
+
+def get_multi_file_tabular_analysis_mode(user_question, execution_mode='analysis', analysis_file_contexts=None):
+    """Return a deterministic multi-file mode when the question should bypass SK planning."""
+    normalized_execution_mode = str(execution_mode or 'analysis').strip().lower()
+    normalized_contexts = dedupe_tabular_file_contexts(analysis_file_contexts)
+    if normalized_execution_mode != 'analysis' or len(normalized_contexts) <= 1:
+        return None
+
+    if is_tabular_distinct_url_question(user_question):
+        return 'distinct_url_union'
+
+    return None
+
+
+def score_tabular_distinct_url_column(column_name):
+    """Score likely URL-bearing column names for deterministic multi-file analysis."""
+    normalized_column_name = re.sub(r'\s+', ' ', str(column_name or '').strip().lower())
+    if not normalized_column_name:
+        return None
+
+    exact_priority = {
+        'location': 0,
+        'locations': 0,
+        'url': 1,
+        'urls': 1,
+        'link': 2,
+        'links': 2,
+        'site': 3,
+        'sites': 3,
+        'path': 4,
+        'paths': 4,
+        'address': 5,
+        'addresses': 5,
+    }
+    if normalized_column_name in exact_priority:
+        return exact_priority[normalized_column_name]
+
+    token_priority = {
+        'location': 0,
+        'locations': 0,
+        'url': 1,
+        'urls': 1,
+        'link': 2,
+        'links': 2,
+        'site': 3,
+        'sites': 3,
+        'sharepoint': 4,
+        'path': 5,
+        'paths': 5,
+        'address': 6,
+        'addresses': 6,
+    }
+    token_scores = [
+        token_priority[token]
+        for token in re.split(r'[^a-z0-9]+', normalized_column_name)
+        if token and token in token_priority
+    ]
+    if not token_scores:
+        return None
+
+    return min(token_scores) + 10
+
+
+def select_tabular_distinct_url_column(column_names):
+    """Return the best URL-like column from a list of schema column names."""
+    best_column_name = None
+    best_comparison_key = None
+
+    for candidate_column in column_names or []:
+        rendered_column_name = str(candidate_column or '').strip()
+        if not rendered_column_name:
+            continue
+
+        column_score = score_tabular_distinct_url_column(rendered_column_name)
+        if column_score is None:
+            continue
+
+        comparison_key = (column_score, rendered_column_name.casefold())
+        if best_comparison_key is None or comparison_key < best_comparison_key:
+            best_comparison_key = comparison_key
+            best_column_name = rendered_column_name
+
+    return best_column_name
+
+
+def select_tabular_distinct_url_sheet_and_column(schema_info):
+    """Choose the best worksheet and column for deterministic multi-file URL extraction."""
+    if not isinstance(schema_info, Mapping):
+        return None, None
+
+    per_sheet_schemas = schema_info.get('per_sheet_schemas', {})
+    if isinstance(per_sheet_schemas, Mapping) and per_sheet_schemas:
+        ranked_sheet_candidates = []
+        for raw_sheet_name, raw_sheet_schema in per_sheet_schemas.items():
+            if not isinstance(raw_sheet_schema, Mapping):
+                continue
+
+            selected_column = select_tabular_distinct_url_column(raw_sheet_schema.get('columns', []))
+            if not selected_column:
+                continue
+
+            row_count = raw_sheet_schema.get('row_count', 0)
+            try:
+                normalized_row_count = int(row_count)
+            except (TypeError, ValueError):
+                normalized_row_count = 0
+
+            ranked_sheet_candidates.append((
+                score_tabular_distinct_url_column(selected_column),
+                -normalized_row_count,
+                str(raw_sheet_name or '').casefold(),
+                str(raw_sheet_name or '').strip() or None,
+                selected_column,
+            ))
+
+        if ranked_sheet_candidates:
+            _, _, _, selected_sheet_name, selected_column_name = sorted(ranked_sheet_candidates)[0]
+            return selected_sheet_name, selected_column_name
+
+    return None, select_tabular_distinct_url_column(schema_info.get('columns', []))
+
+
+def normalize_multi_file_tabular_distinct_value(value):
+    """Normalize a distinct scalar so multi-file unions remain stable."""
+    rendered_value = str(value or '').strip()
+    if not rendered_value:
+        return None
+
+    return rendered_value.casefold()
+
+
+def build_multi_file_tabular_distinct_value_analysis(successful_results, failed_results=None):
+    """Build a deterministic combined distinct-value payload across multiple tabular files."""
+    successful_results = list(successful_results or [])
+    failed_results = list(failed_results or [])
+    if not successful_results:
+        return None
+
+    combined_values_by_key = {}
+    per_file_results = []
+    any_values_limited = False
+    files_with_matches = 0
+
+    for result_payload in successful_results:
+        file_values = []
+        for raw_value in result_payload.get('values') or []:
+            rendered_value = str(raw_value or '').strip()
+            if not rendered_value:
+                continue
+
+            file_values.append(rendered_value)
+            normalized_value_key = normalize_multi_file_tabular_distinct_value(rendered_value)
+            if normalized_value_key and normalized_value_key not in combined_values_by_key:
+                combined_values_by_key[normalized_value_key] = rendered_value
+
+        distinct_count = parse_tabular_result_count(result_payload.get('distinct_count'))
+        returned_values = parse_tabular_result_count(result_payload.get('returned_values'))
+        if distinct_count is None:
+            distinct_count = len(file_values)
+        if returned_values is None:
+            returned_values = len(file_values)
+
+        values_limited = bool(result_payload.get('values_limited', False))
+        any_values_limited = any_values_limited or values_limited
+        if returned_values > 0:
+            files_with_matches += 1
+
+        per_file_results.append({
+            'filename': result_payload.get('filename'),
+            'selected_sheet': result_payload.get('selected_sheet'),
+            'column': result_payload.get('column'),
+            'distinct_count': distinct_count,
+            'returned_values': returned_values,
+            'values_limited': values_limited,
+            'values': file_values,
+        })
+
+    combined_values = sorted(combined_values_by_key.values(), key=lambda item: item.casefold())
+    return json.dumps({
+        'analysis_type': 'multi_file_distinct_url_union',
+        'files_requested': len(successful_results) + len(failed_results),
+        'files_analyzed': len(successful_results),
+        'files_with_matches': files_with_matches,
+        'files_failed': len(failed_results),
+        'distinct_count': len(combined_values),
+        'returned_values': len(combined_values),
+        'values_limited': any_values_limited,
+        'values': combined_values,
+        'per_file_results': per_file_results,
+        'failed_files': failed_results,
+    }, indent=2, default=str)
+
+
 def get_kernel():
     return getattr(g, 'kernel', None) or getattr(builtins, 'kernel', None)
 
@@ -774,6 +1039,12 @@ def describe_tabular_invocation_conditions(invocation):
     if query_expression:
         return query_expression
 
+    search_value = str(parameters.get('search_value') or '').strip()
+    if search_value:
+        search_columns = str(parameters.get('search_columns') or '').strip() or 'ALL COLUMNS'
+        search_operator = str(parameters.get('search_operator') or 'contains').strip()
+        return f"search_value={search_value}; search_operator={search_operator}; search_columns={search_columns}"
+
     column_name = str(parameters.get('column') or '').strip()
     operator = str(parameters.get('operator') or '').strip()
     value = parameters.get('value')
@@ -785,6 +1056,17 @@ def describe_tabular_invocation_conditions(invocation):
     if lookup_column:
         return f"{lookup_column} == {lookup_value}"
 
+    extract_mode = str(parameters.get('extract_mode') or '').strip()
+    if extract_mode:
+        extraction_bits = [f"extract_mode={extract_mode}"]
+        extract_pattern = str(parameters.get('extract_pattern') or '').strip()
+        url_path_segments = parameters.get('url_path_segments')
+        if extract_pattern:
+            extraction_bits.append(f"extract_pattern={extract_pattern}")
+        if url_path_segments not in (None, ''):
+            extraction_bits.append(f"url_path_segments={url_path_segments}")
+        return ', '.join(extraction_bits)
+
     return None
 
 
@@ -841,7 +1123,7 @@ def get_tabular_query_overlap_summary(invocations, max_rows=10):
 
     for invocation in invocations or []:
         function_name = getattr(invocation, 'function_name', '')
-        if function_name not in {'query_tabular_data', 'filter_rows'}:
+        if function_name not in {'query_tabular_data', 'filter_rows', 'search_rows'}:
             continue
 
         rows = get_tabular_invocation_data_rows(invocation)
@@ -941,6 +1223,49 @@ def get_tabular_invocation_compact_payload(invocation, max_rows=5):
             'operation': compact_tabular_fallback_value(result_payload.get('operation')),
             'result': compact_tabular_fallback_value(result_payload.get('result')),
         })
+    elif function_name == 'get_distinct_values':
+        for key_name in (
+            'column',
+            'filter_applied',
+            'normalize_match',
+            'extract_mode',
+            'extract_pattern',
+            'url_path_segments',
+            'matched_cell_count',
+            'extracted_match_count',
+            'distinct_count',
+            'returned_values',
+            'values_limited',
+        ):
+            if key_name in result_payload:
+                compact_payload[key_name] = compact_tabular_fallback_value(result_payload.get(key_name))
+
+        raw_values = result_payload.get('values')
+        if isinstance(raw_values, list):
+            compact_values = []
+            rendered_values_length = 0
+            max_values_in_payload = 200
+            max_rendered_values_chars = 14000
+
+            for raw_value in raw_values:
+                compact_value = compact_tabular_fallback_value(raw_value)
+                rendered_value = json.dumps(compact_value, default=str)
+                projected_length = rendered_values_length + len(rendered_value) + 2
+
+                if compact_values and (
+                    len(compact_values) >= max_values_in_payload
+                    or projected_length > max_rendered_values_chars
+                ):
+                    break
+
+                compact_values.append(compact_value)
+                rendered_values_length = projected_length
+
+            compact_payload['values'] = compact_values
+            compact_payload['full_values_included'] = len(compact_values) == len(raw_values)
+            if len(compact_values) != len(raw_values):
+                compact_payload['values_limited'] = True
+                compact_payload['returned_values'] = len(compact_values)
     elif function_name in {'group_by_aggregate', 'group_by_datetime_component'}:
         for key_name in (
             'group_by',
@@ -975,18 +1300,46 @@ def get_tabular_invocation_compact_payload(invocation, max_rows=5):
                 for row in data_rows[:max_rows]
             ]
             compact_payload['sample_rows_limited'] = len(data_rows) > max_rows
-    elif function_name in {'query_tabular_data', 'filter_rows'}:
+    elif function_name in {'query_tabular_data', 'filter_rows', 'search_rows'}:
+        for key_name in ('search_value', 'search_operator', 'searched_columns', 'matched_columns', 'return_columns'):
+            if key_name in result_payload:
+                compact_payload[key_name] = compact_tabular_fallback_value(result_payload.get(key_name))
+
         for key_name in ('total_matches', 'returned_rows'):
             if key_name in result_payload:
                 compact_payload[key_name] = compact_tabular_fallback_value(result_payload.get(key_name))
 
         data_rows = get_tabular_invocation_data_rows(invocation)
         if data_rows:
+            desired_max_rows = max_rows
+            total_matches = result_payload.get('total_matches')
+            returned_rows = result_payload.get('returned_rows')
+            try:
+                total_matches = int(total_matches)
+            except (TypeError, ValueError):
+                total_matches = None
+            try:
+                returned_rows = int(returned_rows)
+            except (TypeError, ValueError):
+                returned_rows = len(data_rows)
+
+            if (
+                total_matches is not None
+                and returned_rows == total_matches
+                and total_matches <= 25
+            ):
+                desired_max_rows = max(desired_max_rows, total_matches)
+
             compact_payload['sample_rows'] = [
                 compact_tabular_fallback_value(row)
-                for row in data_rows[:max_rows]
+                for row in data_rows[:desired_max_rows]
             ]
-            compact_payload['sample_rows_limited'] = len(data_rows) > max_rows
+            compact_payload['sample_rows_limited'] = len(data_rows) > desired_max_rows
+            compact_payload['full_rows_included'] = (
+                total_matches is not None
+                and total_matches == returned_rows
+                and len(compact_payload['sample_rows']) == len(data_rows)
+            )
 
         rendered_conditions = describe_tabular_invocation_conditions(invocation)
         if rendered_conditions:
@@ -1061,6 +1414,15 @@ def build_tabular_analysis_fallback_from_invocations(invocations):
         if 'sample_rows' in shrunk_payload:
             shrunk_payload['sample_rows'] = shrunk_payload['sample_rows'][:2]
             shrunk_payload['sample_rows_limited'] = True
+            shrunk_payload['full_rows_included'] = False
+        if isinstance(shrunk_payload.get('values'), list) and len(shrunk_payload['values']) > 25:
+            shrunk_payload['values'] = shrunk_payload['values'][:25]
+            shrunk_payload['values_limited'] = True
+            shrunk_payload['full_values_included'] = False
+            shrunk_payload['returned_values'] = min(
+                int(shrunk_payload.get('returned_values') or len(shrunk_payload['values'])),
+                len(shrunk_payload['values']),
+            )
         if isinstance(shrunk_payload.get('top_results'), dict):
             shrunk_payload['top_results'] = dict(list(shrunk_payload['top_results'].items())[:3])
 
@@ -1072,6 +1434,15 @@ def build_tabular_analysis_fallback_from_invocations(invocations):
         if len(candidate_text) > (max_fallback_chars - coverage_note_reserve):
             shrunk_payload.pop('sample_rows', None)
             shrunk_payload['sample_rows_limited'] = True
+            shrunk_payload['full_rows_included'] = False
+            if isinstance(shrunk_payload.get('values'), list) and len(shrunk_payload['values']) > 10:
+                shrunk_payload['values'] = shrunk_payload['values'][:10]
+                shrunk_payload['values_limited'] = True
+                shrunk_payload['full_values_included'] = False
+                shrunk_payload['returned_values'] = min(
+                    int(shrunk_payload.get('returned_values') or len(shrunk_payload['values'])),
+                    len(shrunk_payload['values']),
+                )
             shrunk_payload['result_summary_truncated'] = True
             if isinstance(shrunk_payload.get('top_results'), dict):
                 shrunk_payload['top_results'] = dict(list(shrunk_payload['top_results'].items())[:2])
@@ -1219,163 +1590,1485 @@ def summarize_tabular_invocation_errors(invocations):
     return unique_errors
 
 
-def filter_tabular_citation_invocations(invocations):
-    """Hide discovery-only citation noise when analytical tabular calls exist."""
-    if not invocations:
-        return []
-
-    successful_analytical_invocations, _ = split_tabular_analysis_invocations(invocations)
-    if successful_analytical_invocations:
-        return successful_analytical_invocations
+def summarize_tabular_discovery_invocations(invocations, max_sheet_names=6):
+    """Return compact workbook-discovery summaries for retry prompts."""
+    discovery_summaries = []
 
-    successful_schema_summary_invocations = []
     for invocation in invocations or []:
         if getattr(invocation, 'function_name', '') != 'describe_tabular_file':
             continue
         if get_tabular_invocation_error_message(invocation):
             continue
-        successful_schema_summary_invocations.append(invocation)
 
-    if successful_schema_summary_invocations:
-        return successful_schema_summary_invocations
+        result_payload = get_tabular_invocation_result_payload(invocation) or {}
+        filename = str(result_payload.get('filename') or '').strip()
+        if not filename:
+            continue
 
-    return []
+        sheet_names = result_payload.get('sheet_names') or []
+        if not isinstance(sheet_names, list):
+            sheet_names = []
 
+        relationship_hints = result_payload.get('relationship_hints') or []
+        if not isinstance(relationship_hints, list):
+            relationship_hints = []
 
-def format_tabular_thought_parameter_value(value):
-    """Render a concise parameter value for tabular thought details."""
-    if value is None:
-        return None
+        summary_parts = [filename]
+        if result_payload.get('is_workbook'):
+            summary_parts.append(f"sheet_count={result_payload.get('sheet_count', len(sheet_names))}")
+        if sheet_names:
+            rendered_sheet_names = ', '.join(str(sheet_name) for sheet_name in sheet_names[:max_sheet_names])
+            if len(sheet_names) > max_sheet_names:
+                rendered_sheet_names += f", +{len(sheet_names) - max_sheet_names} more"
+            summary_parts.append(f"sheets={rendered_sheet_names}")
+        if relationship_hints:
+            summary_parts.append(f"relationship_hints={len(relationship_hints)}")
 
-    if isinstance(value, (dict, list, tuple)):
-        rendered_value = json.dumps(value, default=str)
-    else:
-        rendered_value = str(value)
+        discovery_summaries.append('; '.join(summary_parts))
 
-    if not rendered_value:
+    return discovery_summaries
+
+
+def extract_json_object_from_text(text):
+    """Extract the first JSON object embedded in a model response."""
+    rendered_text = str(text or '').strip()
+    if not rendered_text:
         return None
 
-    if len(rendered_value) > 120:
-        rendered_value = rendered_value[:117] + '...'
+    json_decoder = json.JSONDecoder()
+    for character_index, character in enumerate(rendered_text):
+        if character != '{':
+            continue
 
-    return rendered_value
+        try:
+            payload, _ = json_decoder.raw_decode(rendered_text[character_index:])
+        except Exception:
+            continue
 
+        if isinstance(payload, dict):
+            return payload
 
-def get_tabular_tool_thought_payloads(invocations):
-    """Convert tabular plugin invocations into user-visible thought payloads."""
-    thought_payloads = []
+    return None
 
-    for invocation in invocations or []:
-        function_name = getattr(invocation, 'function_name', 'unknown_tool')
-        duration_ms = getattr(invocation, 'duration_ms', None)
-        error_message = get_tabular_invocation_error_message(invocation)
-        success = getattr(invocation, 'success', True) and not error_message
-        parameters = getattr(invocation, 'parameters', {}) or {}
 
-        filename = parameters.get('filename')
-        sheet_name = parameters.get('sheet_name')
-        duration_suffix = f" ({int(duration_ms)}ms)" if duration_ms else ""
-        content = f"Tabular tool {function_name}{duration_suffix}"
-        if filename:
-            content = f"Tabular tool {function_name} on {filename}{duration_suffix}"
-        if filename and sheet_name:
-            content = f"Tabular tool {function_name} on {filename} [{sheet_name}]{duration_suffix}"
-        if not success:
-            content = f"{content} failed"
+def normalize_tabular_reviewer_function_name(function_name):
+    """Normalize reviewer-selected function names to bare plugin function names."""
+    normalized_function_name = str(function_name or '').strip()
+    if not normalized_function_name:
+        return ''
 
-        detail_parts = []
-        for parameter_name, parameter_value in parameters.items():
-            if parameter_name in get_tabular_thought_excluded_parameter_names():
-                continue
+    normalized_function_name = normalized_function_name.replace('tabular_processing-', '')
+    if '.' in normalized_function_name:
+        normalized_function_name = normalized_function_name.split('.')[-1]
 
-            rendered_value = format_tabular_thought_parameter_value(parameter_value)
-            if rendered_value is None:
-                continue
+    return normalized_function_name.strip()
 
-            detail_parts.append(f"{parameter_name}={rendered_value}")
 
-        rendered_error_message = format_tabular_thought_parameter_value(error_message)
-        if rendered_error_message:
-            detail_parts.append(f"error={rendered_error_message}")
+def parse_tabular_reviewer_plan(review_text):
+    """Parse a JSON-only LLM reviewer plan into executable call descriptors."""
+    payload = extract_json_object_from_text(review_text)
+    if not isinstance(payload, dict):
+        return []
 
-        detail_parts.append(f"success={success}")
-        detail = "; ".join(detail_parts) if detail_parts else None
-        thought_payloads.append((content, detail))
+    raw_calls = payload.get('calls')
+    if not isinstance(raw_calls, list):
+        raw_call = payload.get('call')
+        raw_calls = [raw_call] if isinstance(raw_call, dict) else []
 
-    return thought_payloads
+    normalized_calls = []
+    for raw_call in raw_calls:
+        if not isinstance(raw_call, dict):
+            continue
 
+        function_name = normalize_tabular_reviewer_function_name(
+            raw_call.get('function') or raw_call.get('function_name')
+        )
+        arguments = raw_call.get('arguments') or raw_call.get('args') or {}
+        if not function_name or not isinstance(arguments, dict):
+            continue
 
-def get_tabular_status_thought_payloads(invocations, analysis_succeeded):
-    """Return additional tabular status thoughts for retries and fallbacks."""
-    successful_analytical_invocations, failed_analytical_invocations = split_tabular_analysis_invocations(invocations)
-    if not failed_analytical_invocations:
-        return []
+        normalized_calls.append({
+            'function_name': function_name,
+            'arguments': dict(arguments),
+        })
 
-    error_messages = summarize_tabular_invocation_errors(failed_analytical_invocations)
-    detail = "; ".join(error_messages) if error_messages else None
+    return normalized_calls
 
-    if analysis_succeeded and successful_analytical_invocations:
-        return [(
-            "Tabular analysis recovered after retrying tool errors",
-            detail,
-        )]
 
-    if analysis_succeeded:
-        return [(
-            "Tabular analysis recovered via internal fallback after tool errors",
-            detail,
-        )]
+def get_tabular_reviewer_function_manifest():
+    """Return compact analytical-function guidance for the reviewer LLM."""
+    return {
+        'lookup_value': {
+            'best_for': 'one exact row or entity and one target column value',
+            'required_arguments': ['filename', 'lookup_column', 'lookup_value', 'target_column'],
+            'optional_arguments': ['match_operator', 'normalize_match', 'sheet_name', 'sheet_index', 'max_rows'],
+        },
+        'get_distinct_values': {
+            'best_for': 'unique values, discrete counts, canonical site lists, embedded URL or regex extraction, and deterministic de-duplication after the relevant text cohort has been narrowed',
+            'required_arguments': ['filename', 'column'],
+            'optional_arguments': ['query_expression', 'filter_column', 'filter_operator', 'filter_value', 'additional_filter_column', 'additional_filter_operator', 'additional_filter_value', 'extract_mode', 'extract_pattern', 'url_path_segments', 'normalize_match', 'sheet_name', 'sheet_index', 'max_values'],
+        },
+        'count_rows': {
+            'best_for': 'deterministic how-many questions after a filter or query',
+            'required_arguments': ['filename'],
+            'optional_arguments': ['query_expression', 'filter_column', 'filter_operator', 'filter_value', 'additional_filter_column', 'additional_filter_operator', 'additional_filter_value', 'normalize_match', 'sheet_name', 'sheet_index'],
+        },
+        'search_rows': {
+            'best_for': 'searching one column, several columns, or an entire sheet/workbook for a topic, phrase, path, code, or other value when the relevant column is unclear',
+            'required_arguments': ['filename', 'search_value'],
+            'optional_arguments': ['search_columns', 'search_operator', 'return_columns', 'query_expression', 'filter_column', 'filter_operator', 'filter_value', 'additional_filter_column', 'additional_filter_operator', 'additional_filter_value', 'normalize_match', 'sheet_name', 'sheet_index', 'max_rows'],
+        },
+        'filter_rows': {
+            'best_for': 'searching a text column for matching cells while preserving full row context before a second analytical step',
+            'required_arguments': ['filename', 'column', 'operator', 'value'],
+            'optional_arguments': ['additional_filter_column', 'additional_filter_operator', 'additional_filter_value', 'normalize_match', 'sheet_name', 'sheet_index', 'max_rows'],
+        },
+        'query_tabular_data': {
+            'best_for': 'compound boolean filters expressed with pandas DataFrame.query()',
+            'required_arguments': ['filename', 'query_expression'],
+            'optional_arguments': ['sheet_name', 'sheet_index', 'max_rows'],
+        },
+        'filter_rows_by_related_values': {
+            'best_for': 'joining a cohort from one sheet to matching rows on another sheet',
+            'required_arguments': ['filename', 'source_sheet_name', 'source_value_column', 'target_sheet_name', 'target_match_column'],
+            'optional_arguments': ['source_query_expression', 'source_filter_column', 'source_filter_operator', 'source_filter_value', 'target_query_expression', 'target_filter_column', 'target_filter_operator', 'target_filter_value', 'normalize_match', 'max_rows'],
+        },
+        'count_rows_by_related_values': {
+            'best_for': 'deterministic counts for cross-sheet cohort membership or related-record questions',
+            'required_arguments': ['filename', 'source_sheet_name', 'source_value_column', 'target_sheet_name', 'target_match_column'],
+            'optional_arguments': ['source_query_expression', 'source_filter_column', 'source_filter_operator', 'source_filter_value', 'target_query_expression', 'target_filter_column', 'target_filter_operator', 'target_filter_value', 'normalize_match'],
+        },
+        'aggregate_column': {
+            'best_for': 'sum, mean, min, max, median, std, count, nunique, or value_counts on one column',
+            'required_arguments': ['filename', 'column', 'operation'],
+            'optional_arguments': ['sheet_name', 'sheet_index'],
+        },
+        'group_by_aggregate': {
+            'best_for': 'grouped metrics by category or entity',
+            'required_arguments': ['filename', 'group_by', 'aggregate_column', 'operation'],
+            'optional_arguments': ['query_expression', 'sheet_name', 'sheet_index', 'top_n'],
+        },
+        'group_by_datetime_component': {
+            'best_for': 'time-based grouped analysis by year, quarter, month, week, day, or hour',
+            'required_arguments': ['filename', 'datetime_column', 'date_component', 'aggregate_column', 'operation'],
+            'optional_arguments': ['query_expression', 'sheet_name', 'sheet_index', 'top_n'],
+        },
+    }
 
-    return [(
-        "Tabular analysis encountered tool errors before fallback",
-        detail,
-    )]
 
+def resolve_tabular_reviewer_call_arguments(raw_arguments, analysis_file_contexts,
+                                            fallback_source_hint='workspace',
+                                            fallback_group_id=None,
+                                            fallback_public_workspace_id=None):
+    """Inject filename and source context into an LLM reviewer tool plan."""
+    raw_arguments = dict(raw_arguments or {})
+    normalized_contexts = analysis_file_contexts or []
+    file_context_by_exact_name = {
+        file_context['file_name']: file_context
+        for file_context in normalized_contexts
+        if file_context.get('file_name')
+    }
+    file_context_by_lower_name = {
+        str(file_context.get('file_name') or '').strip().lower(): file_context
+        for file_context in normalized_contexts
+        if file_context.get('file_name')
+    }
 
-def _normalize_tabular_sheet_token(token):
-    """Normalize question and sheet-name tokens for lightweight matching."""
-    normalized = re.sub(r'[^a-z0-9]+', '', str(token or '').lower())
-    if len(normalized) > 4 and normalized.endswith('ies'):
-        return normalized[:-3] + 'y'
-    if len(normalized) > 3 and normalized.endswith('s') and not normalized.endswith('ss'):
-        return normalized[:-1]
-    return normalized
+    requested_filename = str(raw_arguments.get('filename') or '').strip()
+    resolved_file_context = None
+    if requested_filename:
+        resolved_file_context = (
+            file_context_by_exact_name.get(requested_filename)
+            or file_context_by_lower_name.get(requested_filename.lower())
+        )
+    elif len(normalized_contexts) == 1:
+        resolved_file_context = normalized_contexts[0]
+
+    if not resolved_file_context:
+        if requested_filename:
+            return None, f"Reviewer selected unknown filename '{requested_filename}'."
+        return None, 'Reviewer did not select a filename and multiple files were available.'
+
+    normalized_arguments = dict(raw_arguments)
+    normalized_arguments['filename'] = resolved_file_context['file_name']
+    normalized_arguments['source'] = (
+        resolved_file_context.get('source_hint')
+        or fallback_source_hint
+        or normalized_arguments.get('source')
+        or 'workspace'
+    )
 
+    resolved_group_id = resolved_file_context.get('group_id') or fallback_group_id
+    resolved_public_workspace_id = (
+        resolved_file_context.get('public_workspace_id')
+        or fallback_public_workspace_id
+    )
+    if resolved_group_id:
+        normalized_arguments['group_id'] = resolved_group_id
+    if resolved_public_workspace_id:
+        normalized_arguments['public_workspace_id'] = resolved_public_workspace_id
 
-def _tokenize_tabular_sheet_text(text):
-    """Tokenize free text into normalized sheet-matching tokens."""
-    original_text = re.sub(r'(?i)w[\s\-_]*2', ' w2 ', str(text or ''))
-    expanded_text = re.sub(r'([a-z])([A-Z])', r'\1 \2', original_text)
-    expanded_text = re.sub(r'([A-Za-z])([0-9])', r'\1 \2', expanded_text)
-    expanded_text = re.sub(r'([0-9])([A-Za-z])', r'\1 \2', expanded_text)
-    expanded_text = re.sub(r'[_\-]+', ' ', expanded_text)
-    tokens = []
-    seen_tokens = set()
+    if not str(normalized_arguments.get('sheet_name') or '').strip():
+        normalized_arguments.pop('sheet_name', None)
+    if normalized_arguments.get('sheet_index') in ('', None):
+        normalized_arguments.pop('sheet_index', None)
 
-    for raw_text in (original_text, expanded_text):
-        for raw_token in re.split(r'[^a-z0-9]+', raw_text.lower()):
-            normalized_token = _normalize_tabular_sheet_token(raw_token)
-            if not normalized_token or len(normalized_token) <= 1:
-                continue
-            if normalized_token in seen_tokens:
-                continue
-            seen_tokens.add(normalized_token)
-            tokens.append(normalized_token)
+    return normalized_arguments, None
 
-    return tokens
 
+def normalize_tabular_reviewer_argument_value(argument_name, argument_value):
+    """Normalize scalar reviewer-planned values to plugin-friendly argument types."""
+    if argument_value is None:
+        return None
 
-def _extract_tabular_entity_anchor_terms(question_text):
-    """Extract likely primary-entity terms from an entity lookup question."""
-    normalized_question = str(question_text or '').strip().lower()
+    if isinstance(argument_value, bool):
+        return 'true' if argument_value else 'false'
+
+    if argument_name in {'max_rows', 'max_values', 'sheet_index', 'top_n'} and isinstance(argument_value, (int, float)):
+        return str(int(argument_value))
+
+    return argument_value
+
+
+def is_tabular_distinct_url_question(user_question):
+    """Return True when the user is asking for unique or counted URL/site values."""
+    normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
     if not normalized_question:
-        return []
+        return False
 
-    stopwords = {
-        'and',
-        'any',
-        'by',
-        'detail',
+    count_keywords = (
+        'count',
+        'counts',
+        'how many',
+        'number of',
+        'different',
+        'discrete',
+        'distinct',
+        'unique',
+    )
+    url_keywords = (
+        'http',
+        'https',
+        'link',
+        'links',
+        'sharepoint',
+        'site',
+        'sites',
+        'url',
+        'urls',
+    )
+    return any(keyword in normalized_question for keyword in count_keywords) and any(
+        keyword in normalized_question for keyword in url_keywords
+    )
+
+
+def question_requests_tabular_row_context(user_question):
+    """Return True when the user question implies a need for matching-row context."""
+    normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
+    if not normalized_question:
+        return False
+
+    row_context_keywords = (
+        'appear',
+        'appears',
+        'appearing',
+        'find',
+        'found',
+        'search',
+        'show',
+        'where',
+    )
+    return any(keyword in normalized_question for keyword in row_context_keywords)
+
+
+def question_requests_tabular_exhaustive_results(user_question):
+    """Return True when the user explicitly asks for a full list or all matching results."""
+    normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
+    if not normalized_question:
+        return False
+
+    explicit_phrases = (
+        'all results',
+        'all rows',
+        'all values',
+        'all of them',
+        'complete list',
+        'each one',
+        'every one',
+        'exhaustive',
+        'full list',
+        'list all',
+        'list each',
+        'list every',
+        'list them all',
+        'list them out',
+        'return all',
+        'show all',
+        'show me all',
+    )
+    if any(phrase in normalized_question for phrase in explicit_phrases):
+        return True
+
+    return (
+        'list' in normalized_question
+        and any(token in normalized_question for token in (' all ', ' them', ' out', ' each ', ' every '))
+    )
+
+
+def parse_tabular_result_count(value):
+    """Parse a numeric count from invocation metadata or payloads."""
+    try:
+        parsed_value = int(value)
+    except (TypeError, ValueError):
+        return None
+
+    return parsed_value if parsed_value >= 0 else None
+
+
+def determine_tabular_follow_up_limit(total_available, returned_count, max_cap=200):
+    """Return a larger result limit when the current tool call returned only a partial slice."""
+    total_count = parse_tabular_result_count(total_available)
+    current_count = parse_tabular_result_count(returned_count)
+    if total_count is None or current_count is None or total_count <= current_count:
+        return None
+
+    target_count = min(total_count, max_cap)
+    if target_count <= current_count:
+        return None
+
+    return str(target_count)
+
+
+def extract_tabular_high_signal_search_terms(user_question, max_terms=2):
+    """Extract a short list of likely literal search terms from the user question."""
+    question_text = str(user_question or '').strip()
+    if not question_text:
+        return []
+
+    normalized_question = re.sub(r'\s+', ' ', question_text)
+    lowercase_question = normalized_question.lower()
+    prioritized_terms = []
+    seen_terms = set()
+
+    def add_term(raw_term):
+        rendered_term = str(raw_term or '').strip()
+        if not rendered_term:
+            return
+
+        normalized_term = rendered_term.casefold()
+        if normalized_term in seen_terms:
+            return
+
+        seen_terms.add(normalized_term)
+        prioritized_terms.append(rendered_term)
+
+    for quoted_term in re.findall(r'["\']([^"\']{2,80})["\']', normalized_question):
+        add_term(quoted_term)
+
+    special_terms = (
+        ('sharepoint', 'SharePoint'),
+        ('onedrive', 'OneDrive'),
+        ('teams', 'Teams'),
+        ('ccore', 'CCORe'),
+        ('o365', 'O365'),
+    )
+    for token, rendered_term in special_terms:
+        if token in lowercase_question:
+            add_term(rendered_term)
+
+    ignored_tokens = {
+        'all',
+        'and',
+        'appear',
+        'appears',
+        'are',
+        'cell',
+        'cells',
+        'column',
+        'columns',
+        'count',
+        'counts',
+        'discrete',
+        'distinct',
+        'document',
+        'documents',
+        'does',
+        'every',
+        'file',
+        'for',
+        'from',
+        'get',
+        'how',
+        'in',
+        'is',
+        'it',
+        'link',
+        'links',
+        'location',
+        'locations',
+        'many',
+        'number',
+        'of',
+        'on',
+        'or',
+        'out',
+        'please',
+        'reason',
+        'row',
+        'rows',
+        'search',
+        'sheet',
+        'sheets',
+        'show',
+        'site',
+        'sites',
+        'that',
+        'the',
+        'them',
+        'these',
+        'they',
+        'this',
+        'to',
+        'topic',
+        'unique',
+        'url',
+        'urls',
+        'value',
+        'values',
+        'what',
+        'where',
+        'which',
+        'word',
+        'workbook',
+        'list',
+        'listed',
+        'lists',
+        'lsit',
+    }
+
+    for raw_token in re.findall(r'[A-Za-z0-9][A-Za-z0-9._\-/]{2,}', normalized_question):
+        lowercase_token = raw_token.casefold()
+        if lowercase_token in ignored_tokens:
+            continue
+        add_term(raw_token)
+        if len(prioritized_terms) >= max_terms:
+            break
+
+    return prioritized_terms[:max_terms]
+
+
+def extract_tabular_secondary_filter_terms(user_question, primary_terms=None, max_terms=3):
+    """Return likely cohort/filter terms after excluding the primary topic terms."""
+    excluded_terms = {
+        str(term or '').strip().casefold()
+        for term in (primary_terms or [])
+        if str(term or '').strip()
+    }
+    secondary_terms = []
+
+    for candidate_term in extract_tabular_high_signal_search_terms(
+        user_question,
+        max_terms=max_terms + len(excluded_terms) + 3,
+    ):
+        normalized_candidate_term = str(candidate_term or '').strip().casefold()
+        if not normalized_candidate_term or normalized_candidate_term in excluded_terms:
+            continue
+
+        secondary_terms.append(candidate_term)
+        if len(secondary_terms) >= max_terms:
+            break
+
+    return secondary_terms
+
+
+def normalize_tabular_row_text(value):
+    """Normalize a row cell value for lightweight controller-side term matching."""
+    if value is None:
+        return ''
+
+    return re.sub(r'\s+', ' ', str(value).casefold()).strip()
+
+
+def parse_tabular_column_candidates(raw_columns):
+    """Normalize column arguments from string or list form into a stable list."""
+    if isinstance(raw_columns, list):
+        candidate_columns = raw_columns
+    elif isinstance(raw_columns, str):
+        candidate_columns = raw_columns.split(',')
+    else:
+        return []
+
+    normalized_columns = []
+    seen_columns = set()
+    for candidate_column in candidate_columns:
+        normalized_column = str(candidate_column or '').strip()
+        if not normalized_column:
+            continue
+
+        lowered_column = normalized_column.casefold()
+        if lowered_column in seen_columns:
+            continue
+
+        seen_columns.add(lowered_column)
+        normalized_columns.append(normalized_column)
+
+    return normalized_columns
+
+
+def tabular_value_looks_url_like(value):
+    """Return True when a scalar cell value looks like a URL or site path."""
+    rendered_value = normalize_tabular_row_text(value)
+    if not rendered_value:
+        return False
+
+    return (
+        'http://' in rendered_value
+        or 'https://' in rendered_value
+        or 'sharepoint.com' in rendered_value
+        or '/sites/' in rendered_value
+    )
+
+
+def tabular_result_payload_contains_url_like_content(result_payload):
+    """Return True when a result payload contains URL-like strings."""
+    if not isinstance(result_payload, dict):
+        return False
+
+    candidate_values = []
+    raw_values = result_payload.get('values')
+    if isinstance(raw_values, list):
+        candidate_values.extend(raw_values[:20])
+
+    raw_rows = result_payload.get('data')
+    if isinstance(raw_rows, list):
+        for raw_row in raw_rows[:10]:
+            if not isinstance(raw_row, dict):
+                continue
+            candidate_values.extend(raw_row.values())
+
+    for candidate_value in candidate_values:
+        rendered_candidate = str(candidate_value or '').strip().lower()
+        if not rendered_candidate:
+            continue
+        if (
+            'http://' in rendered_candidate
+            or 'https://' in rendered_candidate
+            or 'sharepoint.com' in rendered_candidate
+            or '/sites/' in rendered_candidate
+        ):
+            return True
+
+    return False
+
+
+def infer_tabular_url_value_column_from_rows(rows, preferred_columns=None):
+    """Infer which returned row column contains URL-like values."""
+    preferred_columns = parse_tabular_column_candidates(preferred_columns)
+    for preferred_column in preferred_columns:
+        if any(
+            isinstance(row, dict) and tabular_value_looks_url_like(row.get(preferred_column))
+            for row in (rows or [])
+        ):
+            return preferred_column
+
+    column_scores = {}
+    for row in rows or []:
+        if not isinstance(row, dict):
+            continue
+
+        for column_name, cell_value in row.items():
+            normalized_column_name = str(column_name or '').strip()
+            if not normalized_column_name or normalized_column_name.startswith('_'):
+                continue
+            if not tabular_value_looks_url_like(cell_value):
+                continue
+
+            column_scores[normalized_column_name] = column_scores.get(normalized_column_name, 0) + 1
+
+    if not column_scores:
+        return None
+
+    return sorted(
+        column_scores.items(),
+        key=lambda item: (-item[1], item[0].casefold()),
+    )[0][0]
+
+
+def infer_tabular_secondary_filter_from_rows(rows, filter_terms, excluded_columns=None):
+    """Infer a likely cohort column/term pair from returned row context."""
+    normalized_excluded_columns = {
+        str(column_name or '').strip().casefold()
+        for column_name in (excluded_columns or [])
+        if str(column_name or '').strip()
+    }
+    normalized_filter_terms = [
+        str(filter_term or '').strip()
+        for filter_term in (filter_terms or [])
+        if str(filter_term or '').strip()
+    ]
+    if not normalized_filter_terms:
+        return None
+
+    candidate_scores = {}
+    for row in rows or []:
+        if not isinstance(row, dict):
+            continue
+
+        for column_name, cell_value in row.items():
+            normalized_column_name = str(column_name or '').strip()
+            if not normalized_column_name or normalized_column_name.startswith('_'):
+                continue
+            if normalized_column_name.casefold() in normalized_excluded_columns:
+                continue
+
+            rendered_cell_value = normalize_tabular_row_text(cell_value)
+            if not rendered_cell_value:
+                continue
+
+            for filter_term in normalized_filter_terms:
+                if str(filter_term).casefold() not in rendered_cell_value:
+                    continue
+
+                score_key = (normalized_column_name, filter_term)
+                candidate_scores[score_key] = candidate_scores.get(score_key, 0) + 1
+
+    if not candidate_scores:
+        return None
+
+    (selected_column, selected_term), match_count = sorted(
+        candidate_scores.items(),
+        key=lambda item: (-item[1], item[0][0].casefold(), item[0][1].casefold()),
+    )[0]
+    return {
+        'column': selected_column,
+        'term': selected_term,
+        'match_count': match_count,
+    }
+
+
+def infer_tabular_url_path_segments(user_question):
+    """Infer URL path truncation when the user is asking about site roots."""
+    normalized_question = re.sub(r'\s+', ' ', str(user_question or '').strip().lower())
+    if not normalized_question:
+        return None
+
+    if 'site' in normalized_question or 'sites' in normalized_question or 'sharepoint' in normalized_question:
+        return '2'
+
+    return None
+
+
+def build_tabular_follow_up_call_signature(function_name, arguments):
+    """Return a stable signature for a follow-up tool call."""
+    normalized_arguments = {}
+    for argument_name, argument_value in (arguments or {}).items():
+        if argument_value in (None, ''):
+            continue
+        normalized_arguments[str(argument_name)] = argument_value
+
+    return f"{function_name}:{json.dumps(normalized_arguments, sort_keys=True, default=str)}"
+
+
+def derive_tabular_follow_up_calls_from_invocations(user_question, invocations):
+    """Derive targeted follow-up calls when initial analytical results are only intermediate."""
+    successful_invocations = [
+        invocation for invocation in (invocations or [])
+        if not get_tabular_invocation_error_message(invocation)
+    ]
+    if not successful_invocations:
+        return []
+
+    wants_distinct_urls = is_tabular_distinct_url_question(user_question)
+    wants_exhaustive_results = question_requests_tabular_exhaustive_results(user_question)
+    wants_row_context = question_requests_tabular_row_context(user_question)
+    search_terms = extract_tabular_high_signal_search_terms(user_question, max_terms=4)
+    primary_search_term = search_terms[0] if search_terms else None
+    secondary_filter_terms = extract_tabular_secondary_filter_terms(
+        user_question,
+        primary_terms=[primary_search_term] if primary_search_term else None,
+        max_terms=3,
+    )
+    has_row_context_tool = any(
+        getattr(invocation, 'function_name', '') in {'search_rows', 'filter_rows', 'query_tabular_data'}
+        for invocation in successful_invocations
+    )
+    has_url_extraction_tool = any(
+        getattr(invocation, 'function_name', '') == 'get_distinct_values'
+        and str(
+            ((getattr(invocation, 'parameters', {}) or {}).get('extract_mode'))
+            or ((get_tabular_invocation_result_payload(invocation) or {}).get('extract_mode'))
+            or ''
+        ).strip().lower() == 'url'
+        for invocation in successful_invocations
+    )
+
+    existing_signatures = {
+        build_tabular_follow_up_call_signature(
+            getattr(invocation, 'function_name', ''),
+            getattr(invocation, 'parameters', {}) or {},
+        )
+        for invocation in successful_invocations
+    }
+    follow_up_calls = []
+
+    for invocation in successful_invocations:
+        function_name = getattr(invocation, 'function_name', '')
+        invocation_parameters = getattr(invocation, 'parameters', {}) or {}
+        result_payload = get_tabular_invocation_result_payload(invocation) or {}
+        filename = str(invocation_parameters.get('filename') or result_payload.get('filename') or '').strip()
+        if not filename:
+            continue
+
+        scope_arguments = {
+            'filename': filename,
+            'source': invocation_parameters.get('source') or 'workspace',
+        }
+        if invocation_parameters.get('group_id'):
+            scope_arguments['group_id'] = invocation_parameters.get('group_id')
+        if invocation_parameters.get('public_workspace_id'):
+            scope_arguments['public_workspace_id'] = invocation_parameters.get('public_workspace_id')
+
+        selected_sheet = get_tabular_invocation_selected_sheet(invocation)
+        if selected_sheet and 'cross-sheet' not in selected_sheet.lower():
+            scope_arguments['sheet_name'] = selected_sheet
+        elif invocation_parameters.get('sheet_name'):
+            scope_arguments['sheet_name'] = invocation_parameters.get('sheet_name')
+        elif invocation_parameters.get('sheet_index') not in (None, ''):
+            scope_arguments['sheet_index'] = invocation_parameters.get('sheet_index')
+
+        if wants_exhaustive_results and function_name in {'search_rows', 'filter_rows', 'query_tabular_data'}:
+            expanded_row_limit = determine_tabular_follow_up_limit(
+                result_payload.get('total_matches'),
+                result_payload.get('returned_rows'),
+            )
+            if expanded_row_limit:
+                expanded_arguments = {
+                    argument_name: argument_value
+                    for argument_name, argument_value in invocation_parameters.items()
+                    if argument_name not in {'user_id', 'conversation_id'} and argument_value not in (None, '')
+                }
+                expanded_arguments.update(scope_arguments)
+                expanded_arguments['max_rows'] = expanded_row_limit
+
+                expanded_signature = build_tabular_follow_up_call_signature(function_name, expanded_arguments)
+                if expanded_signature not in existing_signatures:
+                    follow_up_calls.append({
+                        'function_name': function_name,
+                        'arguments': expanded_arguments,
+                        'reason': 'expand the matching row slice because the user asked for the full result list',
+                    })
+                    existing_signatures.add(expanded_signature)
+
+        if function_name == 'get_distinct_values':
+            target_column = str(invocation_parameters.get('column') or result_payload.get('column') or '').strip()
+            if not target_column:
+                continue
+
+            current_filter_columns = [
+                str(invocation_parameters.get('filter_column') or '').strip(),
+                str(invocation_parameters.get('additional_filter_column') or '').strip(),
+            ]
+            same_column_filter = any(
+                filter_column.casefold() == target_column.casefold()
+                for filter_column in current_filter_columns
+                if filter_column
+            )
+            distinct_count = parse_tabular_result_count(result_payload.get('distinct_count'))
+            returned_values = parse_tabular_result_count(result_payload.get('returned_values'))
+
+            if wants_exhaustive_results:
+                expanded_value_limit = determine_tabular_follow_up_limit(distinct_count, returned_values)
+                if expanded_value_limit:
+                    expanded_arguments = {
+                        argument_name: argument_value
+                        for argument_name, argument_value in invocation_parameters.items()
+                        if argument_name not in {'user_id', 'conversation_id'} and argument_value not in (None, '')
+                    }
+                    expanded_arguments.update(scope_arguments)
+                    expanded_arguments['max_values'] = expanded_value_limit
+
+                    expanded_signature = build_tabular_follow_up_call_signature('get_distinct_values', expanded_arguments)
+                    if expanded_signature not in existing_signatures:
+                        follow_up_calls.append({
+                            'function_name': 'get_distinct_values',
+                            'arguments': expanded_arguments,
+                            'reason': 'expand the returned value list because the user asked for the full result set',
+                        })
+                        existing_signatures.add(expanded_signature)
+
+            needs_broad_row_context = bool(
+                wants_row_context
+                and primary_search_term
+                and not has_row_context_tool
+                and same_column_filter
+                and secondary_filter_terms
+                and distinct_count == 0
+            )
+
+            if wants_row_context and primary_search_term and not has_row_context_tool:
+                row_search_arguments = dict(scope_arguments)
+                row_search_arguments['search_value'] = primary_search_term
+                row_search_arguments['search_columns'] = target_column
+
+                normalize_match_value = invocation_parameters.get('normalize_match')
+                if normalize_match_value not in (None, ''):
+                    row_search_arguments['normalize_match'] = normalize_match_value
+
+                if not needs_broad_row_context:
+                    for argument_name in (
+                        'query_expression',
+                        'filter_column',
+                        'filter_operator',
+                        'filter_value',
+                        'additional_filter_column',
+                        'additional_filter_operator',
+                        'additional_filter_value',
+                    ):
+                        argument_value = invocation_parameters.get(argument_name)
+                        if argument_value in (None, ''):
+                            continue
+                        row_search_arguments[argument_name] = argument_value
+
+                    return_columns = []
+                    for candidate_column in (
+                        invocation_parameters.get('filter_column'),
+                        invocation_parameters.get('additional_filter_column'),
+                        target_column,
+                    ):
+                        normalized_column = str(candidate_column or '').strip()
+                        if not normalized_column or normalized_column in return_columns:
+                            continue
+                        return_columns.append(normalized_column)
+
+                    if return_columns:
+                        row_search_arguments['return_columns'] = ','.join(return_columns)
+
+                row_search_arguments['max_rows'] = '50' if needs_broad_row_context else '25'
+
+                row_search_signature = build_tabular_follow_up_call_signature('search_rows', row_search_arguments)
+                if row_search_signature not in existing_signatures:
+                    follow_up_calls.append({
+                        'function_name': 'search_rows',
+                        'arguments': row_search_arguments,
+                        'reason': (
+                            'collect broad row context for the literal topic before inferring a cohort column'
+                            if needs_broad_row_context else
+                            'collect matching row context for the literal topic before final reasoning'
+                        ),
+                    })
+                    existing_signatures.add(row_search_signature)
+                    has_row_context_tool = True
+
+            if wants_distinct_urls and not str(invocation_parameters.get('extract_mode') or '').strip() and not has_url_extraction_tool:
+                if needs_broad_row_context:
+                    continue
+                if not tabular_result_payload_contains_url_like_content(result_payload):
+                    continue
+
+                extraction_arguments = dict(scope_arguments)
+                extraction_arguments['column'] = target_column
+                for argument_name in (
+                    'query_expression',
+                    'filter_column',
+                    'filter_operator',
+                    'filter_value',
+                    'additional_filter_column',
+                    'additional_filter_operator',
+                    'additional_filter_value',
+                    'normalize_match',
+                    'max_values',
+                ):
+                    argument_value = invocation_parameters.get(argument_name)
+                    if argument_value in (None, ''):
+                        continue
+                    extraction_arguments[argument_name] = argument_value
+
+                extraction_arguments['extract_mode'] = 'url'
+                inferred_path_segments = infer_tabular_url_path_segments(user_question)
+                if inferred_path_segments:
+                    extraction_arguments['url_path_segments'] = inferred_path_segments
+
+                extraction_signature = build_tabular_follow_up_call_signature('get_distinct_values', extraction_arguments)
+                if extraction_signature not in existing_signatures:
+                    follow_up_calls.append({
+                        'function_name': 'get_distinct_values',
+                        'arguments': extraction_arguments,
+                        'reason': 'extract canonical URL or site values from composite text cells',
+                    })
+                    existing_signatures.add(extraction_signature)
+                    has_url_extraction_tool = True
+
+        if function_name == 'search_rows' and wants_distinct_urls and not has_url_extraction_tool:
+            search_rows_result_rows = get_tabular_invocation_data_rows(invocation)
+            if not search_rows_result_rows:
+                continue
+
+            target_column = None
+            searched_columns = parse_tabular_column_candidates(
+                result_payload.get('searched_columns') or invocation_parameters.get('search_columns')
+            )
+            if len(searched_columns) == 1:
+                target_column = searched_columns[0]
+            else:
+                target_column = infer_tabular_url_value_column_from_rows(
+                    search_rows_result_rows,
+                    preferred_columns=searched_columns,
+                )
+
+            if not target_column:
+                continue
+
+            extraction_arguments = dict(scope_arguments)
+            extraction_arguments['column'] = target_column
+
+            inferred_filter = infer_tabular_secondary_filter_from_rows(
+                search_rows_result_rows,
+                secondary_filter_terms,
+                excluded_columns=[target_column],
+            )
+            if inferred_filter:
+                extraction_arguments['filter_column'] = inferred_filter['column']
+                extraction_arguments['filter_operator'] = 'contains'
+                extraction_arguments['filter_value'] = inferred_filter['term']
+            elif not secondary_filter_terms:
+                for argument_name in (
+                    'query_expression',
+                    'filter_column',
+                    'filter_operator',
+                    'filter_value',
+                    'additional_filter_column',
+                    'additional_filter_operator',
+                    'additional_filter_value',
+                ):
+                    argument_value = invocation_parameters.get(argument_name)
+                    if argument_value in (None, ''):
+                        continue
+                    extraction_arguments[argument_name] = argument_value
+            else:
+                continue
+
+            normalize_match_value = invocation_parameters.get('normalize_match')
+            if normalize_match_value not in (None, ''):
+                extraction_arguments['normalize_match'] = normalize_match_value
+
+            extraction_arguments['extract_mode'] = 'url'
+            inferred_path_segments = infer_tabular_url_path_segments(user_question)
+            if inferred_path_segments:
+                extraction_arguments['url_path_segments'] = inferred_path_segments
+
+            expanded_value_limit = None
+            if wants_exhaustive_results:
+                expanded_value_limit = determine_tabular_follow_up_limit(
+                    result_payload.get('total_matches'),
+                    result_payload.get('returned_rows'),
+                )
+            if expanded_value_limit:
+                extraction_arguments['max_values'] = expanded_value_limit
+            elif invocation_parameters.get('max_rows') not in (None, ''):
+                extraction_arguments['max_values'] = invocation_parameters.get('max_rows')
+
+            extraction_signature = build_tabular_follow_up_call_signature('get_distinct_values', extraction_arguments)
+            if extraction_signature not in existing_signatures:
+                follow_up_calls.append({
+                    'function_name': 'get_distinct_values',
+                    'arguments': extraction_arguments,
+                    'reason': 'extract canonical URL or site values after inferring the cohort column from matching rows',
+                })
+                existing_signatures.add(extraction_signature)
+                has_url_extraction_tool = True
+
+        if len(follow_up_calls) >= 2:
+            break
+
+    return follow_up_calls[:2]
+
+
+async def maybe_recover_tabular_analysis_with_llm_reviewer(chat_service, kernel,
+                                                           tabular_plugin, plugin_logger,
+                                                           user_question, schema_context,
+                                                           source_context,
+                                                           analysis_file_contexts,
+                                                           user_id, conversation_id,
+                                                           execution_mode,
+                                                           allowed_function_names,
+                                                           workbook_sheet_hints=None,
+                                                           workbook_related_sheet_hints=None,
+                                                           workbook_cross_sheet_bridge_hints=None,
+                                                           tool_error_messages=None,
+                                                           execution_gap_messages=None,
+                                                           discovery_feedback_messages=None,
+                                                           fallback_source_hint='workspace',
+                                                           fallback_group_id=None,
+                                                           fallback_public_workspace_id=None):
+    """Use an LLM reviewer to choose analytical tool calls when the main SK loop stalls."""
+    reviewer_allowed_function_names = [
+        function_name for function_name in (allowed_function_names or [])
+        if function_name in get_tabular_analysis_function_names()
+    ]
+    if not reviewer_allowed_function_names:
+        return None
+
+    reviewer_manifest = {
+        function_name: get_tabular_reviewer_function_manifest().get(function_name, {})
+        for function_name in reviewer_allowed_function_names
+    }
+
+    reviewer_sections = [
+        f"QUESTION:\n{user_question}",
+        f"EXECUTION_MODE: {execution_mode}",
+        f"SOURCE_CONTEXT:\n{source_context}",
+        f"FILE_SCHEMAS:\n{schema_context}",
+        "FUNCTION_MANIFEST:\n" + json.dumps(reviewer_manifest, indent=2, default=str),
+    ]
+    if discovery_feedback_messages:
+        reviewer_sections.append(
+            'WORKBOOK_DISCOVERY_RESULTS:\n' + json.dumps(discovery_feedback_messages, indent=2, default=str)
+        )
+    if tool_error_messages:
+        reviewer_sections.append(
+            'PREVIOUS_TOOL_ERRORS:\n' + json.dumps(tool_error_messages, indent=2, default=str)
+        )
+    if execution_gap_messages:
+        reviewer_sections.append(
+            'PREVIOUS_EXECUTION_GAPS:\n' + json.dumps(execution_gap_messages, indent=2, default=str)
+        )
+    if workbook_sheet_hints:
+        reviewer_sections.append(
+            'LIKELY_WORKSHEET_HINTS:\n' + json.dumps(workbook_sheet_hints, indent=2, default=str)
+        )
+    if workbook_related_sheet_hints:
+        reviewer_sections.append(
+            'QUESTION_RELEVANT_WORKSHEETS:\n' + json.dumps(workbook_related_sheet_hints, indent=2, default=str)
+        )
+    if workbook_cross_sheet_bridge_hints:
+        reviewer_sections.append(
+            'CROSS_SHEET_BRIDGE_HINTS:\n' + json.dumps(workbook_cross_sheet_bridge_hints, indent=2, default=str)
+        )
+
+    review_history = ChatHistory()
+    review_history.add_system_message(
+        "You are a tabular recovery planner. A previous workbook analysis came close but did not reach computed analytical results. "
+        "Choose the next 1-3 analytical tabular calls that should be executed directly. "
+        "Return JSON only with this schema: {\"reasoning_summary\": \"...\", \"calls\": [{\"function\": \"get_distinct_values\", \"arguments\": {...}}]}. "
+        "Rules: Use only the listed analytical functions. Do not return describe_tabular_file. "
+        "Prefer the smallest number of high-confidence calls needed to compute the answer. "
+        "For deterministic how-many, discrete, unique, or canonical-list questions, prefer count_rows or get_distinct_values over sampled-row tools when possible. "
+        "When the user is asking where a topic, phrase, code, path, identifier, or other value appears and the relevant column is unclear, prefer search_rows. Omit search_columns to search all columns, and use return_columns to surface the fields most relevant to the question. "
+        "When the user wants values from a subset or pattern within one column, prefer get_distinct_values with filter_column/filter_operator/filter_value instead of an unfiltered full-column distinct-value call. "
+        "When the answer depends on two literal column conditions, prefer count_rows, get_distinct_values, or filter_rows with filter_column/filter_operator/filter_value plus additional_filter_column/additional_filter_operator/additional_filter_value instead of a broad query_expression call. "
+        "When the user is asking for URLs, sites, links, or regex-like identifiers embedded inside a text cell, prefer get_distinct_values with extract_mode='url' or extract_mode='regex' rather than counting whole-cell strings. Use url_path_segments when you need canonical higher-level URL roots. "
+        "If whether an embedded URL or identifier counts depends on surrounding text in the original cell rather than the extracted value itself, search/filter the original text column first. Prefer filter_rows for that text search when the matching row context matters, and set max_rows high enough to return the full cohort when it is modest. If a prior tool result is limited and the user explicitly asked for the full list, rerun with a higher max_rows or max_values instead of stopping at the preview slice. "
+        "Do not classify extracted URLs solely by whether the URL text itself contains the keyword when the original cell text already defines the category. "
+        "For URLs, links, paths, and literal identifiers, set normalize_match=false unless normalization is clearly necessary. "
+        "Prefer sheet_name when the correct worksheet is evident from the schemas or discovery results. "
+        "Omit sheet_name only for a deliberate cross-sheet analytical search. "
+        "Use filename exactly as listed in FILE_SCHEMAS. "
+        "Do not include user_id or conversation_id in arguments. Do not wrap the JSON in markdown fences."
+    )
+    review_history.add_user_message("\n\n".join(reviewer_sections))
+
+    reviewer_settings = AzureChatPromptExecutionSettings(service_id="tabular-analysis")
+
+    try:
+        reviewer_result = await chat_service.get_chat_message_contents(
+            review_history,
+            reviewer_settings,
+            kernel=kernel,
+        )
+    except Exception as reviewer_error:
+        log_event(
+            f"[Tabular SK Analysis] Reviewer recovery call failed: {reviewer_error}",
+            level=logging.WARNING,
+            exceptionTraceback=True,
+        )
+        return None
+
+    reviewer_text = ''
+    if reviewer_result and reviewer_result[0].content:
+        reviewer_text = reviewer_result[0].content.strip()
+
+    reviewer_calls = parse_tabular_reviewer_plan(reviewer_text)
+    if not reviewer_calls:
+        log_event(
+            '[Tabular SK Analysis] Reviewer recovery did not return an executable analytical plan',
+            extra={'reviewer_output_preview': reviewer_text[:500]},
+            level=logging.WARNING,
+        )
+        return None
+
+    baseline_invocation_count = len(plugin_logger.get_invocations_for_conversation(
+        user_id,
+        conversation_id,
+        limit=1000,
+    ))
+    executed_function_names = []
+    reviewer_plan_errors = []
+
+    for reviewer_call in reviewer_calls[:3]:
+        function_name = reviewer_call['function_name']
+        if function_name not in reviewer_allowed_function_names:
+            reviewer_plan_errors.append(
+                f"Reviewer selected disallowed function '{function_name}'."
+            )
+            continue
+
+        call_arguments, argument_error = resolve_tabular_reviewer_call_arguments(
+            reviewer_call.get('arguments'),
+            analysis_file_contexts,
+            fallback_source_hint=fallback_source_hint,
+            fallback_group_id=fallback_group_id,
+            fallback_public_workspace_id=fallback_public_workspace_id,
+        )
+        if argument_error:
+            reviewer_plan_errors.append(argument_error)
+            continue
+
+        plugin_function = getattr(tabular_plugin, function_name, None)
+        if plugin_function is None:
+            reviewer_plan_errors.append(
+                f"Reviewer selected unavailable function '{function_name}'."
+            )
+            continue
+
+        function_signature = inspect.signature(plugin_function)
+        executable_arguments = {
+            'user_id': user_id,
+            'conversation_id': conversation_id,
+        }
+        for argument_name, argument_value in call_arguments.items():
+            if argument_name not in function_signature.parameters:
+                continue
+
+            normalized_argument_value = normalize_tabular_reviewer_argument_value(
+                argument_name,
+                argument_value,
+            )
+            if normalized_argument_value is None:
+                continue
+
+            executable_arguments[argument_name] = normalized_argument_value
+
+        try:
+            await plugin_function(**executable_arguments)
+            executed_function_names.append(function_name)
+        except Exception as execution_error:
+            reviewer_plan_errors.append(f"{function_name}: {execution_error}")
+
+    invocations_after = plugin_logger.get_invocations_for_conversation(
+        user_id,
+        conversation_id,
+        limit=1000,
+    )
+    reviewer_invocations = get_new_plugin_invocations(invocations_after, baseline_invocation_count)
+    successful_analytical_invocations, failed_analytical_invocations = split_tabular_analysis_invocations(
+        reviewer_invocations
+    )
+    for follow_up_round in range(2):
+        follow_up_calls = derive_tabular_follow_up_calls_from_invocations(
+            user_question,
+            successful_analytical_invocations,
+        )
+        if not follow_up_calls:
+            break
+
+        auto_follow_up_names = []
+        for follow_up_call in follow_up_calls:
+            function_name = follow_up_call.get('function_name')
+            if function_name not in reviewer_allowed_function_names:
+                reviewer_plan_errors.append(
+                    f"Auto follow-up selected disallowed function '{function_name}'."
+                )
+                continue
+
+            plugin_function = getattr(tabular_plugin, function_name, None)
+            if plugin_function is None:
+                reviewer_plan_errors.append(
+                    f"Auto follow-up selected unavailable function '{function_name}'."
+                )
+                continue
+
+            function_signature = inspect.signature(plugin_function)
+            executable_arguments = {
+                'user_id': user_id,
+                'conversation_id': conversation_id,
+            }
+            for argument_name, argument_value in (follow_up_call.get('arguments') or {}).items():
+                if argument_name not in function_signature.parameters:
+                    continue
+
+                normalized_argument_value = normalize_tabular_reviewer_argument_value(
+                    argument_name,
+                    argument_value,
+                )
+                if normalized_argument_value is None:
+                    continue
+
+                executable_arguments[argument_name] = normalized_argument_value
+
+            try:
+                await plugin_function(**executable_arguments)
+                auto_follow_up_names.append(function_name)
+            except Exception as execution_error:
+                reviewer_plan_errors.append(f"{function_name}: {execution_error}")
+
+        if not auto_follow_up_names:
+            break
+
+        log_event(
+            '[Tabular SK Analysis] Reviewer recovery executed automatic analytical follow-up calls',
+            extra={
+                'follow_up_functions': auto_follow_up_names,
+                'initial_reviewer_functions': executed_function_names,
+                'follow_up_round': follow_up_round + 1,
+            },
+            level=logging.INFO,
+        )
+        executed_function_names.extend(auto_follow_up_names)
+        invocations_after = plugin_logger.get_invocations_for_conversation(
+            user_id,
+            conversation_id,
+            limit=1000,
+        )
+        reviewer_invocations = get_new_plugin_invocations(invocations_after, baseline_invocation_count)
+        successful_analytical_invocations, failed_analytical_invocations = split_tabular_analysis_invocations(
+            reviewer_invocations
+        )
+
+    fallback = build_tabular_analysis_fallback_from_invocations(successful_analytical_invocations)
+    failed_tool_error_messages = summarize_tabular_invocation_errors(failed_analytical_invocations)
+
+    if fallback:
+        log_event(
+            '[Tabular SK Analysis] Reviewer recovery produced computed analytical tool results',
+            extra={
+                'reviewer_functions': executed_function_names,
+                'successful_tool_count': len(successful_analytical_invocations),
+                'failed_tool_count': len(failed_analytical_invocations),
+            },
+            level=logging.INFO,
+        )
+        return {
+            'fallback': fallback,
+            'tool_error_messages': failed_tool_error_messages,
+            'reviewer_plan_errors': reviewer_plan_errors,
+        }
+
+    if reviewer_plan_errors or failed_tool_error_messages:
+        log_event(
+            '[Tabular SK Analysis] Reviewer recovery executed but did not produce usable analytical results',
+            extra={
+                'reviewer_functions': executed_function_names,
+                'reviewer_plan_errors': reviewer_plan_errors[:5],
+                'tool_errors': failed_tool_error_messages[:5],
+                'reviewer_output_preview': reviewer_text[:500],
+            },
+            level=logging.WARNING,
+        )
+
+    return None
+
+
+def filter_tabular_citation_invocations(invocations):
+    """Hide discovery-only citation noise when analytical tabular calls exist."""
+    if not invocations:
+        return []
+
+    successful_analytical_invocations, _ = split_tabular_analysis_invocations(invocations)
+    if successful_analytical_invocations:
+        return successful_analytical_invocations
+
+    successful_schema_summary_invocations = []
+    for invocation in invocations or []:
+        if getattr(invocation, 'function_name', '') != 'describe_tabular_file':
+            continue
+        if get_tabular_invocation_error_message(invocation):
+            continue
+        successful_schema_summary_invocations.append(invocation)
+
+    if successful_schema_summary_invocations:
+        return successful_schema_summary_invocations
+
+    return []
+
+
+def format_tabular_thought_parameter_value(value):
+    """Render a concise parameter value for tabular thought details."""
+    if value is None:
+        return None
+
+    if isinstance(value, (dict, list, tuple)):
+        rendered_value = json.dumps(value, default=str)
+    else:
+        rendered_value = str(value)
+
+    if not rendered_value:
+        return None
+
+    if len(rendered_value) > 120:
+        rendered_value = rendered_value[:117] + '...'
+
+    return rendered_value
+
+
+def get_tabular_tool_thought_payloads(invocations):
+    """Convert tabular plugin invocations into user-visible thought payloads."""
+    thought_payloads = []
+
+    for invocation in invocations or []:
+        function_name = getattr(invocation, 'function_name', 'unknown_tool')
+        duration_ms = getattr(invocation, 'duration_ms', None)
+        error_message = get_tabular_invocation_error_message(invocation)
+        success = getattr(invocation, 'success', True) and not error_message
+        parameters = getattr(invocation, 'parameters', {}) or {}
+
+        filename = parameters.get('filename')
+        sheet_name = parameters.get('sheet_name')
+        duration_suffix = f" ({int(duration_ms)}ms)" if duration_ms else ""
+        content = f"Tabular tool {function_name}{duration_suffix}"
+        if filename:
+            content = f"Tabular tool {function_name} on {filename}{duration_suffix}"
+        if filename and sheet_name:
+            content = f"Tabular tool {function_name} on {filename} [{sheet_name}]{duration_suffix}"
+        if not success:
+            content = f"{content} failed"
+
+        detail_parts = []
+        for parameter_name, parameter_value in parameters.items():
+            if parameter_name in get_tabular_thought_excluded_parameter_names():
+                continue
+
+            rendered_value = format_tabular_thought_parameter_value(parameter_value)
+            if rendered_value is None:
+                continue
+
+            detail_parts.append(f"{parameter_name}={rendered_value}")
+
+        rendered_error_message = format_tabular_thought_parameter_value(error_message)
+        if rendered_error_message:
+            detail_parts.append(f"error={rendered_error_message}")
+
+        detail_parts.append(f"success={success}")
+        detail = "; ".join(detail_parts) if detail_parts else None
+        thought_payloads.append((content, detail))
+
+    return thought_payloads
+
+
+def get_tabular_status_thought_payloads(invocations, analysis_succeeded):
+    """Return additional tabular status thoughts for retries and fallbacks."""
+    successful_analytical_invocations, failed_analytical_invocations = split_tabular_analysis_invocations(invocations)
+    if not failed_analytical_invocations:
+        return []
+
+    error_messages = summarize_tabular_invocation_errors(failed_analytical_invocations)
+    detail = "; ".join(error_messages) if error_messages else None
+
+    if analysis_succeeded and successful_analytical_invocations:
+        return [(
+            "Tabular analysis recovered after retrying tool errors",
+            detail,
+        )]
+
+    if analysis_succeeded:
+        return [(
+            "Tabular analysis recovered via internal fallback after tool errors",
+            detail,
+        )]
+
+    return [(
+        "Tabular analysis encountered tool errors before fallback",
+        detail,
+    )]
+
+
+def _normalize_tabular_sheet_token(token):
+    """Normalize question and sheet-name tokens for lightweight matching."""
+    normalized = re.sub(r'[^a-z0-9]+', '', str(token or '').lower())
+    if len(normalized) > 4 and normalized.endswith('ies'):
+        return normalized[:-3] + 'y'
+    if len(normalized) > 3 and normalized.endswith('s') and not normalized.endswith('ss'):
+        return normalized[:-1]
+    return normalized
+
+
+def _tokenize_tabular_sheet_text(text):
+    """Tokenize free text into normalized sheet-matching tokens."""
+    original_text = re.sub(r'(?i)w[\s\-_]*2', ' w2 ', str(text or ''))
+    expanded_text = re.sub(r'([a-z])([A-Z])', r'\1 \2', original_text)
+    expanded_text = re.sub(r'([A-Za-z])([0-9])', r'\1 \2', expanded_text)
+    expanded_text = re.sub(r'([0-9])([A-Za-z])', r'\1 \2', expanded_text)
+    expanded_text = re.sub(r'[_\-]+', ' ', expanded_text)
+    tokens = []
+    seen_tokens = set()
+
+    for raw_text in (original_text, expanded_text):
+        for raw_token in re.split(r'[^a-z0-9]+', raw_text.lower()):
+            normalized_token = _normalize_tabular_sheet_token(raw_token)
+            if not normalized_token or len(normalized_token) <= 1:
+                continue
+            if normalized_token in seen_tokens:
+                continue
+            seen_tokens.add(normalized_token)
+            tokens.append(normalized_token)
+
+    return tokens
+
+
+def _coerce_citation_sort_number(value):
+    """Return a numeric citation sort value when possible."""
+    if value in (None, '') or isinstance(value, bool):
+        return None
+
+    if isinstance(value, (int, float)):
+        return float(value)
+
+    raw_value = str(value).strip()
+    if not raw_value:
+        return None
+
+    try:
+        return float(raw_value)
+    except (TypeError, ValueError):
+        return None
+
+
+def _build_hybrid_citation_sort_key(citation):
+    """Sort numeric page citations first, then metadata-style citations safely."""
+    if not isinstance(citation, dict):
+        return (0, -1.0, -1.0, '', '')
+
+    page_number = citation.get('page_number')
+    page_value = _coerce_citation_sort_number(page_number)
+    chunk_sequence_value = _coerce_citation_sort_number(citation.get('chunk_sequence'))
+    page_label = str(page_number or '').strip().lower()
+    metadata_type = str(citation.get('metadata_type') or '').strip().lower()
+
+    if page_value is not None:
+        return (
+            2,
+            page_value,
+            chunk_sequence_value if chunk_sequence_value is not None else -1.0,
+            page_label,
+            metadata_type,
+        )
+
+    if chunk_sequence_value is not None:
+        return (1, chunk_sequence_value, -1.0, page_label, metadata_type)
+
+    return (0, -1.0, -1.0, page_label, metadata_type)
+
+
+def _extract_tabular_entity_anchor_terms(question_text):
+    """Extract likely primary-entity terms from an entity lookup question."""
+    normalized_question = str(question_text or '').strip().lower()
+    if not normalized_question:
+        return []
+
+    stopwords = {
+        'and',
+        'any',
+        'by',
+        'detail',
         'details',
         'exact',
         'explain',
@@ -1642,7 +3335,8 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
                                    conversation_id, gpt_model, settings,
                                    source_hint="workspace", group_id=None,
                                    public_workspace_id=None,
-                                   execution_mode='analysis'):
+                                   execution_mode='analysis',
+                                   tabular_file_contexts=None):
     """Run lightweight SK with TabularProcessingPlugin to analyze tabular data.
 
     Creates a temporary Kernel with only the TabularProcessingPlugin, uses the
@@ -1661,8 +3355,16 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
         execution_mode = execution_mode if execution_mode in {'analysis', 'schema_summary', 'entity_lookup'} else 'analysis'
         schema_summary_mode = execution_mode == 'schema_summary'
         entity_lookup_mode = execution_mode == 'entity_lookup'
+        analysis_file_contexts = normalize_tabular_file_contexts_for_analysis(
+            tabular_filenames=tabular_filenames,
+            tabular_file_contexts=tabular_file_contexts,
+            fallback_source_hint=source_hint,
+            fallback_group_id=group_id,
+            fallback_public_workspace_id=public_workspace_id,
+        )
+        analysis_filenames = [file_context['file_name'] for file_context in analysis_file_contexts]
         log_event(
-            f"[Tabular SK Analysis] Starting {execution_mode} analysis for files: {tabular_filenames}",
+            f"[Tabular SK Analysis] Starting {execution_mode} analysis for files: {analysis_filenames}",
             level=logging.INFO,
         )
 
@@ -1703,11 +3405,12 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
         kernel.add_service(chat_service)
 
         # 3. Pre-dispatch: load file schemas to eliminate discovery LLM rounds
-        source_context = f"source='{source_hint}'"
-        if group_id:
-            source_context += f", group_id='{group_id}'"
-        if public_workspace_id:
-            source_context += f", public_workspace_id='{public_workspace_id}'"
+        source_context = build_tabular_analysis_source_context(
+            analysis_file_contexts,
+            fallback_source_hint=source_hint,
+            fallback_group_id=group_id,
+            fallback_public_workspace_id=public_workspace_id,
+        )
 
         schema_parts = []
         workbook_sheet_hints = {}
@@ -1716,22 +3419,28 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
         workbook_blob_locations = {}
         retry_sheet_overrides = {}
         previous_failed_call_parameters = []  # entity lookup: concrete failed call params for retry hints
+        has_multi_sheet_workbook = False
         sheet_score_match_fn = _score_tabular_entity_sheet_match if entity_lookup_mode else _score_tabular_sheet_match
-        allowed_function_filters = {
-            'included_functions': [
-                f"tabular_processing-{function_name}"
-                for function_name in (
-                    ['describe_tabular_file']
-                    if schema_summary_mode else
-                    sorted(get_tabular_analysis_function_names())
-                )
-            ]
-        }
-        for fname in tabular_filenames:
+        for file_context in analysis_file_contexts:
+            fname = file_context['file_name']
+            file_source_hint = file_context.get('source_hint', source_hint)
+            file_group_id = file_context.get('group_id')
+            file_public_workspace_id = file_context.get('public_workspace_id')
+            schema_source_context = {'source': file_source_hint}
+            if file_group_id:
+                schema_source_context['group_id'] = file_group_id
+            if file_public_workspace_id:
+                schema_source_context['public_workspace_id'] = file_public_workspace_id
             try:
                 container, blob_path = tabular_plugin._resolve_blob_location_with_fallback(
-                    user_id, conversation_id, fname, source_hint,
-                    group_id=group_id, public_workspace_id=public_workspace_id
+                    user_id, conversation_id, fname, file_source_hint,
+                    group_id=file_group_id, public_workspace_id=file_public_workspace_id
+                )
+                tabular_plugin.remember_resolved_blob_location(
+                    file_source_hint,
+                    fname,
+                    container,
+                    blob_path,
                 )
                 schema_info = tabular_plugin._build_workbook_schema_summary(
                     container,
@@ -1742,6 +3451,7 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
                 workbook_blob_locations[fname] = (container, blob_path)
 
                 if schema_info.get('is_workbook') and schema_info.get('sheet_count', 0) > 1:
+                    has_multi_sheet_workbook = True
                     # Build a compact sheet directory so the model can pick the
                     # relevant sheet itself instead of us guessing.
                     per_sheet = schema_info.get('per_sheet_schemas', {})
@@ -1798,6 +3508,7 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
                         })
                     directory_schema = {
                         'filename': fname,
+                        'source_context': schema_source_context,
                         'is_workbook': True,
                         'sheet_count': schema_info.get('sheet_count', 0),
                         'likely_sheet': likely_sheet,
@@ -1813,7 +3524,9 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
                         level=logging.DEBUG,
                     )
                 else:
-                    schema_parts.append(json.dumps(schema_info, indent=2, default=str))
+                    schema_with_context = dict(schema_info)
+                    schema_with_context['source_context'] = schema_source_context
+                    schema_parts.append(json.dumps(schema_with_context, indent=2, default=str))
                     if schema_info.get('is_workbook'):
                         # Single-sheet workbook — set default so the model needs no sheet arg
                         single_sheet = (schema_info.get('sheet_names') or [None])[0]
@@ -1822,12 +3535,31 @@ async def run_tabular_sk_analysis(user_question, tabular_filenames, user_id,
                     df = tabular_plugin._read_tabular_blob_to_dataframe(container, blob_path)
                     log_event(f"[Tabular SK Analysis] Pre-loaded schema for {fname} ({len(df)} rows)", level=logging.DEBUG)
             except Exception as e:
-                log_event(f"[Tabular SK Analysis] Failed to pre-load schema for {fname}: {e}", level=logging.WARNING)
-                schema_parts.append(json.dumps({"filename": fname, "error": f"Could not pre-load: {str(e)}"}))
+                log_event(
+                    f"[Tabular SK Analysis] Failed to pre-load schema for {fname} "
+                    f"(source={file_source_hint}, group_id={file_group_id}, public_workspace_id={file_public_workspace_id}): {e}",
+                    level=logging.WARNING,
+                )
+                schema_parts.append(json.dumps({
+                    "filename": fname,
+                    "source_context": schema_source_context,
+                    "error": f"Could not pre-load: {str(e)}",
+                }))
 
         schema_context = "\n".join(schema_parts)
+        allow_multi_sheet_discovery = has_multi_sheet_workbook and not schema_summary_mode
+        allowed_function_names = ['describe_tabular_file'] if schema_summary_mode else sorted(get_tabular_analysis_function_names())
+        if allow_multi_sheet_discovery:
+            allowed_function_names = ['describe_tabular_file'] + allowed_function_names
+        allowed_function_filters = {
+            'included_functions': [
+                f"tabular_processing-{function_name}"
+                for function_name in allowed_function_names
+            ]
+        }
 
-        def build_system_prompt(force_tool_use=False, tool_error_messages=None, execution_gap_messages=None):
+        def build_system_prompt(force_tool_use=False, tool_error_messages=None,
+                                execution_gap_messages=None, discovery_feedback_messages=None):
             if schema_summary_mode:
                 retry_prefix = ""
                 if force_tool_use:
@@ -1898,6 +3630,17 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                     "Correct the analysis plan and query the missing related worksheets before answering.\n\n"
                 )
 
+            discovery_feedback = ""
+            if discovery_feedback_messages:
+                rendered_discovery_feedback = "\n".join(
+                    f"- {message}" for message in discovery_feedback_messages
+                )
+                discovery_feedback = (
+                    "WORKBOOK DISCOVERY RESULTS:\n"
+                    f"{rendered_discovery_feedback}\n"
+                    "Use these discovery results to choose the next analytical tool calls. Discovery alone does not answer the question.\n\n"
+                )
+
             missing_sheet_feedback = ""
             if tool_error_messages and any(
                 'Specify sheet_name or sheet_index on analytical calls.' in error_message
@@ -1976,6 +3719,13 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                     "These recovery hints override the original likely-sheet guess when the previous tool call failed on the wrong worksheet.\n\n"
                 )
 
+            discovery_step_feedback = ""
+            if allow_multi_sheet_discovery:
+                discovery_step_feedback = (
+                    "MULTI-SHEET DISCOVERY:\n"
+                    "If the right worksheet or columns are unclear, call describe_tabular_file without sheet_name as an exploration step, then continue with one or more analytical tool calls. You may need multiple tool rounds.\n\n"
+                )
+
             related_sheet_feedback = ""
             if workbook_related_sheet_hints:
                 rendered_related_sheet_hints = "\n".join(
@@ -2027,30 +3777,38 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                     f"{entity_retry_prefix}"
                     f"{tool_error_feedback}"
                     f"{execution_gap_feedback}"
+                    f"{discovery_feedback}"
                     f"{recovery_sheet_feedback}"
                     f"{sheet_hint_feedback}"
                     f"{related_sheet_feedback}"
+                    f"{discovery_step_feedback}"
                     f"{missing_sheet_feedback}"
                     f"FILE SCHEMAS:\n"
                     f"{schema_context}\n\n"
-                    "AVAILABLE FUNCTIONS: filter_rows, query_tabular_data, lookup_value, get_distinct_values, count_rows, "
-                    "filter_rows_by_related_values, count_rows_by_related_values, aggregate_column, group_by_aggregate, and group_by_datetime_component.\n\n"
-                    "Discovery functions are not available in this analysis run because schema context is already pre-loaded.\n\n"
+                    f"AVAILABLE FUNCTIONS: {', '.join(allowed_function_names)}.\n\n"
+                    + (
+                        "Workbook discovery is available through describe_tabular_file. Discovery-only results do NOT complete the analysis. After exploration, continue with analytical functions before answering.\n\n"
+                        if allow_multi_sheet_discovery else
+                        "Discovery functions are not available in this analysis run because schema context is already pre-loaded.\n\n"
+                    )
+                    +
                     "IMPORTANT:\n"
-                    "1. If the question includes an exact identifier or exact entity name and the correct starting worksheet is unclear, begin with filter_rows or query_tabular_data without sheet_name so the plugin can perform a cross-sheet discovery search.\n"
-                    "2. After the first discovery step, pass sheet_name='<name>' on follow-up analytical calls for multi-sheet workbooks. Do not rely on a default sheet for cross-sheet entity lookups.\n"
-                    "3. Use filter_rows or query_tabular_data first when you need full matching rows. Use lookup_value only when you already know the exact worksheet and target column.\n"
-                    "4. Do not start with aggregate_column, group_by_aggregate, or group_by_datetime_component until you have located the relevant entity rows.\n"
-                    "5. When using query_tabular_data, use simple DataFrame.query() syntax with backticked column names for columns containing spaces. Avoid method calls such as .str.lower() or .astype(...).\n"
-                    "6. Then query other relevant worksheets explicitly to collect related records.\n"
-                    "7. When a retrieved row contains a secondary identifier such as ReturnID, CaseID, AccountID, PaymentID, W2ID, or Form1099ID, reuse it to query dependent worksheets.\n"
-                    "8. Do not stop after the first successful row if the question asks for related records across sheets.\n"
-                    "9. If a requested record type has no corresponding worksheet in the workbook, say that the workbook does not contain that record type.\n"
-                    "10. Clearly distinguish between no matching rows and no corresponding worksheet.\n"
-                    "11. Summarize concrete found records sheet-by-sheet using the tool results, not schema placeholders.\n"
-                    "12. For count or percentage questions involving a cohort defined on one sheet and facts on another, prefer get_distinct_values, count_rows, filter_rows_by_related_values, or count_rows_by_related_values over manually counting sampled rows.\n"
-                    "13. Use normalize_match=true when matching names, owners, assignees, engineers, or similar entity-text columns across worksheets.\n"
-                    "14. Do not mention hypothetical follow-up analyses, parser errors, or failed attempts unless the user explicitly asked about failures and you have actual tool error output to report."
+                    "0. Use the source_context listed in FILE SCHEMAS for the matching filename when calling tabular_processing functions.\n"
+                    "1. If the right worksheet is unclear on a multi-sheet workbook, you may call describe_tabular_file without sheet_name first, then continue with analytical tool calls.\n"
+                    "2. If the question includes an exact identifier, exact entity name, or asks where a topic or value appears and the correct starting worksheet or column is unclear, begin with search_rows, filter_rows, or query_tabular_data without sheet_name so the plugin can perform a cross-sheet discovery search. Omit search_columns on search_rows to search all columns, and use return_columns to surface the fields most relevant to the lookup.\n"
+                    "3. After the first discovery step, pass sheet_name='<name>' on follow-up analytical calls for multi-sheet workbooks. Do not rely on a default sheet for cross-sheet entity lookups.\n"
+                    "4. Use search_rows, filter_rows, or query_tabular_data first when you need full matching rows. Use lookup_value only when you already know the exact worksheet and target column.\n"
+                    "5. Do not start with aggregate_column, group_by_aggregate, or group_by_datetime_component until you have located the relevant entity rows.\n"
+                    "6. When using query_tabular_data, use simple DataFrame.query() syntax with backticked column names for columns containing spaces. Avoid method calls such as .str.lower() or .astype(...).\n"
+                    "7. Then query other relevant worksheets explicitly to collect related records.\n"
+                    "8. When a retrieved row contains a secondary identifier such as ReturnID, CaseID, AccountID, PaymentID, W2ID, or Form1099ID, reuse it to query dependent worksheets.\n"
+                    "9. Do not stop after the first successful row if the question asks for related records across sheets.\n"
+                    "10. If a requested record type has no corresponding worksheet in the workbook, say that the workbook does not contain that record type.\n"
+                    "11. Clearly distinguish between no matching rows and no corresponding worksheet.\n"
+                    "12. Summarize concrete found records sheet-by-sheet using the tool results, not schema placeholders.\n"
+                    "13. For count or percentage questions involving a cohort defined on one sheet and facts on another, prefer get_distinct_values, count_rows, filter_rows_by_related_values, or count_rows_by_related_values over manually counting sampled rows.\n"
+                    "14. Use normalize_match=true when matching names, owners, assignees, engineers, or similar entity-text columns across worksheets.\n"
+                    "15. Do not mention hypothetical follow-up analyses, parser errors, or failed attempts unless the user explicitly asked about failures and you have actual tool error output to report."
                 )
 
             return (
@@ -2062,39 +3820,49 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                 f"{retry_prefix}"
                 f"{tool_error_feedback}"
                 f"{execution_gap_feedback}"
+                f"{discovery_feedback}"
                 f"{recovery_sheet_feedback}"
                 f"{sheet_hint_feedback}"
                 f"{related_sheet_feedback}"
                 f"{cross_sheet_bridge_feedback}"
+                f"{discovery_step_feedback}"
                 f"{missing_sheet_feedback}"
                 f"FILE SCHEMAS:\n"
                 f"{schema_context}\n\n"
-                "AVAILABLE FUNCTIONS: lookup_value, get_distinct_values, count_rows, filter_rows, query_tabular_data, "
-                "filter_rows_by_related_values, count_rows_by_related_values, aggregate_column, group_by_aggregate, and group_by_datetime_component for year/quarter/month/week/day/hour trend analysis.\n\n"
-                "Discovery functions are not available in this analysis run because schema context is already pre-loaded.\n\n"
+                f"AVAILABLE FUNCTIONS: {', '.join(allowed_function_names)} for year/quarter/month/week/day/hour trend analysis.\n\n"
+                + (
+                    "Workbook discovery is available through describe_tabular_file. Discovery-only results do NOT complete the analysis. After exploration, continue with analytical functions before answering.\n\n"
+                    if allow_multi_sheet_discovery else
+                    "Discovery functions are not available in this analysis run because schema context is already pre-loaded.\n\n"
+                )
+                +
                 "IMPORTANT:\n"
-                "1. Use the pre-loaded schema to pick the correct columns, then call the plugin functions.\n"
-                "2. For multi-sheet workbooks, review the sheet_directory to find the most relevant sheet for the question. Pass sheet_name='<name>' in every analytical tool call unless a trustworthy default sheet has already been established. If a CROSS-SHEET BRIDGE PLAN is provided, query the listed worksheets explicitly and do not rely on a default sheet.\n"
-                "3. If a previous tool error says a requested column is missing on the current sheet and suggests candidate sheets, switch to one of those candidate sheets immediately.\n"
-                "4. For account/category lookup questions at a specific period or metric, use lookup_value first. Provide lookup_column, lookup_value, and target_column.\n"
-                "5. If lookup_value is not sufficient, use filter_rows or query_tabular_data on the label column, then read the requested period column.\n"
-                "6. For deterministic how-many questions, use count_rows instead of estimating counts from partial returned rows.\n"
-                "7. For cohort, membership, ownership-share, or percentage questions where one sheet defines the group and another sheet contains the fact rows, use get_distinct_values, filter_rows_by_related_values, or count_rows_by_related_values.\n"
-                "8. When the question asks for one named member's share within that cohort, prefer count_rows_by_related_values and either read source_value_match_counts from the helper result or rerun count_rows_by_related_values with source_filter_column/source_filter_value on the reference sheet. Do not fall back to query_tabular_data or filter_rows on the fact sheet with a guessed exact text value unless the workbook already exposed that canonical target value.\n"
-                "9. Use normalize_match=true when matching names, owners, assignees, engineers, or similar entity-text columns across worksheets.\n"
-                "10. Only use aggregate_column when the user explicitly asks for a sum, average, min, max, or count across rows and count_rows is not the simpler deterministic option.\n"
-                "11. For time-based questions on datetime columns, use group_by_datetime_component.\n"
-                "12. For threshold, ranking, comparison, or correlation-like questions, first filter/query the relevant rows, then compute grouped metrics.\n"
-                "13. When the question asks for grouped results for each entity or category and a cross-sheet bridge plan or relationship hint is available, use the reference worksheet to identify the canonical entities or categories and the fact worksheet to compute the metric. Do not answer 'each X' by grouping a yes/no, boolean, or membership-flag column unless the user explicitly asked about that flag.\n"
-                "14. When the question asks for rows satisfying multiple conditions, prefer one combined query_expression using and/or instead of separate broad queries that you plan to intersect later.\n"
-                "15. Batch multiple independent function calls in a SINGLE response whenever possible.\n"
-                "16. Keep max_rows as small as possible. Only increase it when the user explicitly asked for an exhaustive row list or export; otherwise return total_matches plus representative rows.\n"
-                "17. For analytical questions, prefer deterministic counts plus lookup/filter/query/grouped computations over raw row or preview output.\n"
-                "18. For identifier-based workbook questions, locate the identifier on the correct sheet before explaining downstream calculations.\n"
-                "19. For peak, busiest, highest, or lowest questions, use grouped functions and inspect the highest_group, highest_value, lowest_group, and lowest_value summary fields.\n"
-                "20. Return only computed findings and name the strongest drivers clearly.\n"
-                "21. Do not mention hypothetical follow-up analyses, parser errors, or failed attempts unless the user explicitly asked about failures and you have actual tool error output to report.\n"
-                "22. When using query_tabular_data, use simple DataFrame.query() syntax with backticked column names for columns containing spaces. Avoid method calls such as .str.lower(), .astype(...), or other Python expressions that DataFrame.query() may reject."
+                "1. Use the pre-loaded schema to pick the correct columns, then call the plugin functions. Use the source_context listed in FILE SCHEMAS for the matching filename.\n"
+                "2. For multi-sheet workbooks, review the sheet_directory to find the most relevant sheet for the question. If the right worksheet is still unclear, call describe_tabular_file without sheet_name, then continue with analytical calls. Pass sheet_name='<name>' in follow-up analytical tool calls unless a trustworthy default sheet has already been established or you are intentionally doing an initial cross-sheet discovery step. If a CROSS-SHEET BRIDGE PLAN is provided, query the listed worksheets explicitly and do not rely on a default sheet.\n"
+                "3. If the question includes an exact identifier or asks where a topic, phrase, path, code, or other value appears and the correct starting worksheet or column is unclear, begin with search_rows, filter_rows, or query_tabular_data without sheet_name so the plugin can perform a cross-sheet discovery search. Omit search_columns on search_rows to search all columns, and use return_columns to surface the columns most relevant to the question.\n"
+                "4. If a previous tool error says a requested column is missing on the current sheet and suggests candidate sheets, switch to one of those candidate sheets immediately.\n"
+                "5. For account/category lookup questions at a specific period or metric, use lookup_value first. Provide lookup_column, lookup_value, and target_column.\n"
+                "6. If lookup_value is not sufficient, use search_rows, filter_rows, or query_tabular_data on the relevant label or text columns, then read the requested period or target column.\n"
+                "7. For deterministic how-many questions, use count_rows instead of estimating counts from partial returned rows. Use get_distinct_values when the answer depends on the unique values present in a column. When the cohort is defined by two literal conditions on different columns, prefer count_rows, get_distinct_values, or filter_rows with filter_column/filter_operator/filter_value plus additional_filter_column/additional_filter_operator/additional_filter_value instead of a broad query_tabular_data call.\n"
+                "8. When URLs, links, sites, or regex-like identifiers are embedded inside a text column, prefer get_distinct_values with extract_mode='url' or extract_mode='regex' after filtering the relevant cohort. Use url_path_segments when the question asks for higher-level URL roots rather than full page paths.\n"
+                "9. If whether an embedded URL, site, link, or identifier counts depends on surrounding text in the original cell rather than the extracted value itself, search/filter the original text column first. Prefer filter_rows when the matching row context matters, and return the full matching rows when the cohort is modest enough to fit comfortably.\n"
+                "10. Do not classify extracted URLs solely by whether the URL text itself contains the keyword when the original cell text already defines the category.\n"
+                "11. For cohort, membership, ownership-share, or percentage questions where one sheet defines the group and another sheet contains the fact rows, use get_distinct_values, filter_rows_by_related_values, or count_rows_by_related_values.\n"
+                "12. When the question asks for one named member's share within that cohort, prefer count_rows_by_related_values and either read source_value_match_counts from the helper result or rerun count_rows_by_related_values with source_filter_column/source_filter_value on the reference sheet. Do not fall back to query_tabular_data or filter_rows on the fact sheet with a guessed exact text value unless the workbook already exposed that canonical target value.\n"
+                "13. Use normalize_match=true when matching names, owners, assignees, engineers, or similar entity-text columns across worksheets.\n"
+                "14. Only use aggregate_column when the user explicitly asks for a sum, average, min, max, or count across rows and count_rows is not the simpler deterministic option.\n"
+                "15. For time-based questions on datetime columns, use group_by_datetime_component.\n"
+                "16. For threshold, ranking, comparison, or correlation-like questions, first filter/query the relevant rows, then compute grouped metrics.\n"
+                "17. When the question asks for grouped results for each entity or category and a cross-sheet bridge plan or relationship hint is available, use the reference worksheet to identify the canonical entities or categories and the fact worksheet to compute the metric. Do not answer 'each X' by grouping a yes/no, boolean, or membership-flag column unless the user explicitly asked about that flag.\n"
+                "18. When the question asks for rows satisfying multiple conditions, prefer one combined query_expression using and/or instead of separate broad queries that you plan to intersect later.\n"
+                "19. Batch multiple independent function calls in a SINGLE response whenever possible.\n"
+                "20. Keep max_rows as small as possible. Only increase it when the user explicitly asked for an exhaustive row list or export, or when the full matching row context is required and the cohort is modest; otherwise return total_matches plus representative rows. If a prior result reports total_matches > returned_rows or distinct_count > returned_values for a full-list question, rerun with a higher max_rows or max_values before answering.\n"
+                "21. For analytical questions, prefer deterministic counts plus lookup/filter/query/grouped computations over raw row or preview output.\n"
+                "22. For identifier-based workbook questions, locate the identifier on the correct sheet before explaining downstream calculations.\n"
+                "23. For peak, busiest, highest, or lowest questions, use grouped functions and inspect the highest_group, highest_value, lowest_group, and lowest_value summary fields.\n"
+                "24. Return only computed findings and name the strongest drivers clearly.\n"
+                "25. Do not mention hypothetical follow-up analyses, parser errors, or failed attempts unless the user explicitly asked about failures and you have actual tool error output to report.\n"
+                "26. When using query_tabular_data, use simple DataFrame.query() syntax with backticked column names for columns containing spaces. Avoid method calls such as .str.lower(), .astype(...), or other Python expressions that DataFrame.query() may reject."
             )
 
         baseline_invocations = plugin_logger.get_invocations_for_conversation(
@@ -2105,20 +3873,24 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
         baseline_invocation_count = len(baseline_invocations)
         previous_tool_error_messages = []
         previous_execution_gap_messages = []
+        previous_discovery_feedback_messages = []
+        analysis_requires_immediate_tool_choice = has_multi_sheet_workbook and not schema_summary_mode
 
         for attempt_number in range(1, 4):
-            force_tool_use = attempt_number > 1
+            force_tool_use = attempt_number > 1 or (attempt_number == 1 and analysis_requires_immediate_tool_choice)
             # 4. Build chat history with pre-loaded schemas
             chat_history = SKChatHistory()
             chat_history.add_system_message(build_system_prompt(
                 force_tool_use=force_tool_use,
                 tool_error_messages=previous_tool_error_messages,
                 execution_gap_messages=previous_execution_gap_messages,
+                discovery_feedback_messages=previous_discovery_feedback_messages,
             ))
 
             chat_history.add_user_message(
                 f"Analyze the tabular data to answer: {user_question}\n"
-                f"Use user_id='{user_id}', conversation_id='{conversation_id}', {source_context}."
+                f"Use user_id='{user_id}', conversation_id='{conversation_id}'.\n"
+                f"{source_context}"
             )
 
             # 5. Execute with auto function calling
@@ -2249,6 +4021,7 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                     if successful_analytical_invocations:
                         previous_tool_error_messages = []
                         previous_failed_call_parameters = []
+                        previous_discovery_feedback_messages = []
 
                         if entity_lookup_mode:
                             selected_sheets = get_tabular_invocation_selected_sheets(successful_analytical_invocations)
@@ -2363,7 +4136,12 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                             level=logging.WARNING
                         )
                     elif discovery_invocations:
-                        previous_execution_gap_messages = []
+                        previous_discovery_feedback_messages = summarize_tabular_discovery_invocations(
+                            successful_schema_summary_invocations or discovery_invocations,
+                        )
+                        previous_execution_gap_messages = [
+                            'Previous attempt explored workbook structure but did not execute analytical functions. Continue with analytical tool calls now.'
+                        ]
                         discovery_function_names = sorted({
                             invocation.function_name for invocation in discovery_invocations
                         })
@@ -2372,13 +4150,19 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                             level=logging.WARNING
                         )
                     elif new_invocation_count > 0:
+                        previous_discovery_feedback_messages = []
                         previous_execution_gap_messages = []
                         log_event(
                             f"[Tabular SK Analysis] Attempt {attempt_number} used unsupported tool(s) without computed analysis; retrying",
                             level=logging.WARNING
                         )
                     else:
-                        previous_execution_gap_messages = []
+                        previous_discovery_feedback_messages = []
+                        previous_execution_gap_messages = (
+                            ['Previous attempt did not use any tools. Start with workbook discovery if the right worksheet is unclear, then continue with analytical tool calls.']
+                            if allow_multi_sheet_discovery else
+                            []
+                        )
                         log_event(
                             f"[Tabular SK Analysis] Attempt {attempt_number} returned narrative without tool use; retrying",
                             level=logging.WARNING
@@ -2397,6 +4181,7 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
                     )
                 elif failed_analytical_invocations:
                     previous_tool_error_messages = summarize_tabular_invocation_errors(failed_analytical_invocations)
+                    previous_discovery_feedback_messages = []
                     previous_execution_gap_messages = []
                     log_event(
                         f"[Tabular SK Analysis] Attempt {attempt_number} returned no content after tool errors; retrying",
@@ -2414,6 +4199,34 @@ def build_system_prompt(force_tool_use=False, tool_error_messages=None, executio
 
             baseline_invocation_count = len(invocations_after)
 
+        reviewer_recovery = None
+        if has_multi_sheet_workbook and not schema_summary_mode:
+            reviewer_recovery = await maybe_recover_tabular_analysis_with_llm_reviewer(
+                chat_service=chat_service,
+                kernel=kernel,
+                tabular_plugin=tabular_plugin,
+                plugin_logger=plugin_logger,
+                user_question=user_question,
+                schema_context=schema_context,
+                source_context=source_context,
+                analysis_file_contexts=analysis_file_contexts,
+                user_id=user_id,
+                conversation_id=conversation_id,
+                execution_mode=execution_mode,
+                allowed_function_names=allowed_function_names,
+                workbook_sheet_hints=workbook_sheet_hints,
+                workbook_related_sheet_hints=workbook_related_sheet_hints,
+                workbook_cross_sheet_bridge_hints=workbook_cross_sheet_bridge_hints,
+                tool_error_messages=previous_tool_error_messages,
+                execution_gap_messages=previous_execution_gap_messages,
+                discovery_feedback_messages=previous_discovery_feedback_messages,
+                fallback_source_hint=source_hint,
+                fallback_group_id=group_id,
+                fallback_public_workspace_id=public_workspace_id,
+            )
+            if reviewer_recovery and reviewer_recovery.get('fallback'):
+                return reviewer_recovery['fallback']
+
         log_event("[Tabular SK Analysis] Unable to obtain computed tool-backed results", level=logging.WARNING)
         return None
 
@@ -2515,17 +4328,125 @@ def get_document_container_for_scope(document_scope):
     return cosmos_user_documents_container
 
 
-def get_selected_workspace_tabular_filenames(selected_document_ids=None, selected_document_id=None, document_scope='personal'):
-    """Resolve explicitly selected workspace documents and return tabular filenames."""
+def get_document_containers_for_scope(document_scope):
+    """Return workspace source/container pairs for the requested document scope."""
+    if document_scope == 'group':
+        return [('group', cosmos_group_documents_container)]
+    if document_scope == 'public':
+        return [('public', cosmos_public_documents_container)]
+    if document_scope == 'all':
+        return [
+            ('workspace', cosmos_user_documents_container),
+            ('group', cosmos_group_documents_container),
+            ('public', cosmos_public_documents_container),
+        ]
+    return [('workspace', cosmos_user_documents_container)]
+
+
+def build_tabular_file_context(file_name, source_hint='workspace', group_id=None, public_workspace_id=None):
+    """Build normalized source metadata for a tabular file when enough scope is known."""
+    normalized_file_name = str(file_name or '').strip()
+    if not is_tabular_filename(normalized_file_name):
+        return None
+
+    normalized_source_hint = str(source_hint or 'workspace').strip().lower()
+    if normalized_source_hint == 'personal':
+        normalized_source_hint = 'workspace'
+    if normalized_source_hint not in {'workspace', 'chat', 'group', 'public'}:
+        normalized_source_hint = 'workspace'
+
+    normalized_group_id = str(group_id or '').strip() or None
+    normalized_public_workspace_id = str(public_workspace_id or '').strip() or None
+
+    if normalized_source_hint == 'group' and not normalized_group_id:
+        normalized_source_hint = 'workspace'
+    if normalized_source_hint == 'public' and not normalized_public_workspace_id:
+        normalized_source_hint = 'workspace'
+
+    context = {
+        'file_name': normalized_file_name,
+        'source_hint': normalized_source_hint,
+    }
+    if normalized_source_hint == 'group' and normalized_group_id:
+        context['group_id'] = normalized_group_id
+    if normalized_source_hint == 'public' and normalized_public_workspace_id:
+        context['public_workspace_id'] = normalized_public_workspace_id
+    return context
+
+
+def dedupe_tabular_file_contexts(file_contexts=None):
+    """Return unique tabular file contexts while preserving the first-seen order."""
+    unique_contexts = []
+    seen_contexts = set()
+
+    for file_context in file_contexts or []:
+        if not isinstance(file_context, Mapping):
+            continue
+
+        context_key = (
+            str(file_context.get('file_name') or '').strip(),
+            str(file_context.get('source_hint') or 'workspace').strip().lower(),
+            str(file_context.get('group_id') or '').strip(),
+            str(file_context.get('public_workspace_id') or '').strip(),
+        )
+        if not context_key[0] or context_key in seen_contexts:
+            continue
+
+        seen_contexts.add(context_key)
+        unique_contexts.append(dict(file_context))
+
+    return unique_contexts
+
+
+def infer_tabular_source_context_from_document(source_doc, document_scope='personal',
+                                              active_group_id=None, active_public_workspace_id=None):
+    """Infer tabular file source metadata from a search result or citation document."""
+    if not isinstance(source_doc, Mapping):
+        return None
+
+    file_name = source_doc.get('file_name')
+    doc_group_id = str(source_doc.get('group_id') or '').strip() or None
+    doc_public_workspace_id = str(source_doc.get('public_workspace_id') or '').strip() or None
+
+    if doc_public_workspace_id:
+        return build_tabular_file_context(
+            file_name,
+            source_hint='public',
+            public_workspace_id=doc_public_workspace_id,
+        )
+    if doc_group_id:
+        return build_tabular_file_context(
+            file_name,
+            source_hint='group',
+            group_id=doc_group_id,
+        )
+    if document_scope == 'group':
+        return build_tabular_file_context(
+            file_name,
+            source_hint='group',
+            group_id=active_group_id,
+        )
+    if document_scope == 'public':
+        return build_tabular_file_context(
+            file_name,
+            source_hint='public',
+            public_workspace_id=active_public_workspace_id,
+        )
+    return build_tabular_file_context(file_name, source_hint='workspace')
+
+
+def get_selected_workspace_tabular_file_contexts(selected_document_ids=None, selected_document_id=None,
+                                                 document_scope='personal', active_group_id=None,
+                                                 active_public_workspace_id=None):
+    """Resolve explicitly selected workspace documents and return tabular source contexts."""
     selected_ids = list(selected_document_ids or [])
     if not selected_ids and selected_document_id and selected_document_id != 'all':
         selected_ids = [selected_document_id]
 
     if not selected_ids:
-        return set()
+        return []
 
-    cosmos_container = get_document_container_for_scope(document_scope)
-    tabular_filenames = set()
+    tabular_file_contexts = []
 
     for doc_id in selected_ids:
         if not doc_id or doc_id == 'all':
@@ -2533,58 +4454,337 @@ def get_selected_workspace_tabular_filenames(selected_document_ids=None, selecte
 
         try:
             doc_query = (
-                "SELECT TOP 1 c.file_name, c.title "
+                "SELECT TOP 1 c.file_name, c.title, c.group_id, c.public_workspace_id "
                 "FROM c WHERE c.id = @doc_id "
                 "ORDER BY c.version DESC"
             )
-            doc_params = [{"name": "@doc_id", "value": doc_id}]
-            doc_results = list(cosmos_container.query_items(
-                query=doc_query,
-                parameters=doc_params,
-                enable_cross_partition_query=True
-            ))
+            doc_params = [{"name": "@doc_id", "value": doc_id}]
+
+            for source_hint, cosmos_container in get_document_containers_for_scope(document_scope):
+                doc_results = list(cosmos_container.query_items(
+                    query=doc_query,
+                    parameters=doc_params,
+                    enable_cross_partition_query=True
+                ))
+
+                if not doc_results:
+                    continue
+
+                doc_info = doc_results[0]
+                file_context = build_tabular_file_context(
+                    doc_info.get('file_name') or doc_info.get('title'),
+                    source_hint=source_hint,
+                    group_id=doc_info.get('group_id') or active_group_id,
+                    public_workspace_id=doc_info.get('public_workspace_id') or active_public_workspace_id,
+                )
+                if file_context:
+                    tabular_file_contexts.append(file_context)
+                break
+        except Exception as e:
+            log_event(
+                f"[Tabular SK Analysis] Failed to resolve selected document '{doc_id}': {e}",
+                level=logging.WARNING
+            )
+
+    return dedupe_tabular_file_contexts(tabular_file_contexts)
+
+
+def collect_workspace_tabular_file_contexts(combined_documents=None, selected_document_ids=None,
+                                            selected_document_id=None, document_scope='personal',
+                                            active_group_id=None, active_public_workspace_id=None):
+    """Collect tabular source contexts from search results and explicit workspace selection."""
+    tabular_file_contexts = []
+
+    for source_doc in combined_documents or []:
+        file_context = infer_tabular_source_context_from_document(
+            source_doc,
+            document_scope=document_scope,
+            active_group_id=active_group_id,
+            active_public_workspace_id=active_public_workspace_id,
+        )
+        if file_context:
+            tabular_file_contexts.append(file_context)
+
+    tabular_file_contexts.extend(get_selected_workspace_tabular_file_contexts(
+        selected_document_ids=selected_document_ids,
+        selected_document_id=selected_document_id,
+        document_scope=document_scope,
+        active_group_id=active_group_id,
+        active_public_workspace_id=active_public_workspace_id,
+    ))
+
+    return dedupe_tabular_file_contexts(tabular_file_contexts)
+
+
+def collect_workspace_tabular_filenames(combined_documents=None, selected_document_ids=None,
+                                        selected_document_id=None, document_scope='personal',
+                                        active_group_id=None, active_public_workspace_id=None):
+    """Collect unique tabular filenames from search results and explicit workspace selection."""
+    tabular_file_contexts = collect_workspace_tabular_file_contexts(
+        combined_documents=combined_documents,
+        selected_document_ids=selected_document_ids,
+        selected_document_id=selected_document_id,
+        document_scope=document_scope,
+        active_group_id=active_group_id,
+        active_public_workspace_id=active_public_workspace_id,
+    )
+    return {file_context['file_name'] for file_context in tabular_file_contexts}
+
+
+def normalize_tabular_file_contexts_for_analysis(tabular_filenames=None, tabular_file_contexts=None,
+                                                 fallback_source_hint='workspace', fallback_group_id=None,
+                                                 fallback_public_workspace_id=None):
+    """Return per-file tabular source contexts, defaulting to a shared fallback only when needed."""
+    normalized_contexts = dedupe_tabular_file_contexts(tabular_file_contexts)
+    if normalized_contexts:
+        return normalized_contexts
+
+    fallback_contexts = []
+    for file_name in tabular_filenames or []:
+        fallback_context = build_tabular_file_context(
+            file_name,
+            source_hint=fallback_source_hint,
+            group_id=fallback_group_id,
+            public_workspace_id=fallback_public_workspace_id,
+        )
+        if fallback_context:
+            fallback_contexts.append(fallback_context)
+
+    return dedupe_tabular_file_contexts(fallback_contexts)
+
+
+def build_tabular_analysis_source_context(tabular_file_contexts=None, fallback_source_hint='workspace',
+                                          fallback_group_id=None, fallback_public_workspace_id=None):
+    """Build prompt instructions for per-file tabular source metadata."""
+    normalized_contexts = dedupe_tabular_file_contexts(tabular_file_contexts)
+    if normalized_contexts:
+        lines = [
+            "Use the following per-file source metadata on tabular_processing tool calls. "
+            "Do not substitute a different source for a listed file:",
+        ]
+        for file_context in normalized_contexts:
+            context_parts = [f"source='{file_context.get('source_hint', 'workspace')}'"]
+            if file_context.get('group_id'):
+                context_parts.append(f"group_id='{file_context['group_id']}'")
+            if file_context.get('public_workspace_id'):
+                context_parts.append(f"public_workspace_id='{file_context['public_workspace_id']}'")
+            lines.append(f"- {file_context['file_name']}: {', '.join(context_parts)}")
+        return "\n".join(lines)
+
+    fallback_parts = [f"source='{fallback_source_hint}'"]
+    if fallback_source_hint == 'group' and fallback_group_id:
+        fallback_parts.append(f"group_id='{fallback_group_id}'")
+    if fallback_source_hint == 'public' and fallback_public_workspace_id:
+        fallback_parts.append(f"public_workspace_id='{fallback_public_workspace_id}'")
+    return f"Use {', '.join(fallback_parts)} on tabular_processing tool calls."
+
+
+def determine_tabular_source_hint(document_scope, active_group_id=None, active_public_workspace_id=None):
+    """Map workspace scope metadata to the tabular plugin source hint."""
+    if document_scope == 'group' and active_group_id:
+        return 'group'
+    if document_scope == 'public' and active_public_workspace_id:
+        return 'public'
+    return 'workspace'
+
+
+async def run_multi_file_tabular_distinct_url_analysis(user_question, analysis_file_contexts,
+                                                       user_id, conversation_id):
+    """Run deterministic per-file URL extraction and union the distinct results in Python."""
+    from semantic_kernel_plugins.tabular_processing_plugin import TabularProcessingPlugin
+
+    del user_question
+    normalized_contexts = dedupe_tabular_file_contexts(analysis_file_contexts)
+    if len(normalized_contexts) <= 1:
+        return None
+
+    tabular_plugin = TabularProcessingPlugin()
+    successful_results = []
+    fatal_failures = []
+
+    for file_context in normalized_contexts:
+        filename = file_context['file_name']
+        source_hint = file_context.get('source_hint', 'workspace')
+        group_id = file_context.get('group_id')
+        public_workspace_id = file_context.get('public_workspace_id')
+
+        try:
+            container_name, blob_name = tabular_plugin._resolve_blob_location_with_fallback(
+                user_id,
+                conversation_id,
+                filename,
+                source_hint,
+                group_id=group_id,
+                public_workspace_id=public_workspace_id,
+            )
+            tabular_plugin.remember_resolved_blob_location(
+                source_hint,
+                filename,
+                container_name,
+                blob_name,
+            )
+            schema_info = tabular_plugin._build_workbook_schema_summary(
+                container_name,
+                blob_name,
+                filename,
+                preview_rows=2,
+            )
+        except Exception as exc:
+            fatal_failures.append({
+                'filename': filename,
+                'source': source_hint,
+                'error': f'Could not load workbook schema: {exc}',
+            })
+            continue
 
-            if not doc_results:
-                continue
+        selected_sheet, selected_column = select_tabular_distinct_url_sheet_and_column(schema_info)
+        if not selected_column:
+            fatal_failures.append({
+                'filename': filename,
+                'source': source_hint,
+                'error': 'Could not identify a URL/location-style column from workbook schema.',
+            })
+            continue
 
-            file_name = doc_results[0].get('file_name') or doc_results[0].get('title')
-            if is_tabular_filename(file_name):
-                tabular_filenames.add(file_name)
-        except Exception as e:
-            log_event(
-                f"[Tabular SK Analysis] Failed to resolve selected document '{doc_id}': {e}",
-                level=logging.WARNING
-            )
+        base_arguments = {
+            'user_id': user_id,
+            'conversation_id': conversation_id,
+            'filename': filename,
+            'column': selected_column,
+            'extract_mode': 'regex',
+            'extract_pattern': MULTI_FILE_TABULAR_DISTINCT_URL_EXTRACT_PATTERN,
+            'normalize_match': 'false',
+            'max_values': '10000',
+            'source': source_hint,
+        }
+        if group_id:
+            base_arguments['group_id'] = group_id
+        if public_workspace_id:
+            base_arguments['public_workspace_id'] = public_workspace_id
+
+        attempt_arguments = []
+        primary_arguments = dict(base_arguments)
+        if selected_sheet:
+            primary_arguments['sheet_name'] = selected_sheet
+        attempt_arguments.append(primary_arguments)
+
+        if (
+            selected_sheet
+            and schema_info.get('is_workbook')
+            and int(schema_info.get('sheet_count', 0) or 0) > 1
+        ):
+            attempt_arguments.append(dict(base_arguments))
 
-    return tabular_filenames
+        best_result_payload = None
+        best_result_counts = None
+        last_error_message = None
+        for current_arguments in attempt_arguments:
+            raw_result = await tabular_plugin.get_distinct_values(**current_arguments)
+            try:
+                result_payload = json.loads(raw_result)
+            except (TypeError, ValueError):
+                last_error_message = 'get_distinct_values returned a non-JSON payload.'
+                continue
 
+            if result_payload.get('error'):
+                last_error_message = str(result_payload.get('error')).strip()
+                continue
 
-def collect_workspace_tabular_filenames(combined_documents=None, selected_document_ids=None,
-                                        selected_document_id=None, document_scope='personal'):
-    """Collect tabular filenames from search results and explicit workspace selection."""
-    tabular_filenames = set()
+            distinct_count = parse_tabular_result_count(result_payload.get('distinct_count')) or 0
+            returned_values = parse_tabular_result_count(result_payload.get('returned_values')) or 0
+            comparison_key = (distinct_count, returned_values)
+            if best_result_counts is None or comparison_key > best_result_counts:
+                best_result_payload = result_payload
+                best_result_counts = comparison_key
+
+        if best_result_payload is None:
+            fatal_failures.append({
+                'filename': filename,
+                'source': source_hint,
+                'error': last_error_message or 'Distinct URL extraction failed for this file.',
+            })
+            continue
 
-    for source_doc in combined_documents or []:
-        file_name = source_doc.get('file_name', '')
-        if is_tabular_filename(file_name):
-            tabular_filenames.add(file_name)
+        successful_results.append(best_result_payload)
 
-    tabular_filenames.update(get_selected_workspace_tabular_filenames(
-        selected_document_ids=selected_document_ids,
-        selected_document_id=selected_document_id,
-        document_scope=document_scope,
-    ))
+    if fatal_failures:
+        log_event(
+            '[Tabular Multi-File] Deterministic distinct URL analysis could not cover every file; falling back to SK orchestration.',
+            extra={
+                'conversation_id': conversation_id,
+                'file_count': len(normalized_contexts),
+                'fatal_failures': fatal_failures[:5],
+            },
+            level=logging.WARNING,
+        )
+        return None
 
-    return tabular_filenames
+    combined_analysis = build_multi_file_tabular_distinct_value_analysis(successful_results)
+    if combined_analysis:
+        log_event(
+            '[Tabular Multi-File] Deterministic distinct URL analysis completed.',
+            extra={
+                'conversation_id': conversation_id,
+                'file_count': len(normalized_contexts),
+                'matched_file_count': len(successful_results),
+            },
+            level=logging.INFO,
+        )
 
+    return combined_analysis
+
+
+async def run_tabular_analysis_with_multi_file_support(user_question, tabular_filenames, user_id,
+                                                       conversation_id, gpt_model, settings,
+                                                       source_hint='workspace', group_id=None,
+                                                       public_workspace_id=None,
+                                                       execution_mode='analysis',
+                                                       tabular_file_contexts=None):
+    """Run deterministic multi-file helpers first, then fall back to the SK planner."""
+    analysis_file_contexts = normalize_tabular_file_contexts_for_analysis(
+        tabular_filenames=tabular_filenames,
+        tabular_file_contexts=tabular_file_contexts,
+        fallback_source_hint=source_hint,
+        fallback_group_id=group_id,
+        fallback_public_workspace_id=public_workspace_id,
+    )
+    multi_file_mode = get_multi_file_tabular_analysis_mode(
+        user_question,
+        execution_mode=execution_mode,
+        analysis_file_contexts=analysis_file_contexts,
+    )
 
-def determine_tabular_source_hint(document_scope, active_group_id=None, active_public_workspace_id=None):
-    """Map workspace scope metadata to the tabular plugin source hint."""
-    if document_scope == 'group' and active_group_id:
-        return 'group'
-    if document_scope == 'public' and active_public_workspace_id:
-        return 'public'
-    return 'workspace'
+    if multi_file_mode == 'distinct_url_union':
+        log_event(
+            '[Tabular Multi-File] Starting deterministic distinct URL union analysis.',
+            extra={
+                'conversation_id': conversation_id,
+                'file_names': [file_context['file_name'] for file_context in analysis_file_contexts],
+            },
+            level=logging.INFO,
+        )
+        deterministic_analysis = await run_multi_file_tabular_distinct_url_analysis(
+            user_question,
+            analysis_file_contexts,
+            user_id,
+            conversation_id,
+        )
+        if deterministic_analysis:
+            return deterministic_analysis
+
+    return await run_tabular_sk_analysis(
+        user_question=user_question,
+        tabular_filenames=tabular_filenames,
+        tabular_file_contexts=analysis_file_contexts,
+        user_id=user_id,
+        conversation_id=conversation_id,
+        gpt_model=gpt_model,
+        settings=settings,
+        source_hint=source_hint,
+        group_id=group_id,
+        public_workspace_id=public_workspace_id,
+        execution_mode=execution_mode,
+    )
 
 
 def resolve_foundry_scope_for_auth(auth_settings, endpoint=None):
@@ -2988,6 +5188,51 @@ def consume_stream():
             }
         )
 
+    def get_facts_for_context(scope_id, scope_type, conversation_id: str = None, agent_id: str = None):
+        if not scope_id or not scope_type:
+            return ""
+        fact_store = FactMemoryStore()
+        kwargs = dict(
+            scope_type=scope_type,
+            scope_id=scope_id,
+        )
+        if agent_id:
+            kwargs['agent_id'] = agent_id
+        if conversation_id:
+            kwargs['conversation_id'] = conversation_id
+        facts = fact_store.get_facts(**kwargs)
+        if not facts:
+            return ""
+        fact_lines = []
+        for fact in facts:
+            value = str(fact.get('value') or '').strip()
+            if value:
+                fact_lines.append(f"- {value}")
+        if not fact_lines:
+            return ""
+        fact_lines.append(f"- agent_id: {agent_id or 'None'}")
+        fact_lines.append(f"- scope_type: {scope_type}")
+        fact_lines.append(f"- scope_id: {scope_id}")
+        fact_lines.append(f"- conversation_id: {conversation_id or 'None'}")
+        return "\n".join(fact_lines)
+
+    def inject_fact_memory_context(conversation_history, scope_id, scope_type, conversation_id: str = None, agent_id: str = None):
+        facts = get_facts_for_context(
+            scope_id=scope_id,
+            scope_type=scope_type,
+            conversation_id=conversation_id,
+            agent_id=agent_id,
+        )
+        if facts:
+            conversation_history.insert(0, {
+                "role": "system",
+                "content": f"<Fact Memory>\n{facts}\n</Fact Memory>"
+            })
+        conversation_history.insert(0, {
+            "role": "system",
+            "content": f"""<Conversation Metadata>\n<Scope ID: {scope_id}>\n<Scope Type: {scope_type}>\n<Conversation ID: {conversation_id}>\n<Agent ID: {agent_id}>\n</Conversation Metadata>"""
+        })
+
     @app.route('/api/chat', methods=['POST'])
     @swagger_route(security=get_auth_security())
     @login_required
@@ -3158,6 +5403,18 @@ def result_requires_message_reload(result: Any) -> bool:
             if isinstance(image_gen_enabled, str):
                 image_gen_enabled = image_gen_enabled.lower() == 'true'
 
+            original_hybrid_search_enabled = bool(hybrid_search_enabled)
+            history_grounded_search_used = False
+            history_only_answerability = None
+            prior_grounded_document_refs = []
+            effective_document_scope = document_scope
+            effective_selected_document_ids = list(selected_document_ids or [])
+            effective_selected_document_id = selected_document_id
+            effective_active_group_ids = list(active_group_ids or [])
+            effective_active_group_id = active_group_id
+            effective_active_public_workspace_ids = list(active_public_workspace_ids or [])
+            effective_active_public_workspace_id = active_public_workspace_id
+
             # GPT & Image generation APIM or direct
             gpt_model = ""
             gpt_client = None
@@ -3790,16 +6047,127 @@ def result_requires_message_reload(result: Any) -> bool:
                     debug_print(f"[Content Safety Error] {e}")
                 except Exception as ex:
                     debug_print(f"[Content Safety] Unexpected error: {ex}")
+
+            if not original_hybrid_search_enabled:
+                prior_grounded_document_refs = _normalize_prior_grounded_document_refs(conversation_item)
+                if prior_grounded_document_refs:
+                    thought_tracker.add_thought(
+                        'history_context',
+                        'Checking whether prior conversation context already answers the question',
+                        detail=f"grounded_documents={len(prior_grounded_document_refs)}"
+                    )
+                    try:
+                        preflight_messages_query = (
+                            "SELECT * FROM c WHERE c.conversation_id = @conv_id ORDER BY c.timestamp ASC"
+                        )
+                        preflight_messages_params = [{"name": "@conv_id", "value": conversation_id}]
+                        preflight_messages = list(cosmos_messages_container.query_items(
+                            query=preflight_messages_query,
+                            parameters=preflight_messages_params,
+                            partition_key=conversation_id,
+                            enable_cross_partition_query=True,
+                        ))
+                        preflight_history_segments = build_conversation_history_segments(
+                            all_messages=preflight_messages,
+                            conversation_history_limit=conversation_history_limit,
+                            enable_summarize_older_messages=enable_summarize_content_history_beyond_conversation_history_limit,
+                            gpt_client=gpt_client,
+                            gpt_model=gpt_model,
+                            user_message_id=user_message_id,
+                            fallback_user_message=user_message,
+                        )
+                        history_only_answerability = assess_history_only_answerability(
+                            gpt_client,
+                            gpt_model,
+                            build_history_only_assessment_messages(
+                                preflight_history_segments,
+                                settings.get('default_system_prompt', '').strip(),
+                            ),
+                        )
+                    except Exception as assessment_error:
+                        debug_print(
+                            f"[History Fallback] History-only sufficiency assessment failed: {assessment_error}"
+                        )
+
+                    if history_only_answerability and history_only_answerability.get('can_answer_from_history'):
+                        thought_tracker.add_thought(
+                            'history_context',
+                            'Prior conversation context appears sufficient without new document retrieval',
+                            detail=history_only_answerability.get('reason') or None,
+                        )
+                    else:
+                        fallback_search_parameters = build_prior_grounded_document_search_parameters(
+                            prior_grounded_document_refs
+                        )
+                        if fallback_search_parameters.get('document_ids'):
+                            history_grounded_search_used = True
+                            effective_document_scope = fallback_search_parameters.get('doc_scope') or 'all'
+                            effective_selected_document_ids = list(
+                                fallback_search_parameters.get('document_ids') or []
+                            )
+                            effective_selected_document_id = (
+                                effective_selected_document_ids[0]
+                                if len(effective_selected_document_ids) == 1
+                                else None
+                            )
+                            effective_active_group_ids = list(
+                                fallback_search_parameters.get('active_group_ids') or []
+                            )
+                            effective_active_group_id = fallback_search_parameters.get('active_group_id')
+                            effective_active_public_workspace_ids = list(
+                                fallback_search_parameters.get('active_public_workspace_ids') or []
+                            )
+                            effective_active_public_workspace_id = fallback_search_parameters.get(
+                                'active_public_workspace_id'
+                            )
+
+                            rewritten_search_query = ''
+                            if history_only_answerability:
+                                rewritten_search_query = str(
+                                    history_only_answerability.get('search_query') or ''
+                                ).strip()
+                            if rewritten_search_query:
+                                search_query = rewritten_search_query
+
+                            fallback_detail_parts = [
+                                f"documents={len(effective_selected_document_ids)}",
+                                f"scope={effective_document_scope or 'all'}",
+                            ]
+                            if history_only_answerability and history_only_answerability.get('reason'):
+                                fallback_detail_parts.append(
+                                    f"reason={history_only_answerability['reason']}"
+                                )
+                            thought_tracker.add_thought(
+                                'search',
+                                'Conversation context alone was insufficient; searching previously grounded documents',
+                                detail=' | '.join(fallback_detail_parts),
+                            )
+
+                            user_metadata.setdefault('workspace_search', {})[
+                                'history_grounded_fallback'
+                            ] = {
+                                'used': True,
+                                'document_scope': effective_document_scope,
+                                'document_count': len(effective_selected_document_ids),
+                                'search_query': search_query,
+                            }
+                            user_message_doc['metadata'] = user_metadata
+                            cosmos_messages_container.upsert_item(user_message_doc)
+                else:
+                    thought_tracker.add_thought(
+                        'history_context',
+                        'No prior grounded documents were available; using conversation history only'
+                    )
         # region 4 - Augmentation
             # ---------------------------------------------------------------------
             # 4) Augmentation (Search, etc.) - Run *before* final history prep
             # ---------------------------------------------------------------------
             
             # Hybrid Search
-            if hybrid_search_enabled:
+            if hybrid_search_enabled or history_grounded_search_used:
                 
                 # Optional: Summarize recent history *for search* (uses its own limit)
-                if enable_summarize_content_history_for_search:
+                if hybrid_search_enabled and enable_summarize_content_history_for_search:
                     # Fetch last N messages for search context
                     limit_n_search = number_of_historical_messages_to_summarize * 2
                     query_search = f"SELECT TOP {limit_n_search} * FROM c WHERE c.conversation_id = @conv_id ORDER BY c.timestamp DESC"
@@ -3852,7 +6220,16 @@ def result_requires_message_reload(result: Any) -> bool:
 
 
                 # Perform the search
-                thought_tracker.add_thought('search', f"Searching {document_scope or 'personal'} workspace documents for '{(search_query or user_message)[:50]}'")
+                if history_grounded_search_used and not hybrid_search_enabled:
+                    thought_tracker.add_thought(
+                        'search',
+                        f"Searching {len(effective_selected_document_ids)} previously grounded document(s) for '{(search_query or user_message)[:50]}'"
+                    )
+                else:
+                    thought_tracker.add_thought(
+                        'search',
+                        f"Searching {effective_document_scope or 'personal'} workspace documents for '{(search_query or user_message)[:50]}'"
+                    )
                 try:
                     # Prepare search arguments
                     # Set default and maximum values for top_n
@@ -3878,25 +6255,31 @@ def result_requires_message_reload(result: Any) -> bool:
                         "query": search_query,
                         "user_id": user_id,
                         "top_n": top_n,
-                        "doc_scope": document_scope,
+                        "doc_scope": effective_document_scope,
                     }
                     
                     # Add active_group_ids when:
                     # 1. Document scope is 'group' or chat_type is 'group', OR
                     # 2. Document scope is 'all' and groups are enabled (so group search can be included)
-                    if active_group_ids and (document_scope == 'group' or document_scope == 'all' or chat_type == 'group'):
-                        search_args["active_group_ids"] = active_group_ids
+                    if effective_active_group_ids and (
+                        effective_document_scope == 'group'
+                        or effective_document_scope == 'all'
+                        or chat_type == 'group'
+                    ):
+                        search_args["active_group_ids"] = effective_active_group_ids
     
                     # Add active_public_workspace_id when:
                     # 1. Document scope is 'public' or
                     # 2. Document scope is 'all' and public workspaces are enabled
-                    if active_public_workspace_id and (document_scope == 'public' or document_scope == 'all'):
-                        search_args["active_public_workspace_id"] = active_public_workspace_id
+                    if effective_active_public_workspace_id and (
+                        effective_document_scope == 'public' or effective_document_scope == 'all'
+                    ):
+                        search_args["active_public_workspace_id"] = effective_active_public_workspace_id
                         
-                    if selected_document_ids:
-                        search_args["document_ids"] = selected_document_ids
-                    elif selected_document_id:
-                        search_args["document_id"] = selected_document_id
+                    if effective_selected_document_ids:
+                        search_args["document_ids"] = effective_selected_document_ids
+                    elif effective_selected_document_id:
+                        search_args["document_id"] = effective_selected_document_id
                     
                     # Add tags filter if provided
                     if tags_filter and isinstance(tags_filter, list) and len(tags_filter) > 0:
@@ -3930,10 +6313,18 @@ def result_requires_message_reload(result: Any) -> bool:
                         chunk_sequence = doc.get('chunk_sequence', 0) # Add default
                         page_number = doc.get('page_number') or chunk_sequence or 1 # Ensure a fallback page
                         citation_id = doc.get('id', str(uuid.uuid4())) # Ensure ID exists
+                        document_id = str(doc.get('document_id') or '').strip()
+                        if not document_id:
+                            document_id = (
+                                '_'.join(str(citation_id).split('_')[:-1])
+                                if '_' in str(citation_id)
+                                else str(citation_id)
+                            )
                         classification = doc.get('document_classification')
                         chunk_id = doc.get('chunk_id', str(uuid.uuid4())) # Ensure ID exists
                         score = doc.get('score', 0.0) # Add default score
                         group_id = doc.get('group_id', None) # Add default group ID
+                        doc_public_workspace_id = doc.get('public_workspace_id', None)
                         sheet_name = doc.get('sheet_name')
                         location_label, location_value = get_citation_location(
                             file_name,
@@ -3946,6 +6337,7 @@ def result_requires_message_reload(result: Any) -> bool:
                         retrieved_texts.append(f"{chunk_text}\n{citation}")
                         combined_documents.append({
                             "file_name": file_name, 
+                            "document_id": document_id,
                             "citation_id": citation_id, 
                             "page_number": page_number,
                             "sheet_name": sheet_name,
@@ -3958,6 +6350,7 @@ def result_requires_message_reload(result: Any) -> bool:
                             "chunk_id": chunk_id,
                             "score": score,
                             "group_id": group_id,
+                            "public_workspace_id": doc_public_workspace_id,
                         })
                         if classification:
                             classifications_found.add(classification)
@@ -3979,12 +6372,14 @@ def result_requires_message_reload(result: Any) -> bool:
                         #    in the citation itself, as it can be large. The citation points *to* the chunk.
                         citation_data = {
                             "file_name": source_doc.get("file_name"),
+                            "document_id": source_doc.get("document_id"),
                             "citation_id": source_doc.get("citation_id"), # Seems like a useful identifier
                             "page_number": source_doc.get("page_number"),
                             "chunk_id": source_doc.get("chunk_id"), # Specific chunk identifier
                             "chunk_sequence": source_doc.get("chunk_sequence"), # Order within document/group
                             "score": source_doc.get("score"), # Relevance score from search
                             "group_id": source_doc.get("group_id"), # Grouping info if used
+                            "public_workspace_id": source_doc.get("public_workspace_id"),
                             "version": source_doc.get("version"), # Document version
                             "classification": source_doc.get("classification") # Document classification
                             # Add any other relevant metadata fields from source_doc here
@@ -3992,8 +6387,7 @@ def result_requires_message_reload(result: Any) -> bool:
                         # Using .get() provides None if a key is missing, preventing KeyErrors
                         hybrid_citations_list.append(citation_data)
 
-                    # Reorder hybrid citations list in descending order based on page_number
-                    hybrid_citations_list.sort(key=lambda x: x.get('page_number', 0), reverse=True)
+                    hybrid_citations_list.sort(key=_build_hybrid_citation_sort_key, reverse=True)
 
                     # --- NEW: Extract metadata (keywords/abstract) for additional citations ---
                     # Only if extract_metadata is enabled
@@ -4006,7 +6400,10 @@ def result_requires_message_reload(result: Any) -> bool:
                         for doc in search_results:
                             # Get document ID (from the chunk's document reference)
                             # AI Search chunks contain references to their parent document
-                            doc_id = doc.get('id', '').split('_')[0] if doc.get('id') else None
+                            doc_id = str(doc.get('document_id') or '').strip()
+                            if not doc_id and doc.get('id'):
+                                raw_doc_id = str(doc.get('id') or '').strip()
+                                doc_id = '_'.join(raw_doc_id.split('_')[:-1]) if '_' in raw_doc_id else raw_doc_id
 
                             # Skip if we've already processed this document
                             if not doc_id or doc_id in processed_doc_ids:
@@ -4043,6 +6440,7 @@ def result_requires_message_reload(result: Any) -> bool:
                                     
                                     keywords_citation = {
                                         "file_name": file_name,
+                                        "document_id": doc_id,
                                         "citation_id": keywords_citation_id,
                                         "page_number": "Metadata",  # Special page identifier
                                         "chunk_id": keywords_citation_id,
@@ -4076,6 +6474,7 @@ def result_requires_message_reload(result: Any) -> bool:
                                     
                                     abstract_citation = {
                                         "file_name": file_name,
+                                        "document_id": doc_id,
                                         "citation_id": abstract_citation_id,
                                         "page_number": "Metadata",  # Special page identifier
                                         "chunk_id": abstract_citation_id,
@@ -4119,6 +6518,7 @@ def result_requires_message_reload(result: Any) -> bool:
                                     
                                     vision_citation = {
                                         "file_name": file_name,
+                                        "document_id": doc_id,
                                         "citation_id": vision_citation_id,
                                         "page_number": "AI Vision",  # Special page identifier
                                         "chunk_id": vision_citation_id,
@@ -4152,18 +6552,23 @@ def result_requires_message_reload(result: Any) -> bool:
                     if list(classifications_found) != conversation_item.get('classification', []):
                         conversation_item['classification'] = list(classifications_found)
                         # No need to upsert item here, will be updated later
+                elif history_grounded_search_used:
+                    thought_tracker.add_thought(
+                        'search',
+                        'No matching excerpts were found in the previously grounded documents'
+                    )
 
             # Update message-level chat_type based on actual document usage for this message
             # This must happen after document search is completed so search_results is populated
             message_chat_type = None
-            if hybrid_search_enabled and search_results and len(search_results) > 0:
+            if (hybrid_search_enabled or history_grounded_search_used) and search_results and len(search_results) > 0:
                 # Documents were actually used for this message
-                if document_scope == 'group':
+                if effective_document_scope == 'group':
                     message_chat_type = 'group'
-                elif document_scope == 'public':
+                elif effective_document_scope == 'public':
                     message_chat_type = 'public'  
                 else:
-                        message_chat_type = 'personal_single_user'
+                    message_chat_type = 'personal_single_user'
             else:
                 # No documents used for this message - only model knowledge
                 message_chat_type = 'Model'
@@ -4171,19 +6576,22 @@ def result_requires_message_reload(result: Any) -> bool:
             # Update the message-level chat_type in user_metadata
             user_metadata['chat_context']['chat_type'] = message_chat_type
             debug_print(f"Set message-level chat_type to: {message_chat_type}")
-            debug_print(f"hybrid_search_enabled: {hybrid_search_enabled}, search_results count: {len(search_results) if search_results else 0}")
+            debug_print(
+                f"hybrid_search_enabled: {hybrid_search_enabled}, history_grounded_search_used: {history_grounded_search_used}, "
+                f"search_results count: {len(search_results) if search_results else 0}"
+            )
             
             # Add context-specific information based on message chat type
-            if message_chat_type == 'group' and active_group_id:
-                user_metadata['chat_context']['group_id'] = active_group_id
+            if message_chat_type == 'group' and effective_active_group_id:
+                user_metadata['chat_context']['group_id'] = effective_active_group_id
                 # We may have already fetched this in workspace_search section
                 if 'workspace_search' in user_metadata and user_metadata['workspace_search'].get('group_name'):
                     user_metadata['chat_context']['group_name'] = user_metadata['workspace_search']['group_name']
                     debug_print(f"Chat context - using group_name from workspace_search: {user_metadata['workspace_search']['group_name']}")
                 else:
                     try:
-                        debug_print(f"Chat context - looking up group for id: {active_group_id}")
-                        group_doc = find_group_by_id(active_group_id)
+                        debug_print(f"Chat context - looking up group for id: {effective_active_group_id}")
+                        group_doc = find_group_by_id(effective_active_group_id)
                         debug_print(f"Chat context group lookup result: {group_doc}")
                         
                         if group_doc and group_doc.get('name'):
@@ -4191,7 +6599,7 @@ def result_requires_message_reload(result: Any) -> bool:
                             user_metadata['chat_context']['group_name'] = group_title
                             debug_print(f"Chat context - set group_name to: {group_title}")
                         else:
-                            debug_print(f"Chat context - no group found or no name for id: {active_group_id}")
+                            debug_print(f"Chat context - no group found or no name for id: {effective_active_group_id}")
                             user_metadata['chat_context']['group_name'] = None
                             
                     except Exception as e:
@@ -4495,20 +6903,26 @@ def result_requires_message_reload(result: Any) -> bool:
                         'error': user_friendly_message
                     }), status_code
 
+            workspace_tabular_file_contexts = []
             workspace_tabular_files = set()
-            if hybrid_search_enabled and is_tabular_processing_enabled(settings):
-                workspace_tabular_files = collect_workspace_tabular_filenames(
+            if (hybrid_search_enabled or history_grounded_search_used) and is_tabular_processing_enabled(settings):
+                workspace_tabular_file_contexts = collect_workspace_tabular_file_contexts(
                     combined_documents=combined_documents,
-                    selected_document_ids=selected_document_ids,
-                    selected_document_id=selected_document_id,
-                    document_scope=document_scope,
+                    selected_document_ids=effective_selected_document_ids,
+                    selected_document_id=effective_selected_document_id,
+                    document_scope=effective_document_scope,
+                    active_group_id=effective_active_group_id,
+                    active_public_workspace_id=effective_active_public_workspace_id,
                 )
+                workspace_tabular_files = {
+                    file_context['file_name'] for file_context in workspace_tabular_file_contexts
+                }
 
-            if hybrid_search_enabled and workspace_tabular_files and is_tabular_processing_enabled(settings):
+            if (hybrid_search_enabled or history_grounded_search_used) and workspace_tabular_files and is_tabular_processing_enabled(settings):
                 tabular_source_hint = determine_tabular_source_hint(
-                    document_scope,
-                    active_group_id=active_group_id,
-                    active_public_workspace_id=active_public_workspace_id,
+                    effective_document_scope,
+                    active_group_id=effective_active_group_id,
+                    active_public_workspace_id=effective_active_public_workspace_id,
                 )
                 tabular_execution_mode = get_tabular_execution_mode(user_message)
                 tabular_filenames_str = ", ".join(sorted(workspace_tabular_files))
@@ -4517,16 +6931,17 @@ def result_requires_message_reload(result: Any) -> bool:
                     plugin_logger.get_invocations_for_conversation(user_id, conversation_id, limit=1000)
                 )
 
-                tabular_analysis = asyncio.run(run_tabular_sk_analysis(
+                tabular_analysis = asyncio.run(run_tabular_analysis_with_multi_file_support(
                     user_question=user_message,
                     tabular_filenames=workspace_tabular_files,
+                    tabular_file_contexts=workspace_tabular_file_contexts,
                     user_id=user_id,
                     conversation_id=conversation_id,
                     gpt_model=gpt_model,
                     settings=settings,
                     source_hint=tabular_source_hint,
-                    group_id=active_group_id if tabular_source_hint == 'group' else None,
-                    public_workspace_id=active_public_workspace_id if tabular_source_hint == 'public' else None,
+                    group_id=effective_active_group_id if tabular_source_hint == 'group' else None,
+                    public_workspace_id=effective_active_public_workspace_id if tabular_source_hint == 'public' else None,
                     execution_mode=tabular_execution_mode,
                 ))
                 tabular_invocations = get_new_plugin_invocations(
@@ -4596,6 +7011,8 @@ def result_requires_message_reload(result: Any) -> bool:
             # ---------------------------------------------------------------------
             conversation_history_for_api = []
             summary_of_older = ""
+            history_debug_info = {}
+            final_api_source_refs = []
 
 
             try:
@@ -4605,66 +7022,18 @@ def result_requires_message_reload(result: Any) -> bool:
                 all_messages = list(cosmos_messages_container.query_items(
                     query=all_messages_query, parameters=params_all, partition_key=conversation_id, enable_cross_partition_query=True
                 ))
-                all_messages = filter_assistant_artifact_items(all_messages)
-
-                # Sort messages using threading logic
-                all_messages = sort_messages_by_thread(all_messages)
-
-                total_messages = len(all_messages)
-
-                # Determine which messages are "recent" and which are "older"
-                # `conversation_history_limit` includes the *current* user message
-                num_recent_messages = min(total_messages, conversation_history_limit)
-                num_older_messages = total_messages - num_recent_messages
-
-                recent_messages = all_messages[-num_recent_messages:] # Last N messages
-                older_messages_to_summarize = all_messages[:num_older_messages] # Messages before the recent ones
-
-                # Summarize older messages if needed and present
-                if enable_summarize_content_history_beyond_conversation_history_limit and older_messages_to_summarize:
-                    debug_print(f"Summarizing {len(older_messages_to_summarize)} older messages for conversation {conversation_id}")
-                    summary_prompt_older = (
-                        "Summarize the following conversation history concisely (around 50-100 words), "
-                        "focusing on key facts, decisions, or context that might be relevant for future turns. "
-                        "Do not add any introductory phrases like 'Here is a summary'.\n\n"
-                        "Conversation History:\n"
-                    )
-                    message_texts_older = []
-                    for msg in older_messages_to_summarize:
-                        role = msg.get('role', 'user')
-                        metadata = msg.get('metadata', {})
-                        
-                        # Check active_thread flag - skip messages with active_thread=False
-                        thread_info = metadata.get('thread_info', {})
-                        active_thread = thread_info.get('active_thread')
-                        
-                        # Exclude content when active_thread is explicitly False
-                        if active_thread is False:
-                            debug_print(f"[THREAD] Skipping inactive thread message {msg.get('id')} from summary")
-                            continue
-                        
-                        # Skip roles that shouldn't be in summary (adjust as needed)
-                        if role in ['system', 'safety', 'blocked', 'image', 'file']: continue
-                        content = msg.get('content', '')
-                        message_texts_older.append(f"{role.upper()}: {content}")
-
-                    if message_texts_older: # Only summarize if there's content to summarize
-                        summary_prompt_older += "\n".join(message_texts_older)
-                        try:
-                            # Use the already initialized client and model
-                            summary_response_older = gpt_client.chat.completions.create(
-                                model=gpt_model,
-                                messages=[{"role": "system", "content": summary_prompt_older}],
-                                max_tokens=150, # Adjust token limit for summary
-                                temperature=0.3 # Lower temp for factual summary
-                            )
-                            summary_of_older = summary_response_older.choices[0].message.content.strip()
-                            debug_print(f"Generated summary: {summary_of_older}")
-                        except Exception as e:
-                            debug_print(f"Error summarizing older conversation history: {e}")
-                            summary_of_older = "" # Failed, proceed without summary
-                    else:
-                        debug_print("No summarizable content found in older messages.")
+                history_segments = build_conversation_history_segments(
+                    all_messages=all_messages,
+                    conversation_history_limit=conversation_history_limit,
+                    enable_summarize_older_messages=enable_summarize_content_history_beyond_conversation_history_limit,
+                    gpt_client=gpt_client,
+                    gpt_model=gpt_model,
+                    user_message_id=user_message_id,
+                    fallback_user_message=user_message,
+                )
+                summary_of_older = history_segments['summary_of_older']
+                chat_tabular_files = history_segments['chat_tabular_files']
+                history_debug_info = history_segments.get('debug_info', {})
 
 
                 # Construct the final history for the API call
@@ -4674,6 +7043,7 @@ def result_requires_message_reload(result: Any) -> bool:
                         "role": "system",
                         "content": f"<Summary of previous conversation context>\n{summary_of_older}\n</Summary of previous conversation context>"
                     })
+                    final_api_source_refs.append('system:summary_of_older')
 
                 # Add augmentation system messages (search, agents) next
                 # **Important**: Decide if you want these saved. If so, you need to upsert them now.
@@ -4721,6 +7091,7 @@ def result_requires_message_reload(result: Any) -> bool:
                     }
                     cosmos_messages_container.upsert_item(system_doc)
                     conversation_history_for_api.append(aug_msg) # Add to API context
+                    final_api_source_refs.append(f"system:augmentation:{len(final_api_source_refs) + 1}")
                     # System message shares the same thread as user message, no thread update needed
 
                     # --- NEW: Save plugin output as agent citation ---
@@ -4731,141 +7102,8 @@ def result_requires_message_reload(result: Any) -> bool:
                         "timestamp": datetime.utcnow().isoformat()
                     })
 
-
-                # Add the recent messages (user, assistant, relevant system/file messages)
-                allowed_roles_in_history = ['user', 'assistant'] # Add 'system' if you PERSIST general system messages not related to augmentation
-                max_file_content_length_in_history = 50000 # Increased limit for all file content in history
-                max_tabular_content_length_in_history = 50000 # Same limit for tabular data consistency
-                chat_tabular_files = set()  # Track tabular files uploaded directly to chat
-
-                for message in recent_messages:
-                    role = message.get('role')
-                    content = message.get('content')
-                    metadata = message.get('metadata', {})
-                    
-                    # Check active_thread flag - skip messages with active_thread=False
-                    # This handles both threaded messages and legacy messages with the flag set
-                    thread_info = metadata.get('thread_info', {})
-                    active_thread = thread_info.get('active_thread')
-                    
-                    # Exclude content when active_thread is explicitly False
-                    # Include when: active_thread is True, None, or not present (legacy messages)
-                    if active_thread is False:
-                        debug_print(f"[THREAD] Skipping inactive thread message {message.get('id')} (thread_id: {thread_info.get('thread_id')}, attempt: {thread_info.get('thread_attempt')})")
-                        continue
-                    
-                    # Check if message is fully masked - skip it entirely
-                    if metadata.get('masked', False):
-                        debug_print(f"[MASK] Skipping fully masked message {message.get('id')}")
-                        continue
-                    
-                    # Check for partially masked content
-                    masked_ranges = metadata.get('masked_ranges', [])
-                    if masked_ranges and content:
-                        # Remove masked portions from content
-                        content = remove_masked_content(content, masked_ranges)
-                        debug_print(f"[MASK] Applied {len(masked_ranges)} masked ranges to message {message.get('id')}")
-
-                    if role in allowed_roles_in_history:
-                        conversation_history_for_api.append({"role": role, "content": content})
-                    elif role == 'file': # Handle file content inclusion (simplified)
-                        filename = message.get('filename', 'uploaded_file')
-                        file_content = message.get('file_content', '') # Assuming file content is stored
-                        is_table = message.get('is_table', False)
-                        file_content_source = message.get('file_content_source', '')
-
-                        # Tabular files stored in blob (enhanced citations enabled) - reference plugin
-                        if is_table and file_content_source == 'blob':
-                            chat_tabular_files.add(filename)  # Track for mini SK analysis
-                            conversation_history_for_api.append({
-                                'role': 'system',
-                                'content': f"[User uploaded a tabular data file named '{filename}'. "
-                                    f"The file is stored in blob storage and available for analysis. "
-                                    f"Use the tabular_processing plugin functions (list_tabular_files, describe_tabular_file, "
-                                    f"aggregate_column, filter_rows, query_tabular_data, group_by_aggregate, group_by_datetime_component) to analyze this data. "
-                                    f"The file source is 'chat'.]"
-                            })
-                        else:
-                            # Use higher limit for tabular data that needs complete analysis
-                            content_limit = max_tabular_content_length_in_history if is_table else max_file_content_length_in_history
-
-                            display_content = file_content[:content_limit]
-                            if len(file_content) > content_limit:
-                                display_content += "..."
-
-                            # Enhanced message for tabular data
-                            if is_table:
-                                conversation_history_for_api.append({
-                                    'role': 'system', # Represent file as system info
-                                    'content': f"[User uploaded a tabular data file named '{filename}'. This is CSV format data for analysis:\n{display_content}]\nThis is complete tabular data in CSV format. You can perform calculations, analysis, and data operations on this dataset."
-                                })
-                            else:
-                                conversation_history_for_api.append({
-                                    'role': 'system', # Represent file as system info
-                                    'content': f"[User uploaded a file named '{filename}'. Content preview:\n{display_content}]\nUse this file context if relevant."
-                                })
-                    elif role == 'image': # Handle image uploads with extracted text and vision analysis
-                        filename = message.get('filename', 'uploaded_image')
-                        is_user_upload = message.get('metadata', {}).get('is_user_upload', False)
-                        
-                        if is_user_upload:
-                            # This is a user-uploaded image with extracted text and vision analysis
-                            # IMPORTANT: Do NOT include message.get('content') as it contains base64 image data
-                            # which would consume excessive tokens. Only use extracted_text and vision_analysis.
-                            extracted_text = message.get('extracted_text', '')
-                            vision_analysis = message.get('vision_analysis', {})
-                            
-                            # Build comprehensive context from OCR and vision analysis (NO BASE64!)
-                            image_context_parts = [f"[User uploaded an image named '{filename}'.]"]
-                            
-                            if extracted_text:
-                                # Include OCR text from Document Intelligence
-                                extracted_preview = extracted_text[:max_file_content_length_in_history]
-                                if len(extracted_text) > max_file_content_length_in_history:
-                                    extracted_preview += "..."
-                                image_context_parts.append(f"\n\nExtracted Text (OCR):\n{extracted_preview}")
-                            
-                            if vision_analysis:
-                                # Include AI vision analysis
-                                image_context_parts.append("\n\nAI Vision Analysis:")
-                                
-                                if vision_analysis.get('description'):
-                                    image_context_parts.append(f"\nDescription: {vision_analysis['description']}")
-                                
-                                if vision_analysis.get('objects'):
-                                    objects_str = ', '.join(vision_analysis['objects'])
-                                    image_context_parts.append(f"\nObjects detected: {objects_str}")
-                                
-                                if vision_analysis.get('text'):
-                                    image_context_parts.append(f"\nText visible in image: {vision_analysis['text']}")
-                                
-                                if vision_analysis.get('contextual_analysis'):
-                                    image_context_parts.append(f"\nContextual analysis: {vision_analysis['contextual_analysis']}")
-                            
-                            image_context_content = ''.join(image_context_parts) + "\n\nUse this image information to answer questions about the uploaded image."
-                            
-                            # Verify we're not accidentally including base64 data
-                            if 'data:image/' in image_context_content or ';base64,' in image_context_content:
-                                debug_print(f"WARNING: Base64 image data detected in chat history for {filename}! Removing to save tokens.")
-                                # This should never happen, but safety check just in case
-                                image_context_content = f"[User uploaded an image named '{filename}' - image data excluded from chat history to conserve tokens]"
-                            
-                            debug_print(f"[IMAGE_CONTEXT] Adding user-uploaded image to history: {filename}, context length: {len(image_context_content)} chars")
-                            conversation_history_for_api.append({
-                                'role': 'system',
-                                'content': image_context_content
-                            })
-                        else:
-                            # This is a system-generated image (DALL-E, etc.)
-                            # Don't include the image data URL in history either
-                            prompt = message.get('prompt', 'User requested image generation.')
-                            debug_print(f"[IMAGE_CONTEXT] Adding system-generated image to history: {prompt[:100]}...")
-                            conversation_history_for_api.append({
-                                'role': 'system',
-                                'content': f"[Assistant generated an image based on the prompt: '{prompt}']"
-                            })
-
-                    # Ignored roles: 'safety', 'blocked', 'system' (if they are only for augmentation/summary)
+                conversation_history_for_api.extend(history_segments['history_messages'])
+                final_api_source_refs.extend(history_debug_info.get('history_message_source_refs', []))
 
                 # --- Mini SK analysis for tabular files uploaded directly to chat ---
                 if chat_tabular_files and is_tabular_processing_enabled(settings):
@@ -4880,7 +7118,7 @@ def result_requires_message_reload(result: Any) -> bool:
                         plugin_logger.get_invocations_for_conversation(user_id, conversation_id, limit=1000)
                     )
 
-                    chat_tabular_analysis = asyncio.run(run_tabular_sk_analysis(
+                    chat_tabular_analysis = asyncio.run(run_tabular_analysis_with_multi_file_support(
                         user_question=user_message,
                         tabular_filenames=chat_tabular_files,
                         user_id=user_id,
@@ -4913,6 +7151,7 @@ def result_requires_message_reload(result: Any) -> bool:
                                 chat_tabular_analysis,
                             )
                         })
+                        final_api_source_refs.append('system:tabular_results')
 
                         # Collect tool execution citations from SK tabular analysis
                         chat_tabular_sk_citations = collect_tabular_sk_citations(user_id, conversation_id)
@@ -4928,20 +7167,6 @@ def result_requires_message_reload(result: Any) -> bool:
                         )
                         debug_print("[Chat Tabular SK] Analysis returned None, relying on existing file context messages")
 
-                # Ensure the very last message is the current user's message (it should be if fetched correctly)
-                if not conversation_history_for_api or conversation_history_for_api[-1]['role'] != 'user':
-                    debug_print("Warning: Last message in history is not the user's current message. Appending.")
-                    # This might happen if 'recent_messages' somehow didn't include the latest user message saved in step 2
-                    # Or if the last message had an ignored role. Find the actual user message:
-                    user_msg_found = False
-                    for msg in reversed(recent_messages):
-                        if msg['role'] == 'user' and msg['id'] == user_message_id:
-                            conversation_history_for_api.append({"role": "user", "content": msg['content']})
-                            user_msg_found = True
-                            break
-                    if not user_msg_found: # Still not found? Append the original input as fallback
-                        conversation_history_for_api.append({"role": "user", "content": user_message})
-
             except Exception as e:
                 debug_print(f"Error preparing conversation history: {e}")
                 return jsonify({'error': f'Error preparing conversation history: {str(e)}'}), 500
@@ -4951,6 +7176,7 @@ def result_requires_message_reload(result: Any) -> bool:
             # 6) Final GPT Call
             # ---------------------------------------------------------------------
             default_system_prompt = settings.get('default_system_prompt', '').strip()
+            default_system_prompt_inserted = False
             # Only add if non-empty and not already present (excluding summary/augmentation system messages)
             if default_system_prompt:
                 # Find if any system message (not summary or augmentation) is present
@@ -4970,6 +7196,43 @@ def result_requires_message_reload(result: Any) -> bool:
                         "role": "system",
                         "content": default_system_prompt
                     })
+                    final_api_source_refs.insert(insert_idx, 'system:default_prompt')
+                    default_system_prompt_inserted = True
+
+            if not original_hybrid_search_enabled:
+                history_grounding_message = build_history_grounding_system_message()
+                insert_idx = 0
+                if (
+                    conversation_history_for_api
+                    and conversation_history_for_api[0].get('role') == 'system'
+                    and conversation_history_for_api[0].get('content', '').startswith(
+                        '<Summary of previous conversation context>'
+                    )
+                ):
+                    insert_idx = 1
+                if default_system_prompt_inserted:
+                    insert_idx += 1
+                conversation_history_for_api.insert(insert_idx, history_grounding_message)
+                final_api_source_refs.insert(insert_idx, 'system:history_grounding')
+
+            history_debug_info = enrich_history_context_debug_info(
+                history_debug_info,
+                conversation_history_for_api,
+                final_api_source_refs,
+                path_label='standard',
+                augmentation_message_count=len(system_messages_for_augmentation),
+                default_system_prompt_inserted=default_system_prompt_inserted,
+            )
+            emit_history_context_debug(history_debug_info, conversation_id)
+            thought_tracker.add_thought(
+                'history_context',
+                build_history_context_thought_content(history_debug_info),
+                build_history_context_thought_detail(history_debug_info),
+            )
+            if settings.get('enable_debug_logging', False):
+                agent_citations_list.append(
+                    build_history_context_debug_citation(history_debug_info, 'standard')
+                )
 
             # --- DRY Fallback Chain Helper ---
             def try_fallback_chain(steps):
@@ -4996,38 +7259,6 @@ def try_fallback_chain(steps):
                 # If all fail, return default error
                 return ("Sorry, I encountered an error.", gpt_model, None, None)
 
-            # --- Inject facts as a system message at the top of conversation_history_for_api ---
-            def get_facts_for_context(scope_id, scope_type, conversation_id: str = None, agent_id: str = None):
-                settings = get_settings()
-                agents = settings.get('semantic_kernel_agents', [])
-                default_agent = next((a for a in agents if a.get('default_agent')), None)
-                agent_dict = default_agent or (agents[0] if agents else None)
-                agent_id = agent_dict.get('id') if agent_dict else None
-                if not scope_id or not scope_type:
-                    return ""
-                fact_store = FactMemoryStore()
-                kwargs = dict(
-                    scope_type=scope_type,
-                    scope_id=scope_id,
-                )
-                if agent_id:
-                    kwargs['agent_id'] = agent_id
-                if conversation_id:
-                    kwargs['conversation_id'] = conversation_id
-                facts = fact_store.get_facts(**kwargs)
-                if not facts:
-                    return ""
-                fact_lines = []
-                for fact in facts:
-                    value = fact.get('value', '')
-                    if value:
-                        fact_lines.append(f"- {value}")
-                fact_lines.append(f"- agent_id: {agent_id}")
-                fact_lines.append(f"- scope_type: {scope_type}")
-                fact_lines.append(f"- scope_id: {scope_id}")
-                fact_lines.append(f"- conversation_id: {conversation_id}")
-                return "\n".join(fact_lines)
-
             async def run_sk_call(callable_obj, *args, **kwargs):
                 log_event(
                     f"Running Semantic Kernel callable: {callable_obj.__name__}",
@@ -5225,19 +7456,13 @@ async def run_sk_call(callable_obj, *args, **kwargs):
 
                 # Add additional metadata here to scope the facts to be returned
                 # Allows for additional per agent and per conversation scoping.
-                facts = get_facts_for_context(
+                inject_fact_memory_context(
+                    conversation_history=conversation_history_for_api,
                     scope_id=scope_id,
-                    scope_type=scope_type
+                    scope_type=scope_type,
+                    conversation_id=conversation_id,
+                    agent_id=agent_id,
                 )
-                if facts:
-                    conversation_history_for_api.insert(0, {
-                        "role": "system",
-                        "content": f"<Fact Memory>\n{facts}\n</Fact Memory>"
-                    })
-                conversation_history_for_api.insert(0, {
-                    "role": "system",
-                    "content": f"""<Conversation Metadata>\n<Scope ID: {scope_id}>\n<Scope Type: {scope_type}>\n<Conversation ID: {conversation_id}>\n<Agent ID: {agent_id}>\n</Conversation Metadata>"""
-                })
 
                 agent_message_history = [
                     ChatMessageContent(
@@ -5791,7 +8016,7 @@ def gpt_error(e):
                 'augmented': bool(system_messages_for_augmentation),
                 'hybrid_citations': hybrid_citations_list, # <--- SIMPLIFIED: Directly use the list
                 'web_search_citations': web_search_citations_list,
-                'hybridsearch_query': search_query if hybrid_search_enabled and search_results else None, # Log query only if hybrid search ran and found results
+                'hybridsearch_query': search_query if search_results else None, # Log query when any bounded document retrieval produced results
                 'agent_citations': prepared_agent_citations,
                 'model_deployment_name': actual_model_used,
                 'agent_display_name': agent_display_name,
@@ -5799,6 +8024,7 @@ def gpt_error(e):
                 'metadata': {
                     'user_info': user_info_for_assistant,  # Track which user created this assistant message
                     'reasoning_effort': reasoning_effort,
+                    'history_context': history_debug_info,
                     'thread_info': {
                         'thread_id': user_thread_id,  # Same thread as user message
                         'previous_thread_id': user_previous_thread_id,  # Same previous_thread_id as user message
@@ -5824,9 +8050,9 @@ def gpt_error(e):
                     
                     # Determine workspace type based on active group/public workspace
                     workspace_type = 'personal'
-                    if active_public_workspace_id:
+                    if effective_active_public_workspace_id:
                         workspace_type = 'public'
-                    elif active_group_id:
+                    elif effective_active_group_id:
                         workspace_type = 'group'
                     
                     log_token_usage(
@@ -5839,8 +8065,8 @@ def gpt_error(e):
                         completion_tokens=token_usage_data.get('completion_tokens'),
                         conversation_id=conversation_id,
                         message_id=assistant_message_id,
-                        group_id=active_group_id,
-                        public_workspace_id=active_public_workspace_id,
+                        group_id=effective_active_group_id,
+                        public_workspace_id=effective_active_public_workspace_id,
                         additional_context={
                             'agent_name': agent_name,
                             'augmented': bool(system_messages_for_augmentation),
@@ -5882,20 +8108,20 @@ def gpt_error(e):
                     user_message=user_message,
                     conversation_id=conversation_id,
                     user_id=user_id,
-                    active_group_id=active_group_id,
-                    active_group_ids=active_group_ids,
-                    document_scope=document_scope,
-                    selected_document_id=selected_document_id,
+                    active_group_id=effective_active_group_id,
+                    active_group_ids=effective_active_group_ids,
+                    document_scope=effective_document_scope,
+                    selected_document_id=effective_selected_document_id,
                     model_deployment=actual_model_used,
-                    hybrid_search_enabled=hybrid_search_enabled,
+                    hybrid_search_enabled=hybrid_search_enabled or history_grounded_search_used,
                     image_gen_enabled=image_gen_enabled,
                     selected_documents=combined_documents if 'combined_documents' in locals() else None,
                     selected_agent=selected_agent_name,
                     selected_agent_details=user_metadata.get('agent_selection'),
                     search_results=search_results if 'search_results' in locals() else None,
                     conversation_item=conversation_item,
-                    active_public_workspace_id=active_public_workspace_id,
-                    active_public_workspace_ids=active_public_workspace_ids
+                    active_public_workspace_id=effective_active_public_workspace_id,
+                    active_public_workspace_ids=effective_active_public_workspace_ids
                 )
             except Exception as e:
                 debug_print(f"Error collecting conversation metadata: {e}")
@@ -6224,6 +8450,8 @@ def generate(publish_background_event=None):
                 # Validate chat_type
                 if chat_type not in ('user', 'group'):
                     chat_type = 'user'
+                scope_id = active_group_id if chat_type == 'group' else user_id
+                scope_type = 'group' if chat_type == 'group' else 'user'
                 
                 # Initialize variables
                 search_query = user_message
@@ -6239,12 +8467,27 @@ def generate(publish_background_event=None):
                 conversation_history_limit = math.ceil(raw_conversation_history_limit)
                 if conversation_history_limit % 2 != 0:
                     conversation_history_limit += 1
+                enable_summarize_content_history_beyond_conversation_history_limit = settings.get(
+                    'enable_summarize_content_history_beyond_conversation_history_limit',
+                    True,
+                )
                 
                 # Convert toggles
                 if isinstance(hybrid_search_enabled, str):
                     hybrid_search_enabled = hybrid_search_enabled.lower() == 'true'
                 if isinstance(web_search_enabled, str):
                     web_search_enabled = web_search_enabled.lower() == 'true'
+                original_hybrid_search_enabled = bool(hybrid_search_enabled)
+                history_grounded_search_used = False
+                history_only_answerability = None
+                prior_grounded_document_refs = []
+                effective_document_scope = document_scope
+                effective_selected_document_ids = list(selected_document_ids or [])
+                effective_selected_document_id = selected_document_id
+                effective_active_group_ids = list(active_group_ids or [])
+                effective_active_group_id = active_group_id
+                effective_active_public_workspace_ids = list(active_public_workspace_ids or [])
+                effective_active_public_workspace_id = active_public_workspace_id
                 debug_print(
                     "[Streaming] Normalized toggles | "
                     f"hybrid_search={hybrid_search_enabled} | "
@@ -6709,36 +8952,162 @@ def publish_live_plugin_thought(thought_payload):
                     except Exception as ex:
                         debug_print(f"[Content Safety - Streaming] Unexpected error: {ex}")
 
+                if not original_hybrid_search_enabled:
+                    prior_grounded_document_refs = _normalize_prior_grounded_document_refs(conversation_item)
+                    if prior_grounded_document_refs:
+                        yield emit_thought(
+                            'history_context',
+                            'Checking whether prior conversation context already answers the question',
+                            detail=f"grounded_documents={len(prior_grounded_document_refs)}"
+                        )
+                        try:
+                            preflight_messages_query = (
+                                "SELECT * FROM c WHERE c.conversation_id = @conv_id ORDER BY c.timestamp ASC"
+                            )
+                            preflight_messages_params = [{"name": "@conv_id", "value": conversation_id}]
+                            preflight_messages = list(cosmos_messages_container.query_items(
+                                query=preflight_messages_query,
+                                parameters=preflight_messages_params,
+                                partition_key=conversation_id,
+                                enable_cross_partition_query=True,
+                            ))
+                            preflight_history_segments = build_conversation_history_segments(
+                                all_messages=preflight_messages,
+                                conversation_history_limit=conversation_history_limit,
+                                enable_summarize_older_messages=enable_summarize_content_history_beyond_conversation_history_limit,
+                                gpt_client=gpt_client,
+                                gpt_model=gpt_model,
+                                user_message_id=user_message_id,
+                                fallback_user_message=user_message,
+                            )
+                            history_only_answerability = assess_history_only_answerability(
+                                gpt_client,
+                                gpt_model,
+                                build_history_only_assessment_messages(
+                                    preflight_history_segments,
+                                    settings.get('default_system_prompt', '').strip(),
+                                ),
+                            )
+                        except Exception as assessment_error:
+                            debug_print(
+                                f"[Streaming][History Fallback] History-only sufficiency assessment failed: {assessment_error}"
+                            )
+
+                        if history_only_answerability and history_only_answerability.get('can_answer_from_history'):
+                            yield emit_thought(
+                                'history_context',
+                                'Prior conversation context appears sufficient without new document retrieval',
+                                detail=history_only_answerability.get('reason') or None,
+                            )
+                        else:
+                            fallback_search_parameters = build_prior_grounded_document_search_parameters(
+                                prior_grounded_document_refs
+                            )
+                            if fallback_search_parameters.get('document_ids'):
+                                history_grounded_search_used = True
+                                effective_document_scope = fallback_search_parameters.get('doc_scope') or 'all'
+                                effective_selected_document_ids = list(
+                                    fallback_search_parameters.get('document_ids') or []
+                                )
+                                effective_selected_document_id = (
+                                    effective_selected_document_ids[0]
+                                    if len(effective_selected_document_ids) == 1
+                                    else None
+                                )
+                                effective_active_group_ids = list(
+                                    fallback_search_parameters.get('active_group_ids') or []
+                                )
+                                effective_active_group_id = fallback_search_parameters.get('active_group_id')
+                                effective_active_public_workspace_ids = list(
+                                    fallback_search_parameters.get('active_public_workspace_ids') or []
+                                )
+                                effective_active_public_workspace_id = fallback_search_parameters.get(
+                                    'active_public_workspace_id'
+                                )
+
+                                rewritten_search_query = ''
+                                if history_only_answerability:
+                                    rewritten_search_query = str(
+                                        history_only_answerability.get('search_query') or ''
+                                    ).strip()
+                                if rewritten_search_query:
+                                    search_query = rewritten_search_query
+
+                                fallback_detail_parts = [
+                                    f"documents={len(effective_selected_document_ids)}",
+                                    f"scope={effective_document_scope or 'all'}",
+                                ]
+                                if history_only_answerability and history_only_answerability.get('reason'):
+                                    fallback_detail_parts.append(
+                                        f"reason={history_only_answerability['reason']}"
+                                    )
+                                yield emit_thought(
+                                    'search',
+                                    'Conversation context alone was insufficient; searching previously grounded documents',
+                                    detail=' | '.join(fallback_detail_parts),
+                                )
+
+                                user_metadata.setdefault('workspace_search', {})[
+                                    'history_grounded_fallback'
+                                ] = {
+                                    'used': True,
+                                    'document_scope': effective_document_scope,
+                                    'document_count': len(effective_selected_document_ids),
+                                    'search_query': search_query,
+                                }
+                                user_message_doc['metadata'] = user_metadata
+                                cosmos_messages_container.upsert_item(user_message_doc)
+                    else:
+                        yield emit_thought(
+                            'history_context',
+                            'No prior grounded documents were available; using conversation history only'
+                        )
+
                 # Hybrid search (if enabled)
                 combined_documents = []
-                if hybrid_search_enabled:
+                if hybrid_search_enabled or history_grounded_search_used:
                     debug_print(
                         "[Streaming] Starting hybrid search | "
-                        f"conversation_id={conversation_id} | doc_scope={document_scope} | "
-                        f"selected_document_ids={len(selected_document_ids)} | tags={len(tags_filter) if isinstance(tags_filter, list) else 0}"
+                        f"conversation_id={conversation_id} | doc_scope={effective_document_scope} | "
+                        f"selected_document_ids={len(effective_selected_document_ids)} | tags={len(tags_filter) if isinstance(tags_filter, list) else 0}"
                     )
-                    yield emit_thought('search', f"Searching {document_scope or 'personal'} workspace documents for '{(search_query or user_message)[:50]}'")
+                    if history_grounded_search_used and not hybrid_search_enabled:
+                        yield emit_thought(
+                            'search',
+                            f"Searching {len(effective_selected_document_ids)} previously grounded document(s) for '{(search_query or user_message)[:50]}'"
+                        )
+                    else:
+                        yield emit_thought(
+                            'search',
+                            f"Searching {effective_document_scope or 'personal'} workspace documents for '{(search_query or user_message)[:50]}'"
+                        )
                     try:
                         search_args = {
                             "query": search_query,
                             "user_id": user_id,
                             "top_n": 12,
-                            "doc_scope": document_scope,
+                            "doc_scope": effective_document_scope,
                         }
                         
-                        if active_group_ids and (document_scope == 'group' or document_scope == 'all' or chat_type == 'group'):
-                            search_args['active_group_ids'] = active_group_ids
+                        if effective_active_group_ids and (
+                            effective_document_scope == 'group'
+                            or effective_document_scope == 'all'
+                            or chat_type == 'group'
+                        ):
+                            search_args['active_group_ids'] = effective_active_group_ids
                         
                         # Add active_public_workspace_id when:
                         # 1. Document scope is 'public' or
                         # 2. Document scope is 'all' and public workspaces are enabled
-                        if active_public_workspace_id and (document_scope == 'public' or document_scope == 'all'):
-                            search_args['active_public_workspace_id'] = active_public_workspace_id
+                        if effective_active_public_workspace_id and (
+                            effective_document_scope == 'public' or effective_document_scope == 'all'
+                        ):
+                            search_args['active_public_workspace_id'] = effective_active_public_workspace_id
                         
-                        if selected_document_ids:
-                            search_args['document_ids'] = selected_document_ids
-                        elif selected_document_id:
-                            search_args['document_id'] = selected_document_id
+                        if effective_selected_document_ids:
+                            search_args['document_ids'] = effective_selected_document_ids
+                        elif effective_selected_document_id:
+                            search_args['document_id'] = effective_selected_document_id
                         
                         # Add tags filter if provided
                         if tags_filter and isinstance(tags_filter, list) and len(tags_filter) > 0:
@@ -6763,10 +9132,18 @@ def publish_live_plugin_thought(thought_payload):
                             chunk_sequence = doc.get('chunk_sequence', 0)
                             page_number = doc.get('page_number') or chunk_sequence or 1
                             citation_id = doc.get('id', str(uuid.uuid4()))
+                            document_id = str(doc.get('document_id') or '').strip()
+                            if not document_id:
+                                document_id = (
+                                    '_'.join(str(citation_id).split('_')[:-1])
+                                    if '_' in str(citation_id)
+                                    else str(citation_id)
+                                )
                             classification = doc.get('document_classification')
                             chunk_id = doc.get('chunk_id', str(uuid.uuid4()))
                             score = doc.get('score', 0.0)
                             group_id = doc.get('group_id', None)
+                            doc_public_workspace_id = doc.get('public_workspace_id', None)
                             sheet_name = doc.get('sheet_name')
                             location_label, location_value = get_citation_location(
                                 file_name,
@@ -6780,6 +9157,7 @@ def publish_live_plugin_thought(thought_payload):
                             
                             combined_documents.append({
                                 "file_name": file_name,
+                                "document_id": document_id,
                                 "citation_id": citation_id,
                                 "page_number": page_number,
                                 "sheet_name": sheet_name,
@@ -6792,17 +9170,20 @@ def publish_live_plugin_thought(thought_payload):
                                 "chunk_id": chunk_id,
                                 "score": score,
                                 "group_id": group_id,
+                                "public_workspace_id": doc_public_workspace_id,
                             })
                             
                             # Build citation data to match non-streaming format
                             citation_data = {
                                 "file_name": file_name,
+                                "document_id": document_id,
                                 "citation_id": citation_id,
                                 "page_number": page_number,
                                 "chunk_id": chunk_id,
                                 "chunk_sequence": chunk_sequence,
                                 "score": score,
                                 "group_id": group_id,
+                                "public_workspace_id": doc_public_workspace_id,
                                 "version": version,
                                 "classification": classification
                             }
@@ -6815,7 +9196,10 @@ def publish_live_plugin_thought(thought_payload):
                             processed_doc_ids = set()
                             
                             for doc in search_results:
-                                doc_id = doc.get('document_id') or doc.get('id')
+                                doc_id = str(doc.get('document_id') or '').strip()
+                                if not doc_id and doc.get('id'):
+                                    raw_doc_id = str(doc.get('id') or '').strip()
+                                    doc_id = '_'.join(raw_doc_id.split('_')[:-1]) if '_' in raw_doc_id else raw_doc_id
                                 if not doc_id or doc_id in processed_doc_ids:
                                     continue
                                 
@@ -6826,10 +9210,10 @@ def publish_live_plugin_thought(thought_payload):
                                 
                                 # Map document_scope to correct parameter names for the function
                                 metadata_params = {'user_id': user_id}
-                                if document_scope == 'group':
-                                    metadata_params['group_id'] = active_group_id
-                                elif document_scope == 'public':
-                                    metadata_params['public_workspace_id'] = active_public_workspace_id
+                                if effective_document_scope == 'group':
+                                    metadata_params['group_id'] = effective_active_group_id
+                                elif effective_document_scope == 'public':
+                                    metadata_params['public_workspace_id'] = effective_active_public_workspace_id
                                 
                                 metadata = get_document_metadata_for_citations(
                                     doc_id, 
@@ -6846,6 +9230,7 @@ def publish_live_plugin_thought(thought_payload):
                                         
                                         keywords_citation = {
                                             "file_name": file_name,
+                                            "document_id": doc_id,
                                             "citation_id": keywords_citation_id,
                                             "page_number": "Metadata",
                                             "chunk_id": keywords_citation_id,
@@ -6868,6 +9253,7 @@ def publish_live_plugin_thought(thought_payload):
                                         
                                         abstract_citation = {
                                             "file_name": file_name,
+                                            "document_id": doc_id,
                                             "citation_id": abstract_citation_id,
                                             "page_number": "Metadata",
                                             "chunk_id": abstract_citation_id,
@@ -6903,6 +9289,7 @@ def publish_live_plugin_thought(thought_payload):
                                         
                                         vision_citation = {
                                             "file_name": file_name,
+                                            "document_id": doc_id,
                                             "citation_id": vision_citation_id,
                                             "page_number": "AI Vision",
                                             "chunk_id": vision_citation_id,
@@ -6929,23 +9316,33 @@ def publish_live_plugin_thought(thought_payload):
                             'documents': combined_documents
                         })
 
-                        # Reorder hybrid citations list in descending order based on page_number
-                        hybrid_citations_list.sort(key=lambda x: x.get('page_number', 0), reverse=True)
+                        hybrid_citations_list.sort(key=_build_hybrid_citation_sort_key, reverse=True)
+                    elif history_grounded_search_used:
+                        yield emit_thought(
+                            'search',
+                            'No matching excerpts were found in the previously grounded documents'
+                        )
                 
+                workspace_tabular_file_contexts = []
                 workspace_tabular_files = set()
-                if hybrid_search_enabled and is_tabular_processing_enabled(settings):
-                    workspace_tabular_files = collect_workspace_tabular_filenames(
+                if (hybrid_search_enabled or history_grounded_search_used) and is_tabular_processing_enabled(settings):
+                    workspace_tabular_file_contexts = collect_workspace_tabular_file_contexts(
                         combined_documents=combined_documents,
-                        selected_document_ids=selected_document_ids,
-                        selected_document_id=selected_document_id,
-                        document_scope=document_scope,
+                        selected_document_ids=effective_selected_document_ids,
+                        selected_document_id=effective_selected_document_id,
+                        document_scope=effective_document_scope,
+                        active_group_id=effective_active_group_id,
+                        active_public_workspace_id=effective_active_public_workspace_id,
                     )
+                    workspace_tabular_files = {
+                        file_context['file_name'] for file_context in workspace_tabular_file_contexts
+                    }
 
-                if hybrid_search_enabled and workspace_tabular_files and is_tabular_processing_enabled(settings):
+                if (hybrid_search_enabled or history_grounded_search_used) and workspace_tabular_files and is_tabular_processing_enabled(settings):
                     tabular_source_hint = determine_tabular_source_hint(
-                        document_scope,
-                        active_group_id=active_group_id,
-                        active_public_workspace_id=active_public_workspace_id,
+                        effective_document_scope,
+                        active_group_id=effective_active_group_id,
+                        active_public_workspace_id=effective_active_public_workspace_id,
                     )
                     tabular_execution_mode = get_tabular_execution_mode(user_message)
                     tabular_filenames_str = ", ".join(sorted(workspace_tabular_files))
@@ -6956,19 +9353,21 @@ def publish_live_plugin_thought(thought_payload):
                     debug_print(
                         "[Streaming][Tabular SK] Starting workspace tabular analysis | "
                         f"files={sorted(workspace_tabular_files)} | source_hint={tabular_source_hint} | "
+                        f"file_contexts={workspace_tabular_file_contexts} | "
                         f"execution_mode={tabular_execution_mode} | baseline_invocations={baseline_tabular_invocation_count}"
                     )
 
-                    tabular_analysis = asyncio.run(run_tabular_sk_analysis(
+                    tabular_analysis = asyncio.run(run_tabular_analysis_with_multi_file_support(
                         user_question=user_message,
                         tabular_filenames=workspace_tabular_files,
+                        tabular_file_contexts=workspace_tabular_file_contexts,
                         user_id=user_id,
                         conversation_id=conversation_id,
                         gpt_model=gpt_model,
                         settings=settings,
                         source_hint=tabular_source_hint,
-                        group_id=active_group_id if tabular_source_hint == 'group' else None,
-                        public_workspace_id=active_public_workspace_id if tabular_source_hint == 'public' else None,
+                        group_id=effective_active_group_id if tabular_source_hint == 'group' else None,
+                        public_workspace_id=effective_active_public_workspace_id if tabular_source_hint == 'public' else None,
                         execution_mode=tabular_execution_mode,
                     ))
                     tabular_invocations = get_new_plugin_invocations(
@@ -7044,10 +9443,10 @@ def publish_live_plugin_thought(thought_payload):
 
                 # Update message chat type
                 message_chat_type = None
-                if hybrid_search_enabled and search_results and len(search_results) > 0:
-                    if document_scope == 'group':
+                if (hybrid_search_enabled or history_grounded_search_used) and search_results and len(search_results) > 0:
+                    if effective_document_scope == 'group':
                         message_chat_type = 'group'
-                    elif document_scope == 'public':
+                    elif effective_document_scope == 'public':
                         message_chat_type = 'public'
                     else:
                         message_chat_type = 'personal_single_user'
@@ -7060,6 +9459,8 @@ def publish_live_plugin_thought(thought_payload):
                 
                 # Prepare conversation history
                 conversation_history_for_api = []
+                history_debug_info = {}
+                final_api_source_refs = []
                 
                 try:
                     all_messages_query = "SELECT * FROM c WHERE c.conversation_id = @conv_id ORDER BY c.timestamp ASC"
@@ -7068,85 +9469,38 @@ def publish_live_plugin_thought(thought_payload):
                         query=all_messages_query, parameters=params_all, 
                         partition_key=conversation_id, enable_cross_partition_query=True
                     ))
-                    all_messages = filter_assistant_artifact_items(all_messages)
-                    
-                    # Sort messages using threading logic
-                    all_messages = sort_messages_by_thread(all_messages)
-                    
-                    total_messages = len(all_messages)
-                    num_recent_messages = min(total_messages, conversation_history_limit)
-                    recent_messages = all_messages[-num_recent_messages:]
-                    
-                    # Add augmentation messages
-                    for aug_msg in system_messages_for_augmentation:
-                        conversation_history_for_api.append({
-                            'role': aug_msg['role'],
-                            'content': aug_msg['content']
-                        })
-                    
-                    # Add recent messages (with file role handling)
-                    allowed_roles_in_history = ['user', 'assistant']
-                    max_file_content_length_in_history = 50000
-                    max_tabular_content_length_in_history = 50000
-                    chat_tabular_files = set()  # Track tabular files uploaded directly to chat
-
-                    for message in recent_messages:
-                        role = message.get('role')
-                        content = message.get('content', '')
+                    history_segments = build_conversation_history_segments(
+                        all_messages=all_messages,
+                        conversation_history_limit=conversation_history_limit,
+                        enable_summarize_older_messages=enable_summarize_content_history_beyond_conversation_history_limit,
+                        gpt_client=gpt_client,
+                        gpt_model=gpt_model,
+                        user_message_id=user_message_id,
+                        fallback_user_message=user_message,
+                    )
+                    summary_of_older = history_segments['summary_of_older']
+                    chat_tabular_files = history_segments['chat_tabular_files']
+                    history_debug_info = history_segments.get('debug_info', {})
 
-                        if role in allowed_roles_in_history:
-                            conversation_history_for_api.append({
-                                'role': role,
-                                'content': content
-                            })
-                        elif role == 'file':
-                            filename = message.get('filename', 'uploaded_file')
-                            file_content = message.get('file_content', '')
-                            is_table = message.get('is_table', False)
-                            file_content_source = message.get('file_content_source', '')
-
-                            # Tabular files stored in blob - track for mini SK analysis
-                            if is_table and file_content_source == 'blob':
-                                chat_tabular_files.add(filename)
-                                conversation_history_for_api.append({
-                                    'role': 'system',
-                                    'content': (
-                                        f"[User uploaded a tabular data file named '{filename}'. "
-                                        f"The file is stored in blob storage and available for analysis. "
-                                        f"Use the tabular_processing plugin functions (list_tabular_files, "
-                                        f"describe_tabular_file, aggregate_column, filter_rows, "
-                                        f"query_tabular_data, group_by_aggregate, group_by_datetime_component) to analyze this data. "
-                                        f"The file source is 'chat'.]"
-                                    )
-                                })
-                            else:
-                                content_limit = (
-                                    max_tabular_content_length_in_history if is_table
-                                    else max_file_content_length_in_history
-                                )
-                                display_content = file_content[:content_limit]
-                                if len(file_content) > content_limit:
-                                    display_content += "..."
-
-                                if is_table:
-                                    conversation_history_for_api.append({
-                                        'role': 'system',
-                                        'content': (
-                                            f"[User uploaded a tabular data file named '{filename}'. "
-                                            f"This is CSV format data for analysis:\n{display_content}]\n"
-                                            f"This is complete tabular data in CSV format. You can perform "
-                                            f"calculations, analysis, and data operations on this dataset."
-                                        )
-                                    })
-                                else:
-                                    conversation_history_for_api.append({
-                                        'role': 'system',
-                                        'content': (
-                                            f"[User uploaded a file named '{filename}'. "
-                                            f"Content preview:\n{display_content}]\n"
-                                            f"Use this file context if relevant."
-                                        )
-                                    })
+                    if summary_of_older:
+                        conversation_history_for_api.append({
+                            'role': 'system',
+                            'content': (
+                                f"<Summary of previous conversation context>\n{summary_of_older}\n"
+                                "</Summary of previous conversation context>"
+                            )
+                        })
+                        final_api_source_refs.append('system:summary_of_older')
+
+                    # Add augmentation messages
+                    for aug_msg in system_messages_for_augmentation:
+                        conversation_history_for_api.append({
+                            'role': aug_msg['role'],
+                            'content': aug_msg['content']
+                        })
+                        final_api_source_refs.append(f"system:augmentation:{len(final_api_source_refs) + 1}")
+                    conversation_history_for_api.extend(history_segments['history_messages'])
+                    final_api_source_refs.extend(history_debug_info.get('history_message_source_refs', []))
 
                     # --- Mini SK analysis for tabular files uploaded directly to chat ---
                     if chat_tabular_files and is_tabular_processing_enabled(settings):
@@ -7166,7 +9520,7 @@ def publish_live_plugin_thought(thought_payload):
                             f"baseline_invocations={baseline_tabular_invocation_count}"
                         )
 
-                        chat_tabular_analysis = asyncio.run(run_tabular_sk_analysis(
+                        chat_tabular_analysis = asyncio.run(run_tabular_analysis_with_multi_file_support(
                             user_question=user_message,
                             tabular_filenames=chat_tabular_files,
                             user_id=user_id,
@@ -7202,6 +9556,7 @@ def publish_live_plugin_thought(thought_payload):
                                     chat_tabular_analysis,
                                 )
                             })
+                            final_api_source_refs.append('system:tabular_results')
 
                             # Collect tool execution citations
                             chat_tabular_sk_citations = collect_tabular_sk_citations(user_id, conversation_id)
@@ -7223,18 +9578,66 @@ def publish_live_plugin_thought(thought_payload):
                 
                 # Add system prompt
                 default_system_prompt = settings.get('default_system_prompt', '').strip()
+                default_system_prompt_inserted = False
                 if default_system_prompt:
                     has_general_system_prompt = any(
                         msg.get('role') == 'system' and not (
+                            msg.get('content', '').startswith('<Summary of previous conversation context>') or
                             "retrieved document excerpts" in msg.get('content', '')
                         )
                         for msg in conversation_history_for_api
                     )
                     if not has_general_system_prompt:
-                        conversation_history_for_api.insert(0, {
+                        insert_idx = 0
+                        if (
+                            conversation_history_for_api
+                            and conversation_history_for_api[0].get('role') == 'system'
+                            and conversation_history_for_api[0].get('content', '').startswith(
+                                '<Summary of previous conversation context>'
+                            )
+                        ):
+                            insert_idx = 1
+                        conversation_history_for_api.insert(insert_idx, {
                             'role': 'system',
                             'content': default_system_prompt
                         })
+                        final_api_source_refs.insert(insert_idx, 'system:default_prompt')
+                        default_system_prompt_inserted = True
+
+                if not original_hybrid_search_enabled:
+                    history_grounding_message = build_history_grounding_system_message()
+                    insert_idx = 0
+                    if (
+                        conversation_history_for_api
+                        and conversation_history_for_api[0].get('role') == 'system'
+                        and conversation_history_for_api[0].get('content', '').startswith(
+                            '<Summary of previous conversation context>'
+                        )
+                    ):
+                        insert_idx = 1
+                    if default_system_prompt_inserted:
+                        insert_idx += 1
+                    conversation_history_for_api.insert(insert_idx, history_grounding_message)
+                    final_api_source_refs.insert(insert_idx, 'system:history_grounding')
+
+                history_debug_info = enrich_history_context_debug_info(
+                    history_debug_info,
+                    conversation_history_for_api,
+                    final_api_source_refs,
+                    path_label='streaming',
+                    augmentation_message_count=len(system_messages_for_augmentation),
+                    default_system_prompt_inserted=default_system_prompt_inserted,
+                )
+                emit_history_context_debug(history_debug_info, conversation_id)
+                yield emit_thought(
+                    'history_context',
+                    build_history_context_thought_content(history_debug_info),
+                    build_history_context_thought_detail(history_debug_info),
+                )
+                if settings.get('enable_debug_logging', False):
+                    agent_citations_list.append(
+                        build_history_context_debug_citation(history_debug_info, 'streaming')
+                    )
                 
                 # Check if agents are enabled and should be used
                 selected_agent = None
@@ -7324,6 +9727,14 @@ def publish_live_plugin_thought(thought_payload):
                             debug_print(f"--- Streaming from Agent: {agent_name_used} (model: {actual_model_used}) ---")
                         else:
                             debug_print(f"[Streaming] ⚠️ No agent selected, falling back to GPT")
+
+                    inject_fact_memory_context(
+                        conversation_history=conversation_history_for_api,
+                        scope_id=scope_id,
+                        scope_type=scope_type,
+                        conversation_id=conversation_id,
+                        agent_id=getattr(selected_agent, 'id', None),
+                    )
                 
                 # Stream the response
                 accumulated_content = ""
@@ -7703,13 +10114,14 @@ def make_json_serializable(obj):
                         'augmented': bool(system_messages_for_augmentation),
                         'hybrid_citations': hybrid_citations_list,
                         'web_search_citations': web_search_citations_list,
-                        'hybridsearch_query': search_query if hybrid_search_enabled and search_results else None,
+                        'hybridsearch_query': search_query if search_results else None,
                         'agent_citations': prepared_agent_citations,
                         'model_deployment_name': final_model_used if use_agent_streaming else gpt_model,
                         'agent_display_name': agent_display_name_used if use_agent_streaming else None,
                         'agent_name': agent_name_used if use_agent_streaming else None,
                         'metadata': {
                             'reasoning_effort': reasoning_effort,
+                            'history_context': history_debug_info,
                             'thread_info': {
                                 'thread_id': user_thread_id,
                                 'previous_thread_id': user_previous_thread_id,
@@ -7728,9 +10140,9 @@ def make_json_serializable(obj):
                             
                             # Determine workspace type based on active group/public workspace
                             workspace_type = 'personal'
-                            if active_public_workspace_id:
+                            if effective_active_public_workspace_id:
                                 workspace_type = 'public'
-                            elif active_group_id:
+                            elif effective_active_group_id:
                                 workspace_type = 'group'
                             
                             log_token_usage(
@@ -7743,8 +10155,8 @@ def make_json_serializable(obj):
                                 completion_tokens=token_usage_data.get('completion_tokens'),
                                 conversation_id=conversation_id,
                                 message_id=assistant_message_id,
-                                group_id=active_group_id,
-                                public_workspace_id=active_public_workspace_id,
+                                group_id=effective_active_group_id,
+                                public_workspace_id=effective_active_public_workspace_id,
                                 additional_context={
                                     'agent_name': agent_name_used if use_agent_streaming else None,
                                     'augmented': bool(system_messages_for_augmentation),
@@ -7764,20 +10176,20 @@ def make_json_serializable(obj):
                             user_message=user_message,
                             conversation_id=conversation_id,
                             user_id=user_id,
-                            active_group_id=active_group_id,
-                            active_group_ids=active_group_ids,
-                            document_scope=document_scope,
-                            selected_document_id=selected_document_id,
+                            active_group_id=effective_active_group_id,
+                            active_group_ids=effective_active_group_ids,
+                            document_scope=effective_document_scope,
+                            selected_document_id=effective_selected_document_id,
                             model_deployment=gpt_model,
-                            hybrid_search_enabled=hybrid_search_enabled,
+                            hybrid_search_enabled=hybrid_search_enabled or history_grounded_search_used,
                             image_gen_enabled=False,
                             selected_documents=combined_documents if combined_documents else None,
                             selected_agent=agent_name_used if use_agent_streaming else None,
                             selected_agent_details=selected_agent_metadata if use_agent_streaming else None,
                             search_results=search_results if search_results else None,
                             conversation_item=conversation_item,
-                            active_public_workspace_id=active_public_workspace_id,
-                            active_public_workspace_ids=active_public_workspace_ids
+                            active_public_workspace_id=effective_active_public_workspace_id,
+                            active_public_workspace_ids=effective_active_public_workspace_ids
                         )
                     except Exception as e:
                         debug_print(f"Error collecting conversation metadata: {e}")
@@ -7872,6 +10284,7 @@ def make_json_serializable(obj):
                                 'incomplete': True,
                                 'error': error_msg,
                                 'reasoning_effort': reasoning_effort,
+                                'history_context': history_debug_info,
                                 'thread_info': {
                                     'thread_id': user_thread_id,
                                     'previous_thread_id': user_previous_thread_id,
@@ -8145,6 +10558,889 @@ def remove_masked_content(content, masked_ranges):
     return result
 
 
+def _format_history_message_ref(message):
+    role = str((message or {}).get('role') or 'unknown')
+    message_id = str((message or {}).get('id') or 'unknown')
+    return f"{role}:{message_id}"
+
+
+def _capture_history_refs(refs, max_items=12):
+    ref_list = [str(ref) for ref in refs if ref]
+    if len(ref_list) <= max_items:
+        return ref_list
+    remaining = len(ref_list) - max_items
+    return ref_list[:max_items] + [f"... (+{remaining} more)"]
+
+
+def _format_history_refs_for_detail(refs):
+    if not refs:
+        return 'none'
+    return ', '.join(str(ref) for ref in refs)
+
+
+def _truncate_history_citation_text(text, max_chars=1600):
+    value = str(text or '').strip()
+    if not value:
+        return ''
+    if len(value) <= max_chars:
+        return value
+    return f"{value[:max_chars]}... [truncated {len(value) - max_chars} chars]"
+
+
+def _serialize_history_citation_value(value, max_chars=1200):
+    if value in (None, '', [], {}):
+        return ''
+
+    if isinstance(value, str):
+        serialized = value
+    else:
+        try:
+            serialized = json.dumps(value, default=str, ensure_ascii=False)
+        except Exception:
+            serialized = str(value)
+
+    compact_serialized = ' '.join(serialized.split())
+    return _truncate_history_citation_text(compact_serialized, max_chars=max_chars)
+
+
+def _build_agent_citation_history_lines(agent_citations, max_citations=4):
+    def parse_citation_payload(value):
+        if isinstance(value, str):
+            stripped_value = value.strip()
+            if stripped_value[:1] in ('{', '['):
+                try:
+                    return json.loads(stripped_value)
+                except Exception:
+                    return value
+        return value
+
+    def is_tabular_citation(citation):
+        if not isinstance(citation, dict):
+            return False
+        tool_name = str(citation.get('tool_name') or '')
+        function_name = str(citation.get('function_name') or '')
+        plugin_name = str(citation.get('plugin_name') or '')
+        return (
+            plugin_name == 'TabularProcessingPlugin'
+            or 'TabularProcessingPlugin.' in tool_name
+            or function_name in {
+                'aggregate_column',
+                'count_rows',
+                'count_rows_by_related_values',
+                'describe_tabular_file',
+                'filter_rows',
+                'filter_rows_by_related_values',
+                'get_distinct_values',
+                'group_by_aggregate',
+                'group_by_datetime_component',
+                'lookup_value',
+                'query_tabular_data',
+            }
+        )
+
+    def build_tabular_signature(citation):
+        arguments = parse_citation_payload(citation.get('function_arguments'))
+        result = parse_citation_payload(citation.get('function_result'))
+        if not isinstance(arguments, dict):
+            arguments = {}
+        if not isinstance(result, dict):
+            result = {}
+
+        tool_signature_name = str(citation.get('function_name') or citation.get('tool_name') or '').strip()
+        if ' [' in tool_signature_name:
+            tool_signature_name = tool_signature_name.split(' [', 1)[0]
+
+        signature_payload = {
+            'tool': tool_signature_name,
+            'filename': result.get('filename') or arguments.get('filename'),
+            'column': result.get('column') or arguments.get('column'),
+            'values': result.get('values'),
+            'sample_rows': result.get('sample_rows'),
+            'value': result.get('value'),
+        }
+        try:
+            return json.dumps(signature_payload, sort_keys=True, default=str)
+        except Exception:
+            return str(signature_payload)
+
+    def summarize_tabular_values(values, max_chars=2200, max_items=60):
+        if not isinstance(values, list) or not values:
+            return ''
+
+        compact_values = []
+        current_length = 0
+        for index, item in enumerate(values[:max_items]):
+            item_text = _serialize_history_citation_value(item, max_chars=300)
+            if not item_text:
+                continue
+
+            separator_length = 2 if compact_values else 0
+            if current_length + separator_length + len(item_text) > max_chars:
+                remaining = len(values) - index
+                compact_values.append(f"... (+{remaining} more values)")
+                break
+
+            compact_values.append(item_text)
+            current_length += separator_length + len(item_text)
+
+        if len(values) > max_items and (not compact_values or not str(compact_values[-1]).startswith('... (+')):
+            compact_values.append(f"... (+{len(values) - max_items} more values)")
+
+        return '; '.join(compact_values)
+
+    def build_tabular_line(citation):
+        arguments = parse_citation_payload(citation.get('function_arguments'))
+        result = parse_citation_payload(citation.get('function_result'))
+        if not isinstance(arguments, dict):
+            arguments = {}
+        if not isinstance(result, dict):
+            result = {}
+
+        tool_name = str(citation.get('tool_name') or citation.get('function_name') or 'TabularProcessingPlugin').strip()
+        filename = result.get('filename') or arguments.get('filename') or 'unknown file'
+        selected_sheet = result.get('selected_sheet') or arguments.get('sheet_name') or 'unknown sheet'
+        column = result.get('column') or arguments.get('column') or 'unknown column'
+        distinct_count = result.get('distinct_count')
+        returned_values = result.get('returned_values')
+        values_summary = summarize_tabular_values(result.get('values'))
+
+        line_parts = [
+            tool_name,
+            f"file={filename}",
+            f"sheet={selected_sheet}",
+            f"column={column}",
+        ]
+        if distinct_count not in (None, ''):
+            line_parts.append(f"distinct_count={distinct_count}")
+        if returned_values not in (None, ''):
+            line_parts.append(f"returned_values={returned_values}")
+        if values_summary:
+            line_parts.append(f"values={values_summary}")
+
+        return f"- {' | '.join(str(part) for part in line_parts if part not in (None, ''))}"
+
+    eligible_citations = []
+    seen_tabular_signatures = set()
+    for citation in agent_citations or []:
+        if isinstance(citation, dict):
+            tool_name = str(citation.get('tool_name') or citation.get('function_name') or '').strip()
+            if tool_name.startswith('[Debug]') or tool_name == 'Conversation History':
+                continue
+            if is_tabular_citation(citation):
+                signature = build_tabular_signature(citation)
+                if signature in seen_tabular_signatures:
+                    continue
+                seen_tabular_signatures.add(signature)
+        eligible_citations.append(citation)
+
+    lines = []
+    for citation in eligible_citations[:max_citations]:
+        if not isinstance(citation, dict):
+            value_summary = _serialize_history_citation_value(citation, max_chars=800)
+            if value_summary:
+                lines.append(f"- Tool result: {value_summary}")
+            continue
+
+        if is_tabular_citation(citation):
+            lines.append(build_tabular_line(citation))
+            continue
+
+        tool_name = str(citation.get('tool_name') or citation.get('function_name') or 'Tool invocation').strip()
+        argument_summary = _serialize_history_citation_value(citation.get('function_arguments'), max_chars=350)
+        result_summary = _serialize_history_citation_value(citation.get('function_result'), max_chars=700)
+        error_summary = ''
+        if citation.get('success') is False:
+            error_summary = _serialize_history_citation_value(citation.get('error_message'), max_chars=400)
+
+        line_parts = [tool_name]
+        if argument_summary:
+            line_parts.append(f"args={argument_summary}")
+        if result_summary:
+            line_parts.append(f"result={result_summary}")
+        if error_summary:
+            line_parts.append(f"error={error_summary}")
+        lines.append(f"- {' | '.join(line_parts)}")
+
+    remaining = len(eligible_citations) - min(len(eligible_citations), max_citations)
+    if remaining > 0:
+        lines.append(f"- ... (+{remaining} more prior tool results)")
+
+    return lines
+
+
+def _build_document_citation_history_lines(hybrid_citations, max_citations=5):
+    lines = []
+    for citation in (hybrid_citations or [])[:max_citations]:
+        if not isinstance(citation, dict):
+            continue
+
+        file_name = str(citation.get('file_name') or 'Document').strip()
+        line_parts = [file_name]
+
+        page_number = citation.get('page_number')
+        if page_number not in (None, ''):
+            line_parts.append(f"page {page_number}")
+
+        chunk_sequence = citation.get('chunk_sequence')
+        chunk_id = citation.get('chunk_id')
+        if chunk_sequence not in (None, ''):
+            line_parts.append(f"chunk {chunk_sequence}")
+        elif chunk_id not in (None, ''):
+            line_parts.append(f"chunk {chunk_id}")
+
+        classification = citation.get('classification')
+        if classification not in (None, ''):
+            line_parts.append(str(classification))
+
+        lines.append(f"- {', '.join(line_parts)}")
+
+    remaining = max(0, len(hybrid_citations or []) - min(len(hybrid_citations or []), max_citations))
+    if remaining > 0:
+        lines.append(f"- ... (+{remaining} more cited documents)")
+
+    return lines
+
+
+def _build_web_citation_history_lines(web_search_citations, max_citations=4):
+    lines = []
+    for citation in (web_search_citations or [])[:max_citations]:
+        if not isinstance(citation, dict):
+            continue
+
+        title = str(citation.get('title') or citation.get('url') or 'Web source').strip()
+        url = str(citation.get('url') or '').strip()
+        if url and url != title:
+            lines.append(f"- {title} ({url})")
+        else:
+            lines.append(f"- {title}")
+
+    remaining = max(0, len(web_search_citations or []) - min(len(web_search_citations or []), max_citations))
+    if remaining > 0:
+        lines.append(f"- ... (+{remaining} more web sources)")
+
+    return lines
+
+
+def _parse_json_object_from_text(text):
+    """Extract a JSON object from a plain text model response."""
+    value = str(text or '').strip()
+    if not value:
+        return None
+
+    try:
+        parsed = json.loads(value)
+        return parsed if isinstance(parsed, dict) else None
+    except Exception:
+        pass
+
+    start_index = value.find('{')
+    end_index = value.rfind('}')
+    if start_index == -1 or end_index == -1 or end_index <= start_index:
+        return None
+
+    try:
+        parsed = json.loads(value[start_index:end_index + 1])
+        return parsed if isinstance(parsed, dict) else None
+    except Exception:
+        return None
+
+
+def _normalize_prior_grounded_document_refs(conversation_item):
+    """Return the reusable grounded document set for follow-up turns with search disabled."""
+    normalized_refs = []
+    seen_refs = set()
+
+    def add_ref(raw_ref):
+        if not isinstance(raw_ref, dict):
+            return
+
+        document_id = str(raw_ref.get('document_id') or '').strip()
+        scope = str(raw_ref.get('scope') or '').strip().lower()
+        scope_id = str(
+            raw_ref.get('scope_id')
+            or raw_ref.get('group_id')
+            or raw_ref.get('public_workspace_id')
+            or raw_ref.get('user_id')
+            or ''
+        ).strip()
+        if not document_id or not scope or not scope_id:
+            return
+
+        ref_key = (scope, scope_id, document_id)
+        if ref_key in seen_refs:
+            return
+
+        seen_refs.add(ref_key)
+
+        normalized_ref = {
+            'document_id': document_id,
+            'scope': scope,
+            'scope_id': scope_id,
+            'file_name': raw_ref.get('file_name') or raw_ref.get('title'),
+            'classification': raw_ref.get('classification'),
+        }
+
+        if scope == 'group':
+            normalized_ref['group_id'] = scope_id
+        elif scope == 'public':
+            normalized_ref['public_workspace_id'] = scope_id
+        else:
+            normalized_ref['user_id'] = scope_id
+
+        normalized_refs.append(normalized_ref)
+
+    for raw_ref in (conversation_item or {}).get('last_grounded_document_refs', []) or []:
+        add_ref(raw_ref)
+
+    if normalized_refs:
+        return normalized_refs
+
+    for tag in (conversation_item or {}).get('tags', []) or []:
+        if not isinstance(tag, dict) or tag.get('category') != 'document':
+            continue
+
+        scope_info = tag.get('scope') or {}
+        add_ref({
+            'document_id': tag.get('document_id'),
+            'scope': scope_info.get('type'),
+            'scope_id': scope_info.get('id'),
+            'title': tag.get('title'),
+            'classification': tag.get('classification'),
+        })
+
+    return normalized_refs
+
+
+def build_prior_grounded_document_search_parameters(grounded_refs):
+    """Translate grounded document refs into bounded search parameters."""
+    document_ids = []
+    group_ids = []
+    public_workspace_ids = []
+    scope_types = set()
+
+    for ref in grounded_refs or []:
+        if not isinstance(ref, dict):
+            continue
+
+        document_id = str(ref.get('document_id') or '').strip()
+        if document_id and document_id not in document_ids:
+            document_ids.append(document_id)
+
+        scope = str(ref.get('scope') or '').strip().lower()
+        if not scope:
+            continue
+        scope_types.add(scope)
+
+        if scope == 'group':
+            group_id = str(ref.get('group_id') or ref.get('scope_id') or '').strip()
+            if group_id and group_id not in group_ids:
+                group_ids.append(group_id)
+        elif scope == 'public':
+            public_workspace_id = str(ref.get('public_workspace_id') or ref.get('scope_id') or '').strip()
+            if public_workspace_id and public_workspace_id not in public_workspace_ids:
+                public_workspace_ids.append(public_workspace_id)
+
+    if len(scope_types) == 1:
+        doc_scope = next(iter(scope_types))
+    else:
+        doc_scope = 'all'
+
+    return {
+        'document_ids': document_ids,
+        'doc_scope': doc_scope,
+        'active_group_ids': group_ids,
+        'active_group_id': group_ids[0] if group_ids else None,
+        'active_public_workspace_ids': public_workspace_ids,
+        'active_public_workspace_id': public_workspace_ids[0] if public_workspace_ids else None,
+        'scope_types': sorted(scope_types),
+    }
+
+
+def build_history_only_assessment_messages(history_segments, default_system_prompt=''):
+    """Construct the prompt context used to decide whether history alone is sufficient."""
+    assessment_messages = []
+    summary_of_older = str((history_segments or {}).get('summary_of_older') or '').strip()
+    if summary_of_older:
+        assessment_messages.append({
+            'role': 'system',
+            'content': (
+                f"<Summary of previous conversation context>\n{summary_of_older}\n"
+                "</Summary of previous conversation context>"
+            )
+        })
+
+    normalized_default_system_prompt = str(default_system_prompt or '').strip()
+    if normalized_default_system_prompt:
+        assessment_messages.append({
+            'role': 'system',
+            'content': normalized_default_system_prompt,
+        })
+
+    assessment_messages.extend((history_segments or {}).get('history_messages', []))
+    return assessment_messages
+
+
+def assess_history_only_answerability(gpt_client, gpt_model, conversation_history_for_api):
+    """Return whether the current question can be answered from existing conversation grounding alone."""
+    assessment_prompt = (
+        "You are evaluating whether the latest user question can be answered using only the "
+        "existing conversation context already provided. Earlier assistant turns may include "
+        "supporting citation context from previously grounded document answers.\n\n"
+        "Respond with JSON only using this schema:\n"
+        "{\"can_answer_from_history\": true|false, \"search_query\": \"...\", \"reason\": \"...\"}\n\n"
+        "Set can_answer_from_history to true only if the conversation already contains enough "
+        "grounded information to answer confidently without retrieving any new document excerpts. "
+        "If false, produce a concise standalone search_query that resolves pronouns and omitted "
+        "references from the conversation for use against the previously grounded documents. "
+        "Keep reason short."
+    )
+
+    assessment_messages = [{'role': 'system', 'content': assessment_prompt}]
+    assessment_messages.extend(conversation_history_for_api or [])
+
+    assessment_response = gpt_client.chat.completions.create(
+        model=gpt_model,
+        messages=assessment_messages,
+        max_tokens=180,
+        temperature=0,
+    )
+    response_text = str(assessment_response.choices[0].message.content or '').strip()
+    response_payload = _parse_json_object_from_text(response_text) or {}
+
+    can_answer_from_history = response_payload.get('can_answer_from_history')
+    if isinstance(can_answer_from_history, str):
+        can_answer_from_history = can_answer_from_history.strip().lower() == 'true'
+    else:
+        can_answer_from_history = bool(can_answer_from_history)
+
+    return {
+        'can_answer_from_history': can_answer_from_history,
+        'search_query': str(response_payload.get('search_query') or '').strip(),
+        'reason': str(response_payload.get('reason') or '').strip(),
+        'raw_response': response_text,
+    }
+
+
+def build_history_grounding_system_message():
+    """Instruction used when explicit workspace search is disabled for the current turn."""
+    return {
+        'role': 'system',
+        'content': (
+            "Workspace search is disabled for this turn. Answer only from the existing conversation "
+            "context and any retrieved document excerpts explicitly provided in this turn. If those "
+            "sources are insufficient, say that you do not have enough grounded information from the "
+            "prior conversation sources and ask the user to select a workspace or document."
+        ),
+    }
+
+
+def build_assistant_history_content_with_citations(message, content):
+    base_content = str(content or '').strip()
+    citation_sections = []
+
+    agent_lines = _build_agent_citation_history_lines(message.get('agent_citations', []))
+    if agent_lines:
+        citation_sections.append("Prior tool results:\n" + "\n".join(agent_lines))
+
+    document_lines = _build_document_citation_history_lines(message.get('hybrid_citations', []))
+    if document_lines:
+        citation_sections.append("Prior cited documents:\n" + "\n".join(document_lines))
+
+    web_lines = _build_web_citation_history_lines(message.get('web_search_citations', []))
+    if web_lines:
+        citation_sections.append("Prior cited web sources:\n" + "\n".join(web_lines))
+
+    if not citation_sections:
+        return content
+
+    citation_context = (
+        "<Supporting citation context from this assistant turn>\n"
+        + "\n\n".join(citation_sections)
+        + "\n</Supporting citation context from this assistant turn>"
+    )
+    citation_context = _truncate_history_citation_text(citation_context, max_chars=5200)
+
+    if not base_content:
+        return citation_context
+
+    return f"{base_content}\n\n{citation_context}"
+
+
+def build_history_context_thought_content(history_debug_info):
+    history_debug_info = history_debug_info or {}
+    stored_total = history_debug_info.get('stored_total_messages', 0)
+    recent_count = history_debug_info.get('recent_message_count', 0)
+    final_api_count = history_debug_info.get('final_api_message_count', 0)
+    older_count = history_debug_info.get('older_message_count', 0)
+    summary_requested = history_debug_info.get('summary_requested', False)
+    summary_used = history_debug_info.get('summary_used', False)
+
+    summary_note = 'no older messages'
+    if older_count > 0:
+        if summary_used:
+            summary_note = f"summarized {history_debug_info.get('summarized_message_count', 0)} older"
+        elif summary_requested:
+            summary_note = 'older summary unavailable'
+        else:
+            summary_note = 'older summary disabled'
+
+    return (
+        f"Prepared {final_api_count} model history messages from {stored_total} stored messages "
+        f"(recent={recent_count}; {summary_note})"
+    )
+
+
+def build_history_context_thought_detail(history_debug_info):
+    history_debug_info = history_debug_info or {}
+    lines = [
+        f"path: {history_debug_info.get('path', 'unknown')}",
+        (
+            f"stored_total={history_debug_info.get('stored_total_messages', 0)}, "
+            f"history_limit={history_debug_info.get('history_limit', 0)}, "
+            f"older_count={history_debug_info.get('older_message_count', 0)}, "
+            f"recent_count={history_debug_info.get('recent_message_count', 0)}, "
+            f"summary_requested={history_debug_info.get('summary_requested', False)}, "
+            f"summary_used={history_debug_info.get('summary_used', False)}, "
+            f"augmentation_count={history_debug_info.get('augmentation_message_count', 0)}, "
+            f"default_system_prompt_inserted={history_debug_info.get('default_system_prompt_inserted', False)}"
+        ),
+        f"older_refs: {_format_history_refs_for_detail(history_debug_info.get('older_message_refs', []))}",
+        f"recent_refs: {_format_history_refs_for_detail(history_debug_info.get('selected_recent_message_refs', []))}",
+        f"summarized_refs: {_format_history_refs_for_detail(history_debug_info.get('summarized_message_refs', []))}",
+        f"skipped_inactive_refs: {_format_history_refs_for_detail(history_debug_info.get('skipped_inactive_message_refs', []))}",
+        f"skipped_masked_refs: {_format_history_refs_for_detail(history_debug_info.get('skipped_masked_message_refs', []))}",
+        f"masked_range_refs: {_format_history_refs_for_detail(history_debug_info.get('masked_range_message_refs', []))}",
+        f"history_segment_refs: {_format_history_refs_for_detail(history_debug_info.get('history_message_source_refs', []))}",
+        f"final_api_roles: {_format_history_refs_for_detail(history_debug_info.get('final_api_message_roles', []))}",
+        f"final_api_refs: {_format_history_refs_for_detail(history_debug_info.get('final_api_source_refs', []))}",
+    ]
+    return "\n".join(lines)
+
+
+def build_history_context_debug_citation(history_debug_info, path_label):
+    history_debug_info = dict(history_debug_info or {})
+    history_debug_info['path'] = path_label
+    return {
+        'tool_name': 'Conversation History',
+        'function_arguments': json.dumps({
+            'path': path_label,
+            'stored_total_messages': history_debug_info.get('stored_total_messages', 0),
+            'history_limit': history_debug_info.get('history_limit', 0),
+            'older_message_count': history_debug_info.get('older_message_count', 0),
+            'recent_message_count': history_debug_info.get('recent_message_count', 0),
+            'final_api_message_count': history_debug_info.get('final_api_message_count', 0),
+            'summary_requested': history_debug_info.get('summary_requested', False),
+            'summary_used': history_debug_info.get('summary_used', False),
+        }),
+        'function_result': build_history_context_thought_detail(history_debug_info),
+        'timestamp': datetime.utcnow().isoformat(),
+    }
+
+
+def enrich_history_context_debug_info(
+    history_debug_info,
+    conversation_history_for_api,
+    final_api_source_refs,
+    path_label,
+    augmentation_message_count=0,
+    default_system_prompt_inserted=False,
+):
+    enriched = dict(history_debug_info or {})
+    enriched['path'] = path_label
+    enriched['augmentation_message_count'] = augmentation_message_count
+    enriched['default_system_prompt_inserted'] = bool(default_system_prompt_inserted)
+    enriched['final_api_message_count'] = len(conversation_history_for_api or [])
+    enriched['final_api_message_roles'] = [
+        str((message or {}).get('role') or 'unknown')
+        for message in (conversation_history_for_api or [])
+    ]
+    enriched['final_api_source_refs'] = _capture_history_refs(final_api_source_refs, max_items=20)
+    return enriched
+
+
+def emit_history_context_debug(history_debug_info, conversation_id):
+    debug_payload = history_debug_info or {}
+    debug_print(
+        f"[History Context][{debug_payload.get('path', 'unknown')}] conversation_id={conversation_id} | "
+        f"{json.dumps(debug_payload, default=str)}"
+    )
+
+
+def build_conversation_history_segments(
+    all_messages,
+    conversation_history_limit,
+    enable_summarize_older_messages=False,
+    gpt_client=None,
+    gpt_model=None,
+    user_message_id=None,
+    fallback_user_message="",
+):
+    """Build shared conversation history segments for chat completions."""
+    conversation_history_messages = []
+    summary_of_older = ""
+    chat_tabular_files = set()
+
+    artifact_payload_map = build_message_artifact_payload_map(all_messages or [])
+    filtered_messages = filter_assistant_artifact_items(all_messages or [])
+    filtered_messages = hydrate_agent_citations_from_artifacts(filtered_messages, artifact_payload_map)
+    ordered_messages = sort_messages_by_thread(filtered_messages)
+
+    total_messages = len(ordered_messages)
+    num_recent_messages = min(total_messages, conversation_history_limit)
+    num_older_messages = total_messages - num_recent_messages
+
+    recent_messages = ordered_messages[-num_recent_messages:] if num_recent_messages else []
+    older_messages_to_summarize = ordered_messages[:num_older_messages]
+
+    summarized_message_refs = []
+    skipped_inactive_message_refs = []
+    skipped_masked_message_refs = []
+    masked_range_message_refs = []
+    history_message_source_refs = []
+    appended_fallback_user_message = False
+
+    if enable_summarize_older_messages and older_messages_to_summarize and gpt_client and gpt_model:
+        debug_print(
+            f"Summarizing {len(older_messages_to_summarize)} older messages for current conversation history"
+        )
+        summary_prompt_older = (
+            "Summarize the following conversation history concisely (around 50-100 words), "
+            "focusing on key facts, decisions, or context that might be relevant for future turns. "
+            "Do not add any introductory phrases like 'Here is a summary'.\n\n"
+            "Conversation History:\n"
+        )
+        message_texts_older = []
+        for message in older_messages_to_summarize:
+            role = message.get('role', 'user')
+            metadata = message.get('metadata', {})
+            thread_info = metadata.get('thread_info', {})
+            active_thread = thread_info.get('active_thread')
+
+            if active_thread is False:
+                debug_print(f"[THREAD] Skipping inactive thread message {message.get('id')} from summary")
+                skipped_inactive_message_refs.append(_format_history_message_ref(message))
+                continue
+
+            if role in ['system', 'safety', 'blocked', 'image', 'file']:
+                continue
+
+            content = message.get('content', '')
+            if role == 'assistant':
+                content = build_assistant_history_content_with_citations(message, content)
+            message_texts_older.append(f"{role.upper()}: {content}")
+            summarized_message_refs.append(_format_history_message_ref(message))
+
+        if message_texts_older:
+            summary_prompt_older += "\n".join(message_texts_older)
+            try:
+                summary_response_older = gpt_client.chat.completions.create(
+                    model=gpt_model,
+                    messages=[{"role": "system", "content": summary_prompt_older}],
+                    max_tokens=150,
+                    temperature=0.3,
+                )
+                summary_of_older = summary_response_older.choices[0].message.content.strip()
+                debug_print(f"Generated summary: {summary_of_older}")
+            except Exception as exc:
+                debug_print(f"Error summarizing older conversation history: {exc}")
+                summary_of_older = ""
+        else:
+            debug_print("No summarizable content found in older messages.")
+
+    allowed_roles_in_history = ['user', 'assistant']
+    max_file_content_length_in_history = 50000
+    max_tabular_content_length_in_history = 50000
+
+    for message in recent_messages:
+        role = message.get('role')
+        content = message.get('content')
+        metadata = message.get('metadata', {})
+
+        thread_info = metadata.get('thread_info', {})
+        active_thread = thread_info.get('active_thread')
+        if active_thread is False:
+            debug_print(
+                f"[THREAD] Skipping inactive thread message {message.get('id')} "
+                f"(thread_id: {thread_info.get('thread_id')}, attempt: {thread_info.get('thread_attempt')})"
+            )
+            skipped_inactive_message_refs.append(_format_history_message_ref(message))
+            continue
+
+        if metadata.get('masked', False):
+            debug_print(f"[MASK] Skipping fully masked message {message.get('id')}")
+            skipped_masked_message_refs.append(_format_history_message_ref(message))
+            continue
+
+        masked_ranges = metadata.get('masked_ranges', [])
+        if masked_ranges and content:
+            content = remove_masked_content(content, masked_ranges)
+            masked_range_message_refs.append(_format_history_message_ref(message))
+            debug_print(f"[MASK] Applied {len(masked_ranges)} masked ranges to message {message.get('id')}")
+
+        if role in allowed_roles_in_history:
+            if role == 'assistant':
+                content = build_assistant_history_content_with_citations(message, content)
+            conversation_history_messages.append({"role": role, "content": content})
+            history_message_source_refs.append(_format_history_message_ref(message))
+        elif role == 'file':
+            filename = message.get('filename', 'uploaded_file')
+            file_content = message.get('file_content', '')
+            is_table = message.get('is_table', False)
+            file_content_source = message.get('file_content_source', '')
+
+            if is_table and file_content_source == 'blob':
+                chat_tabular_files.add(filename)
+                conversation_history_messages.append({
+                    'role': 'system',
+                    'content': (
+                        f"[User uploaded a tabular data file named '{filename}'. "
+                        f"The file is stored in blob storage and available for analysis. "
+                        f"Use the tabular_processing plugin functions (list_tabular_files, describe_tabular_file, "
+                        f"aggregate_column, filter_rows, query_tabular_data, group_by_aggregate, "
+                        f"group_by_datetime_component) to analyze this data. "
+                        f"The file source is 'chat'.]"
+                    )
+                })
+            else:
+                content_limit = (
+                    max_tabular_content_length_in_history
+                    if is_table else max_file_content_length_in_history
+                )
+                display_content = file_content[:content_limit]
+                if len(file_content) > content_limit:
+                    display_content += "..."
+
+                if is_table:
+                    conversation_history_messages.append({
+                        'role': 'system',
+                        'content': (
+                            f"[User uploaded a tabular data file named '{filename}'. This is CSV format data for analysis:\n"
+                            f"{display_content}]\n"
+                            "This is complete tabular data in CSV format. You can perform calculations, analysis, and "
+                            "data operations on this dataset."
+                        )
+                    })
+                else:
+                    conversation_history_messages.append({
+                        'role': 'system',
+                        'content': (
+                            f"[User uploaded a file named '{filename}'. Content preview:\n{display_content}]\n"
+                            "Use this file context if relevant."
+                        )
+                    })
+            history_message_source_refs.append(f"system:file:{message.get('id', 'unknown')}")
+        elif role == 'image':
+            filename = message.get('filename', 'uploaded_image')
+            is_user_upload = metadata.get('is_user_upload', False)
+
+            if is_user_upload:
+                extracted_text = message.get('extracted_text', '')
+                vision_analysis = message.get('vision_analysis', {})
+                image_context_parts = [f"[User uploaded an image named '{filename}'.]"]
+
+                if extracted_text:
+                    extracted_preview = extracted_text[:max_file_content_length_in_history]
+                    if len(extracted_text) > max_file_content_length_in_history:
+                        extracted_preview += "..."
+                    image_context_parts.append(f"\n\nExtracted Text (OCR):\n{extracted_preview}")
+
+                if vision_analysis:
+                    image_context_parts.append("\n\nAI Vision Analysis:")
+                    if vision_analysis.get('description'):
+                        image_context_parts.append(f"\nDescription: {vision_analysis['description']}")
+                    if vision_analysis.get('objects'):
+                        objects_str = ', '.join(vision_analysis['objects'])
+                        image_context_parts.append(f"\nObjects detected: {objects_str}")
+                    if vision_analysis.get('text'):
+                        image_context_parts.append(f"\nText visible in image: {vision_analysis['text']}")
+                    if vision_analysis.get('contextual_analysis'):
+                        image_context_parts.append(
+                            f"\nContextual analysis: {vision_analysis['contextual_analysis']}"
+                        )
+
+                image_context_content = ''.join(image_context_parts)
+                image_context_content += "\n\nUse this image information to answer questions about the uploaded image."
+
+                if 'data:image/' in image_context_content or ';base64,' in image_context_content:
+                    debug_print(
+                        f"WARNING: Base64 image data detected in chat history for {filename}! Removing to save tokens."
+                    )
+                    image_context_content = (
+                        f"[User uploaded an image named '{filename}' - image data excluded from chat history to conserve tokens]"
+                    )
+
+                debug_print(
+                    f"[IMAGE_CONTEXT] Adding user-uploaded image to history: {filename}, "
+                    f"context length: {len(image_context_content)} chars"
+                )
+                conversation_history_messages.append({
+                    'role': 'system',
+                    'content': image_context_content,
+                })
+            else:
+                prompt = message.get('prompt', 'User requested image generation.')
+                debug_print(f"[IMAGE_CONTEXT] Adding system-generated image to history: {prompt[:100]}...")
+                conversation_history_messages.append({
+                    'role': 'system',
+                    'content': f"[Assistant generated an image based on the prompt: '{prompt}']",
+                })
+
+            history_message_source_refs.append(f"system:image:{message.get('id', 'unknown')}")
+
+    if not conversation_history_messages or conversation_history_messages[-1].get('role') != 'user':
+        debug_print("Warning: Last message in history is not the user's current message. Appending.")
+        user_msg_found = False
+        for message in reversed(recent_messages):
+            if message.get('role') != 'user':
+                continue
+            if user_message_id and message.get('id') != user_message_id:
+                continue
+            conversation_history_messages.append({
+                'role': 'user',
+                'content': message.get('content', ''),
+            })
+            history_message_source_refs.append(_format_history_message_ref(message))
+            user_msg_found = True
+            break
+
+        if not user_msg_found and fallback_user_message:
+            conversation_history_messages.append({
+                'role': 'user',
+                'content': fallback_user_message,
+            })
+            history_message_source_refs.append('user:fallback_input')
+            appended_fallback_user_message = True
+
+    debug_info = {
+        'history_limit': conversation_history_limit,
+        'summary_requested': bool(enable_summarize_older_messages),
+        'summary_used': bool(summary_of_older),
+        'stored_total_messages': total_messages,
+        'older_message_count': len(older_messages_to_summarize),
+        'recent_message_count': len(recent_messages),
+        'summarized_message_count': len(summarized_message_refs),
+        'older_message_refs': _capture_history_refs(
+            [_format_history_message_ref(message) for message in older_messages_to_summarize]
+        ),
+        'selected_recent_message_refs': _capture_history_refs(
+            [_format_history_message_ref(message) for message in recent_messages]
+        ),
+        'summarized_message_refs': _capture_history_refs(summarized_message_refs),
+        'skipped_inactive_message_refs': _capture_history_refs(skipped_inactive_message_refs),
+        'skipped_masked_message_refs': _capture_history_refs(skipped_masked_message_refs),
+        'masked_range_message_refs': _capture_history_refs(masked_range_message_refs),
+        'history_message_source_refs': _capture_history_refs(history_message_source_refs, max_items=20),
+        'appended_fallback_user_message': appended_fallback_user_message,
+    }
+
+    return {
+        'summary_of_older': summary_of_older,
+        'history_messages': conversation_history_messages,
+        'chat_tabular_files': chat_tabular_files,
+        'debug_info': debug_info,
+    }
+
+
 def _extract_web_search_citations_from_content(content: str) -> List[Dict[str, str]]:
     if not content:
         return []
diff --git a/application/single_app/route_backend_documents.py b/application/single_app/route_backend_documents.py
index bd4d7e43..b70d9980 100644
--- a/application/single_app/route_backend_documents.py
+++ b/application/single_app/route_backend_documents.py
@@ -4,6 +4,8 @@
 from functions_authentication import *
 from functions_documents import *
 from functions_settings import *
+from functions_group import get_user_groups
+from functions_public_workspaces import get_user_visible_public_workspace_ids_from_settings
 from utils_cache import invalidate_personal_search_cache
 from functions_debug import *
 from functions_activity_logging import log_document_upload, log_document_metadata_update_transaction
@@ -14,6 +16,102 @@
 from swagger_wrapper import swagger_route, get_auth_security
 from functions_debug import debug_print
 
+
+def _extract_citation_document_id(chunk, citation_id):
+    document_id = (chunk or {}).get('document_id') if isinstance(chunk, dict) else None
+    if document_id:
+        return str(document_id)
+
+    if citation_id and '_' in citation_id:
+        return citation_id.rsplit('_', 1)[0]
+
+    return citation_id
+
+
+def _try_get_document_json(user_id, document_id, group_id=None, public_workspace_id=None):
+    try:
+        doc_response, status_code = get_document(
+            user_id,
+            document_id,
+            group_id=group_id,
+            public_workspace_id=public_workspace_id,
+        )
+    except Exception:
+        return None
+
+    if status_code != 200:
+        return None
+
+    if isinstance(doc_response, dict):
+        return doc_response
+
+    get_json = getattr(doc_response, 'get_json', None)
+    if callable(get_json):
+        return get_json()
+
+    return None
+
+
+def _find_accessible_citation_document(user_id, document_id, scope_name):
+    if not user_id or not document_id:
+        return None
+
+    settings = get_settings()
+
+    if scope_name == 'personal':
+        if not settings.get('enable_user_workspace', False):
+            return None
+        return _try_get_document_json(user_id, document_id)
+
+    if scope_name == 'group':
+        if not settings.get('enable_group_workspaces', False):
+            return None
+
+        try:
+            user_groups = get_user_groups(user_id)
+        except Exception:
+            return None
+
+        for group in user_groups:
+            group_id = group.get('id')
+            if not group_id:
+                continue
+
+            document_json = _try_get_document_json(
+                user_id,
+                document_id,
+                group_id=group_id,
+            )
+            if document_json:
+                return document_json
+
+        return None
+
+    if scope_name == 'public':
+        if not settings.get('enable_public_workspaces', False):
+            return None
+
+        try:
+            workspace_ids = get_user_visible_public_workspace_ids_from_settings(user_id)
+        except Exception:
+            return None
+
+        for workspace_id in workspace_ids:
+            if not workspace_id:
+                continue
+
+            document_json = _try_get_document_json(
+                user_id,
+                document_id,
+                public_workspace_id=workspace_id,
+            )
+            if document_json:
+                return document_json
+
+        return None
+
+    return None
+
 def register_route_backend_documents(app):
     @app.route('/api/get_file_content', methods=['POST'])
     @swagger_route(security=get_auth_security())
@@ -428,48 +526,34 @@ def api_get_user_documents():
         # Combine conditions into the WHERE clause
         where_clause = " AND ".join(query_conditions)
 
-        # --- 3) First query: get total count based on filters ---
-        try:
-            count_query_str = f"SELECT VALUE COUNT(1) FROM c WHERE {where_clause}"
-            # debug_print(f"Count Query: {count_query_str}") # Optional Debugging
-            # debug_print(f"Count Params: {query_params}")    # Optional Debugging
-            count_items = list(cosmos_user_documents_container.query_items(
-                query=count_query_str,
-                parameters=query_params,
-                enable_cross_partition_query=True # May be needed if user_id is not partition key
-            ))
-            total_count = count_items[0] if count_items else 0
-
-        except Exception as e:
-            debug_print(f"Error executing count query: {e}") # Log the error
-            return jsonify({"error": f"Error counting documents: {str(e)}"}), 500
-
-
-        # --- 4) Second query: fetch the page of data based on filters ---
+        # --- 3) Query matching documents, then collapse to current revisions before paginating ---
         try:
             offset = (page - 1) * page_size
             data_query_str = f"""
                 SELECT *
                 FROM c
                 WHERE {where_clause}
-                ORDER BY c.{sort_by} {sort_order}
-                OFFSET {offset} LIMIT {page_size}
             """
-            # debug_print(f"Data Query: {data_query_str}") # Optional Debugging
-            # debug_print(f"Data Params: {query_params}")    # Optional Debugging
-            docs = list(cosmos_user_documents_container.query_items(
+            matching_docs = list(cosmos_user_documents_container.query_items(
                 query=data_query_str,
                 parameters=query_params,
-                enable_cross_partition_query=True # May be needed if user_id is not partition key
+                enable_cross_partition_query=True
             ))
 
+            current_docs = sort_documents(
+                select_current_documents(matching_docs),
+                sort_by=sort_by,
+                sort_order=sort_order,
+            )
+            total_count = len(current_docs)
+            docs = current_docs[offset:offset + page_size]
+
             # Add shared_approval_status and owner_id for each doc
             for doc in docs:
                 doc["owner_id"] = doc.get("user_id")  # Always set owner_id to the original user_id
                 if doc.get("user_id") == user_id:
                     doc["shared_approval_status"] = "owner"
                 else:
-                    # Find entry for this user in shared_user_ids
                     status = None
                     for entry in doc.get("shared_user_ids", []):
                         if entry.startswith(f"{user_id},"):
@@ -477,7 +561,7 @@ def api_get_user_documents():
                             break
                     doc["shared_approval_status"] = status or "none"
         except Exception as e:
-            debug_print(f"Error executing data query: {e}") # Log the error
+            debug_print(f"Error executing data query: {e}")
             return jsonify({"error": f"Error fetching documents: {str(e)}"}), 500
 
         
@@ -673,15 +757,21 @@ def api_delete_user_document(document_id):
         user_id = get_current_user_id()
         if not user_id:
             return jsonify({'error': 'User not authenticated'}), 401
+
+        delete_mode = request.args.get('delete_mode', 'all_versions')
+        if delete_mode not in {'all_versions', 'current_only'}:
+            return jsonify({'error': 'Invalid delete mode'}), 400
         
         try:
-            delete_document(user_id, document_id)
-            delete_document_chunks(document_id)
+            delete_result = delete_document_revision(user_id, document_id, delete_mode=delete_mode)
             
             # Invalidate search cache since document was deleted
             invalidate_personal_search_cache(user_id)
             
-            return jsonify({'message': 'Document deleted successfully'}), 200
+            return jsonify({
+                'message': 'Document deleted successfully',
+                **delete_result,
+            }), 200
         except Exception as e:
             return jsonify({'error': f'Error deleting document: {str(e)}'}), 500
     
@@ -733,53 +823,40 @@ def get_citation():
         if not citation_id:
             return jsonify({"error": "Missing citation_id"}), 400
 
-        try:
-            search_client_user = CLIENTS['search_client_user']
-            chunk = search_client_user.get_document(key=citation_id)
-            
-            # Check if user owns the document or if document is shared with user
-            chunk_user_id = chunk.get("user_id")
-            chunk_shared_user_ids = chunk.get("shared_user_ids", [])
-            
-            # Allow access if user is owner or in shared_user_ids (prefix match)
-            is_shared = any(
-                entry == user_id or entry.startswith(f"{user_id},")
-                for entry in chunk_shared_user_ids
-            )
-            if chunk_user_id != user_id and not is_shared:
-                return jsonify({"error": "Unauthorized access to citation"}), 403
-
+        def build_citation_response(chunk):
             return jsonify({
                 "cited_text": chunk.get("chunk_text", ""),
                 "file_name": chunk.get("file_name", ""),
                 "page_number": chunk.get("chunk_sequence", 0)
             }), 200
 
+        def get_citation_for_scope(search_client, scope_name):
+            chunk = search_client.get_document(key=citation_id)
+            document_id = _extract_citation_document_id(chunk, citation_id)
+            accessible_document = _find_accessible_citation_document(user_id, document_id, scope_name)
+
+            if not accessible_document:
+                return jsonify({"error": "Unauthorized access to citation"}), 403
+
+            return build_citation_response(chunk)
+
+        try:
+            search_client_user = CLIENTS['search_client_user']
+            return get_citation_for_scope(search_client_user, 'personal')
+
         except ResourceNotFoundError:
             pass
 
         try:
             search_client_group = CLIENTS['search_client_group']
-            group_chunk = search_client_group.get_document(key=citation_id)
-
-            return jsonify({
-                "cited_text": group_chunk.get("chunk_text", ""),
-                "file_name": group_chunk.get("file_name", ""),
-                "page_number": group_chunk.get("chunk_sequence", 0)
-            }), 200
+            return get_citation_for_scope(search_client_group, 'group')
 
         except ResourceNotFoundError:
             pass
         
         try:
             search_client_public = CLIENTS['search_client_public']
-            public_chunk = search_client_public.get_document(key=citation_id)
-
-            return jsonify({
-                "cited_text": public_chunk.get("chunk_text", ""),
-                "file_name": public_chunk.get("file_name", ""),
-                "page_number": public_chunk.get("chunk_sequence", 0)
-            }), 200
+            return get_citation_for_scope(search_client_public, 'public')
         
         except ResourceNotFoundError:
             return jsonify({"error": "Citation not found in user, group, or public docs"}), 404
diff --git a/application/single_app/route_backend_group_documents.py b/application/single_app/route_backend_group_documents.py
index 957c3ee4..d8f00a04 100644
--- a/application/single_app/route_backend_group_documents.py
+++ b/application/single_app/route_backend_group_documents.py
@@ -277,34 +277,26 @@ def api_get_group_documents():
 
         where_clause = " AND ".join(query_conditions)
 
-        # --- 3) Get total count ---
-        try:
-            count_query_str = f"SELECT VALUE COUNT(1) FROM c WHERE {where_clause}"
-            count_items = list(cosmos_group_documents_container.query_items(
-                query=count_query_str,
-                parameters=query_params,
-                enable_cross_partition_query=True
-            ))
-            total_count = count_items[0] if count_items else 0
-        except Exception as e:
-            print(f"Error executing count query for group: {e}")
-            return jsonify({"error": f"Error counting documents: {str(e)}"}), 500
-
-        # --- 4) Get paginated data ---
+        # --- 3) Query matching documents, then collapse to current revisions before paginating ---
         try:
             offset = (page - 1) * page_size
             data_query_str = f"""
                 SELECT *
                 FROM c
                 WHERE {where_clause}
-                ORDER BY c.{sort_by} {sort_order}
-                OFFSET {offset} LIMIT {page_size}
             """
-            docs = list(cosmos_group_documents_container.query_items(
+            matching_docs = list(cosmos_group_documents_container.query_items(
                 query=data_query_str,
                 parameters=query_params,
                 enable_cross_partition_query=True
             ))
+            current_docs = sort_documents(
+                select_current_documents(matching_docs),
+                sort_by=sort_by,
+                sort_order=sort_order,
+            )
+            total_count = len(current_docs)
+            docs = current_docs[offset:offset + page_size]
         except Exception as e:
             print(f"Error fetching group documents: {e}")
             return jsonify({"error": f"Error fetching documents: {str(e)}"}), 500
@@ -570,14 +562,25 @@ def api_delete_group_document(document_id):
         if role not in ["Owner", "Admin", "DocumentManager"]:
             return jsonify({'error': 'You do not have permission to delete documents in this group'}), 403
 
+        delete_mode = request.args.get('delete_mode', 'all_versions')
+        if delete_mode not in {'all_versions', 'current_only'}:
+            return jsonify({'error': 'Invalid delete mode'}), 400
+
         try:
-            delete_document(user_id=user_id, document_id=document_id, group_id=active_group_id)
-            delete_document_chunks(document_id=document_id, group_id=active_group_id)
+            delete_result = delete_document_revision(
+                user_id=user_id,
+                document_id=document_id,
+                delete_mode=delete_mode,
+                group_id=active_group_id,
+            )
             
             # Invalidate group search cache since document was deleted
             invalidate_group_search_cache(active_group_id)
             
-            return jsonify({'message': 'Group document deleted successfully'}), 200
+            return jsonify({
+                'message': 'Group document deleted successfully',
+                **delete_result,
+            }), 200
         except Exception as e:
             return jsonify({'error': f'Error deleting group document: {str(e)}'}), 500
 
diff --git a/application/single_app/route_backend_public_documents.py b/application/single_app/route_backend_public_documents.py
index dab2bdb8..3b7486bd 100644
--- a/application/single_app/route_backend_public_documents.py
+++ b/application/single_app/route_backend_public_documents.py
@@ -207,18 +207,17 @@ def api_list_public_documents():
 
         where = ' AND '.join(conds)
 
-        # count
-        count_q = f'SELECT VALUE COUNT(1) FROM c WHERE {where}'
-        total = list(cosmos_public_documents_container.query_items(
-            query=count_q, parameters=params, enable_cross_partition_query=True
-        ))
-        total_count = total[0] if total else 0
-
-        # data
-        data_q = f'SELECT * FROM c WHERE {where} ORDER BY c.{sort_by} {sort_order} OFFSET {offset} LIMIT {page_size}'
-        docs = list(cosmos_public_documents_container.query_items(
+        data_q = f'SELECT * FROM c WHERE {where}'
+        matching_docs = list(cosmos_public_documents_container.query_items(
             query=data_q, parameters=params, enable_cross_partition_query=True
         ))
+        current_docs = sort_documents(
+            select_current_documents(matching_docs),
+            sort_by=sort_by,
+            sort_order=sort_order,
+        )
+        total_count = len(current_docs)
+        docs = current_docs[offset:offset + page_size]
 
         # legacy
         legacy_q = 'SELECT VALUE COUNT(1) FROM c WHERE c.public_workspace_id = @ws AND NOT IS_DEFINED(c.percentage_complete)'
@@ -284,8 +283,7 @@ def api_list_public_workspace_documents():
             enable_cross_partition_query=True
         ))
 
-        # Limit results to page_size
-        docs = docs[:page_size]
+        docs = sort_documents(select_current_documents(docs))[:page_size]
 
         return jsonify({
             'documents': docs,
@@ -404,14 +402,21 @@ def api_delete_public_document(doc_id):
         role = get_user_role_in_public_workspace(ws_doc, user_id) if ws_doc else None
         if role not in ['Owner','Admin','DocumentManager']:
             return jsonify({'error':'Access denied'}), 403
+        delete_mode = request.args.get('delete_mode', 'all_versions')
+        if delete_mode not in {'all_versions', 'current_only'}:
+            return jsonify({'error': 'Invalid delete mode'}), 400
         try:
-            delete_document(user_id=user_id, document_id=doc_id, public_workspace_id=active_ws)
-            delete_document_chunks(document_id=doc_id, public_workspace_id=active_ws)
+            delete_result = delete_document_revision(
+                user_id=user_id,
+                document_id=doc_id,
+                delete_mode=delete_mode,
+                public_workspace_id=active_ws,
+            )
             
             # Invalidate public workspace search cache since document was deleted
             invalidate_public_workspace_search_cache(active_ws)
             
-            return jsonify({'message':'Deleted'}), 200
+            return jsonify({'message':'Deleted', **delete_result}), 200
         except Exception as e:
             return jsonify({'error':str(e)}), 500
 
diff --git a/application/single_app/route_enhanced_citations.py b/application/single_app/route_enhanced_citations.py
index 60675f41..29de8313 100644
--- a/application/single_app/route_enhanced_citations.py
+++ b/application/single_app/route_enhanced_citations.py
@@ -12,15 +12,98 @@
 
 from functions_authentication import login_required, user_required, get_current_user_id
 from functions_settings import get_settings, enabled_required
-from functions_documents import get_document_metadata
+from functions_documents import get_document_metadata, get_document_blob_storage_info
 from functions_group import get_user_groups
 from functions_public_workspaces import get_user_visible_public_workspace_ids_from_settings
 from swagger_wrapper import swagger_route, get_auth_security
 from config import CLIENTS, storage_account_user_documents_container_name, storage_account_group_documents_container_name, storage_account_public_documents_container_name, storage_account_personal_chat_container_name, IMAGE_EXTENSIONS, VIDEO_EXTENSIONS, AUDIO_EXTENSIONS, TABULAR_EXTENSIONS, cosmos_messages_container, cosmos_conversations_container
 from functions_debug import debug_print
 
+
+def _sanitize_tabular_preview_value(value):
+    """Convert pandas preview values into JSON-safe display strings."""
+    if hasattr(value, 'item') and not isinstance(value, (str, bytes)):
+        try:
+            value = value.item()
+        except (TypeError, ValueError):
+            pass
+
+    if value is None:
+        return ''
+
+    if pandas.api.types.is_scalar(value):
+        try:
+            if pandas.isna(value):
+                return ''
+        except (TypeError, ValueError):
+            pass
+
+    if isinstance(value, bytes):
+        return value.decode('utf-8', errors='replace')
+
+    if hasattr(value, 'isoformat') and not isinstance(value, str):
+        try:
+            return value.isoformat()
+        except TypeError:
+            pass
+
+    return str(value)
+
+
+def _serialize_tabular_preview_table(df_preview):
+    """Build JSON-safe tabular preview payload pieces for the browser."""
+    columns = [
+        _sanitize_tabular_preview_value(column)
+        for column in df_preview.columns.tolist()
+    ]
+    rows = [
+        [_sanitize_tabular_preview_value(cell) for cell in row]
+        for row in df_preview.itertuples(index=False, name=None)
+    ]
+    return columns, rows
+
 def register_enhanced_citations_routes(app):
     """Register enhanced citations routes"""
+
+    @app.route("/api/enhanced_citations/document_metadata", methods=["GET"])
+    @swagger_route(security=get_auth_security())
+    @login_required
+    @user_required
+    @enabled_required("enable_enhanced_citations")
+    def get_enhanced_citation_document_metadata():
+        """
+        Return minimal document metadata for an exact historical or current doc_id.
+        This lets the chat UI render enhanced citations even when the cited
+        document revision is not part of the currently loaded workspace list.
+        """
+        doc_id = request.args.get("doc_id")
+        if not doc_id:
+            return jsonify({"error": "doc_id is required"}), 400
+
+        user_id = get_current_user_id()
+        if not user_id:
+            return jsonify({"error": "User not authenticated"}), 401
+
+        try:
+            doc_response, status_code = get_document(user_id, doc_id)
+            if status_code != 200:
+                return doc_response, status_code
+
+            raw_doc = doc_response.get_json()
+            _, blob_path = get_document_blob_storage_info(raw_doc)
+
+            return jsonify({
+                "id": raw_doc.get("id"),
+                "document_id": raw_doc.get("id"),
+                "file_name": raw_doc.get("file_name"),
+                "version": raw_doc.get("version"),
+                "is_current_version": raw_doc.get("is_current_version"),
+                "enhanced_citations": bool(blob_path),
+            }), 200
+
+        except Exception as e:
+            debug_print(f"Error getting enhanced citation document metadata: {e}")
+            return jsonify({"error": str(e)}), 500
     
     @app.route("/api/enhanced_citations/image", methods=["GET"])
     @swagger_route(security=get_auth_security())
@@ -435,6 +518,7 @@ def get_enhanced_citation_tabular_preview():
             total_rows = len(df)
             truncated = total_rows > max_rows
             preview = df.head(max_rows)
+            columns, rows = _serialize_tabular_preview_table(preview)
 
             return jsonify({
                 "filename": file_name,
@@ -443,8 +527,8 @@ def get_enhanced_citation_tabular_preview():
                 "sheet_count": len(sheet_names),
                 "total_rows": total_rows if not truncated else None,
                 "total_columns": len(df.columns),
-                "columns": list(df.columns),
-                "rows": preview.values.tolist(),
+                "columns": columns,
+                "rows": rows,
                 "truncated": truncated
             })
 
@@ -513,16 +597,20 @@ def determine_workspace_type_and_container(raw_doc):
     Determine workspace type and appropriate container based on document metadata
     """
     if raw_doc.get('public_workspace_id'):
-        return 'public', storage_account_public_documents_container_name
+        return 'public', raw_doc.get('blob_container') or storage_account_public_documents_container_name
     elif raw_doc.get('group_id'):
-        return 'group', storage_account_group_documents_container_name
+        return 'group', raw_doc.get('blob_container') or storage_account_group_documents_container_name
     else:
-        return 'personal', storage_account_user_documents_container_name
+        return 'personal', raw_doc.get('blob_container') or storage_account_user_documents_container_name
 
 def get_blob_name(raw_doc, workspace_type):
     """
     Determine the correct blob name based on workspace type
     """
+    _, blob_name = get_document_blob_storage_info(raw_doc)
+    if blob_name:
+        return blob_name
+
     if workspace_type == 'public':
         return f"{raw_doc['public_workspace_id']}/{raw_doc['file_name']}"
     elif workspace_type == 'group':
diff --git a/application/single_app/route_external_public_documents.py b/application/single_app/route_external_public_documents.py
index 67bcbafa..88b496cc 100644
--- a/application/single_app/route_external_public_documents.py
+++ b/application/single_app/route_external_public_documents.py
@@ -181,34 +181,22 @@ def external_get_public_documents():
 
         where_clause = " AND ".join(query_conditions)
 
-        # --- 3) Get total count ---
-        try:
-            count_query_str = f"SELECT VALUE COUNT(1) FROM c WHERE {where_clause}"
-            count_items = list(cosmos_public_documents_container.query_items(
-                query=count_query_str,
-                parameters=query_params,
-                enable_cross_partition_query=True
-            ))
-            total_count = count_items[0] if count_items else 0
-        except Exception as e:
-            print(f"Error executing count query for public: {e}")
-            return jsonify({"error": f"Error counting documents: {str(e)}"}), 500
-
-        # --- 4) Get paginated data ---
+        # --- 3) Query matching documents, then collapse to current revisions before paginating ---
         try:
             offset = (page - 1) * page_size
             data_query_str = f"""
                 SELECT *
                 FROM c
                 WHERE {where_clause}
-                ORDER BY c._ts DESC
-                OFFSET {offset} LIMIT {page_size}
             """
-            docs = list(cosmos_public_documents_container.query_items(
+            matching_docs = list(cosmos_public_documents_container.query_items(
                 query=data_query_str,
                 parameters=query_params,
                 enable_cross_partition_query=True
             ))
+            current_docs = sort_documents(select_current_documents(matching_docs))
+            total_count = len(current_docs)
+            docs = current_docs[offset:offset + page_size]
         except Exception as e:
             print(f"Error fetching public documents: {e}")
             return jsonify({"error": f"Error fetching documents: {str(e)}"}), 500
@@ -398,11 +386,22 @@ def external_delete_public_document(document_id):
         """
         user_id = request.args.get('user_id')
         active_workspace_id = request.args.get('active_workspace_id')
+        delete_mode = request.args.get('delete_mode', 'all_versions')
+
+        if delete_mode not in {'all_versions', 'current_only'}:
+            return jsonify({'error': 'Invalid delete mode'}), 400
 
         try:
-            delete_document(user_id=user_id, document_id=document_id, public_workspace_id=active_workspace_id)
-            delete_document_chunks(document_id=document_id, public_workspace_id=active_workspace_id)
-            return jsonify({'message': 'Public document deleted successfully'}), 200
+            delete_result = delete_document_revision(
+                user_id=user_id,
+                document_id=document_id,
+                delete_mode=delete_mode,
+                public_workspace_id=active_workspace_id,
+            )
+            return jsonify({
+                'message': 'Public document deleted successfully',
+                **delete_result,
+            }), 200
         except Exception as e:
             return jsonify({'error': f'Error deleting public document: {str(e)}'}), 500
 
diff --git a/application/single_app/route_frontend_conversations.py b/application/single_app/route_frontend_conversations.py
index 4ffc2371..d2b428fe 100644
--- a/application/single_app/route_frontend_conversations.py
+++ b/application/single_app/route_frontend_conversations.py
@@ -4,7 +4,10 @@
 from functions_authentication import *
 from functions_debug import debug_print
 from functions_chat import sort_messages_by_thread
-from functions_message_artifacts import filter_assistant_artifact_items
+from functions_message_artifacts import (
+    build_message_artifact_payload_map,
+    filter_assistant_artifact_items,
+)
 from swagger_wrapper import swagger_route, get_auth_security
 
 def register_route_frontend_conversations(app):
@@ -193,6 +196,42 @@ def get_conversation_messages(conversation_id):
 
         return jsonify({'messages': messages})
 
+    @app.route('/api/conversation/<conversation_id>/agent-citation/<artifact_id>', methods=['GET'])
+    @swagger_route(security=get_auth_security())
+    @login_required
+    @user_required
+    def get_agent_citation_artifact(conversation_id, artifact_id):
+        user_id = get_current_user_id()
+        if not user_id:
+            return jsonify({'error': 'User not authenticated'}), 401
+
+        try:
+            conversation = cosmos_conversations_container.read_item(
+                item=conversation_id,
+                partition_key=conversation_id,
+            )
+        except CosmosResourceNotFoundError:
+            return jsonify({'error': 'Conversation not found'}), 404
+
+        if conversation.get('user_id') != user_id:
+            return jsonify({'error': 'Unauthorized access to conversation'}), 403
+
+        conversation_messages = list(cosmos_messages_container.query_items(
+            query="SELECT * FROM c WHERE c.conversation_id = @conversation_id",
+            parameters=[{'name': '@conversation_id', 'value': conversation_id}],
+            partition_key=conversation_id,
+        ))
+        artifact_payload_map = build_message_artifact_payload_map(conversation_messages)
+        artifact_payload = artifact_payload_map.get(str(artifact_id or ''))
+        if not isinstance(artifact_payload, dict):
+            return jsonify({'error': 'Agent citation artifact not found'}), 404
+
+        citation = artifact_payload.get('citation')
+        if citation is None:
+            return jsonify({'error': 'Agent citation payload not found'}), 404
+
+        return jsonify({'citation': citation})
+
     @app.route('/api/message/<message_id>/metadata', methods=['GET'])
     @swagger_route(security=get_auth_security())
     @login_required
diff --git a/application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py b/application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py
index 7dd66517..dea35f22 100644
--- a/application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py
+++ b/application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py
@@ -60,6 +60,102 @@ def to_json(self) -> str:
         return json.dumps(self.to_dict(), default=str, indent=2)
 
 
+def _compact_plugin_log_value(value: Any, max_length: int = 160) -> Any:
+    """Return a compact logging-safe representation for structured plugin summaries."""
+    if value is None or isinstance(value, (int, float, bool)):
+        return value
+
+    if isinstance(value, str):
+        return value if len(value) <= max_length else f"{value[:max_length]}... [truncated]"
+
+    if isinstance(value, list):
+        compact_items = [_compact_plugin_log_value(item, max_length=max_length) for item in value[:5]]
+        if len(value) > 5:
+            compact_items.append({'remaining_items': len(value) - 5})
+        return compact_items
+
+    if isinstance(value, dict):
+        compact_mapping = {}
+        for index, (key, item) in enumerate(value.items()):
+            if index >= 8:
+                compact_mapping['remaining_keys'] = len(value) - 8
+                break
+            compact_mapping[str(key)] = _compact_plugin_log_value(item, max_length=max_length)
+        return compact_mapping
+
+    return str(value)
+
+
+def _build_plugin_result_logging_payload(plugin_name: str, function_name: str, result: Any) -> tuple:
+    """Build preview and structured summary payloads for plugin invocation logs."""
+    result_str = str(result)
+    result_preview = result_str[:200] + "..." if len(result_str) > 200 else result_str
+    result_summary = None
+
+    if plugin_name != 'TabularProcessingPlugin' or result is None:
+        return result_preview, result_summary
+
+    try:
+        result_payload = json.loads(result) if isinstance(result, str) else result
+    except Exception:
+        return result_preview, result_summary
+
+    if not isinstance(result_payload, dict):
+        return result_preview, result_summary
+
+    summary = {}
+    key_names = (
+        'filename',
+        'selected_sheet',
+        'column',
+        'search_value',
+        'search_operator',
+        'searched_columns',
+        'matched_columns',
+        'return_columns',
+        'lookup_column',
+        'target_column',
+        'operation',
+        'filter_applied',
+        'normalize_match',
+        'extract_mode',
+        'extract_pattern',
+        'url_path_segments',
+        'distinct_count',
+        'returned_values',
+        'row_count',
+        'rows_scanned',
+        'total_matches',
+        'returned_rows',
+        'matched_cell_count',
+        'extracted_match_count',
+        'sheets_searched',
+        'sheets_matched',
+        'source_sheet',
+        'target_sheet',
+        'relationship_type',
+        'source_cohort_size',
+        'matched_target_row_count',
+        'result',
+        'error',
+    )
+    for key_name in key_names:
+        if key_name in result_payload:
+            summary[key_name] = _compact_plugin_log_value(result_payload.get(key_name))
+
+    if isinstance(result_payload.get('values'), list):
+        summary['values_sample'] = _compact_plugin_log_value(result_payload['values'][:5])
+        summary['values_sample_limited'] = len(result_payload['values']) > 5
+
+    if isinstance(result_payload.get('data'), list):
+        summary['data_sample_count'] = min(len(result_payload['data']), 5)
+
+    if summary:
+        result_summary = summary
+
+    return result_preview, result_summary
+
+
 class PluginInvocationLogger:
     """Centralized logger for all Semantic Kernel plugin invocations."""
     
@@ -127,8 +223,14 @@ def _log_to_terminal(self, invocation: PluginInvocation):
             
             if invocation.success:
                 if invocation.result:
-                    result_str = str(invocation.result)
-                    log_data["result_preview"] = result_str[:200] + "..." if len(result_str) > 200 else result_str
+                    result_preview, result_summary = _build_plugin_result_logging_payload(
+                        invocation.plugin_name,
+                        invocation.function_name,
+                        invocation.result,
+                    )
+                    log_data["result_preview"] = result_preview
+                    if result_summary:
+                        log_data["result_summary"] = result_summary
                     log_data["result_type"] = type(invocation.result).__name__
                 
                 log_event(f"Plugin function executed successfully", 
@@ -175,11 +277,17 @@ def _log_to_appinsights(self, invocation: PluginInvocation):
             
             # Add sanitized result
             if invocation.result is not None:
-                result_str = str(invocation.result)
-                if len(result_str) > 500:
-                    log_data["result_preview"] = f"{result_str[:500]}... [truncated]"
+                result_preview, result_summary = _build_plugin_result_logging_payload(
+                    invocation.plugin_name,
+                    invocation.function_name,
+                    invocation.result,
+                )
+                if len(str(invocation.result)) > 500:
+                    log_data["result_preview"] = f"{result_preview[:500]}... [truncated]"
                 else:
-                    log_data["result_preview"] = result_str
+                    log_data["result_preview"] = result_preview
+                if result_summary:
+                    log_data["result_summary"] = result_summary
             
             log_event(
                 f"[Plugin Invocation] {invocation.plugin_name}.{invocation.function_name}",
@@ -487,13 +595,18 @@ def _log_parameters(function_name: str, parameters: Dict[str, Any]):
             )
 
         def _log_success(function_name: str, result: Any, duration_ms: float):
-            result_preview = str(result)[:200] + "..." if len(str(result)) > 200 else str(result)
+            result_preview, result_summary = _build_plugin_result_logging_payload(
+                plugin_name,
+                function_name,
+                result,
+            )
             log_event(
                 f"[Plugin Function Logger] Function completed successfully",
                 extra={
                     "plugin_name": plugin_name,
                     "function_name": function_name,
                     "result_preview": result_preview,
+                    "result_summary": result_summary,
                     "duration_ms": duration_ms,
                     "full_function_name": f"{plugin_name}.{function_name}"
                 },
diff --git a/application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py b/application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py
index cf7fc663..344d092a 100644
--- a/application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py
+++ b/application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py
@@ -16,6 +16,7 @@
 import warnings
 import pandas
 from typing import Annotated, Dict, List, Optional, Set
+from urllib.parse import urlsplit, urlunsplit
 from semantic_kernel.functions import kernel_function
 from semantic_kernel_plugins.plugin_invocation_logger import plugin_function_logger
 from functions_appinsights import log_event
@@ -43,6 +44,7 @@ class TabularProcessingPlugin:
         'count_rows',
         'aggregate_column',
         'filter_rows',
+        'search_rows',
         'query_tabular_data',
         'filter_rows_by_related_values',
         'count_rows_by_related_values',
@@ -110,6 +112,7 @@ def __init__(self):
         self._blob_data_cache = {}  # Per-instance cache: (container, blob_name) -> raw bytes
         self._workbook_metadata_cache = {}  # Per-instance cache: (container, blob_name) -> workbook metadata
         self._default_sheet_overrides = {}  # (container, blob_name) -> default sheet name
+        self._resolved_blob_location_overrides = {}  # (source, filename) -> (container, blob_name)
 
     @classmethod
     def get_discovery_function_names(cls):
@@ -130,6 +133,53 @@ def set_default_sheet(self, container_name: str, blob_name: str, sheet_name: str
         """Set the default sheet for a workbook so the model doesn't need to specify it."""
         self._default_sheet_overrides[(container_name, blob_name)] = sheet_name
 
+    def remember_resolved_blob_location(self, source: str, filename: str, container_name: str, blob_name: str):
+        """Remember a resolved blob location so later tool calls can reuse it without resupplying scope ids."""
+        normalized_filename = str(filename or '').strip()
+        if not normalized_filename:
+            return
+
+        normalized_source = str(source or '').strip().lower()
+        if normalized_source:
+            self._resolved_blob_location_overrides[(normalized_source, normalized_filename)] = (container_name, blob_name)
+
+        inferred_source = self._infer_source_from_container(container_name)
+        if inferred_source:
+            self._resolved_blob_location_overrides[(inferred_source, normalized_filename)] = (container_name, blob_name)
+
+    def _infer_source_from_container(self, container_name: str) -> Optional[str]:
+        """Infer the logical tabular source from the backing blob container name."""
+        if container_name == storage_account_user_documents_container_name:
+            return 'workspace'
+        if container_name == storage_account_personal_chat_container_name:
+            return 'chat'
+        if container_name == storage_account_group_documents_container_name:
+            return 'group'
+        if container_name == storage_account_public_documents_container_name:
+            return 'public'
+        return None
+
+    def _get_resolved_blob_location_override(self, source: str, filename: str) -> Optional[tuple]:
+        """Return a remembered blob location override when one is available for this analysis run."""
+        normalized_filename = str(filename or '').strip()
+        if not normalized_filename:
+            return None
+
+        normalized_source = str(source or '').strip().lower()
+        exact_match = self._resolved_blob_location_overrides.get((normalized_source, normalized_filename))
+        if exact_match:
+            return exact_match
+
+        filename_matches = [
+            blob_location
+            for (override_source, override_filename), blob_location in self._resolved_blob_location_overrides.items()
+            if override_filename == normalized_filename
+        ]
+        if len(filename_matches) == 1:
+            return filename_matches[0]
+
+        return None
+
     def _get_blob_service_client(self):
         """Get the blob service client from CLIENTS cache."""
         client = CLIENTS.get("storage_account_office_docs_client")
@@ -214,14 +264,12 @@ def _resolve_sheet_selection(
         if not available_sheets:
             raise ValueError(f"Workbook '{blob_name}' does not contain any readable sheets.")
 
+        matched_sheet_name = self._match_workbook_sheet_name(sheet_name, available_sheets)
+        if matched_sheet_name:
+            return matched_sheet_name, workbook_metadata
+
         normalized_sheet_name = (sheet_name or '').strip()
         if normalized_sheet_name:
-            for candidate in available_sheets:
-                if candidate == normalized_sheet_name:
-                    return candidate, workbook_metadata
-            for candidate in available_sheets:
-                if candidate.lower() == normalized_sheet_name.lower():
-                    return candidate, workbook_metadata
             raise ValueError(
                 f"Sheet '{normalized_sheet_name}' was not found in workbook '{blob_name}'. "
                 f"Available sheets: {available_sheets}."
@@ -250,9 +298,9 @@ def _resolve_sheet_selection(
         override_key = (container_name, blob_name)
         if override_key in self._default_sheet_overrides:
             override_sheet = self._default_sheet_overrides[override_key]
-            for candidate in available_sheets:
-                if candidate == override_sheet or candidate.lower() == override_sheet.lower():
-                    return candidate, workbook_metadata
+            matched_override_sheet = self._match_workbook_sheet_name(override_sheet, available_sheets)
+            if matched_override_sheet:
+                return matched_override_sheet, workbook_metadata
 
         if require_explicit_sheet:
             raise ValueError(
@@ -262,6 +310,34 @@ def _resolve_sheet_selection(
 
         return workbook_metadata.get('default_sheet'), workbook_metadata
 
+    def _match_workbook_sheet_name(self, requested_sheet_name: Optional[str], available_sheets: List[str]) -> Optional[str]:
+        """Match a workbook sheet name while tolerating trailing whitespace and case drift."""
+        raw_sheet_name = None if requested_sheet_name is None else str(requested_sheet_name)
+        normalized_sheet_name = (raw_sheet_name or '').strip()
+        if not normalized_sheet_name:
+            return None
+
+        for candidate in available_sheets:
+            if candidate == raw_sheet_name:
+                return candidate
+
+        for candidate in available_sheets:
+            if candidate.strip() == normalized_sheet_name:
+                return candidate
+
+        raw_sheet_name_casefold = (raw_sheet_name or '').casefold()
+        if raw_sheet_name_casefold:
+            for candidate in available_sheets:
+                if candidate.casefold() == raw_sheet_name_casefold:
+                    return candidate
+
+        normalized_sheet_name_casefold = normalized_sheet_name.casefold()
+        for candidate in available_sheets:
+            if candidate.strip().casefold() == normalized_sheet_name_casefold:
+                return candidate
+
+        return None
+
     def _filter_rows_across_sheets(
         self,
         container_name: str,
@@ -270,6 +346,9 @@ def _filter_rows_across_sheets(
         column: str,
         operator_str: str,
         value: str,
+        additional_filter_column: Optional[str] = None,
+        additional_filter_operator: str = 'equals',
+        additional_filter_value=None,
         normalize_match: bool = False,
         max_rows: int = 100,
     ) -> Optional[str]:
@@ -302,18 +381,23 @@ def _filter_rows_across_sheets(
             if column not in df.columns:
                 continue
 
-            sheets_searched.append(sheet)
             try:
-                mask = self._build_series_match_mask(
-                    df[column],
-                    operator_str,
-                    value,
+                filtered_df, applied_filters = self._apply_optional_dataframe_filters(
+                    df,
+                    filter_column=column,
+                    filter_operator=operator_str,
+                    filter_value=value,
+                    additional_filter_column=additional_filter_column,
+                    additional_filter_operator=additional_filter_operator,
+                    additional_filter_value=additional_filter_value,
                     normalize_match=normalize_match,
                 )
-            except ValueError:
+            except (KeyError, ValueError):
                 continue
 
-            sheet_matches = int(mask.sum())
+            sheets_searched.append(sheet)
+
+            sheet_matches = len(filtered_df)
             if sheet_matches == 0:
                 continue
 
@@ -321,7 +405,7 @@ def _filter_rows_across_sheets(
             total_matches += sheet_matches
             remaining_capacity = max(0, max_rows - len(combined_results))
             if remaining_capacity > 0:
-                filtered = df[mask].head(remaining_capacity)
+                filtered = filtered_df.head(remaining_capacity)
                 for row in filtered.to_dict(orient='records'):
                     row['_sheet'] = sheet
                     combined_results.append(row)
@@ -342,11 +426,164 @@ def _filter_rows_across_sheets(
             "selected_sheet": "ALL (cross-sheet search)",
             "sheets_searched": sheets_searched,
             "sheets_matched": sheets_matched,
+            "filter_applied": applied_filters,
             "total_matches": total_matches,
             "returned_rows": len(combined_results),
             "data": combined_results,
         }, indent=2, default=str)
 
+    def _search_rows_across_sheets(
+        self,
+        container_name: str,
+        blob_name: str,
+        filename: str,
+        search_value: str,
+        search_columns=None,
+        search_operator: str = 'contains',
+        return_columns=None,
+        query_expression: Optional[str] = None,
+        filter_column: Optional[str] = None,
+        filter_operator: str = 'equals',
+        filter_value=None,
+        additional_filter_column: Optional[str] = None,
+        additional_filter_operator: str = 'equals',
+        additional_filter_value=None,
+        normalize_match: bool = False,
+        max_rows: int = 100,
+    ) -> Optional[str]:
+        """Search rows across worksheets when the relevant text column is unknown or broad."""
+        workbook_metadata = self._get_workbook_metadata(container_name, blob_name)
+        if not workbook_metadata.get('is_workbook'):
+            return None
+
+        available_sheets = workbook_metadata.get('sheet_names', [])
+        if len(available_sheets) <= 1:
+            return None
+
+        requested_search_columns = self._parse_optional_column_list_argument(search_columns)
+        requested_return_columns = self._parse_optional_column_list_argument(return_columns)
+        combined_results = []
+        sheets_searched = []
+        sheets_matched = []
+        total_matches = 0
+        applied_filters = []
+        searched_columns = []
+        seen_searched_columns = set()
+        matched_columns = []
+        seen_matched_columns = set()
+
+        for sheet in available_sheets:
+            df = self._read_tabular_blob_to_dataframe(
+                container_name,
+                blob_name,
+                sheet_name=sheet,
+            )
+            df = self._try_numeric_conversion(df)
+
+            try:
+                filtered_df, sheet_filters = self._apply_optional_dataframe_filters(
+                    df,
+                    query_expression=query_expression,
+                    filter_column=filter_column,
+                    filter_operator=filter_operator,
+                    filter_value=filter_value,
+                    additional_filter_column=additional_filter_column,
+                    additional_filter_operator=additional_filter_operator,
+                    additional_filter_value=additional_filter_value,
+                    normalize_match=normalize_match,
+                )
+            except KeyError:
+                continue
+            except Exception as query_error:
+                return json.dumps({
+                    'error': f"Query/filter error: {query_error}",
+                    'filename': filename,
+                    'selected_sheet': 'ALL (cross-sheet search)',
+                }, indent=2, default=str)
+
+            remaining_capacity = max(0, max_rows - len(combined_results))
+            if remaining_capacity <= 0:
+                break
+
+            try:
+                search_result = self._search_dataframe_rows(
+                    filtered_df,
+                    search_value=search_value,
+                    search_columns=requested_search_columns,
+                    search_operator=search_operator,
+                    return_columns=requested_return_columns,
+                    normalize_match=normalize_match,
+                    max_rows=remaining_capacity,
+                )
+            except KeyError:
+                continue
+            except ValueError as search_error:
+                return json.dumps({
+                    'error': str(search_error),
+                    'filename': filename,
+                    'selected_sheet': 'ALL (cross-sheet search)',
+                }, indent=2, default=str)
+
+            sheets_searched.append(sheet)
+            applied_filters = sheet_filters or applied_filters
+            for column_name in search_result['searched_columns']:
+                lowered_name = str(column_name).lower()
+                if lowered_name in seen_searched_columns:
+                    continue
+                seen_searched_columns.add(lowered_name)
+                searched_columns.append(column_name)
+
+            sheet_match_count = int(search_result['total_matches'])
+            total_matches += sheet_match_count
+            if sheet_match_count > 0:
+                sheets_matched.append(sheet)
+
+            for column_name in search_result['matched_columns']:
+                lowered_name = str(column_name).lower()
+                if lowered_name in seen_matched_columns:
+                    continue
+                seen_matched_columns.add(lowered_name)
+                matched_columns.append(column_name)
+
+            for row in search_result['data']:
+                row['_sheet'] = sheet
+                combined_results.append(row)
+
+        if not sheets_searched:
+            if requested_search_columns:
+                return json.dumps({
+                    'error': 'None of the requested search_columns were found on any worksheet during cross-sheet search.',
+                    'filename': filename,
+                    'selected_sheet': 'ALL (cross-sheet search)',
+                    'search_columns': requested_search_columns,
+                }, indent=2, default=str)
+            return None
+
+        log_event(
+            f"[TabularProcessingPlugin] Cross-sheet search_rows: "
+            f"searched {len(sheets_searched)} sheets, "
+            f"matched on {len(sheets_matched)} ({sheets_matched}), "
+            f"total_matches={total_matches}",
+            level=logging.INFO,
+        )
+
+        return json.dumps({
+            'filename': filename,
+            'selected_sheet': 'ALL (cross-sheet search)',
+            'search_value': search_value,
+            'search_operator': search_operator,
+            'searched_columns': searched_columns,
+            'matched_columns': matched_columns,
+            'return_columns': requested_return_columns,
+            'sheets_searched': sheets_searched,
+            'sheets_matched': sheets_matched,
+            'filter_applied': applied_filters,
+            'normalize_match': normalize_match,
+            'total_matches': total_matches,
+            'returned_rows': len(combined_results),
+            'data': combined_results,
+        }, indent=2, default=str)
+
     def _lookup_value_across_sheets(
         self,
         container_name: str,
@@ -485,7 +722,11 @@ def _query_tabular_data_across_sheets(
             df = self._try_numeric_conversion(df)
 
             try:
-                result_df = df.query(query_expression)
+                result_df, _ = self._apply_query_expression_with_fallback(
+                    df,
+                    query_expression=query_expression,
+                    normalize_match=False,
+                )
             except Exception as query_error:
                 query_errors.append({
                     'sheet_name': sheet,
@@ -558,6 +799,9 @@ def _count_rows_across_sheets(
         filter_column: Optional[str] = None,
         filter_operator: str = 'equals',
         filter_value=None,
+        additional_filter_column: Optional[str] = None,
+        additional_filter_operator: str = 'equals',
+        additional_filter_value=None,
         query_expression: Optional[str] = None,
         normalize_match: bool = False,
     ) -> Optional[str]:
@@ -591,6 +835,9 @@ def _count_rows_across_sheets(
                     filter_column=filter_column,
                     filter_operator=filter_operator,
                     filter_value=filter_value,
+                    additional_filter_column=additional_filter_column,
+                    additional_filter_operator=additional_filter_operator,
+                    additional_filter_value=additional_filter_value,
                     normalize_match=normalize_match,
                 )
             except KeyError:
@@ -653,6 +900,12 @@ def _get_distinct_values_across_sheets(
         filter_column: Optional[str] = None,
         filter_operator: str = 'equals',
         filter_value=None,
+        additional_filter_column: Optional[str] = None,
+        additional_filter_operator: str = 'equals',
+        additional_filter_value=None,
+        extract_mode: Optional[str] = None,
+        extract_pattern: Optional[str] = None,
+        url_path_segments: Optional[int] = None,
         normalize_match: bool = False,
         max_values: int = 100,
     ) -> Optional[str]:
@@ -668,6 +921,8 @@ def _get_distinct_values_across_sheets(
         sheets_searched = []
         sheets_matched = []
         distinct_display_values = {}
+        matched_cell_count = 0
+        extracted_match_count = 0
         query_errors = []
         applied_filters = []
 
@@ -687,6 +942,9 @@ def _get_distinct_values_across_sheets(
                     filter_column=filter_column,
                     filter_operator=filter_operator,
                     filter_value=filter_value,
+                    additional_filter_column=additional_filter_column,
+                    additional_filter_operator=additional_filter_operator,
+                    additional_filter_value=additional_filter_value,
                     normalize_match=normalize_match,
                 )
             except KeyError:
@@ -701,20 +959,20 @@ def _get_distinct_values_across_sheets(
 
             sheets_searched.append(sheet)
             applied_filters = sheet_filters or applied_filters
-            for cell_value in filtered_df[column].tolist():
-                display_value = str(cell_value).strip()
-                if not display_value:
-                    continue
-                compare_variants = self._extract_cell_value_variants(
-                    cell_value,
-                    normalize_match=normalize_match,
-                )
-                if not compare_variants:
-                    continue
-                canonical_key = sorted(compare_variants)[0]
+            sheet_distinct_values, sheet_matched_cells, sheet_extracted_matches = self._collect_distinct_display_values(
+                filtered_df[column],
+                normalize_match=normalize_match,
+                extract_mode=extract_mode,
+                extract_pattern=extract_pattern,
+                url_path_segments=url_path_segments,
+            )
+            matched_cell_count += sheet_matched_cells
+            extracted_match_count += sheet_extracted_matches
+            for canonical_key, display_value in sheet_distinct_values.items():
                 distinct_display_values.setdefault(canonical_key, display_value)
 
-            if not filtered_df.empty:
+            sheet_match_count = sheet_matched_cells if extract_mode else len(filtered_df)
+            if sheet_match_count > 0:
                 sheets_matched.append(sheet)
 
         if not sheets_searched:
@@ -741,7 +999,7 @@ def _get_distinct_values_across_sheets(
             return None
 
         ordered_values = sorted(distinct_display_values.values(), key=lambda item: item.casefold())
-        return json.dumps({
+        response_payload = {
             'filename': filename,
             'selected_sheet': 'ALL (cross-sheet search)',
             'column': column,
@@ -753,7 +1011,16 @@ def _get_distinct_values_across_sheets(
             'returned_values': min(len(ordered_values), int(max_values)),
             'values': ordered_values[:int(max_values)],
             'values_limited': len(ordered_values) > int(max_values),
-        }, indent=2, default=str)
+        }
+        if extract_mode:
+            response_payload.update({
+                'extract_mode': extract_mode,
+                'extract_pattern': extract_pattern if extract_mode == 'regex' else None,
+                'url_path_segments': url_path_segments if extract_mode == 'url' else None,
+                'matched_cell_count': matched_cell_count,
+                'extracted_match_count': extracted_match_count,
+            })
+        return json.dumps(response_payload, indent=2, default=str)
 
     def _evaluate_related_value_membership(
         self,
@@ -1119,6 +1386,334 @@ def _extract_cell_value_variants(self, value, normalize_match: bool = False) ->
 
         return variants
 
+    def _normalize_distinct_extraction_arguments(
+        self,
+        extract_mode: Optional[str] = None,
+        extract_pattern: Optional[str] = None,
+        url_path_segments: Optional[str] = None,
+    ) -> tuple:
+        """Validate and normalize optional embedded extraction arguments."""
+        normalized_extract_mode = str(extract_mode or '').strip().lower() or None
+        if normalized_extract_mode not in {None, 'url', 'regex'}:
+            raise ValueError("Unsupported extract_mode. Use 'url' or 'regex'.")
+
+        normalized_extract_pattern = str(extract_pattern or '').strip() or None
+        if normalized_extract_mode == 'regex' and not normalized_extract_pattern:
+            raise ValueError('extract_pattern is required when extract_mode is regex.')
+        if normalized_extract_mode != 'regex':
+            normalized_extract_pattern = None
+
+        parsed_url_path_segments = None
+        if url_path_segments not in (None, ''):
+            try:
+                parsed_url_path_segments = int(url_path_segments)
+            except (TypeError, ValueError):
+                raise ValueError('url_path_segments must be an integer when provided.')
+            if parsed_url_path_segments < 0:
+                raise ValueError('url_path_segments must be zero or greater when provided.')
+
+        if normalized_extract_mode != 'url':
+            parsed_url_path_segments = None
+
+        return normalized_extract_mode, normalized_extract_pattern, parsed_url_path_segments
+
+    def _normalize_embedded_url_match(self, raw_match, url_path_segments: Optional[int] = None) -> Optional[str]:
+        """Normalize an extracted URL for stable distinct-value analysis."""
+        cleaned_match = str(raw_match or '').strip().rstrip('.,;:!?)]}\"\'')
+        if not cleaned_match:
+            return None
+
+        parsed_url = urlsplit(cleaned_match)
+        if not parsed_url.scheme or not parsed_url.netloc:
+            return cleaned_match
+
+        path_segments = [segment for segment in parsed_url.path.split('/') if segment]
+        if url_path_segments is not None:
+            path_segments = path_segments[:url_path_segments]
+
+        normalized_path = ''
+        if path_segments:
+            normalized_path = '/' + '/'.join(path_segments)
+
+        return urlunsplit((
+            parsed_url.scheme.lower(),
+            parsed_url.netloc.lower(),
+            normalized_path,
+            '',
+            '',
+        ))
+
+    def _extract_embedded_matches_from_text(
+        self,
+        value,
+        extract_mode: Optional[str] = None,
+        extract_pattern: Optional[str] = None,
+        url_path_segments: Optional[int] = None,
+    ) -> List[str]:
+        """Extract embedded URL or regex matches from a composite text cell."""
+        if value is None or (not isinstance(value, str) and pandas.isna(value)):
+            return []
+
+        rendered_text = str(value).strip()
+        if not rendered_text or not extract_mode:
+            return []
+
+        normalized_extract_mode = str(extract_mode or '').strip().lower()
+        extracted_matches = []
+
+        if normalized_extract_mode == 'url':
+            for raw_match in re.findall(r'https?://[^\s<>"\'\]\)]+', rendered_text, flags=re.IGNORECASE):
+                normalized_match = self._normalize_embedded_url_match(
+                    raw_match,
+                    url_path_segments=url_path_segments,
+                )
+                if normalized_match:
+                    extracted_matches.append(normalized_match)
+        elif normalized_extract_mode == 'regex':
+            compiled_pattern = re.compile(extract_pattern, flags=re.IGNORECASE)
+            for match in compiled_pattern.finditer(rendered_text):
+                candidate_value = None
+                if match.lastindex:
+                    for group_value in match.groups():
+                        if group_value:
+                            candidate_value = group_value
+                            break
+                if candidate_value is None:
+                    candidate_value = match.group(0)
+
+                cleaned_candidate = str(candidate_value or '').strip().rstrip('.,;:!?)]}\"\'')
+                if cleaned_candidate:
+                    extracted_matches.append(cleaned_candidate)
+        else:
+            raise ValueError("Unsupported extract_mode. Use 'url' or 'regex'.")
+
+        unique_matches = []
+        seen_matches = set()
+        for extracted_match in extracted_matches:
+            canonical_match = str(extracted_match).casefold().strip()
+            if not canonical_match or canonical_match in seen_matches:
+                continue
+            seen_matches.add(canonical_match)
+            unique_matches.append(str(extracted_match).strip())
+
+        return unique_matches
+
+    def _collect_distinct_value_candidates(
+        self,
+        value,
+        normalize_match: bool = False,
+        extract_mode: Optional[str] = None,
+        extract_pattern: Optional[str] = None,
+        url_path_segments: Optional[int] = None,
+    ) -> List[dict]:
+        """Return display/canonical pairs for raw or embedded distinct-value extraction."""
+        normalized_extract_mode = str(extract_mode or '').strip().lower() or None
+
+        if normalized_extract_mode:
+            candidates = []
+            for extracted_match in self._extract_embedded_matches_from_text(
+                value,
+                extract_mode=normalized_extract_mode,
+                extract_pattern=extract_pattern,
+                url_path_segments=url_path_segments,
+            ):
+                display_value = str(extracted_match).strip()
+                if not display_value:
+                    continue
+
+                if normalized_extract_mode == 'url':
+                    canonical_key = display_value.casefold()
+                elif normalize_match:
+                    canonical_key = self._normalize_entity_match_text(display_value)
+                else:
+                    canonical_key = display_value.casefold()
+
+                if not canonical_key:
+                    continue
+
+                candidates.append({
+                    'display_value': display_value,
+                    'canonical_key': canonical_key,
+                })
+
+            return candidates
+
+        if value is None or (not isinstance(value, str) and pandas.isna(value)):
+            return []
+
+        display_value = str(value).strip()
+        if not display_value:
+            return []
+
+        compare_variants = self._extract_cell_value_variants(
+            value,
+            normalize_match=normalize_match,
+        )
+        if not compare_variants:
+            return []
+
+        return [{
+            'display_value': display_value,
+            'canonical_key': sorted(compare_variants)[0],
+        }]
+
+    def _collect_distinct_display_values(
+        self,
+        series: pandas.Series,
+        normalize_match: bool = False,
+        extract_mode: Optional[str] = None,
+        extract_pattern: Optional[str] = None,
+        url_path_segments: Optional[int] = None,
+    ) -> tuple:
+        """Collect display values and counts for deterministic distinct-value analysis."""
+        distinct_display_values = {}
+        matched_cell_count = 0
+        extracted_match_count = 0
+
+        for cell_value in series.tolist():
+            candidates = self._collect_distinct_value_candidates(
+                cell_value,
+                normalize_match=normalize_match,
+                extract_mode=extract_mode,
+                extract_pattern=extract_pattern,
+                url_path_segments=url_path_segments,
+            )
+            if not candidates:
+                continue
+
+            matched_cell_count += 1
+            extracted_match_count += len(candidates)
+            for candidate in candidates:
+                distinct_display_values.setdefault(
+                    candidate['canonical_key'],
+                    candidate['display_value'],
+                )
+
+        return distinct_display_values, matched_cell_count, extracted_match_count
+
+    def _parse_optional_column_list_argument(self, raw_columns) -> Optional[List[str]]:
+        """Parse an optional comma-separated or JSON-array column list argument."""
+        if raw_columns is None:
+            return None
+
+        candidate_values = None
+        if isinstance(raw_columns, (list, tuple, set)):
+            candidate_values = list(raw_columns)
+        else:
+            rendered_columns = str(raw_columns).strip()
+            if not rendered_columns:
+                return None
+            if rendered_columns.casefold() in {'*', 'all', 'all_columns', 'all columns'}:
+                return None
+
+            if rendered_columns.startswith('['):
+                try:
+                    parsed_columns = json.loads(rendered_columns)
+                except Exception:
+                    parsed_columns = None
+                if isinstance(parsed_columns, list):
+                    candidate_values = parsed_columns
+
+            if candidate_values is None:
+                candidate_values = re.split(r'[,;|\n]+', rendered_columns)
+
+        normalized_columns = []
+        seen_columns = set()
+        for candidate_value in candidate_values:
+            normalized_column = str(candidate_value or '').strip()
+            if not normalized_column:
+                continue
+            lowered_column = normalized_column.casefold()
+            if lowered_column in seen_columns:
+                continue
+            seen_columns.add(lowered_column)
+            normalized_columns.append(normalized_column)
+
+        return normalized_columns or None
+
+    def _search_dataframe_rows(
+        self,
+        df: pandas.DataFrame,
+        search_value,
+        search_columns=None,
+        search_operator: str = 'contains',
+        return_columns=None,
+        normalize_match: bool = False,
+        max_rows: int = 100,
+    ) -> dict:
+        """Search one or more columns in a DataFrame and return row-context results."""
+        requested_search_columns = self._parse_optional_column_list_argument(search_columns)
+        requested_return_columns = self._parse_optional_column_list_argument(return_columns)
+
+        if requested_search_columns:
+            resolved_search_columns = [
+                column_name for column_name in requested_search_columns
+                if column_name in df.columns
+            ]
+            if not resolved_search_columns:
+                raise KeyError(requested_search_columns[0])
+        else:
+            resolved_search_columns = list(df.columns)
+
+        resolved_return_columns = [
+            column_name for column_name in (requested_return_columns or [])
+            if column_name in df.columns
+        ]
+
+        combined_mask = pandas.Series([False] * len(df), index=df.index)
+        column_masks = {}
+        for column_name in resolved_search_columns:
+            column_mask = self._build_series_match_mask(
+                df[column_name],
+                search_operator,
+                search_value,
+                normalize_match=normalize_match,
+            ).fillna(False)
+            column_masks[column_name] = column_mask
+            combined_mask = combined_mask | column_mask
+
+        matched_df = df[combined_mask]
+        matched_columns = []
+        seen_matched_columns = set()
+        result_rows = []
+
+        for row_index, row in matched_df.head(int(max_rows)).iterrows():
+            row_matched_columns = []
+            for column_name in resolved_search_columns:
+                if not bool(column_masks[column_name].loc[row_index]):
+                    continue
+                row_matched_columns.append(column_name)
+                lowered_column = column_name.casefold()
+                if lowered_column not in seen_matched_columns:
+                    seen_matched_columns.add(lowered_column)
+                    matched_columns.append(column_name)
+
+            if resolved_return_columns:
+                row_payload = {
+                    column_name: row.get(column_name)
+                    for column_name in resolved_return_columns
+                }
+            else:
+                row_payload = {
+                    str(key): value for key, value in row.to_dict().items()
+                }
+
+            row_payload['_matched_columns'] = row_matched_columns
+            row_payload['_matched_values'] = {
+                column_name: row.get(column_name)
+                for column_name in row_matched_columns
+            }
+            result_rows.append(row_payload)
+
+        return {
+            'searched_columns': resolved_search_columns,
+            'matched_columns': matched_columns,
+            'return_columns': resolved_return_columns or None,
+            'total_matches': len(matched_df),
+            'returned_rows': len(result_rows),
+            'data': result_rows,
+        }
+
     def _build_series_match_mask(
         self,
         series: pandas.Series,
@@ -1197,6 +1792,213 @@ def _build_series_match_mask(
 
         raise ValueError(f"Unsupported operator: {operator}")
 
+    def _normalize_pseudo_query_column_reference(self, raw_column_name: str) -> str:
+        """Normalize a reviewer-style query column reference into a DataFrame column name."""
+        normalized_column_name = str(raw_column_name or '').strip()
+        if normalized_column_name.startswith('`') and normalized_column_name.endswith('`'):
+            normalized_column_name = normalized_column_name[1:-1]
+        return normalized_column_name.strip()
+
+    def _build_pseudo_query_string_method_mask(
+        self,
+        series: pandas.Series,
+        operator: str,
+        value,
+        case_sensitive: bool = False,
+        normalize_match: bool = False,
+    ) -> pandas.Series:
+        """Build a boolean mask for reviewer-style string method clauses."""
+        if normalize_match and not case_sensitive:
+            return self._build_series_match_mask(
+                series,
+                operator,
+                value,
+                normalize_match=True,
+            )
+
+        if not case_sensitive:
+            return self._build_series_match_mask(
+                series,
+                operator,
+                value,
+                normalize_match=False,
+            )
+
+        text_series = series.astype(str)
+        value_text = str(value)
+        if operator == 'contains':
+            return text_series.str.contains(value_text, regex=False, case=True, na=False)
+        if operator == 'startswith':
+            return text_series.str.startswith(value_text, na=False)
+        if operator == 'endswith':
+            return text_series.str.endswith(value_text, na=False)
+
+        raise ValueError(f"Unsupported operator: {operator}")
+
+    def _apply_reviewer_style_query_expression(
+        self,
+        df: pandas.DataFrame,
+        query_expression: str,
+        normalize_match: bool = False,
+    ) -> Optional[pandas.DataFrame]:
+        """Apply limited reviewer-style pseudo-pandas filters when DataFrame.query syntax is invalid."""
+        rendered_query_expression = str(query_expression or '').strip()
+        if not rendered_query_expression:
+            return df
+
+        lowered_expression = rendered_query_expression.casefold()
+        if ' or ' in lowered_expression or '||' in rendered_query_expression or '|' in rendered_query_expression:
+            return None
+
+        clause_texts = [
+            clause.strip()
+            for clause in re.split(r'\s+(?i:and)\s+|&&', rendered_query_expression)
+            if clause.strip()
+        ]
+        if not clause_texts:
+            return None
+
+        notnull_pattern = re.compile(
+            r"^\s*(?P<column>`[^`]+`|[A-Za-z_][A-Za-z0-9_]*)\s*\.\s*notnull\(\)\s*$",
+            flags=re.IGNORECASE,
+        )
+        isnull_pattern = re.compile(
+            r"^\s*(?P<column>`[^`]+`|[A-Za-z_][A-Za-z0-9_]*)\s*\.\s*isnull\(\)\s*$",
+            flags=re.IGNORECASE,
+        )
+        string_method_pattern = re.compile(
+            r"^\s*(?P<column>`[^`]+`|[A-Za-z_][A-Za-z0-9_]*)"
+            r"(?:\s*\.\s*astype\(\s*str\s*\))?\s*\.\s*str\s*\.\s*"
+            r"(?P<method>contains|startswith|endswith)\(\s*"
+            r"(?P<quote>['\"])(?P<value>.*?)(?P=quote)(?P<args>[^)]*)\)\s*$",
+            flags=re.IGNORECASE,
+        )
+        equality_pattern = re.compile(
+            r"^\s*(?P<column>`[^`]+`|[A-Za-z_][A-Za-z0-9_]*)\s*"
+            r"(?P<operator>==|!=)\s*"
+            r"(?P<quote>['\"])(?P<value>.*?)(?P=quote)\s*$",
+            flags=re.IGNORECASE,
+        )
+        null_literal_pattern = re.compile(
+            r"^\s*(?P<column>`[^`]+`|[A-Za-z_][A-Za-z0-9_]*)\s*"
+            r"(?P<operator>==|!=)\s*"
+            r"(?P<null_literal>null|none|nan)\s*$",
+            flags=re.IGNORECASE,
+        )
+
+        filtered_df = df
+        matched_any_clause = False
+
+        for clause_text in clause_texts:
+            normalized_clause_text = clause_text.strip()
+            while normalized_clause_text.startswith('(') and normalized_clause_text.endswith(')'):
+                normalized_clause_text = normalized_clause_text[1:-1].strip()
+
+            match = notnull_pattern.match(normalized_clause_text)
+            if match:
+                column_name = self._normalize_pseudo_query_column_reference(match.group('column'))
+                if column_name not in filtered_df.columns:
+                    raise KeyError(column_name)
+                filtered_df = filtered_df[filtered_df[column_name].notna()]
+                matched_any_clause = True
+                continue
+
+            match = isnull_pattern.match(normalized_clause_text)
+            if match:
+                column_name = self._normalize_pseudo_query_column_reference(match.group('column'))
+                if column_name not in filtered_df.columns:
+                    raise KeyError(column_name)
+                filtered_df = filtered_df[filtered_df[column_name].isna()]
+                matched_any_clause = True
+                continue
+
+            match = string_method_pattern.match(normalized_clause_text)
+            if match:
+                column_name = self._normalize_pseudo_query_column_reference(match.group('column'))
+                if column_name not in filtered_df.columns:
+                    raise KeyError(column_name)
+
+                method_name = str(match.group('method') or '').strip().lower()
+                operator_name = {
+                    'contains': 'contains',
+                    'startswith': 'startswith',
+                    'endswith': 'endswith',
+                }.get(method_name)
+                if not operator_name:
+                    return None
+
+                args_text = str(match.group('args') or '').replace(' ', '').casefold()
+                if 'regex=true' in args_text:
+                    return None
+                case_sensitive = 'case=true' in args_text
+
+                mask = self._build_pseudo_query_string_method_mask(
+                    filtered_df[column_name],
+                    operator_name,
+                    match.group('value'),
+                    case_sensitive=case_sensitive,
+                    normalize_match=normalize_match,
+                )
+                filtered_df = filtered_df[mask]
+                matched_any_clause = True
+                continue
+
+            match = equality_pattern.match(normalized_clause_text)
+            if match:
+                column_name = self._normalize_pseudo_query_column_reference(match.group('column'))
+                if column_name not in filtered_df.columns:
+                    raise KeyError(column_name)
+
+                operator_name = 'equals' if match.group('operator') == '==' else '!='
+                mask = self._build_series_match_mask(
+                    filtered_df[column_name],
+                    operator_name,
+                    match.group('value'),
+                    normalize_match=normalize_match,
+                )
+                filtered_df = filtered_df[mask]
+                matched_any_clause = True
+                continue
+
+            match = null_literal_pattern.match(normalized_clause_text)
+            if match:
+                column_name = self._normalize_pseudo_query_column_reference(match.group('column'))
+                if column_name not in filtered_df.columns:
+                    raise KeyError(column_name)
+
+                if match.group('operator') == '==':
+                    filtered_df = filtered_df[filtered_df[column_name].isna()]
+                else:
+                    filtered_df = filtered_df[filtered_df[column_name].notna()]
+                matched_any_clause = True
+                continue
+
+            return None
+
+        return filtered_df if matched_any_clause else None
+
+    def _apply_query_expression_with_fallback(
+        self,
+        df: pandas.DataFrame,
+        query_expression: Optional[str] = None,
+        normalize_match: bool = False,
+    ) -> tuple:
+        """Apply DataFrame.query syntax first, then fall back to limited reviewer-style parsing."""
+        if not query_expression:
+            return df, False
+
+        try:
+            return df.query(query_expression), False
+        except Exception as query_error:
+            fallback_df = self._apply_reviewer_style_query_expression(
+                df,
+                query_expression,
+                normalize_match=normalize_match,
+            )
+            if fallback_df is not None:
+                return fallback_df, True
+            raise query_error
+
     def _apply_optional_dataframe_filters(
         self,
         df: pandas.DataFrame,
@@ -1204,31 +2006,67 @@ def _apply_optional_dataframe_filters(
         filter_column: Optional[str] = None,
         filter_operator: str = 'equals',
         filter_value=None,
+        additional_filter_column: Optional[str] = None,
+        additional_filter_operator: str = 'equals',
+        additional_filter_value=None,
         normalize_match: bool = False,
     ) -> tuple:
-        """Apply optional query and single-column filters to a DataFrame."""
+        """Apply optional query and up to two single-column filters to a DataFrame."""
         filtered_df = df
         applied_filters = []
 
         if query_expression:
-            filtered_df = filtered_df.query(query_expression)
-            applied_filters.append(f"query_expression={query_expression}")
+            filtered_df, used_reviewer_style_fallback = self._apply_query_expression_with_fallback(
+                filtered_df,
+                query_expression=query_expression,
+                normalize_match=normalize_match,
+            )
+            applied_filters.append(
+                f"query_expression={query_expression}"
+                + (' [reviewer-style fallback]' if used_reviewer_style_fallback else '')
+            )
 
-        if filter_column:
-            if filter_column not in filtered_df.columns:
-                raise KeyError(filter_column)
-            if filter_value is None:
-                raise ValueError('filter_value is required when filter_column is provided.')
+        structured_filters = [
+            {
+                'column': filter_column,
+                'operator': filter_operator,
+                'value': filter_value,
+                'column_argument': 'filter_column',
+                'value_argument': 'filter_value',
+            },
+            {
+                'column': additional_filter_column,
+                'operator': additional_filter_operator,
+                'value': additional_filter_value,
+                'column_argument': 'additional_filter_column',
+                'value_argument': 'additional_filter_value',
+            },
+        ]
+
+        for filter_spec in structured_filters:
+            current_filter_column = filter_spec['column']
+            if not current_filter_column:
+                continue
+
+            if current_filter_column not in filtered_df.columns:
+                raise KeyError(current_filter_column)
+
+            current_filter_value = filter_spec['value']
+            if current_filter_value is None:
+                raise ValueError(
+                    f"{filter_spec['value_argument']} is required when {filter_spec['column_argument']} is provided."
+                )
 
+            current_filter_operator = filter_spec['operator'] or 'equals'
             mask = self._build_series_match_mask(
-                filtered_df[filter_column],
-                filter_operator,
-                filter_value,
+                filtered_df[current_filter_column],
+                current_filter_operator,
+                current_filter_value,
                 normalize_match=normalize_match,
             )
             filtered_df = filtered_df[mask]
             applied_filters.append(
-                f"{filter_column} {filter_operator or 'equals'} {filter_value}"
+                f"{current_filter_column} {current_filter_operator} {current_filter_value}"
                 + (' [normalized]' if normalize_match else '')
             )
 
@@ -1917,6 +2755,10 @@ def _resolve_blob_location_with_fallback(self, user_id: str, conversation_id: st
                                               group_id: str = None, public_workspace_id: str = None) -> tuple:
         """Try primary source first, then fall back to other containers if blob not found."""
         source = source.lower().strip()
+        override = self._get_resolved_blob_location_override(source, filename)
+        if override:
+            return override
+
         attempts = []
 
         # Primary attempt based on specified source
@@ -2254,8 +3096,8 @@ def _sync_work():
 
     @kernel_function(
         description=(
-            "Return deterministic distinct values for a column, with optional query_expression or filter criteria. "
-            "Use this to build a canonical cohort from a worksheet before counting or joining related rows."
+            "Return deterministic distinct values for a column, with optional query_expression, up to two column filters, and optional embedded URL or regex extraction from composite text cells. "
+            "Use this to build a canonical cohort from a worksheet before counting or joining related rows. Narrow the original text column first when category membership depends on surrounding cell context."
         ),
         name="get_distinct_values"
     )
@@ -2270,6 +3112,12 @@ async def get_distinct_values(
         filter_column: Annotated[Optional[str], "Optional column to filter on before collecting distinct values"] = None,
         filter_operator: Annotated[str, "Optional filter operator when filter_column is provided"] = "equals",
         filter_value: Annotated[Optional[str], "Optional filter value when filter_column is provided"] = None,
+        additional_filter_column: Annotated[Optional[str], "Optional second column to filter on before collecting distinct values"] = None,
+        additional_filter_operator: Annotated[str, "Optional filter operator when additional_filter_column is provided"] = "equals",
+        additional_filter_value: Annotated[Optional[str], "Optional filter value when additional_filter_column is provided"] = None,
+        extract_mode: Annotated[Optional[str], "Optional embedded extraction mode: 'url' or 'regex'"] = None,
+        extract_pattern: Annotated[Optional[str], "Optional regex pattern when extract_mode is 'regex'"] = None,
+        url_path_segments: Annotated[Optional[str], "Optional number of URL path segments to keep when extract_mode is 'url'"] = None,
         normalize_match: Annotated[str, "Whether to normalize string/entity matching and deduplication (true/false)"] = "true",
         sheet_name: Annotated[Optional[str], "Optional worksheet name for Excel files. When omitted, the plugin may perform a cross-sheet distinct-value search."] = None,
         sheet_index: Annotated[Optional[str], "Optional zero-based worksheet index for Excel files. Ignored when sheet_name is provided."] = None,
@@ -2282,6 +3130,11 @@ async def get_distinct_values(
         def _sync_work():
             try:
                 normalize_match_flag = self._parse_boolean_argument(normalize_match, default=True)
+                normalized_extract_mode, normalized_extract_pattern, parsed_url_path_segments = self._normalize_distinct_extraction_arguments(
+                    extract_mode=extract_mode,
+                    extract_pattern=extract_pattern,
+                    url_path_segments=url_path_segments,
+                )
                 container, blob_path = self._resolve_blob_location_with_fallback(
                     user_id, conversation_id, filename, source,
                     group_id=group_id, public_workspace_id=public_workspace_id
@@ -2299,6 +3152,12 @@ def _sync_work():
                         filter_column=filter_column,
                         filter_operator=filter_operator,
                         filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
+                        extract_mode=normalized_extract_mode,
+                        extract_pattern=normalized_extract_pattern,
+                        url_path_segments=parsed_url_path_segments,
                         normalize_match=normalize_match_flag,
                         max_values=int(max_values),
                     )
@@ -2328,7 +3187,10 @@ def _sync_work():
                             workbook_metadata,
                             selected_sheet,
                             column,
-                            related_columns=[filter_column] if filter_column else None,
+                            related_columns=[
+                                candidate_column for candidate_column in (filter_column, additional_filter_column)
+                                if candidate_column
+                            ] or None,
                             available_columns=list(df.columns),
                         )
                     )
@@ -2340,6 +3202,9 @@ def _sync_work():
                         filter_column=filter_column,
                         filter_operator=filter_operator,
                         filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
                         normalize_match=normalize_match_flag,
                     )
                 except KeyError as missing_column_error:
@@ -2352,7 +3217,10 @@ def _sync_work():
                             workbook_metadata,
                             selected_sheet,
                             missing_column,
-                            related_columns=[column],
+                            related_columns=[
+                                candidate_column for candidate_column in (column, filter_column, additional_filter_column)
+                                if candidate_column
+                            ],
                             available_columns=list(df.columns),
                         )
                     )
@@ -2363,23 +3231,17 @@ def _sync_work():
                         'selected_sheet': selected_sheet if workbook_metadata.get('is_workbook') else None,
                     })
 
-                distinct_display_values = {}
-                for cell_value in filtered_df[column].tolist():
-                    display_value = str(cell_value).strip()
-                    if not display_value:
-                        continue
-                    compare_variants = self._extract_cell_value_variants(
-                        cell_value,
-                        normalize_match=normalize_match_flag,
-                    )
-                    if not compare_variants:
-                        continue
-                    canonical_key = sorted(compare_variants)[0]
-                    distinct_display_values.setdefault(canonical_key, display_value)
+                distinct_display_values, matched_cell_count, extracted_match_count = self._collect_distinct_display_values(
+                    filtered_df[column],
+                    normalize_match=normalize_match_flag,
+                    extract_mode=normalized_extract_mode,
+                    extract_pattern=normalized_extract_pattern,
+                    url_path_segments=parsed_url_path_segments,
+                )
 
                 ordered_values = sorted(distinct_display_values.values(), key=lambda item: item.casefold())
                 limit = int(max_values)
-                return json.dumps({
+                response_payload = {
                     'filename': filename,
                     'selected_sheet': selected_sheet if workbook_metadata.get('is_workbook') else None,
                     'column': column,
@@ -2389,7 +3251,16 @@ def _sync_work():
                     'returned_values': min(len(ordered_values), limit),
                     'values': ordered_values[:limit],
                     'values_limited': len(ordered_values) > limit,
-                }, indent=2, default=str)
+                }
+                if normalized_extract_mode:
+                    response_payload.update({
+                        'extract_mode': normalized_extract_mode,
+                        'extract_pattern': normalized_extract_pattern if normalized_extract_mode == 'regex' else None,
+                        'url_path_segments': parsed_url_path_segments if normalized_extract_mode == 'url' else None,
+                        'matched_cell_count': matched_cell_count,
+                        'extracted_match_count': extracted_match_count,
+                    })
+                return json.dumps(response_payload, indent=2, default=str)
             except Exception as e:
                 log_event(f"[TabularProcessingPlugin] Error getting distinct values: {e}", level=logging.WARNING)
                 return json.dumps({"error": str(e)})
@@ -2398,7 +3269,7 @@ def _sync_work():
 
     @kernel_function(
         description=(
-            "Return a deterministic row count after applying an optional query_expression or filter condition. "
+            "Return a deterministic row count after applying an optional query_expression and up to two filter conditions. "
             "Use this instead of estimating counts from partial returned rows when the user asks how many or what percentage."
         ),
         name="count_rows"
@@ -2413,6 +3284,9 @@ async def count_rows(
         filter_column: Annotated[Optional[str], "Optional column to filter on before counting rows"] = None,
         filter_operator: Annotated[str, "Optional filter operator when filter_column is provided"] = "equals",
         filter_value: Annotated[Optional[str], "Optional filter value when filter_column is provided"] = None,
+        additional_filter_column: Annotated[Optional[str], "Optional second column to filter on before counting rows"] = None,
+        additional_filter_operator: Annotated[str, "Optional filter operator when additional_filter_column is provided"] = "equals",
+        additional_filter_value: Annotated[Optional[str], "Optional filter value when additional_filter_column is provided"] = None,
         normalize_match: Annotated[str, "Whether to normalize string/entity matching for text comparisons (true/false)"] = "false",
         sheet_name: Annotated[Optional[str], "Optional worksheet name for Excel files. When omitted, the plugin may perform a cross-sheet row count."] = None,
         sheet_index: Annotated[Optional[str], "Optional zero-based worksheet index for Excel files. Ignored when sheet_name is provided."] = None,
@@ -2439,6 +3313,9 @@ def _sync_work():
                         filter_column=filter_column,
                         filter_operator=filter_operator,
                         filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
                         query_expression=query_expression,
                         normalize_match=normalize_match_flag,
                     )
@@ -2467,6 +3344,9 @@ def _sync_work():
                         filter_column=filter_column,
                         filter_operator=filter_operator,
                         filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
                         normalize_match=normalize_match_flag,
                     )
                 except KeyError as missing_column_error:
@@ -2479,6 +3359,10 @@ def _sync_work():
                             workbook_metadata,
                             selected_sheet,
                             missing_column,
+                            related_columns=[
+                                candidate_column for candidate_column in (filter_column, additional_filter_column)
+                                if candidate_column
+                            ] or None,
                             available_columns=list(df.columns),
                         )
                     )
@@ -2598,7 +3482,8 @@ def _sync_work():
     @kernel_function(
         description=(
             "Filter rows in a tabular file based on conditions and return matching rows. "
-            "Supports operators: ==, !=, >, <, >=, <=, contains, startswith, endswith."
+            "Supports operators: ==, !=, >, <, >=, <=, contains, startswith, endswith. "
+            "A second column filter can be applied for compound text or literal matching. Use this as the text-search tool when the full cell or row context matters."
         ),
         name="filter_rows"
     )
@@ -2611,6 +3496,9 @@ async def filter_rows(
         column: Annotated[str, "The column to filter on"],
         operator: Annotated[str, "Operator: ==, !=, >, <, >=, <=, contains, startswith, endswith"],
         value: Annotated[str, "The value to compare against"],
+        additional_filter_column: Annotated[Optional[str], "Optional second column to filter on"] = None,
+        additional_filter_operator: Annotated[str, "Optional filter operator when additional_filter_column is provided"] = "equals",
+        additional_filter_value: Annotated[Optional[str], "Optional filter value when additional_filter_column is provided"] = None,
         normalize_match: Annotated[str, "Whether to normalize string/entity matching for text comparisons (true/false)"] = "false",
         sheet_name: Annotated[Optional[str], "Optional worksheet name for Excel files. Required for analytical calls on multi-sheet workbooks unless sheet_index is provided."] = None,
         sheet_index: Annotated[Optional[str], "Optional zero-based worksheet index for Excel files. Ignored when sheet_name is provided."] = None,
@@ -2632,7 +3520,15 @@ def _sync_work():
                 normalized_sheet_idx = None if sheet_index is None else str(sheet_index).strip()
                 if not normalized_sheet and normalized_sheet_idx in (None, ''):
                     cross_sheet_result = self._filter_rows_across_sheets(
-                        container, blob_path, filename, column, operator, value,
+                        container,
+                        blob_path,
+                        filename,
+                        column,
+                        operator,
+                        value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
                         normalize_match=normalize_match_flag,
                         max_rows=int(max_rows),
                     )
@@ -2662,27 +3558,47 @@ def _sync_work():
                             workbook_metadata,
                             selected_sheet,
                             column,
+                            related_columns=[additional_filter_column] if additional_filter_column else None,
                             available_columns=list(df.columns),
                         )
                     )
 
                 try:
-                    mask = self._build_series_match_mask(
-                        df[column],
-                        operator,
-                        value,
+                    filtered_df, applied_filters = self._apply_optional_dataframe_filters(
+                        df,
+                        filter_column=column,
+                        filter_operator=operator,
+                        filter_value=value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
                         normalize_match=normalize_match_flag,
                     )
-                except ValueError:
-                    return json.dumps({"error": f"Unsupported operator: {operator}"})
+                except KeyError as missing_column_error:
+                    missing_column = str(missing_column_error).strip("'")
+                    return json.dumps(
+                        self._build_missing_column_error_payload(
+                            container,
+                            blob_path,
+                            filename,
+                            workbook_metadata,
+                            selected_sheet,
+                            missing_column,
+                            related_columns=[candidate_column for candidate_column in (column, additional_filter_column) if candidate_column],
+                            available_columns=list(df.columns),
+                        )
+                    )
+                except ValueError as filter_error:
+                    return json.dumps({"error": str(filter_error)})
 
                 limit = int(max_rows)
-                filtered = df[mask].head(limit)
+                filtered = filtered_df.head(limit)
                 return json.dumps({
                     "filename": filename,
                     "selected_sheet": selected_sheet if workbook_metadata.get('is_workbook') else None,
+                    "filter_applied": applied_filters,
                     "normalize_match": normalize_match_flag,
-                    "total_matches": int(mask.sum()),
+                    "total_matches": len(filtered_df),
                     "returned_rows": len(filtered),
                     "data": filtered.to_dict(orient='records')
                 }, indent=2, default=str)
@@ -2691,6 +3607,190 @@ def _sync_work():
                 return json.dumps({"error": str(e)})
         return await asyncio.to_thread(_sync_work)
 
+    @kernel_function(
+        description=(
+            "Search one or more columns, or all columns when search_columns is omitted, for a value or phrase and return matching rows with row-context metadata. "
+            "Use this when the relevant column is unclear or when you need to search an entire worksheet or workbook for a topic before deciding which returned content is relevant."
+        ),
+        name="search_rows"
+    )
+    @plugin_function_logger("TabularProcessingPlugin")
+    async def search_rows(
+        self,
+        user_id: Annotated[str, "The user ID (from Scope ID in Conversation Metadata)"],
+        conversation_id: Annotated[str, "The conversation ID (from Conversation Metadata)"],
+        filename: Annotated[str, "The filename of the tabular file"],
+        search_value: Annotated[str, "The text or value to search for"],
+        search_columns: Annotated[Optional[str], "Optional comma-separated columns to search. Omit to search all columns."] = None,
+        search_operator: Annotated[str, "Search operator: equals, contains, startswith, endswith"] = "contains",
+        return_columns: Annotated[Optional[str], "Optional comma-separated columns to include in each result row. Omit to return the full row."] = None,
+        query_expression: Annotated[Optional[str], "Optional pandas DataFrame.query() expression to apply before searching"] = None,
+        filter_column: Annotated[Optional[str], "Optional first column filter to narrow the search cohort"] = None,
+        filter_operator: Annotated[str, "Optional filter operator when filter_column is provided"] = "equals",
+        filter_value: Annotated[Optional[str], "Optional filter value when filter_column is provided"] = None,
+        additional_filter_column: Annotated[Optional[str], "Optional second column filter to narrow the search cohort"] = None,
+        additional_filter_operator: Annotated[str, "Optional filter operator when additional_filter_column is provided"] = "equals",
+        additional_filter_value: Annotated[Optional[str], "Optional filter value when additional_filter_column is provided"] = None,
+        normalize_match: Annotated[str, "Whether to normalize string/entity matching for text comparisons (true/false)"] = "false",
+        sheet_name: Annotated[Optional[str], "Optional worksheet name for Excel files. When omitted, the plugin may perform a cross-sheet search."] = None,
+        sheet_index: Annotated[Optional[str], "Optional zero-based worksheet index for Excel files. Ignored when sheet_name is provided."] = None,
+        source: Annotated[str, "Source: 'workspace', 'chat', 'group', or 'public'"] = "chat",
+        max_rows: Annotated[str, "Maximum matching rows to return"] = "100",
+        group_id: Annotated[Optional[str], "Group ID (for group workspace documents)"] = None,
+        public_workspace_id: Annotated[Optional[str], "Public workspace ID (for public workspace documents)"] = None,
+    ) -> Annotated[str, "JSON result containing matching rows, matched columns, and search metadata"]:
+        """Search rows across one or more columns while preserving row context."""
+        def _sync_work():
+            try:
+                normalize_match_flag = self._parse_boolean_argument(normalize_match, default=False)
+                parsed_search_columns = self._parse_optional_column_list_argument(search_columns)
+                parsed_return_columns = self._parse_optional_column_list_argument(return_columns)
+                container, blob_path = self._resolve_blob_location_with_fallback(
+                    user_id, conversation_id, filename, source,
+                    group_id=group_id, public_workspace_id=public_workspace_id
+                )
+
+                normalized_sheet = (sheet_name or '').strip()
+                normalized_sheet_idx = None if sheet_index is None else str(sheet_index).strip()
+                if not normalized_sheet and normalized_sheet_idx in (None, ''):
+                    cross_sheet_result = self._search_rows_across_sheets(
+                        container,
+                        blob_path,
+                        filename,
+                        search_value=search_value,
+                        search_columns=parsed_search_columns,
+                        search_operator=search_operator,
+                        return_columns=parsed_return_columns,
+                        query_expression=query_expression,
+                        filter_column=filter_column,
+                        filter_operator=filter_operator,
+                        filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
+                        normalize_match=normalize_match_flag,
+                        max_rows=int(max_rows),
+                    )
+                    if cross_sheet_result is not None:
+                        return cross_sheet_result
+
+                selected_sheet, workbook_metadata = self._resolve_sheet_selection(
+                    container,
+                    blob_path,
+                    sheet_name=sheet_name,
+                    sheet_index=sheet_index,
+                    require_explicit_sheet=True,
+                )
+                df = self._read_tabular_blob_to_dataframe(
+                    container,
+                    blob_path,
+                    sheet_name=selected_sheet,
+                    require_explicit_sheet=True,
+                )
+                df = self._try_numeric_conversion(df)
+
+                try:
+                    filtered_df, applied_filters = self._apply_optional_dataframe_filters(
+                        df,
+                        query_expression=query_expression,
+                        filter_column=filter_column,
+                        filter_operator=filter_operator,
+                        filter_value=filter_value,
+                        additional_filter_column=additional_filter_column,
+                        additional_filter_operator=additional_filter_operator,
+                        additional_filter_value=additional_filter_value,
+                        normalize_match=normalize_match_flag,
+                    )
+                except KeyError as missing_column_error:
+                    missing_column = str(missing_column_error).strip("'")
+                    return json.dumps(
+                        self._build_missing_column_error_payload(
+                            container,
+                            blob_path,
+                            filename,
+                            workbook_metadata,
+                            selected_sheet,
+                            missing_column,
+                            related_columns=[
+                                candidate_column
+                                for candidate_column in (
+                                    *(parsed_search_columns or []),
+                                    *(parsed_return_columns or []),
+                                    filter_column,
+                                    additional_filter_column,
+                                )
+                                if candidate_column and candidate_column != missing_column
+                            ] or None,
+                            available_columns=list(df.columns),
+                        )
+                    )
+                except Exception as query_error:
+                    return json.dumps({
+                        'error': f"Query/filter error: {query_error}",
+                        'filename': filename,
+                        'selected_sheet': selected_sheet if workbook_metadata.get('is_workbook') else None,
+                    })
+
+                try:
+                    search_result = self._search_dataframe_rows(
+                        filtered_df,
+                        search_value=search_value,
+                        search_columns=parsed_search_columns,
+                        search_operator=search_operator,
+                        return_columns=parsed_return_columns,
+                        normalize_match=normalize_match_flag,
+                        max_rows=int(max_rows),
+                    )
+                except KeyError as missing_column_error:
+                    missing_column = str(missing_column_error).strip("'")
+                    return json.dumps(
+                        self._build_missing_column_error_payload(
+                            container,
+                            blob_path,
+                            filename,
+                            workbook_metadata,
+                            selected_sheet,
+                            missing_column,
+                            related_columns=[
+                                candidate_column
+                                for candidate_column in (
+                                    *(parsed_search_columns or []),
+                                    *(parsed_return_columns or []),
+                                    filter_column,
+                                    additional_filter_column,
+                                )
+                                if candidate_column and candidate_column != missing_column
+                            ] or None,
+                            available_columns=list(df.columns),
+                        )
+                    )
+                except ValueError as search_error:
+                    return json.dumps({
+                        'error': str(search_error),
+                        'filename': filename,
+                        'selected_sheet': selected_sheet if workbook_metadata.get('is_workbook') else None,
+                    })
+
+                return json.dumps({
+                    'filename': filename,
+                    'selected_sheet': selected_sheet if workbook_metadata.get('is_workbook') else None,
+                    'search_value': search_value,
+                    'search_operator': search_operator,
+                    'searched_columns': search_result['searched_columns'],
+                    'matched_columns': search_result['matched_columns'],
+                    'return_columns': search_result['return_columns'],
+                    'filter_applied': applied_filters,
+                    'normalize_match': normalize_match_flag,
+                    'total_matches': search_result['total_matches'],
+                    'returned_rows': search_result['returned_rows'],
+                    'data': search_result['data'],
+                }, indent=2, default=str)
+            except Exception as e:
+                log_event(f"[TabularProcessingPlugin] Error searching rows: {e}", level=logging.WARNING)
+                return json.dumps({"error": str(e)})
+
+        return await asyncio.to_thread(_sync_work)
+
     @kernel_function(
         description=(
             "Execute a pandas query expression against a tabular file for advanced analysis. "
@@ -2745,11 +3845,17 @@ def _sync_work():
                 )
                 df = self._try_numeric_conversion(df)
 
-                result_df = df.query(query_expression)
+                result_df, used_reviewer_style_fallback = self._apply_query_expression_with_fallback(
+                    df,
+                    query_expression=query_expression,
+                    normalize_match=False,
+                )
                 limit = int(max_rows)
                 return json.dumps({
                     "filename": filename,
                     "selected_sheet": selected_sheet if workbook_metadata.get('is_workbook') else None,
+                    "query_expression": query_expression,
+                    "query_expression_fallback": used_reviewer_style_fallback,
                     "total_matches": len(result_df),
                     "returned_rows": min(len(result_df), limit),
                     "data": result_df.head(limit).to_dict(orient='records')
diff --git a/application/single_app/static/images/features/agent_action_grid_view.png b/application/single_app/static/images/features/agent_action_grid_view.png
index 011fecaf..eaf3c01b 100644
Binary files a/application/single_app/static/images/features/agent_action_grid_view.png and b/application/single_app/static/images/features/agent_action_grid_view.png differ
diff --git a/application/single_app/static/images/features/background_completion_notifications-01.png b/application/single_app/static/images/features/background_completion_notifications-01.png
index f46bb7b3..7f8a3034 100644
Binary files a/application/single_app/static/images/features/background_completion_notifications-01.png and b/application/single_app/static/images/features/background_completion_notifications-01.png differ
diff --git a/application/single_app/static/images/features/background_completion_notifications-02.png b/application/single_app/static/images/features/background_completion_notifications-02.png
index aeac80d8..e02771b4 100644
Binary files a/application/single_app/static/images/features/background_completion_notifications-02.png and b/application/single_app/static/images/features/background_completion_notifications-02.png differ
diff --git a/application/single_app/static/images/features/guided_tutorials_chat.png b/application/single_app/static/images/features/guided_tutorials_chat.png
index a519385b..b25d89e9 100644
Binary files a/application/single_app/static/images/features/guided_tutorials_chat.png and b/application/single_app/static/images/features/guided_tutorials_chat.png differ
diff --git a/application/single_app/static/images/features/guided_tutorials_workspace.png b/application/single_app/static/images/features/guided_tutorials_workspace.png
index 246d018b..0fccf64c 100644
Binary files a/application/single_app/static/images/features/guided_tutorials_workspace.png and b/application/single_app/static/images/features/guided_tutorials_workspace.png differ
diff --git a/application/single_app/static/images/features/sql_test_connection.png b/application/single_app/static/images/features/sql_test_connection.png
index ad2cd4ac..8b18123a 100644
Binary files a/application/single_app/static/images/features/sql_test_connection.png and b/application/single_app/static/images/features/sql_test_connection.png differ
diff --git a/application/single_app/static/images/features/tabular_analysis_enhanced_citations.png b/application/single_app/static/images/features/tabular_analysis_enhanced_citations.png
index 7247eded..b6474ed9 100644
Binary files a/application/single_app/static/images/features/tabular_analysis_enhanced_citations.png and b/application/single_app/static/images/features/tabular_analysis_enhanced_citations.png differ
diff --git a/application/single_app/static/images/features/thoughts_visibility.png b/application/single_app/static/images/features/thoughts_visibility.png
index 0346bbed..cb987ea6 100644
Binary files a/application/single_app/static/images/features/thoughts_visibility.png and b/application/single_app/static/images/features/thoughts_visibility.png differ
diff --git a/application/single_app/static/js/chat/chat-citations.js b/application/single_app/static/js/chat/chat-citations.js
index 60099398..9d751ffd 100644
--- a/application/single_app/static/js/chat/chat-citations.js
+++ b/application/single_app/static/js/chat/chat-citations.js
@@ -10,6 +10,9 @@ import { showEnhancedCitationModal } from './chat-enhanced-citations.js';
 // ------------------
 
 const chatboxEl = document.getElementById("chatbox");
+const AGENT_CITATION_PREVIEW_ROWS = 3;
+const AGENT_CITATION_EXPANDED_ROWS = 25;
+let activeAgentCitationState = null;
 
 function escapeAttribute(value) {
   return String(value)
@@ -310,8 +313,194 @@ export function showMetadataModal(metadataType, metadataContent, fileName) {
   modal.show();
 }
 
-export function showAgentCitationModal(toolName, toolArgs, toolResult) {
-  // Create or reuse the agent citation modal
+function parseAgentCitationValue(value) {
+  if (value === null || value === undefined || value === "") {
+    return null;
+  }
+
+  if (typeof value === "object") {
+    return value;
+  }
+
+  if (typeof value !== "string") {
+    return value;
+  }
+
+  const trimmedValue = value.trim();
+  if (!trimmedValue || (trimmedValue[0] !== "{" && trimmedValue[0] !== "[")) {
+    return value;
+  }
+
+  try {
+    return JSON.parse(trimmedValue);
+  } catch (error) {
+    return value;
+  }
+}
+
+function prettyPrintAgentCitationValue(value) {
+  if (value === null || value === undefined || value === "") {
+    return "No result";
+  }
+
+  if (typeof value === "string") {
+    return value;
+  }
+
+  try {
+    return JSON.stringify(value, null, 2);
+  } catch (error) {
+    return String(value);
+  }
+}
+
+function cloneAgentCitationPayload(value) {
+  if (value === null || value === undefined) {
+    return value;
+  }
+
+  try {
+    return JSON.parse(JSON.stringify(value));
+  } catch (error) {
+    return value;
+  }
+}
+
+function isTabularAgentCitationResult(resultPayload) {
+  return Boolean(
+    resultPayload
+    && typeof resultPayload === "object"
+    && !Array.isArray(resultPayload)
+    && Array.isArray(resultPayload.data)
+    && (
+      Object.prototype.hasOwnProperty.call(resultPayload, "returned_rows")
+      || Object.prototype.hasOwnProperty.call(resultPayload, "total_matches")
+      || Object.prototype.hasOwnProperty.call(resultPayload, "filename")
+      || Object.prototype.hasOwnProperty.call(resultPayload, "selected_sheet")
+    )
+  );
+}
+
+function getAgentCitationRowLimit(rowMode, totalRowCount) {
+  if (rowMode === "all") {
+    return totalRowCount;
+  }
+
+  if (rowMode === "expanded25") {
+    return Math.min(totalRowCount, AGENT_CITATION_EXPANDED_ROWS);
+  }
+
+  return Math.min(totalRowCount, AGENT_CITATION_PREVIEW_ROWS);
+}
+
+function buildAgentCitationResultView(resultPayload, rowMode) {
+  if (!isTabularAgentCitationResult(resultPayload)) {
+    return {
+      resultText: prettyPrintAgentCitationValue(resultPayload),
+      summaryText: "",
+      controls: [],
+    };
+  }
+
+  const allRows = Array.isArray(resultPayload.data) ? resultPayload.data : [];
+  const totalRowCount = allRows.length;
+  const displayedRowCount = getAgentCitationRowLimit(rowMode, totalRowCount);
+  const displayedPayload = cloneAgentCitationPayload(resultPayload) || {};
+  displayedPayload.data = allRows.slice(0, displayedRowCount);
+  displayedPayload.displayed_rows = displayedRowCount;
+  displayedPayload.data_rows_limited = displayedRowCount < totalRowCount;
+
+  const summaryParts = [];
+  if (Object.prototype.hasOwnProperty.call(resultPayload, "total_matches")) {
+    summaryParts.push(`total_matches: ${resultPayload.total_matches}`);
+  }
+  if (Object.prototype.hasOwnProperty.call(resultPayload, "returned_rows")) {
+    summaryParts.push(`returned_rows: ${resultPayload.returned_rows}`);
+  }
+  summaryParts.push(`showing ${displayedRowCount} row${displayedRowCount === 1 ? "" : "s"}`);
+
+  const controls = [];
+  if (totalRowCount > AGENT_CITATION_PREVIEW_ROWS && rowMode !== "preview") {
+    controls.push({ mode: "preview", label: "Show preview" });
+  }
+  if (
+    totalRowCount > AGENT_CITATION_EXPANDED_ROWS
+    && rowMode !== "expanded25"
+  ) {
+    controls.push({ mode: "expanded25", label: "Show 25 rows" });
+  }
+  if (
+    totalRowCount > AGENT_CITATION_PREVIEW_ROWS
+    && rowMode !== "all"
+  ) {
+    controls.push({ mode: "all", label: "Show all rows" });
+  }
+
+  return {
+    resultText: JSON.stringify(displayedPayload, null, 2),
+    summaryText: summaryParts.join(" • "),
+    controls,
+  };
+}
+
+function renderAgentCitationResult(toolResultEl, toolResultSummaryEl, toolResultActionsEl) {
+  if (!toolResultEl || !toolResultSummaryEl || !toolResultActionsEl || !activeAgentCitationState) {
+    return;
+  }
+
+  const resultView = buildAgentCitationResultView(
+    activeAgentCitationState.parsedResult,
+    activeAgentCitationState.rowMode,
+  );
+
+  toolResultEl.textContent = resultView.resultText || "No result";
+  toolResultSummaryEl.textContent = resultView.summaryText || "";
+  toolResultSummaryEl.classList.toggle("d-none", !resultView.summaryText);
+
+  toolResultActionsEl.innerHTML = "";
+  toolResultActionsEl.classList.toggle("d-none", resultView.controls.length === 0);
+  resultView.controls.forEach((control) => {
+    const button = document.createElement("button");
+    button.type = "button";
+    button.className = "btn btn-sm btn-outline-secondary";
+    button.textContent = control.label;
+    button.setAttribute("data-row-mode", control.mode);
+    button.addEventListener("click", () => {
+      activeAgentCitationState.rowMode = control.mode;
+      renderAgentCitationResult(toolResultEl, toolResultSummaryEl, toolResultActionsEl);
+    });
+    toolResultActionsEl.appendChild(button);
+  });
+}
+
+async function fetchAgentCitationArtifact(conversationId, artifactId) {
+  if (!conversationId || !artifactId) {
+    return null;
+  }
+
+  const response = await fetch(
+    `/api/conversation/${encodeURIComponent(conversationId)}/agent-citation/${encodeURIComponent(artifactId)}`,
+    {
+      method: "GET",
+      headers: { "Content-Type": "application/json" },
+    }
+  );
+
+  let payload = null;
+  try {
+    payload = await response.json();
+  } catch (error) {
+    payload = null;
+  }
+
+  if (!response.ok) {
+    throw new Error(payload?.error || `Server responded with status ${response.status}`);
+  }
+
+  return payload?.citation || null;
+}
+
+export async function showAgentCitationModal(toolName, toolArgs, toolResult, options = {}) {
   let modalContainer = document.getElementById("agent-citation-modal");
   if (!modalContainer) {
     modalContainer = document.createElement("div");
@@ -344,8 +533,12 @@ export function showAgentCitationModal(toolName, toolArgs, toolResult) {
               <pre id="agent-tool-args" class="bg-light p-2 rounded" style="white-space: pre-wrap; word-wrap: break-word;"></pre>
             </div>
             <div class="mb-3">
-              <h6 class="fw-bold">Function Result:</h6>
-              <pre id="agent-tool-result" class="bg-light p-2 rounded" style="white-space: pre-wrap; word-wrap: break-word;"></pre>
+              <div class="d-flex flex-wrap justify-content-between align-items-center gap-2">
+                <h6 class="fw-bold mb-0">Function Result:</h6>
+                <div id="agent-tool-result-summary" class="text-muted small d-none"></div>
+              </div>
+              <div id="agent-tool-result-actions" class="d-none mt-2 d-flex flex-wrap gap-2"></div>
+              <pre id="agent-tool-result" class="bg-light p-2 rounded mt-2" style="white-space: pre-wrap; word-wrap: break-word;"></pre>
             </div>
           </div>
         </div>
@@ -354,109 +547,62 @@ export function showAgentCitationModal(toolName, toolArgs, toolResult) {
     document.body.appendChild(modalContainer);
   }
 
-  // Update the content
   const toolNameEl = document.getElementById("agent-tool-name");
   const toolArgsEl = document.getElementById("agent-tool-args");
   const toolResultEl = document.getElementById("agent-tool-result");
+  const toolResultSummaryEl = document.getElementById("agent-tool-result-summary");
+  const toolResultActionsEl = document.getElementById("agent-tool-result-actions");
   const toolSourceEl = document.getElementById("agent-tool-source");
   const toolUrlEl = document.getElementById("agent-tool-url");
   const toolUrlMetaEl = document.getElementById("agent-tool-url-meta");
 
-  if (toolNameEl) {
-    toolNameEl.textContent = toolName || "Unknown";
-  }
-  
-  let parsedArgs = null;
-  if (toolArgsEl) {
-    // Handle empty or no parameters more gracefully
-    let argsContent = "";
-    
+  const artifactId = options.artifactId || "";
+  const conversationId = options.conversationId
+    || window.chatConversations?.getCurrentConversationId?.()
+    || window.currentConversationId
+    || "";
+  let citationPayload = {
+    tool_name: toolName,
+    function_arguments: toolArgs,
+    function_result: toolResult,
+  };
+
+  if (artifactId && conversationId) {
+    showLoadingIndicator();
     try {
-      if (!toolArgs || toolArgs === "" || toolArgs === "{}") {
-        argsContent = "No parameters required";
-      } else {
-        parsedArgs = JSON.parse(toolArgs);
-        // Check if it's an empty object
-        if (typeof parsedArgs === 'object' && Object.keys(parsedArgs).length === 0) {
-          argsContent = "No parameters required";
-        } else {
-          argsContent = JSON.stringify(parsedArgs, null, 2);
-        }
-      }
-    } catch (e) {
-      // If it's not valid JSON, check if it's an object representation
-      if (toolArgs === "[object Object]" || !toolArgs || toolArgs.trim() === "") {
-        argsContent = "No parameters required";
-      } else {
-        argsContent = toolArgs;
+      const hydratedCitation = await fetchAgentCitationArtifact(conversationId, artifactId);
+      if (hydratedCitation && typeof hydratedCitation === "object") {
+        citationPayload = hydratedCitation;
       }
-    }
-    
-    // Add truncation with expand/collapse if content is long
-    if (argsContent.length > 300 && argsContent !== "No parameters required") {
-      const truncatedContent = argsContent.substring(0, 300);
-      const remainingContent = argsContent.substring(300);
-      
-      toolArgsEl.innerHTML = `
-        <div class="args-content position-relative">
-          <span class="args-truncated">${escapeHtml(truncatedContent)}</span><span class="args-remaining" style="display: none;">${escapeHtml(remainingContent)}</span>
-          <button class="btn btn-link p-0 ms-2 expand-args-btn" 
-                  style="font-size: 0.75rem; text-decoration: none; vertical-align: baseline;" 
-                  onclick="toggleArgsExpansion(this)">
-            <i class="bi bi-chevron-down" style="font-size: 0.7rem;"></i>
-          </button>
-        </div>
-      `;
-    } else {
-      toolArgsEl.textContent = argsContent;
+    } catch (error) {
+      console.warn("Failed to hydrate agent citation artifact, using compact payload.", error);
+    } finally {
+      hideLoadingIndicator();
     }
   }
-  
-  if (toolResultEl) {
-    // Handle result formatting and truncation with expand/collapse
-    let resultContent = "";
-    let parsedResult = null;
-    
-    try {
-      if (!toolResult || toolResult === "" || toolResult === "{}") {
-        resultContent = "No result";
-      } else if (toolResult === "[object Object]") {
-        resultContent = "No result data available";
-      } else {
-        // Try to parse as JSON first
-        try {
-          parsedResult = JSON.parse(toolResult);
-          resultContent = JSON.stringify(parsedResult, null, 2);
-        } catch (parseError) {
-          // If not JSON, treat as string
-          resultContent = toolResult;
-        }
-      }
-    } catch (e) {
-      resultContent = toolResult || "No result";
-    }
 
+  const parsedArgs = parseAgentCitationValue(citationPayload.function_arguments ?? toolArgs);
+  const parsedResult = parseAgentCitationValue(citationPayload.function_result ?? toolResult);
+  activeAgentCitationState = {
+    rowMode: "preview",
+    parsedArgs,
+    parsedResult,
+  };
+
+  if (toolNameEl) {
+    toolNameEl.textContent = citationPayload.tool_name || toolName || "Unknown";
+  }
+
+  if (toolArgsEl) {
+    toolArgsEl.textContent = parsedArgs === null
+      ? "No parameters required"
+      : prettyPrintAgentCitationValue(parsedArgs);
+  }
+
+  if (toolResultEl && toolResultSummaryEl && toolResultActionsEl) {
     const citationDetails = extractAgentCitationDetails(parsedResult || parsedArgs);
     updateAgentCitationSource(toolSourceEl, toolUrlEl, toolUrlMetaEl, citationDetails);
-    
-    // Add truncation with expand/collapse if content is long
-    if (resultContent.length > 300) {
-      const truncatedContent = resultContent.substring(0, 300);
-      const remainingContent = resultContent.substring(300);
-      
-      toolResultEl.innerHTML = `
-        <div class="result-content position-relative">
-          <span class="result-truncated">${escapeHtml(truncatedContent)}</span><span class="result-remaining" style="display: none;">${escapeHtml(remainingContent)}</span>
-          <button class="btn btn-link p-0 ms-2 expand-result-btn" 
-                  style="font-size: 0.75rem; text-decoration: none; vertical-align: baseline;" 
-                  onclick="toggleResultExpansion(this)">
-            <i class="bi bi-chevron-down" style="font-size: 0.7rem;"></i>
-          </button>
-        </div>
-      `;
-    } else {
-      toolResultEl.textContent = resultContent;
-    }
+    renderAgentCitationResult(toolResultEl, toolResultSummaryEl, toolResultActionsEl);
   }
 
   const modal = new bootstrap.Modal(modalContainer);
@@ -681,6 +827,10 @@ if (chatboxEl) {
       const toolName = target.getAttribute("data-tool-name");
       const toolArgs = target.getAttribute("data-tool-args");
       const toolResult = target.getAttribute("data-tool-result");
+      const artifactId = target.getAttribute("data-artifact-id");
+      const conversationId = target.getAttribute("data-conversation-id")
+        || window.chatConversations?.getCurrentConversationId?.()
+        || window.currentConversationId;
       
       if (!toolName) {
         console.warn("Agent citation link clicked but data-tool-name is missing.");
@@ -688,7 +838,10 @@ if (chatboxEl) {
         return;
       }
       
-      showAgentCitationModal(toolName, toolArgs, toolResult);
+      void showAgentCitationModal(toolName, toolArgs, toolResult, {
+        artifactId,
+        conversationId,
+      });
       
     } else if (target && target.matches("a.file-link")) { // Keep existing file link logic
       event.preventDefault();
@@ -719,42 +872,4 @@ function escapeHtml(text) {
   div.textContent = text;
   return div.innerHTML;
 }
-
-// Global function to toggle result expansion (called from inline onclick)
-window.toggleResultExpansion = function(button) {
-  const resultContent = button.closest('.result-content');
-  const remaining = resultContent.querySelector('.result-remaining');
-  const icon = button.querySelector('i');
-  
-  if (remaining.style.display === 'none') {
-    // Expand
-    remaining.style.display = 'inline';
-    icon.className = 'bi bi-chevron-up';
-    button.title = 'Show less';
-  } else {
-    // Collapse
-    remaining.style.display = 'none';
-    icon.className = 'bi bi-chevron-down';
-    button.title = 'Show more';
-  }
-};
-
-// Global function to toggle arguments expansion (called from inline onclick)
-window.toggleArgsExpansion = function(button) {
-  const argsContent = button.closest('.args-content');
-  const remaining = argsContent.querySelector('.args-remaining');
-  const icon = button.querySelector('i');
-  
-  if (remaining.style.display === 'none') {
-    // Expand
-    remaining.style.display = 'inline';
-    icon.className = 'bi bi-chevron-up';
-    button.title = 'Show less';
-  } else {
-    // Collapse
-    remaining.style.display = 'none';
-    icon.className = 'bi bi-chevron-down';
-    button.title = 'Show more';
-  }
-};
 // ---------------------------------------
\ No newline at end of file
diff --git a/application/single_app/static/js/chat/chat-documents.js b/application/single_app/static/js/chat/chat-documents.js
index 82b0f898..dde90dc5 100644
--- a/application/single_app/static/js/chat/chat-documents.js
+++ b/application/single_app/static/js/chat/chat-documents.js
@@ -34,6 +34,7 @@ const scopeSearchInput = document.getElementById("scope-search-input");
 export let personalDocs = [];
 export let groupDocs = [];
 export let publicDocs = [];
+const citationMetadataCache = new Map();
 
 // Items removed from the DOM by tag filtering (stored so they can be re-added)
 // Each entry: { element, nextSibling }
@@ -856,9 +857,46 @@ export function getDocumentMetadata(docId) {
   if (publicMatch) {
     return publicMatch;
   }
+  const cachedMatch = citationMetadataCache.get(docId);
+  if (cachedMatch) {
+    return cachedMatch;
+  }
   return null; // Not found in any list
 }
 
+export async function fetchDocumentMetadata(docId) {
+  if (!docId) {
+    return null;
+  }
+
+  const existingMetadata = getDocumentMetadata(docId);
+  if (existingMetadata) {
+    return existingMetadata;
+  }
+
+  try {
+    const response = await fetch(`/api/enhanced_citations/document_metadata?doc_id=${encodeURIComponent(docId)}`, {
+      credentials: 'same-origin',
+    });
+
+    if (!response.ok) {
+      return null;
+    }
+
+    const metadata = await response.json();
+    if (metadata && metadata.id) {
+      citationMetadataCache.set(metadata.id, metadata);
+    }
+    if (metadata && metadata.document_id) {
+      citationMetadataCache.set(metadata.document_id, metadata);
+    }
+    return metadata;
+  } catch (error) {
+    console.warn('Error fetching citation document metadata:', error);
+    return null;
+  }
+}
+
 /* ---------------------------------------------------------------------------
    Loading Documents
 --------------------------------------------------------------------------- */
@@ -1034,6 +1072,7 @@ export async function loadTagsForScope() {
   // Clear existing options in both hidden select and custom dropdown
   chatTagsFilter.innerHTML = '';
   if (tagsDropdownItems) tagsDropdownItems.innerHTML = '';
+  resetTagSelectionState();
 
   try {
     const scopes = getEffectiveScopes();
@@ -1244,6 +1283,24 @@ function hideTagsDropdown() {
   }
 }
 
+function resetTagSelectionState() {
+  if (chatTagsFilter) {
+    Array.from(chatTagsFilter.options).forEach(option => {
+      option.selected = false;
+    });
+  }
+
+  if (tagsDropdownItems) {
+    tagsDropdownItems.querySelectorAll('.tag-checkbox').forEach(checkbox => {
+      checkbox.checked = false;
+    });
+  }
+
+  tagsSearchController?.resetFilter();
+  syncTagsDropdownButtonText();
+  filterDocumentsBySelectedTags();
+}
+
 /* ---------------------------------------------------------------------------
    Sync Tags Dropdown Button Text with Selection State
 --------------------------------------------------------------------------- */
diff --git a/application/single_app/static/js/chat/chat-enhanced-citations.js b/application/single_app/static/js/chat/chat-enhanced-citations.js
index 93779da9..561a7831 100644
--- a/application/single_app/static/js/chat/chat-enhanced-citations.js
+++ b/application/single_app/static/js/chat/chat-enhanced-citations.js
@@ -3,7 +3,7 @@
 
 import { showToast } from "./chat-toast.js";
 import { showLoadingIndicator, hideLoadingIndicator } from "./chat-loading-indicator.js";
-import { getDocumentMetadata } from './chat-documents.js';
+import { getDocumentMetadata, fetchDocumentMetadata } from './chat-documents.js';
 
 /**
  * Determine file type from filename extension
@@ -36,9 +36,14 @@ export function getFileType(fileName) {
  * @param {string} citationId - Citation ID for fallback
  * @param {string|null} initialSheetName - Workbook sheet to open initially for tabular files
  */
-export function showEnhancedCitationModal(docId, pageNumberOrTimestamp, citationId, initialSheetName = null) {
-    // Get document metadata to determine file type
-    const docMetadata = getDocumentMetadata(docId);
+export async function showEnhancedCitationModal(docId, pageNumberOrTimestamp, citationId, initialSheetName = null) {
+    // Get document metadata to determine file type. Historical cited revisions
+    // are not in the current workspace list, so fetch on demand when needed.
+    let docMetadata = getDocumentMetadata(docId);
+    if (!docMetadata || !docMetadata.file_name) {
+        docMetadata = await fetchDocumentMetadata(docId);
+    }
+
     if (!docMetadata || !docMetadata.file_name) {
         console.warn('Document metadata not found, falling back to text citation');
         // Import fetchCitedText dynamically to avoid circular imports
diff --git a/application/single_app/static/js/chat/chat-messages.js b/application/single_app/static/js/chat/chat-messages.js
index 0c28e682..d350eb3a 100644
--- a/application/single_app/static/js/chat/chat-messages.js
+++ b/application/single_app/static/js/chat/chat-messages.js
@@ -448,6 +448,8 @@ function createCitationsHtml(
                  data-tool-name="${escapeHtml(cite.tool_name || '')}"
                  data-tool-args="${escapeHtml(toolArgs)}"
                  data-tool-result="${escapeHtml(toolResult)}"
+                 data-artifact-id="${escapeHtml(cite.artifact_id || '')}"
+                 data-conversation-id="${escapeHtml(window.currentConversationId || '')}"
                  title="Agent tool: ${escapeHtml(displayText)} - Click to view details">
                   <i class="bi bi-cpu me-1"></i>${escapeHtml(displayText)}
               </a>`;
@@ -2448,6 +2450,46 @@ function toggleMessageMetadata(messageDiv, messageId) {
  * Load message metadata into the drawer for AI/image/file messages
  */
 function loadMessageMetadataForDisplay(messageId, container) {
+  function renderHistoryContextRefRow(label, refs) {
+    if (!Array.isArray(refs) || refs.length === 0) {
+      return `<div class="mb-2"><span class="text-muted">${label}:</span> <span class="ms-2 text-muted">none</span></div>`;
+    }
+
+    return `
+      <div class="mb-2">
+        <div><span class="text-muted">${label}:</span></div>
+        <div class="ms-3 mt-1 text-break" style="white-space: pre-wrap; word-break: break-word;">${escapeHtml(refs.join(', '))}</div>
+      </div>
+    `;
+  }
+
+  function renderHistoryContextSection(historyContext) {
+    if (!historyContext || typeof historyContext !== 'object') {
+      return '';
+    }
+
+    let sectionHtml = '<div class="mb-3">';
+    sectionHtml += '<div class="fw-bold mb-2"><i class="bi bi-clock-history me-2"></i>History Context</div>';
+    sectionHtml += '<div class="ms-3 small">';
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Path:</span> <code class="ms-2">${escapeHtml(String(historyContext.path || 'unknown'))}</code></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Stored Messages:</span> <span class="ms-2 badge bg-secondary">${Number(historyContext.stored_total_messages || 0)}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">History Limit:</span> <span class="ms-2 badge bg-secondary">${Number(historyContext.history_limit || 0)}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Older Messages:</span> <span class="ms-2 badge bg-secondary">${Number(historyContext.older_message_count || 0)}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Recent Selected:</span> <span class="ms-2 badge bg-info">${Number(historyContext.recent_message_count || 0)}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Final API Messages:</span> <span class="ms-2 badge bg-primary">${Number(historyContext.final_api_message_count || 0)}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Summary Requested:</span> <span class="ms-2 badge ${historyContext.summary_requested ? 'bg-warning text-dark' : 'bg-secondary'}">${historyContext.summary_requested ? 'Yes' : 'No'}</span></div>`;
+    sectionHtml += `<div class="mb-1"><span class="text-muted">Summary Used:</span> <span class="ms-2 badge ${historyContext.summary_used ? 'bg-success' : 'bg-secondary'}">${historyContext.summary_used ? 'Yes' : 'No'}</span></div>`;
+    sectionHtml += `<div class="mb-2"><span class="text-muted">Default System Prompt:</span> <span class="ms-2 badge ${historyContext.default_system_prompt_inserted ? 'bg-success' : 'bg-secondary'}">${historyContext.default_system_prompt_inserted ? 'Inserted' : 'Not inserted'}</span></div>`;
+    sectionHtml += renderHistoryContextRefRow('Recent Refs', historyContext.selected_recent_message_refs);
+    sectionHtml += renderHistoryContextRefRow('Summarized Refs', historyContext.summarized_message_refs);
+    sectionHtml += renderHistoryContextRefRow('Skipped Inactive', historyContext.skipped_inactive_message_refs);
+    sectionHtml += renderHistoryContextRefRow('Skipped Masked', historyContext.skipped_masked_message_refs);
+    sectionHtml += renderHistoryContextRefRow('Final API Refs', historyContext.final_api_source_refs);
+    sectionHtml += '</div></div>';
+
+    return sectionHtml;
+  }
+
   fetch(`/api/message/${messageId}/metadata`)
     .then(response => {
       if (!response.ok) {
@@ -2471,6 +2513,7 @@ function loadMessageMetadataForDisplay(messageId, container) {
         active_thread: metadata.active_thread,
         thread_attempt: metadata.thread_attempt
       };
+      const historyContext = metadata.metadata?.history_context || null;
       
       if (threadInfo.thread_id) {
         html += '<div class="mb-3">';
@@ -2533,6 +2576,10 @@ function loadMessageMetadataForDisplay(messageId, container) {
         
         html += '</div></div>';
       }
+
+      if (metadata.role === 'assistant' && historyContext) {
+        html += renderHistoryContextSection(historyContext);
+      }
       
       html += '</div>';
       container.innerHTML = html;
diff --git a/application/single_app/static/js/chat/chat-thoughts.js b/application/single_app/static/js/chat/chat-thoughts.js
index e5ada65f..a405d918 100644
--- a/application/single_app/static/js/chat/chat-thoughts.js
+++ b/application/single_app/static/js/chat/chat-thoughts.js
@@ -14,6 +14,7 @@ let activeStreamingServerMessageId = null;
 // ---------------------------------------------------------------------------
 function getThoughtIcon(stepType) {
     const iconMap = {
+        'history_context': 'bi-diagram-3',
         'search': 'bi-search',
         'tabular_analysis': 'bi-table',
         'web_search': 'bi-globe',
diff --git a/application/single_app/static/js/public/public_workspace.js b/application/single_app/static/js/public/public_workspace.js
index 3b8f54a0..c24dfe2c 100644
--- a/application/single_app/static/js/public/public_workspace.js
+++ b/application/single_app/static/js/public/public_workspace.js
@@ -48,6 +48,178 @@ const publicPromptModal = new bootstrap.Modal(document.getElementById('publicPro
 const publicDocMetadataModal = new bootstrap.Modal(document.getElementById('publicDocMetadataModal'));
 const publicTagManagementModal = new bootstrap.Modal(document.getElementById('publicTagManagementModal'));
 const publicTagSelectionModal = new bootstrap.Modal(document.getElementById('publicTagSelectionModal'));
+const publicDocumentDeleteModalElement = document.getElementById('publicDocumentDeleteModal');
+const publicDocumentDeleteModal = publicDocumentDeleteModalElement ? new bootstrap.Modal(publicDocumentDeleteModalElement) : null;
+const publicDocumentDeleteModalTitle = document.getElementById('publicDocumentDeleteModalLabel');
+const publicDocumentDeleteModalBody = document.getElementById('publicDocumentDeleteModalBody');
+const publicDeleteCurrentBtn = document.getElementById('publicDeleteCurrentBtn');
+const publicDeleteAllBtn = document.getElementById('publicDeleteAllBtn');
+
+function getPublicDeleteModalContent(documentCount) {
+  if (documentCount === 1) {
+    return {
+      title: 'Delete Public Document',
+      body: `
+        <p class="mb-2">Choose how to delete this public document revision.</p>
+        <p class="mb-2"><strong>Delete Current Version</strong> removes the visible revision and keeps older revisions for future comparison.</p>
+        <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for this document.</p>
+      `,
+    };
+  }
+
+  return {
+    title: 'Delete Selected Public Documents',
+    body: `
+      <p class="mb-2">Choose how to delete ${documentCount} selected current public document revision(s).</p>
+      <p class="mb-2"><strong>Delete Current Version</strong> removes only the visible revision for each selected document and keeps older revisions.</p>
+      <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for each selected document.</p>
+    `,
+  };
+}
+
+function showPublicDocumentDeleteFeedback(message, variant = 'danger') {
+  if (typeof window.showToast === 'function') {
+    window.showToast(message, variant);
+    return;
+  }
+
+  let container = document.getElementById('publicDocumentDeleteFeedbackContainer');
+  if (!container) {
+    container = document.createElement('div');
+    container.id = 'publicDocumentDeleteFeedbackContainer';
+    container.className = 'toast-container position-fixed top-0 end-0 p-3';
+    document.body.appendChild(container);
+  }
+
+  if (window.bootstrap && typeof window.bootstrap.Toast === 'function') {
+    const toastElement = document.createElement('div');
+    toastElement.className = `toast align-items-center text-white bg-${variant} border-0`;
+    toastElement.setAttribute('role', 'alert');
+    toastElement.setAttribute('aria-live', 'assertive');
+    toastElement.setAttribute('aria-atomic', 'true');
+
+    const wrapper = document.createElement('div');
+    wrapper.className = 'd-flex';
+
+    const body = document.createElement('div');
+    body.className = 'toast-body';
+    body.textContent = message;
+
+    const closeButton = document.createElement('button');
+    closeButton.type = 'button';
+    closeButton.className = 'btn-close btn-close-white me-2 m-auto';
+    closeButton.setAttribute('data-bs-dismiss', 'toast');
+    closeButton.setAttribute('aria-label', 'Close');
+
+    wrapper.appendChild(body);
+    wrapper.appendChild(closeButton);
+    toastElement.appendChild(wrapper);
+    container.appendChild(toastElement);
+
+    const toast = new window.bootstrap.Toast(toastElement);
+    toast.show();
+    toastElement.addEventListener('hidden.bs.toast', () => {
+      toastElement.remove();
+    });
+    return;
+  }
+
+  const alertElement = document.createElement('div');
+  alertElement.className = `alert alert-${variant} alert-dismissible fade show mb-2`;
+  alertElement.setAttribute('role', 'alert');
+
+  const body = document.createElement('span');
+  body.textContent = message;
+
+  const closeButton = document.createElement('button');
+  closeButton.type = 'button';
+  closeButton.className = 'btn-close';
+  closeButton.setAttribute('data-bs-dismiss', 'alert');
+  closeButton.setAttribute('aria-label', 'Close');
+
+  alertElement.appendChild(body);
+  alertElement.appendChild(closeButton);
+  container.appendChild(alertElement);
+}
+
+function isPublicDocumentDeleteModalReady() {
+  return Boolean(
+    publicDocumentDeleteModal &&
+    publicDocumentDeleteModalElement &&
+    publicDocumentDeleteModalElement.isConnected &&
+    publicDocumentDeleteModalBody &&
+    publicDocumentDeleteModalBody.isConnected &&
+    publicDeleteCurrentBtn &&
+    publicDeleteCurrentBtn.isConnected &&
+    publicDeleteAllBtn &&
+    publicDeleteAllBtn.isConnected
+  );
+}
+
+function promptPublicDeleteMode(documentCount = 1) {
+  if (!isPublicDocumentDeleteModalReady()) {
+    showPublicDocumentDeleteFeedback('Delete confirmation dialog is unavailable. Refresh the page and try again.');
+    return Promise.resolve(null);
+  }
+
+  const modalContent = getPublicDeleteModalContent(documentCount);
+  if (publicDocumentDeleteModalTitle) {
+    publicDocumentDeleteModalTitle.textContent = modalContent.title;
+  }
+  publicDocumentDeleteModalBody.innerHTML = modalContent.body;
+
+  return new Promise((resolve) => {
+    let settled = false;
+
+    const cleanup = () => {
+      publicDocumentDeleteModalElement.removeEventListener('hidden.bs.modal', handleHidden);
+      publicDeleteCurrentBtn.removeEventListener('click', handleCurrentOnly);
+      publicDeleteAllBtn.removeEventListener('click', handleAllVersions);
+    };
+
+    const finalize = (value) => {
+      if (settled) {
+        return;
+      }
+      settled = true;
+      cleanup();
+      resolve(value);
+    };
+
+    const handleHidden = () => finalize(null);
+    const handleCurrentOnly = () => {
+      publicDocumentDeleteModal.hide();
+      finalize('current_only');
+    };
+    const handleAllVersions = () => {
+      publicDocumentDeleteModal.hide();
+      finalize('all_versions');
+    };
+
+    publicDocumentDeleteModalElement.addEventListener('hidden.bs.modal', handleHidden);
+    publicDeleteCurrentBtn.addEventListener('click', handleCurrentOnly);
+    publicDeleteAllBtn.addEventListener('click', handleAllVersions);
+    publicDocumentDeleteModal.show();
+  });
+}
+
+async function requestPublicDocumentDeletion(documentId, deleteMode) {
+  const query = new URLSearchParams({ delete_mode: deleteMode });
+  const response = await fetch(`/api/public_documents/${documentId}?${query.toString()}`, { method: 'DELETE' });
+
+  let responseData = {};
+  try {
+    responseData = await response.json();
+  } catch (error) {
+    responseData = {};
+  }
+
+  if (!response.ok) {
+    throw responseData.error ? responseData : { error: `Server responded with status ${response.status}` };
+  }
+
+  return responseData;
+}
 
 // Editors
 let publicSimplemde = null;
@@ -794,7 +966,32 @@ async function onPublicUploadClick() {
     xhr.send(formData);
   });
 }
-window.deletePublicDocument=async function(id, event){ if(!confirm('Delete?')) return; try{ await fetch(`/api/public_documents/${id}`,{method:'DELETE'}); fetchPublicDocs(); }catch(e){ alert(`Error deleting: ${e.error||e.message}`);} };
+window.deletePublicDocument = async function(id, event) {
+  const deleteMode = await promptPublicDeleteMode(1);
+  if (!deleteMode) {
+    return;
+  }
+
+  const deleteTrigger = event ? event.target.closest('a, button') : null;
+  const originalDeleteTriggerHtml = deleteTrigger ? deleteTrigger.innerHTML : null;
+  if (deleteTrigger) {
+    deleteTrigger.classList.add('disabled');
+    deleteTrigger.setAttribute('aria-disabled', 'true');
+    deleteTrigger.innerHTML = '<span class="spinner-border spinner-border-sm" role="status" aria-hidden="true"></span>';
+  }
+
+  try {
+    await requestPublicDocumentDeletion(id, deleteMode);
+    fetchPublicDocs();
+  } catch (e) {
+    showPublicWorkspaceToast(`Error deleting: ${e.error || e.message}`, 'danger');
+    if (deleteTrigger && document.body.contains(deleteTrigger)) {
+      deleteTrigger.classList.remove('disabled');
+      deleteTrigger.removeAttribute('aria-disabled');
+      deleteTrigger.innerHTML = originalDeleteTriggerHtml;
+    }
+  }
+};
 
 window.searchPublicDocumentInChat = function(docId) {
   window.location.href = `/chats?search_documents=true&doc_scope=public&document_id=${docId}&workspace_id=${activePublicId}`;
@@ -854,34 +1051,45 @@ function clearPublicSelection() {
 
 function deletePublicSelectedDocuments() {
   if (publicSelectedDocuments.size === 0) return;
-  if (!confirm(`Are you sure you want to delete ${publicSelectedDocuments.size} selected document(s)? This action cannot be undone.`)) return;
 
-  const deleteBtn = document.getElementById('public-delete-selected-btn');
-  if (deleteBtn) {
-    deleteBtn.disabled = true;
-    deleteBtn.innerHTML = '<span class="spinner-border spinner-border-sm me-1"></span>Deleting...';
-  }
+  promptPublicDeleteMode(publicSelectedDocuments.size).then((deleteMode) => {
+    if (!deleteMode) {
+      return;
+    }
 
-  const deletePromises = Array.from(publicSelectedDocuments).map(docId =>
-    fetch(`/api/public_documents/${docId}`, { method: 'DELETE' })
-      .then(r => r.ok ? r.json() : Promise.reject(r))
-  );
+    const deleteBtn = document.getElementById('public-delete-selected-btn');
+    if (deleteBtn) {
+      deleteBtn.disabled = true;
+      deleteBtn.innerHTML = '<span class="spinner-border spinner-border-sm me-1"></span>Deleting...';
+    }
 
-  Promise.allSettled(deletePromises)
-    .then(results => {
-      const successful = results.filter(r => r.status === 'fulfilled').length;
-      const failed = results.filter(r => r.status === 'rejected').length;
-      if (failed > 0) alert(`Deleted ${successful} document(s). ${failed} failed to delete.`);
-      publicSelectedDocuments.clear();
-      updatePublicBulkActionButtons();
-      fetchPublicDocs();
-    })
-    .finally(() => {
-      if (deleteBtn) {
-        deleteBtn.disabled = false;
-        deleteBtn.innerHTML = '<i class="bi bi-trash me-1"></i>Delete Selected';
-      }
-    });
+    const deletePromises = Array.from(publicSelectedDocuments).map((docId) => requestPublicDocumentDeletion(docId, deleteMode));
+
+    Promise.allSettled(deletePromises)
+      .then((results) => {
+        const successful = results.filter((result) => result.status === 'fulfilled').length;
+        const failed = results.filter((result) => result.status === 'rejected').length;
+        if (failed > 0) {
+          const toastType = successful === 0 ? 'danger' : 'warning';
+          showPublicWorkspaceToast(`Deleted ${successful} document(s). ${failed} failed to delete.`, toastType);
+        }
+
+        if (publicSelectionMode) {
+          togglePublicSelectionMode();
+        } else {
+          publicSelectedDocuments.clear();
+          updatePublicBulkActionButtons();
+        }
+
+        fetchPublicDocs();
+      })
+      .finally(() => {
+        if (deleteBtn) {
+          deleteBtn.disabled = false;
+          deleteBtn.innerHTML = '<i class="bi bi-trash me-1"></i>Delete Selected';
+        }
+      });
+  });
 }
 
 function chatWithPublicSelected() {
diff --git a/application/single_app/static/js/public/public_workspace_utility.js b/application/single_app/static/js/public/public_workspace_utility.js
index d55959c3..85316737 100644
--- a/application/single_app/static/js/public/public_workspace_utility.js
+++ b/application/single_app/static/js/public/public_workspace_utility.js
@@ -13,6 +13,53 @@ function escapeHtml(unsafe) {
   return div.innerHTML;
 }
 
+/**
+ * Shows a Bootstrap toast for public workspace actions.
+ * @param {string} message - The message to display
+ * @param {string} [type='info'] - Bootstrap contextual color
+ * @param {number} [duration=5000] - Toast delay in milliseconds
+ */
+function showPublicWorkspaceToast(message, type = 'info', duration = 5000) {
+  const safeMessage = escapeHtml(message || '');
+  let toastContainer = document.getElementById('toast-container');
+
+  if (!toastContainer) {
+    toastContainer = document.createElement('div');
+    toastContainer.id = 'toast-container';
+    toastContainer.className = 'toast-container position-fixed bottom-0 end-0 p-3';
+    toastContainer.style.zIndex = '1100';
+    document.body.appendChild(toastContainer);
+  }
+
+  const toastId = `public-workspace-toast-${Date.now()}-${Math.floor(Math.random() * 1000)}`;
+  toastContainer.insertAdjacentHTML('beforeend', `
+    <div id="${toastId}" class="toast align-items-center text-bg-${type} border-0" role="alert" aria-live="assertive" aria-atomic="true">
+      <div class="d-flex">
+        <div class="toast-body">${safeMessage}</div>
+        <button type="button" class="btn-close btn-close-white me-2 m-auto" data-bs-dismiss="toast" aria-label="Close"></button>
+      </div>
+    </div>
+  `);
+
+  const toastElement = document.getElementById(toastId);
+  if (!toastElement) {
+    return;
+  }
+
+  if (!window.bootstrap || !window.bootstrap.Toast) {
+    toastElement.classList.add('show');
+    return;
+  }
+
+  const toast = new bootstrap.Toast(toastElement, { delay: duration });
+  toast.show();
+  toastElement.addEventListener('hidden.bs.toast', () => {
+    toastElement.remove();
+  });
+}
+
+window.showPublicWorkspaceToast = showPublicWorkspaceToast;
+
 /**
  * Updates the workspace status alert display based on workspace status
  * @param {Object} options - Configuration options
diff --git a/application/single_app/static/js/workspace/workspace-documents.js b/application/single_app/static/js/workspace/workspace-documents.js
index 481fe310..eefd0237 100644
--- a/application/single_app/static/js/workspace/workspace-documents.js
+++ b/application/single_app/static/js/workspace/workspace-documents.js
@@ -29,6 +29,12 @@ const docMetadataForm = document.getElementById("doc-metadata-form");
 const docsSharedOnlyFilter = document.getElementById("docs-shared-only-filter");
 const deleteSelectedBtn = document.getElementById("delete-selected-btn");
 const clearSelectionBtn = document.getElementById("clear-selection-btn");
+const documentDeleteModalElement = document.getElementById("documentDeleteModal");
+const documentDeleteModal = documentDeleteModalElement ? new bootstrap.Modal(documentDeleteModalElement) : null;
+const documentDeleteModalTitle = document.getElementById("documentDeleteModalLabel");
+const documentDeleteModalBody = document.getElementById("documentDeleteModalBody");
+const documentDeleteCurrentBtn = document.getElementById("documentDeleteCurrentBtn");
+const documentDeleteAllBtn = document.getElementById("documentDeleteAllBtn");
 
 // Selection mode variables
 let selectionModeActive = false;
@@ -84,6 +90,172 @@ function isColorLight(hexColor) {
     return luminance > 0.5;
 }
 
+function getDocumentDeleteModalContent(documentCount) {
+    if (documentCount === 1) {
+        return {
+            title: "Delete Document",
+            body: `
+                <p class="mb-2">Choose how to delete this document revision.</p>
+                <p class="mb-2"><strong>Delete Current Version</strong> removes the visible revision and keeps older revisions for later comparison.</p>
+                <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for this document.</p>
+            `,
+        };
+    }
+
+    return {
+        title: "Delete Selected Documents",
+        body: `
+            <p class="mb-2">Choose how to delete ${documentCount} selected current document revision(s).</p>
+            <p class="mb-2"><strong>Delete Current Version</strong> removes only the visible revision for each selected document and keeps older revisions.</p>
+            <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for each selected document.</p>
+        `,
+    };
+}
+
+function showDocumentDeleteFeedback(message, variant = "danger") {
+    if (typeof window.showToast === "function") {
+        window.showToast(message, variant);
+        return;
+    }
+
+    let container = document.getElementById("documentDeleteFeedbackContainer");
+    if (!container) {
+        container = document.createElement("div");
+        container.id = "documentDeleteFeedbackContainer";
+        container.className = "toast-container position-fixed top-0 end-0 p-3";
+        document.body.appendChild(container);
+    }
+
+    if (window.bootstrap && typeof window.bootstrap.Toast === "function") {
+        const toastElement = document.createElement("div");
+        toastElement.className = `toast align-items-center text-white bg-${variant} border-0`;
+        toastElement.setAttribute("role", "alert");
+        toastElement.setAttribute("aria-live", "assertive");
+        toastElement.setAttribute("aria-atomic", "true");
+
+        const wrapper = document.createElement("div");
+        wrapper.className = "d-flex";
+
+        const body = document.createElement("div");
+        body.className = "toast-body";
+        body.textContent = message;
+
+        const closeButton = document.createElement("button");
+        closeButton.type = "button";
+        closeButton.className = "btn-close btn-close-white me-2 m-auto";
+        closeButton.setAttribute("data-bs-dismiss", "toast");
+        closeButton.setAttribute("aria-label", "Close");
+
+        wrapper.appendChild(body);
+        wrapper.appendChild(closeButton);
+        toastElement.appendChild(wrapper);
+        container.appendChild(toastElement);
+
+        const toast = new window.bootstrap.Toast(toastElement);
+        toast.show();
+        toastElement.addEventListener("hidden.bs.toast", () => {
+            toastElement.remove();
+        });
+        return;
+    }
+
+    const alertElement = document.createElement("div");
+    alertElement.className = `alert alert-${variant} alert-dismissible fade show mb-2`;
+    alertElement.setAttribute("role", "alert");
+
+    const body = document.createElement("span");
+    body.textContent = message;
+
+    const closeButton = document.createElement("button");
+    closeButton.type = "button";
+    closeButton.className = "btn-close";
+    closeButton.setAttribute("data-bs-dismiss", "alert");
+    closeButton.setAttribute("aria-label", "Close");
+
+    alertElement.appendChild(body);
+    alertElement.appendChild(closeButton);
+    container.appendChild(alertElement);
+}
+
+function isDocumentDeleteModalReady() {
+    return Boolean(
+        documentDeleteModal &&
+        documentDeleteModalElement &&
+        documentDeleteModalElement.isConnected &&
+        documentDeleteModalBody &&
+        documentDeleteModalBody.isConnected &&
+        documentDeleteCurrentBtn &&
+        documentDeleteCurrentBtn.isConnected &&
+        documentDeleteAllBtn &&
+        documentDeleteAllBtn.isConnected
+    );
+}
+
+function promptDocumentDeleteMode(documentCount = 1) {
+    if (!isDocumentDeleteModalReady()) {
+        showDocumentDeleteFeedback("Delete confirmation dialog is unavailable. Refresh the page and try again.");
+        return Promise.resolve(null);
+    }
+
+    const modalContent = getDocumentDeleteModalContent(documentCount);
+    if (documentDeleteModalTitle) {
+        documentDeleteModalTitle.textContent = modalContent.title;
+    }
+    documentDeleteModalBody.innerHTML = modalContent.body;
+
+    return new Promise((resolve) => {
+        let settled = false;
+
+        const cleanup = () => {
+            documentDeleteModalElement.removeEventListener("hidden.bs.modal", handleHidden);
+            documentDeleteCurrentBtn.removeEventListener("click", handleCurrentOnly);
+            documentDeleteAllBtn.removeEventListener("click", handleAllVersions);
+        };
+
+        const finalize = (value) => {
+            if (settled) {
+                return;
+            }
+            settled = true;
+            cleanup();
+            resolve(value);
+        };
+
+        const handleHidden = () => finalize(null);
+        const handleCurrentOnly = () => {
+            documentDeleteModal.hide();
+            finalize("current_only");
+        };
+        const handleAllVersions = () => {
+            documentDeleteModal.hide();
+            finalize("all_versions");
+        };
+
+        documentDeleteModalElement.addEventListener("hidden.bs.modal", handleHidden);
+        documentDeleteCurrentBtn.addEventListener("click", handleCurrentOnly);
+        documentDeleteAllBtn.addEventListener("click", handleAllVersions);
+        documentDeleteModal.show();
+    });
+}
+
+async function requestDocumentDeletion(documentId, deleteMode) {
+    const query = new URLSearchParams({ delete_mode: deleteMode });
+    const response = await fetch(`/api/documents/${documentId}?${query.toString()}`, { method: "DELETE" });
+
+    let responseData = {};
+    try {
+        responseData = await response.json();
+    } catch (error) {
+        responseData = {};
+    }
+
+    if (!response.ok) {
+        throw responseData.error ? responseData : { error: `Server responded with status ${response.status}` };
+    }
+
+    return responseData;
+}
+
 // ------------- Event Listeners -------------
 
 // Page Size
@@ -1252,59 +1424,37 @@ window.onExtractMetadata = function (docId, event) {
 };
 
 
-window.deleteDocument = function(documentId, event) {
-    if (!confirm("Are you sure you want to delete this document? This action cannot be undone.")) return;
+window.deleteDocument = async function(documentId, event) {
+    const deleteMode = await promptDocumentDeleteMode(1);
+    if (!deleteMode) {
+        return;
+    }
 
-    const deleteBtn = event ? event.target.closest('button') : null;
-    if (deleteBtn) {
-        deleteBtn.disabled = true;
-        deleteBtn.innerHTML = `<span class="spinner-border spinner-border-sm" role="status" aria-hidden="true"></span>`;
+    const deleteTrigger = event ? event.target.closest('a, button') : null;
+    const originalDeleteTriggerHtml = deleteTrigger ? deleteTrigger.innerHTML : null;
+    if (deleteTrigger) {
+        deleteTrigger.classList.add('disabled');
+        deleteTrigger.setAttribute('aria-disabled', 'true');
+        deleteTrigger.innerHTML = `<span class="spinner-border spinner-border-sm" role="status" aria-hidden="true"></span>`;
     }
 
-    // Stop polling if active for this document
     if (activePolls.has(documentId)) {
-        // Find the interval ID associated with this poll to clear it (more robust approach needed if storing interval IDs)
-        // For now, just remove from the active set; the poll will eventually fail or stop when elements disappear
         activePolls.delete(documentId);
-        // Ideally, you'd store intervalId with the docId in a map to clear it here.
     }
 
-
-    fetch(`/api/documents/${documentId}`, { method: "DELETE" })
-        .then(response => {
-            if (!response.ok) {
-                return response.json().then(data => Promise.reject(data)).catch(() => Promise.reject({ error: `Server responded with status ${response.status}` }));
-            }
-            return response.json();
-        })
-        .then(data => {
-            console.log("Document deleted successfully:", data);
-            const docRow = document.getElementById(`doc-row-${documentId}`);
-            const detailsRow = document.getElementById(`details-row-${documentId}`);
-            const statusRow = document.getElementById(`status-row-${documentId}`);
-            if (docRow) docRow.remove();
-            if (detailsRow) detailsRow.remove();
-            if (statusRow) statusRow.remove();
-
-             // Refresh if the table body becomes empty OR to update pagination total count
-             if (documentsTableBody && documentsTableBody.childElementCount === 0) {
-                 fetchUserDocuments(); // Refresh to show 'No documents' message and correct pagination
-             } else {
-                  // Maybe just decrement total count locally and re-render pagination?
-                  // For simplicity, a full refresh might be acceptable unless dealing with huge lists/slow API
-                  fetchUserDocuments(); // Refresh to update pagination potentially
-             }
-
-        })
-        .catch(error => {
-            console.error("Error deleting document:", error);
-            alert("Error deleting document: " + (error.error || error.message || "Unknown error"));
-            // Re-enable button only if it still exists
-            if (deleteBtn && document.body.contains(deleteBtn)) {
-                 deleteBtn.disabled = false;
-                 deleteBtn.innerHTML = '<i class="bi bi-trash-fill"></i>';
-            }
-        });
+    try {
+        const responseData = await requestDocumentDeletion(documentId, deleteMode);
+        console.log("Document deleted successfully:", responseData);
+        fetchUserDocuments();
+    } catch (error) {
+        console.error("Error deleting document:", error);
+        alert("Error deleting document: " + (error.error || error.message || "Unknown error"));
+        if (deleteTrigger && document.body.contains(deleteTrigger)) {
+            deleteTrigger.classList.remove('disabled');
+            deleteTrigger.removeAttribute('aria-disabled');
+            deleteTrigger.innerHTML = originalDeleteTriggerHtml;
+        }
+    }
 }
 
 window.removeSelfFromDocument = function(documentId, event) {
@@ -1468,64 +1618,43 @@ function updateBulkActionButtons() {
 }
 
 // Delete selected documents
-window.deleteSelectedDocuments = function() {
+window.deleteSelectedDocuments = async function() {
     if (selectedDocuments.size === 0) return;
-    
-    if (!confirm(`Are you sure you want to delete ${selectedDocuments.size} document(s)? This action cannot be undone.`)) {
+
+    const deleteMode = await promptDocumentDeleteMode(selectedDocuments.size);
+    if (!deleteMode) {
         return;
     }
-    
+
     const documentIds = Array.from(selectedDocuments);
-    let completed = 0;
-    let failed = 0;
-    
-    // Process each document deletion sequentially
-    documentIds.forEach(docId => {
-        fetch(`/api/documents/${docId}`, { method: "DELETE" })
-            .then(response => {
-                if (response.ok) {
-                    completed++;
-                    const docRow = document.getElementById(`doc-row-${docId}`);
-                    const detailsRow = document.getElementById(`details-row-${docId}`);
-                    const statusRow = document.getElementById(`status-row-${docId}`);
-                    if (docRow) docRow.remove();
-                    if (detailsRow) detailsRow.remove();
-                    if (statusRow) statusRow.remove();
-                } else {
-                    failed++;
-                }
-                
-                // Update status when all operations complete
-                if (completed + failed === documentIds.length) {
-                    if (failed > 0) {
-                        alert(`Deleted ${completed} document(s), but failed to delete ${failed} document(s).`);
-                    } else {
-                        alert(`Successfully deleted ${completed} document(s).`);
-                    }
-                    
-                    // Refresh the documents list
-                    fetchUserDocuments();
-                    
-                    // Exit selection mode
-                    window.toggleSelectionMode();
-                }
-            })
-            .catch(error => {
-                failed++;
-                console.error("Error deleting document:", error);
-                
-                // Update status when all operations complete
-                if (completed + failed === documentIds.length) {
-                    alert(`Deleted ${completed} document(s), but failed to delete ${failed} document(s).`);
-                    
-                    // Refresh the documents list
-                    fetchUserDocuments();
-                    
-                    // Exit selection mode
-                    window.toggleSelectionMode();
-                }
-            });
-    });
+    if (deleteSelectedBtn) {
+        deleteSelectedBtn.disabled = true;
+        deleteSelectedBtn.innerHTML = `<span class="spinner-border spinner-border-sm me-1" role="status" aria-hidden="true"></span>Deleting...`;
+    }
+
+    documentIds.forEach((docId) => activePolls.delete(docId));
+
+    const results = await Promise.allSettled(documentIds.map((docId) => requestDocumentDeletion(docId, deleteMode)));
+    const completed = results.filter((result) => result.status === 'fulfilled').length;
+    const failed = results.filter((result) => result.status === 'rejected').length;
+
+    if (failed > 0) {
+        alert(`Deleted ${completed} document(s), but failed to delete ${failed} document(s).`);
+    }
+
+    if (selectionModeActive) {
+        window.toggleSelectionMode();
+    } else {
+        selectedDocuments.clear();
+        updateBulkActionButtons();
+    }
+
+    fetchUserDocuments();
+
+    if (deleteSelectedBtn) {
+        deleteSelectedBtn.disabled = false;
+        deleteSelectedBtn.innerHTML = '<i class="bi bi-trash me-1"></i>Delete Selected';
+    }
 };
 
 // Remove self from selected shared documents
diff --git a/application/single_app/templates/group_workspaces.html b/application/single_app/templates/group_workspaces.html
index ea22c764..771649df 100644
--- a/application/single_app/templates/group_workspaces.html
+++ b/application/single_app/templates/group_workspaces.html
@@ -1688,6 +1688,199 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
   const groupTagSelectionModal = new bootstrap.Modal(
     document.getElementById("groupTagSelectionModal")
   );
+  const groupDocumentDeleteModalElement = document.getElementById(
+    "groupDocumentDeleteModal"
+  );
+  const groupDocumentDeleteModal = groupDocumentDeleteModalElement
+    ? new bootstrap.Modal(groupDocumentDeleteModalElement)
+    : null;
+  const groupDocumentDeleteModalTitle = document.getElementById(
+    "groupDocumentDeleteModalLabel"
+  );
+  const groupDocumentDeleteModalBody = document.getElementById(
+    "groupDocumentDeleteModalBody"
+  );
+  const groupDeleteCurrentBtn = document.getElementById(
+    "groupDeleteCurrentBtn"
+  );
+  const groupDeleteAllBtn = document.getElementById("groupDeleteAllBtn");
+
+  function getGroupDeleteModalContent(documentCount) {
+    if (documentCount === 1) {
+      return {
+        title: "Delete Group Document",
+        body: `
+          <p class="mb-2">Choose how to delete this group document revision.</p>
+          <p class="mb-2"><strong>Delete Current Version</strong> removes the visible revision and keeps older revisions for later comparison.</p>
+          <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for this document.</p>
+        `,
+      };
+    }
+
+    return {
+      title: "Delete Selected Group Documents",
+      body: `
+        <p class="mb-2">Choose how to delete ${documentCount} selected current group document revision(s).</p>
+        <p class="mb-2"><strong>Delete Current Version</strong> removes only the visible revision for each selected document and keeps older revisions.</p>
+        <p class="mb-0"><strong>Delete All Versions</strong> permanently removes every stored revision for each selected document.</p>
+      `,
+    };
+  }
+
+  function showGroupDocumentDeleteFeedback(message, variant = "danger") {
+    if (typeof window.showToast === "function") {
+      window.showToast(message, variant);
+      return;
+    }
+
+    let container = document.getElementById("groupDocumentDeleteFeedbackContainer");
+    if (!container) {
+      container = document.createElement("div");
+      container.id = "groupDocumentDeleteFeedbackContainer";
+      container.className = "toast-container position-fixed top-0 end-0 p-3";
+      document.body.appendChild(container);
+    }
+
+    if (window.bootstrap && typeof window.bootstrap.Toast === "function") {
+      const toastElement = document.createElement("div");
+      toastElement.className = `toast align-items-center text-white bg-${variant} border-0`;
+      toastElement.setAttribute("role", "alert");
+      toastElement.setAttribute("aria-live", "assertive");
+      toastElement.setAttribute("aria-atomic", "true");
+
+      const wrapper = document.createElement("div");
+      wrapper.className = "d-flex";
+
+      const body = document.createElement("div");
+      body.className = "toast-body";
+      body.textContent = message;
+
+      const closeButton = document.createElement("button");
+      closeButton.type = "button";
+      closeButton.className = "btn-close btn-close-white me-2 m-auto";
+      closeButton.setAttribute("data-bs-dismiss", "toast");
+      closeButton.setAttribute("aria-label", "Close");
+
+      wrapper.appendChild(body);
+      wrapper.appendChild(closeButton);
+      toastElement.appendChild(wrapper);
+      container.appendChild(toastElement);
+
+      const toast = new window.bootstrap.Toast(toastElement);
+      toast.show();
+      toastElement.addEventListener("hidden.bs.toast", () => {
+        toastElement.remove();
+      });
+      return;
+    }
+
+    const alertElement = document.createElement("div");
+    alertElement.className = `alert alert-${variant} alert-dismissible fade show mb-2`;
+    alertElement.setAttribute("role", "alert");
+
+    const body = document.createElement("span");
+    body.textContent = message;
+
+    const closeButton = document.createElement("button");
+    closeButton.type = "button";
+    closeButton.className = "btn-close";
+    closeButton.setAttribute("data-bs-dismiss", "alert");
+    closeButton.setAttribute("aria-label", "Close");
+
+    alertElement.appendChild(body);
+    alertElement.appendChild(closeButton);
+    container.appendChild(alertElement);
+  }
+
+  function isGroupDocumentDeleteModalReady() {
+    return Boolean(
+      groupDocumentDeleteModal &&
+      groupDocumentDeleteModalElement &&
+      groupDocumentDeleteModalElement.isConnected &&
+      groupDocumentDeleteModalBody &&
+      groupDocumentDeleteModalBody.isConnected &&
+      groupDeleteCurrentBtn &&
+      groupDeleteCurrentBtn.isConnected &&
+      groupDeleteAllBtn &&
+      groupDeleteAllBtn.isConnected
+    );
+  }
+
+  function promptGroupDeleteMode(documentCount = 1) {
+    if (!isGroupDocumentDeleteModalReady()) {
+      showGroupDocumentDeleteFeedback("Delete confirmation dialog is unavailable. Refresh the page and try again.");
+      return Promise.resolve(null);
+    }
+
+    const modalContent = getGroupDeleteModalContent(documentCount);
+    if (groupDocumentDeleteModalTitle) {
+      groupDocumentDeleteModalTitle.textContent = modalContent.title;
+    }
+    groupDocumentDeleteModalBody.innerHTML = modalContent.body;
+
+    return new Promise((resolve) => {
+      let settled = false;
+
+      const cleanup = () => {
+        groupDocumentDeleteModalElement.removeEventListener(
+          "hidden.bs.modal",
+          handleHidden
+        );
+        groupDeleteCurrentBtn.removeEventListener("click", handleCurrentOnly);
+        groupDeleteAllBtn.removeEventListener("click", handleAllVersions);
+      };
+
+      const finalize = (value) => {
+        if (settled) {
+          return;
+        }
+        settled = true;
+        cleanup();
+        resolve(value);
+      };
+
+      const handleHidden = () => finalize(null);
+      const handleCurrentOnly = () => {
+        groupDocumentDeleteModal.hide();
+        finalize("current_only");
+      };
+      const handleAllVersions = () => {
+        groupDocumentDeleteModal.hide();
+        finalize("all_versions");
+      };
+
+      groupDocumentDeleteModalElement.addEventListener(
+        "hidden.bs.modal",
+        handleHidden
+      );
+      groupDeleteCurrentBtn.addEventListener("click", handleCurrentOnly);
+      groupDeleteAllBtn.addEventListener("click", handleAllVersions);
+      groupDocumentDeleteModal.show();
+    });
+  }
+
+  async function requestGroupDocumentDeletion(documentId, deleteMode) {
+    const query = new URLSearchParams({ delete_mode: deleteMode });
+    const response = await fetch(
+      `/api/group_documents/${documentId}?${query.toString()}`,
+      { method: "DELETE" }
+    );
+
+    let responseData = {};
+    try {
+      responseData = await response.json();
+    } catch (error) {
+      responseData = {};
+    }
+
+    if (!response.ok) {
+      throw responseData.error
+        ? responseData
+        : { error: `Server responded with status ${response.status}` };
+    }
+
+    return responseData;
+  }
 
   // --- Editors ---
   const groupPromptContentEl = document.getElementById("group-prompt-content");
@@ -2129,7 +2322,7 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
       .finally(() => {
         if (deleteBtn) {
           deleteBtn.disabled = false;
-          deleteBtn.innerHTML = `<i class="bi bi-trash"></i> Delete`;
+            deleteBtn.innerHTML = `<i class="bi bi-trash me-1"></i>Delete Selected`;
         }
       });
   }
@@ -2418,6 +2611,27 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
               </ul>
             </div>
           </div>
+
+          <div class="modal fade" id="groupDocumentDeleteModal" tabindex="-1" aria-labelledby="groupDocumentDeleteModalLabel" aria-hidden="true" autocomplete="off" data-lpignore="true" data-1p-ignore="true" data-bwignore="true">
+            <div class="modal-dialog">
+              <div class="modal-content">
+                <div class="modal-header">
+                  <h5 class="modal-title" id="groupDocumentDeleteModalLabel">Delete Group Document</h5>
+                  <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
+                </div>
+                <div class="modal-body" id="groupDocumentDeleteModalBody">
+                  <p class="mb-0">Choose how you want to delete this group document revision.</p>
+                </div>
+                <div class="modal-footer d-flex flex-wrap justify-content-between gap-2">
+                  <button type="button" class="btn btn-secondary" data-bs-dismiss="modal">Cancel</button>
+                  <div class="d-flex flex-wrap gap-2">
+                    <button type="button" class="btn btn-outline-danger" id="groupDeleteCurrentBtn">Delete Current Version</button>
+                    <button type="button" class="btn btn-danger" id="groupDeleteAllBtn">Delete All Versions</button>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
         `;
       }
     }
@@ -2833,39 +3047,43 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
   function fetchGroupDocuments() {
     if (!groupDocumentsTableBody || !activeGroupId) return; // Need table and active group
 
-    const placeholder = document.getElementById(
-      "group-legacy-update-prompt-placeholder"
-    );
-    if (placeholder) {
-      // remove old alert div if present
-      const old = placeholder.querySelector("#group-legacy-update-alert");
-      if (old) old.remove();
-    }
-
-    // Show loading state
-    groupDocumentsTableBody.innerHTML = `<tr class="table-loading-row"><td colspan="4"><div class="spinner-border spinner-border-sm me-2" role="status"></div> Loading group documents...</td></tr>`;
-    if (groupDocsPaginationContainer)
-      groupDocsPaginationContainer.innerHTML = ""; // Clear pagination
+    groupDocumentsTableBody.innerHTML = `
+      <tr class="table-loading-row">
+        <td colspan="4">
+          <div class="spinner-border spinner-border-sm me-2" role="status"><span class="visually-hidden">Loading...</span></div>
+          Loading group documents...
+        </td>
+      </tr>`;
+    if (groupDocsPaginationContainer) groupDocsPaginationContainer.innerHTML = "";
 
-    // Build query parameters for group documents endpoint
     const params = new URLSearchParams({
       page: groupDocsCurrentPage,
       page_size: groupDocsPageSize,
-      // Crucially, the backend /api/group_documents needs to know WHICH group
-      // It gets this from the user's active group setting server-side.
-      // We add filters here:
     });
-    if (groupDocsSearchTerm) params.append("search", groupDocsSearchTerm);
-    if (groupDocsClassificationFilter)
+    if (groupDocsSearchTerm) {
+      params.append("search", groupDocsSearchTerm);
+    }
+    if (groupDocsClassificationFilter) {
       params.append("classification", groupDocsClassificationFilter);
-    if (groupDocsAuthorFilter) params.append("author", groupDocsAuthorFilter);
-    if (groupDocsKeywordsFilter)
+    }
+    if (groupDocsAuthorFilter) {
+      params.append("author", groupDocsAuthorFilter);
+    }
+    if (groupDocsKeywordsFilter) {
       params.append("keywords", groupDocsKeywordsFilter);
-    if (groupDocsAbstractFilter)
+    }
+    if (groupDocsAbstractFilter) {
       params.append("abstract", groupDocsAbstractFilter);
-    if (groupDocsTagsFilter) params.append("tags", groupDocsTagsFilter);
-    if (groupDocsSortBy !== '_ts') params.append("sort_by", groupDocsSortBy);
-    if (groupDocsSortOrder !== 'desc') params.append("sort_order", groupDocsSortOrder);
+    }
+    if (groupDocsTagsFilter) {
+      params.append("tags", groupDocsTagsFilter);
+    }
+    if (groupDocsSortBy !== "_ts") {
+      params.append("sort_by", groupDocsSortBy);
+    }
+    if (groupDocsSortOrder !== "desc") {
+      params.append("sort_order", groupDocsSortOrder);
+    }
 
     console.log("Fetching group documents with params:", params.toString());
 
@@ -3564,7 +3782,7 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
   window.onExtractGroupMetadata = onExtractGroupMetadata; // Expose globally
 
   // --- Delete Group Document ---
-  function deleteGroupDocument(documentId, event) {
+  async function deleteGroupDocument(documentId, event) {
     // Renamed function
     // Permission check should happen server-side, but can add UI check too
     if (
@@ -3573,16 +3791,17 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
       alert("You do not have permission to delete documents in this group.");
       return;
     }
-    if (
-      !confirm(
-        "Are you sure you want to delete this group document? This action cannot be undone."
-      )
-    )
+
+    const deleteMode = await promptGroupDeleteMode(1);
+    if (!deleteMode) {
       return;
+    }
 
-    const deleteBtn = event ? event.target.closest("button") : null;
+    const deleteBtn = event ? event.target.closest("a, button") : null;
+    const originalDeleteBtnHtml = deleteBtn ? deleteBtn.innerHTML : null;
     if (deleteBtn) {
-      deleteBtn.disabled = true;
+      deleteBtn.classList.add("disabled");
+      deleteBtn.setAttribute("aria-disabled", "true");
       deleteBtn.innerHTML = `<span class="spinner-border spinner-border-sm"></span>`;
     }
 
@@ -3594,32 +3813,17 @@ <h5 class="modal-title" id="groupTagSelectionModalLabel">Select Tags</h5>
     // Use the group DELETE endpoint. Pass group_id as query param IF backend requires it.
     // Assuming backend gets active_group_id from session/context.
     // If needed: `/api/group_documents/${documentId}?group_id=${activeGroupId}`
-    fetch(`/api/group_documents/${documentId}`, { method: "DELETE" })
-      .then((response) =>
-        response.ok
-          ? response.json()
-          : response.json().then((err) => Promise.reject(err))
-      )
+    requestGroupDocumentDeletion(documentId, deleteMode)
       .then((data) => {
         console.log("Group document deleted:", data);
-        const docRow = document.getElementById(`group-doc-row-${documentId}`);
-        const detailsRow = document.getElementById(
-          `group-details-row-${documentId}`
-        );
-        const statusRow = document.getElementById(
-          `group-status-row-${documentId}`
-        );
-        if (docRow) docRow.remove();
-        if (detailsRow) detailsRow.remove();
-        if (statusRow) statusRow.remove();
-        // Refresh to update pagination etc.
         fetchGroupDocuments();
       })
       .catch((error) => {
         alert("Error deleting document: " + (error.error || error.message));
         if (deleteBtn && document.body.contains(deleteBtn)) {
-          deleteBtn.disabled = false;
-          deleteBtn.innerHTML = '<i class="bi bi-trash-fill"></i>';
+          deleteBtn.classList.remove("disabled");
+          deleteBtn.removeAttribute("aria-disabled");
+          deleteBtn.innerHTML = originalDeleteBtnHtml;
         }
       });
   }
diff --git a/application/single_app/templates/public_workspaces.html b/application/single_app/templates/public_workspaces.html
index 2d7b446b..447410ac 100644
--- a/application/single_app/templates/public_workspaces.html
+++ b/application/single_app/templates/public_workspaces.html
@@ -462,6 +462,28 @@ <h5 class="modal-title" id="publicDocMetadataModalLabel">Edit Document Metadata<
   </div>
 </div>
 
+<!-- Public Document Delete Modal -->
+<div class="modal fade" id="publicDocumentDeleteModal" tabindex="-1" aria-labelledby="publicDocumentDeleteModalLabel" aria-hidden="true">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title" id="publicDocumentDeleteModalLabel">Delete Public Document</h5>
+        <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
+      </div>
+      <div class="modal-body" id="publicDocumentDeleteModalBody">
+        <p class="mb-0">Choose how you want to delete this public document revision.</p>
+      </div>
+      <div class="modal-footer d-flex flex-wrap justify-content-between gap-2">
+        <button type="button" class="btn btn-secondary" data-bs-dismiss="modal">Cancel</button>
+        <div class="d-flex flex-wrap gap-2">
+          <button type="button" class="btn btn-outline-danger" id="publicDeleteCurrentBtn">Delete Current Version</button>
+          <button type="button" class="btn btn-danger" id="publicDeleteAllBtn">Delete All Versions</button>
+        </div>
+      </div>
+    </div>
+  </div>
+</div>
+
 <!-- Prompt Modal -->
 <div class="modal fade" id="publicPromptModal" tabindex="-1"><div class="modal-dialog modal-xl"><form id="public-prompt-form"><div class="modal-content"><div class="modal-header"><h5 class="modal-title" id="publicPromptModalLabel">Create Public Prompt</h5><button type="button" class="btn-close" data-bs-dismiss="modal"></button></div><div class="modal-body"><input type="hidden" id="public-prompt-id" /><div class="mb-3"><label for="public-prompt-name" class="form-label">Prompt Name</label><input type="text" class="form-control" id="public-prompt-name" required /></div><div class="mb-3"><label for="public-prompt-content" class="form-label">Prompt Content</label><textarea class="form-control" id="public-prompt-content" rows="10"></textarea></div></div><div class="modal-footer"><button id="public-prompt-save-btn" type="submit" class="btn btn-primary">Save Prompt</button></div></div></form></div></div>
 
diff --git a/application/single_app/templates/workspace.html b/application/single_app/templates/workspace.html
index 5adcf57f..3feee04f 100644
--- a/application/single_app/templates/workspace.html
+++ b/application/single_app/templates/workspace.html
@@ -1521,6 +1521,26 @@ <h6>Currently Shared With:</h6>
       <span class="tutorial-btn-label">Workspace Tutorial</span>
   </button>
 </div>
+<div class="modal fade" id="documentDeleteModal" tabindex="-1" aria-labelledby="documentDeleteModalLabel" aria-hidden="true" autocomplete="off" data-lpignore="true" data-1p-ignore="true" data-bwignore="true">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title" id="documentDeleteModalLabel">Delete Document</h5>
+        <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
+      </div>
+      <div class="modal-body" id="documentDeleteModalBody">
+        <p class="mb-0">Choose how you want to delete this document revision.</p>
+      </div>
+      <div class="modal-footer d-flex flex-wrap justify-content-between gap-2">
+        <button type="button" class="btn btn-secondary" data-bs-dismiss="modal">Cancel</button>
+        <div class="d-flex flex-wrap gap-2">
+          <button type="button" class="btn btn-outline-danger" id="documentDeleteCurrentBtn">Delete Current Version</button>
+          <button type="button" class="btn btn-danger" id="documentDeleteAllBtn">Delete All Versions</button>
+        </div>
+      </div>
+    </div>
+  </div>
+</div>
 <!-- Approve Shared Document Modal -->
 <div class="modal fade" id="approveSharedModal" tabindex="-1" aria-labelledby="approveSharedModalLabel" aria-hidden="true">
   <div class="modal-dialog">
@@ -1626,6 +1646,7 @@ <h5 class="modal-title" id="approveSharedModalLabel">Approve Shared Document</h5
         document.getElementById("workspaceTabContent"),
         document.getElementById("promptModal"),
         document.getElementById("docMetadataModal"),
+        document.getElementById("documentDeleteModal"),
         document.getElementById("bulkTagModal"),
         document.getElementById("tagManagementModal"),
         document.getElementById("tagSelectionModal"),
diff --git a/artifacts/SimpleChat.pdf b/artifacts/SimpleChat.pdf
new file mode 100644
index 00000000..28b4aeac
Binary files /dev/null and b/artifacts/SimpleChat.pdf differ
diff --git a/artifacts/release_timeline.pptx b/artifacts/release_timeline.pptx
index b165caf5..e8a00e6d 100644
Binary files a/artifacts/release_timeline.pptx and b/artifacts/release_timeline.pptx differ
diff --git a/docs/explanation/fixes/AGENT_TOOL_CITATION_FULL_RESULTS_FIX.md b/docs/explanation/fixes/AGENT_TOOL_CITATION_FULL_RESULTS_FIX.md
new file mode 100644
index 00000000..81d6459f
--- /dev/null
+++ b/docs/explanation/fixes/AGENT_TOOL_CITATION_FULL_RESULTS_FIX.md
@@ -0,0 +1,24 @@
+# AGENT TOOL CITATION FULL RESULTS FIX
+
+Fixed/Implemented in version: **0.240.048**
+
+Related config.py update: `VERSION = "0.240.048"`
+
+## Header Information
+
+- Issue description: Agent tool citations in chat showed a compact tabular summary with sample rows and truncated cell values, which made it difficult for users to verify whether the tool actually returned the correct rows.
+- Root cause analysis: The chat message stored a compact agent citation payload for performance, but the normal citation modal only rendered that compact payload and never hydrated the full raw artifact that was already persisted alongside the assistant message.
+- Version implemented: 0.240.048
+
+## Technical Details
+
+- Files modified: `application/single_app/route_frontend_conversations.py`, `application/single_app/static/js/chat/chat-messages.js`, `application/single_app/static/js/chat/chat-citations.js`, `application/single_app/config.py`, `functional_tests/test_agent_citation_full_results_modal.py`, `ui_tests/test_agent_citation_modal_full_results.py`
+- Code changes summary: Added a lazy conversation-scoped endpoint that returns the raw stored agent citation artifact on demand. Updated the chat citation buttons to carry artifact metadata, and changed the agent citation modal to fetch the raw payload when opened.
+- User-facing behavior: Tabular tool results now open with a short preview, can expand to 25 rows, and can then show all returned rows when more than 25 were returned by the tool call.
+- Testing approach: Added source-level regression coverage for the lazy artifact endpoint and row controls, plus a UI test that validates preview, 25-row, and full-row expansion in the browser.
+
+## Validation
+
+- Test results: Focused functional and UI coverage validate the new full-result hydration flow and the row expansion controls.
+- Before/after comparison: Before the fix, the citation modal only exposed the compact sample payload. After the fix, opening the citation loads the raw stored payload and lets the user inspect the entire returned row set.
+- User experience improvements: Users can verify tabular tool outputs directly from the citation modal without losing important rows to sample-only truncation.
\ No newline at end of file
diff --git a/docs/explanation/fixes/CHAT_CITATION_PAGE_SORT_FIX.md b/docs/explanation/fixes/CHAT_CITATION_PAGE_SORT_FIX.md
new file mode 100644
index 00000000..6a0157d5
--- /dev/null
+++ b/docs/explanation/fixes/CHAT_CITATION_PAGE_SORT_FIX.md
@@ -0,0 +1,52 @@
+# Chat Citation Page Sort Fix (v0.240.055)
+
+Fixed/Implemented in version: **0.240.055**
+
+## Header Information
+
+### Issue Description
+
+Streaming chat could fail after hybrid search completed when the citation list included both numeric page numbers and text page labels such as `Metadata` or `AI Vision`.
+
+This surfaced as `TypeError: '<' not supported between instances of 'int' and 'str'` while the backend tried to sort hybrid citations before finishing the response.
+
+### Root Cause Analysis
+
+`application/single_app/route_backend_chats.py` sorted hybrid citations with `page_number` directly as the key.
+
+Search chunk citations typically use numeric page values, but metadata-derived citations and vision citations use text labels. Python cannot compare those mixed types during sort, so the response failed after retrieval succeeded.
+
+### Version Implemented
+
+`0.240.055`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/config.py`
+- `functional_tests/test_chat_citation_page_sort_fix.py`
+
+### Code Changes Summary
+
+- Added `_coerce_citation_sort_number` to safely normalize numeric citation page or chunk values.
+- Added `_build_hybrid_citation_sort_key` so hybrid citations sort deterministically when `page_number` mixes integers, numeric strings, and text labels.
+- Updated both standard and streaming chat retrieval paths to use the shared helper instead of sorting directly on raw `page_number` values.
+- Preserved descending ordering for numeric page citations while keeping metadata-style citations stable and non-crashing.
+- Bumped the application version to `0.240.055`.
+
+## Validation
+
+### Testing Approach
+
+- Added `functional_tests/test_chat_citation_page_sort_fix.py`.
+- Verified numeric strings and numeric page values normalize correctly for sorting.
+- Verified mixed numeric and text page labels sort without raising type errors.
+- Verified both standard and streaming chat paths call the shared citation sort helper.
+
+### Impact Analysis
+
+- Streaming chat no longer crashes after successful retrieval when metadata citations are present.
+- Standard chat now uses the same safer citation ordering logic, which removes the same latent mixed-type failure there.
+- Citation ordering remains deterministic across page excerpts, metadata citations, and AI vision citations.
\ No newline at end of file
diff --git a/docs/explanation/fixes/CHAT_HISTORY_GROUNDED_FOLLOW_UP_FIX.md b/docs/explanation/fixes/CHAT_HISTORY_GROUNDED_FOLLOW_UP_FIX.md
new file mode 100644
index 00000000..03173851
--- /dev/null
+++ b/docs/explanation/fixes/CHAT_HISTORY_GROUNDED_FOLLOW_UP_FIX.md
@@ -0,0 +1,57 @@
+# Chat History Grounded Follow-Up Fix (v0.240.055)
+
+Fixed/Implemented in version: **0.240.055**
+
+## Header Information
+
+### Issue Description
+
+Follow-up prompts that referred to previously cited documents could lose grounded retrieval when the user did not re-enable workspace search on the next turn.
+
+The app already replayed prior assistant citation summaries into conversation history, but if that replay was not enough to answer the follow-up, the backend had no exact bounded document set to re-query. That made grounded follow-ups weaker than they should be and risked forcing users to manually reselect the same document context.
+
+### Root Cause Analysis
+
+`application/single_app/route_backend_chats.py` reused prior assistant citation context in history, but it did not persist an exact latest grounded document anchor for later turns.
+
+When workspace search was off, the chat routes could only rely on conversation prose and citation summaries. They could not selectively retry retrieval against the exact previously grounded documents, and they had no explicit no-search grounding instruction to fail closed when prior context was insufficient.
+
+### Version Implemented
+
+`0.240.055`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/functions_conversation_metadata.py`
+- `application/single_app/config.py`
+- `functional_tests/test_chat_history_grounded_follow_up_fix.py`
+
+### Code Changes Summary
+
+- Added stable grounded-document persistence in `application/single_app/functions_conversation_metadata.py` via `last_grounded_document_refs`, including stable `document_id`, scope, scope id, filename, and classification.
+- Added helper logic in `application/single_app/route_backend_chats.py` to normalize prior grounded refs, derive bounded search parameters, and build the no-search grounding system instruction.
+- Updated both non-streaming and streaming chat paths to evaluate whether prior conversation history is sufficient before issuing any new retrieval.
+- Added a bounded fallback path that searches only the previously grounded documents when history alone is not enough and workspace search remains disabled.
+- Preserved existing explicit workspace-selection behavior by keeping current workspace search authoritative when the user turns it on.
+- Updated message and conversation metadata so fallback-grounded turns persist the effective document scope, selected documents, and retrieval query for later follow-ups.
+- Bumped the application version to `0.240.055`.
+
+## Validation
+
+### Testing Approach
+
+- Added `functional_tests/test_chat_history_grounded_follow_up_fix.py`.
+- Verified stable grounded refs are built from search-backed document usage across personal, group, and public scopes.
+- Verified prior grounded refs normalize from `last_grounded_document_refs` first and fall back to document tags when needed.
+- Verified bounded fallback search parameters keep retrieval limited to previously grounded documents and preserve scope-specific ids.
+- Verified both standard and streaming chat paths contain the history-only assessment, previously grounded document fallback, and no-search grounding prompt wiring.
+
+### Impact Analysis
+
+- Follow-up turns can now stay grounded even when the user asks a short continuation question without re-enabling workspace search.
+- Retrieval remains bounded to the exact previously grounded documents instead of widening back out to all available workspaces.
+- When history and bounded fallback retrieval are still insufficient, the model is explicitly instructed to ask the user to select a workspace or document instead of improvising.
+- The persisted `last_grounded_document_refs` metadata gives later turns a precise anchor for grounded follow-up behavior.
\ No newline at end of file
diff --git a/docs/explanation/fixes/CHAT_SCOPE_TAG_FILTER_FIX.md b/docs/explanation/fixes/CHAT_SCOPE_TAG_FILTER_FIX.md
new file mode 100644
index 00000000..d3ea2979
--- /dev/null
+++ b/docs/explanation/fixes/CHAT_SCOPE_TAG_FILTER_FIX.md
@@ -0,0 +1,22 @@
+# CHAT SCOPE TAG FILTER FIX
+
+Fixed/Implemented in version: **0.240.029**
+
+## Header Information
+
+- Issue description: Chat retrieval could return chunks from documents outside the selected tag scope when the chat scope was limited to personal, group, or public workspaces.
+- Root cause analysis: `hybrid_search()` only appended the tag OData clause in the `all` scope branch, while the dedicated `personal`, `group`, and `public` branches ignored `tags_filter` entirely.
+- Version implemented: 0.240.029
+
+## Technical Details
+
+- Files modified: `application/single_app/functions_search.py`, `application/single_app/config.py`, `functional_tests/test_chat_scope_tag_filter_fix.py`
+- Code changes summary: Added tag-clause composition to the personal, group, and public `hybrid_search()` branches and aligned their selected Azure AI Search fields to include `document_tags` consistently.
+- Testing approach: Added a focused functional regression test that inspects the scoped `hybrid_search()` branches and verifies the version bump.
+- Impact analysis: Chat requests that rely on tag selection now constrain retrieval consistently across personal, group, public, and all-scope searches.
+
+## Validation
+
+- Test results: Targeted functional regression test verifies the tag filter clause is present in every scoped search branch.
+- Before/after comparison: Before the fix, tag selection only constrained `all`-scope hybrid search; after the fix, every chat document scope applies the same tag enforcement.
+- User experience improvements: Asking for document summaries while a tag is selected now stays within the tagged subset instead of pulling unrelated documents from the same workspace.
\ No newline at end of file
diff --git a/docs/explanation/fixes/CHAT_STREAM_HISTORY_CONTEXT_FIX.md b/docs/explanation/fixes/CHAT_STREAM_HISTORY_CONTEXT_FIX.md
new file mode 100644
index 00000000..4f1c1bc2
--- /dev/null
+++ b/docs/explanation/fixes/CHAT_STREAM_HISTORY_CONTEXT_FIX.md
@@ -0,0 +1,63 @@
+# Chat Stream History Context Fix (v0.240.053)
+
+Fixed/Implemented in version: **0.240.053**
+
+## Header Information
+
+### Issue Description
+
+Follow-up prompts in chat streaming mode could lean too heavily on the latest reply because the streaming route rebuilt model history with a narrower, drifted code path.
+
+When the recent message window was small, older turns were dropped instead of summarized, which made short instructions like "please list the locations out in a single table" lose important context from earlier turns.
+
+### Root Cause Analysis
+
+`application/single_app/route_backend_chats.py` maintained two separate conversation-history builders.
+
+The non-streaming path already supported older-turn summarization, masked-message filtering, inactive-thread filtering, and richer file and image context handling. The streaming path had its own reduced implementation, so the two code paths diverged over time.
+
+### Version Implemented
+
+`0.240.053`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/config.py`
+- `functional_tests/test_chat_stream_history_context_fix.py`
+- `application/single_app/static/js/chat/chat-thoughts.js`
+- `application/single_app/static/js/chat/chat-messages.js`
+
+### Code Changes Summary
+
+- Added a shared `build_conversation_history_segments` helper inside `application/single_app/route_backend_chats.py`.
+- Switched both the streaming and non-streaming chat paths to use the same helper for recent-turn selection, older-turn summarization, masked-content removal, inactive-thread filtering, and file or image context conversion.
+- Updated the streaming path to keep the default system prompt insertion summary-aware, matching the non-streaming behavior.
+- Added compact `history_context` diagnostics so the backend records which message refs were treated as older, recent, summarized, skipped, and finally sent to the model.
+- Emitted the history context into thoughts, assistant metadata, and optional debug citations so follow-up context selection is visible during troubleshooting.
+- Kept the thoughts timeline concise by showing only the short history-context summary there, while leaving the detailed refs in message metadata and optional debug citations.
+- Hydrated prior assistant citation artifacts and appended tabular-aware, deduplicated citation results to assistant history turns so follow-up questions can reuse exact prior tool outputs instead of only the assistant prose.
+- Updated the chat message metadata drawer to render the new history-context detail.
+- Bumped the application version to `0.240.053`.
+
+## Validation
+
+### Testing Approach
+
+- Added `functional_tests/test_chat_stream_history_context_fix.py`.
+- Verified the shared history builder summarizes older turns when the recent window is smaller than the full conversation.
+- Verified masked and inactive messages are filtered before the final payload is sent to the model.
+- Verified both streaming and non-streaming routes call the shared helper.
+- Verified assistant history turns include prior citation results for follow-up prompts without dropping later file results behind redundant cross-sheet duplicates.
+- Verified history-context diagnostics stay available in backend thought and metadata plumbing, while the thoughts UI remains summary-only.
+
+### Impact Analysis
+
+- Streaming follow-up prompts now retain older conversational context through the same summary path already used elsewhere.
+- Short follow-up requests are less likely to anchor only on the immediately preceding answer.
+- Each assistant response now carries enough history-selection detail to confirm which message ids and roles actually reached the model.
+- The thoughts timeline stays readable instead of showing the full right-side history debug payload inline.
+- Follow-up questions can now reuse prior citation results, including exact tabular tool outputs that were only visible in the citation drawer before, while preserving distinct values from multiple files.
+- Future history-preparation changes now land in one place instead of drifting between two chat execution paths.
\ No newline at end of file
diff --git a/docs/explanation/fixes/CITATION_REVISION_LOOKUP_FIX.md b/docs/explanation/fixes/CITATION_REVISION_LOOKUP_FIX.md
new file mode 100644
index 00000000..31cdf919
--- /dev/null
+++ b/docs/explanation/fixes/CITATION_REVISION_LOOKUP_FIX.md
@@ -0,0 +1,51 @@
+# Citation Revision Lookup Fix (v0.240.024)
+
+Fixed/Implemented in version: **0.240.024**
+
+## Header Information
+
+### Issue Description
+
+Moving forward, once document revisioning is active, older chat citations must continue to resolve against the exact document revision that was cited when the message was created.
+
+The chat UI already preserves the citation chunk ID and enhanced citations already load documents by exact `doc_id`, but the text citation lookup route was still authorizing against mutable search chunk ownership fields instead of the exact document record behind the chunk.
+
+### Root Cause Analysis
+
+When an older personal revision is archived, chunk visibility updates rewrite the indexed chunk scope fields so the archived revision is no longer part of normal workspace search.
+
+That is correct for search visibility, but it means the chunk record is no longer a reliable source of document ownership for historical citation lookup. The authoritative source is the exact document metadata record identified by `document_id`.
+
+### Version Implemented
+
+`0.240.024`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_backend_documents.py`
+- `application/single_app/config.py`
+- `functional_tests/test_citation_revision_lookup_fix.py`
+
+### Code Changes Summary
+
+- Added citation helpers that extract the exact document ID behind the citation chunk.
+- Updated `/api/get_citation` to authorize citation access by resolving the exact document record for personal, group, and public scopes.
+- Kept citation content lookup keyed by the original chunk ID, while moving access checks to the revision-aware document metadata path.
+- Bumped the application version to `0.240.024`.
+
+## Validation
+
+### Testing Approach
+
+- Added `functional_tests/test_citation_revision_lookup_fix.py`.
+- Verified citation document ID extraction prefers chunk metadata and falls back to the chunk ID prefix when needed.
+- Verified citation access lookup uses the exact document ID across personal, group, and public scopes.
+- Verified enhanced citations still resolve blob-backed content from exact document metadata.
+
+### Impact Analysis
+
+- New conversations and citations created after revisioning now continue to resolve the correct document revision by exact document ID.
+- Historical text citations no longer depend on archived search chunk scope fields to prove ownership.
+- Enhanced citations keep using the exact document record, including its stored blob path metadata, for revision-aware blob retrieval.
\ No newline at end of file
diff --git a/docs/explanation/fixes/DOCUMENT_REVISION_CURRENT_VERSION_FIX.md b/docs/explanation/fixes/DOCUMENT_REVISION_CURRENT_VERSION_FIX.md
new file mode 100644
index 00000000..7f940959
--- /dev/null
+++ b/docs/explanation/fixes/DOCUMENT_REVISION_CURRENT_VERSION_FIX.md
@@ -0,0 +1,81 @@
+# Document Revision Current Version Fix (0.240.022)
+
+Fixed/Implemented in version: **0.240.022**
+
+## Header Information
+
+### Issue Description
+
+Uploading a document with the same name created a higher revision number, but the new revision started with empty tags and default classification metadata.
+
+Older revisions also remained visible in workspace document lists and continued to participate in chat search, which made the revision model unusable in day-to-day workspace flows.
+
+Deleting the visible revision did not distinguish between removing only the current revision and removing every stored version of that document.
+
+### Root Cause Analysis
+
+The document metadata model tracked a numeric `version`, but it did not maintain a stable revision family identifier or an explicit current-version flag.
+
+Duplicate uploads therefore behaved like unrelated documents for metadata inheritance, list filtering, search visibility, and deletion behavior.
+
+### Version Implemented
+
+`0.240.022`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/functions_documents.py`
+- `application/single_app/functions_search.py`
+- `application/single_app/route_backend_documents.py`
+- `application/single_app/route_backend_group_documents.py`
+- `application/single_app/route_backend_public_documents.py`
+- `application/single_app/route_external_public_documents.py`
+- `application/single_app/route_enhanced_citations.py`
+- `application/single_app/static/js/workspace/workspace-documents.js`
+- `application/single_app/static/js/public/public_workspace.js`
+- `application/single_app/templates/workspace.html`
+- `application/single_app/templates/public_workspaces.html`
+- `application/single_app/templates/group_workspaces.html`
+- `application/single_app/config.py`
+- `functional_tests/test_document_revision_current_version_fix.py`
+- `ui_tests/test_workspace_family_document_revision_delete_modal.py`
+
+### Code Changes Summary
+
+- Added revision-family metadata so duplicate-name uploads now share a stable `revision_family_id` and explicitly mark which revision is current.
+- Carried forward editable metadata such as title, abstract, keywords, publication date, authors, classification, tags, and sharing metadata when a new revision is created.
+- Archived older revisions from search visibility while keeping them stored for future comparison work.
+- Kept the active blob path at the existing alias shape `user-id/filename`, `group-id/filename`, or `public-workspace-id/filename` so current citations and workspace downloads keep their established path structure.
+- Added hierarchical archived revision blob paths at `user-id/revision-family-id/revision-document-id/filename`, `group-id/revision-family-id/revision-document-id/filename`, and `public-workspace-id/revision-family-id/revision-document-id/filename` so prior current blobs are preserved before overwrite.
+- Stored `blob_container`, `blob_path`, `archived_blob_path`, and `blob_path_mode` on document metadata and taught enhanced citations to prefer those values with legacy fallback.
+- Updated personal, group, public, and external public list routes so only current revisions are returned to workspace views.
+- Added revision-aware deletion so users can choose **Delete Current Version** or **Delete All Versions** from the workspace UI.
+- Bumped the application version to `0.240.022`.
+
+### Testing Approach
+
+- Added a functional regression test that validates revision-family metadata markers, hybrid alias-plus-archive blob paths, current-only route filtering, revision-aware delete mode handling, and version/documentation alignment.
+- Added a Playwright UI regression test that verifies the personal, group, and public workspace pages use Bootstrap revision delete modals instead of native browser confirms.
+
+### Impact Analysis
+
+- Duplicate uploads now behave like real document revisions instead of disconnected records.
+- Workspace lists and chat search now focus on the current revision while older revisions remain retained in storage.
+- Current document download and citation flows keep the established alias path, while older revisions now get their own preserved blob location before a new upload overwrites the alias.
+- Users can remove only the visible revision without automatically deleting older revisions, or choose to remove the full revision history when needed.
+
+## Validation
+
+### Before/After Comparison
+
+Before: same-name uploads reset tags and classification, older revisions stayed visible and searchable, deletion acted like a single hard delete with no revision choice, and blob storage overwrote prior binary content at the shared workspace alias path.
+
+After: same-name uploads inherit metadata into a new current revision, older revisions are retained but hidden from workspace/search flows, deletion offers **Delete Current Version** and **Delete All Versions**, and the previous current blob is archived at `scope-id/revision-family-id/revision-document-id/filename` before the alias path is overwritten.
+
+### Test Results
+
+- Functional regression coverage added in `functional_tests/test_document_revision_current_version_fix.py`.
+- UI regression coverage added in `ui_tests/test_workspace_family_document_revision_delete_modal.py`.
+- Current enhanced citation lookups now prefer stored blob metadata and fall back to legacy alias paths for older documents that have not been revised since the hybrid scheme was introduced.
\ No newline at end of file
diff --git a/docs/explanation/fixes/FACT_MEMORY_STREAMING_CONTEXT_FIX.md b/docs/explanation/fixes/FACT_MEMORY_STREAMING_CONTEXT_FIX.md
new file mode 100644
index 00000000..959062a0
--- /dev/null
+++ b/docs/explanation/fixes/FACT_MEMORY_STREAMING_CONTEXT_FIX.md
@@ -0,0 +1,48 @@
+# FACT MEMORY STREAMING CONTEXT FIX
+
+Fixed/Implemented in version: **0.240.051**
+
+Related config.py update: `VERSION = "0.240.051"`
+
+## Issue Description
+
+Saved fact-memory entries were present in the `agent_facts` Cosmos DB container, but normal chat usage still behaved as if fact memory was empty.
+
+## Root Cause Analysis
+
+- The standard `/api/chat` path prepended fact memory into the model context before agent execution.
+- The main `/api/chat/stream` path did not prepend the same fact-memory system message, so streaming conversations skipped saved facts entirely.
+- The fact lookup helper also overwrote the caller-provided agent id with the default configured agent id, which could break per-agent fact scoping.
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/config.py`
+- `functional_tests/test_fact_memory_streaming_context_fix.py`
+
+### Code Changes Summary
+
+- Removed the fallback-to-default-agent overwrite inside the fact lookup helper so it now respects the selected agent id supplied by the current chat path.
+- Added a shared `inject_fact_memory_context(...)` helper that prepends both fact memory and conversation metadata into the model history.
+- Moved the fact-memory helpers into the shared `register_route_backend_chats(...)` scope so both `/api/chat` and `/api/chat/stream` can resolve them at runtime.
+- Wired that helper into both the standard chat path and the streaming chat path so agent conversations use the same fact-memory context assembly.
+- Bumped the application version to `0.240.051`.
+
+### Testing Approach
+
+- Functional regression: `functional_tests/test_fact_memory_streaming_context_fix.py`
+
+## Validation
+
+### Before
+
+- Facts could be stored successfully in Cosmos DB, but streaming chat requests still reached the model without a `<Fact Memory>` system message.
+- Fact lookup could silently use the default agent id instead of the selected agent id.
+
+### After
+
+- Both chat execution paths prepend the same fact-memory and conversation-metadata context before agent invocation.
+- Fact lookup preserves the selected agent id passed by the caller.
+- Saved facts in `agent_facts` now reach the streaming chat path instead of only the non-streaming route.
\ No newline at end of file
diff --git a/docs/explanation/fixes/HISTORICAL_ENHANCED_CITATION_REVISION_RENDERING_FIX.md b/docs/explanation/fixes/HISTORICAL_ENHANCED_CITATION_REVISION_RENDERING_FIX.md
new file mode 100644
index 00000000..513692e8
--- /dev/null
+++ b/docs/explanation/fixes/HISTORICAL_ENHANCED_CITATION_REVISION_RENDERING_FIX.md
@@ -0,0 +1,52 @@
+# Historical Enhanced Citation Revision Rendering Fix (v0.240.025)
+
+Fixed/Implemented in version: **0.240.025**
+
+## Header Information
+
+### Issue Description
+
+Once document revisioning is enabled, users can open a newer revision in a new chat while still expecting older chat citations to render the exact archived PDF and tabular file that was cited originally.
+
+The archived file content still exists in blob storage under the revision-aware path, but older chat citations were falling back to standard text/schema citations instead of opening the enhanced viewer.
+
+### Root Cause Analysis
+
+The chat page only keeps the current workspace document list in memory.
+
+Older chat citations reference exact historical `doc_id` values that are no longer part of that current-only list. `showEnhancedCitationModal(...)` required in-memory metadata to determine the file type, so it treated older cited revisions as unknown documents and immediately fell back to standard citation rendering before the archived blob could ever be requested.
+
+### Version Implemented
+
+`0.240.025`
+
+## Technical Details
+
+### Files Modified
+
+- `application/single_app/route_enhanced_citations.py`
+- `application/single_app/static/js/chat/chat-documents.js`
+- `application/single_app/static/js/chat/chat-enhanced-citations.js`
+- `application/single_app/config.py`
+- `functional_tests/test_historical_enhanced_citation_revision_rendering_fix.py`
+
+### Code Changes Summary
+
+- Added an enhanced citation metadata endpoint that resolves an exact `doc_id` across personal, group, and public workspaces.
+- Added client-side caching and on-demand metadata fetch for cited revisions that are not present in the current workspace document list.
+- Updated the enhanced citation modal flow so older chat citations can still render archived PDF and tabular content instead of falling back to standard text or schema citations.
+- Bumped the application version to `0.240.025`.
+
+## Validation
+
+### Testing Approach
+
+- Added `functional_tests/test_historical_enhanced_citation_revision_rendering_fix.py`.
+- Verified the chat client now fetches exact document metadata on demand for historical cited revisions.
+- Verified the enhanced citation backend exposes a metadata lookup route keyed by exact `doc_id`.
+- Verified version and fix documentation alignment for `0.240.025`.
+
+### Impact Analysis
+
+- Older chat citations now keep rendering archived PDF and tabular content after a newer document revision becomes current.
+- Current-only workspace document loading remains intact while historical citation rendering gains a revision-aware metadata lookup path.
\ No newline at end of file
diff --git a/docs/explanation/fixes/MULTI_FILE_TABULAR_DISTINCT_URL_ANALYSIS_FIX.md b/docs/explanation/fixes/MULTI_FILE_TABULAR_DISTINCT_URL_ANALYSIS_FIX.md
new file mode 100644
index 00000000..e786e903
--- /dev/null
+++ b/docs/explanation/fixes/MULTI_FILE_TABULAR_DISTINCT_URL_ANALYSIS_FIX.md
@@ -0,0 +1,40 @@
+# Multi-File Tabular Distinct URL Analysis Fix
+
+Issue description: Workspace chat could call tabular tools against multiple selected workbooks, but the final answer still depended on LLM planning and synthesis. In multi-file distinct SharePoint/site questions, the route could underuse successful tool results from later files and answer from only one workbook.
+
+Version implemented: 0.240.052
+
+Fixed in version: 0.240.052
+
+Root cause analysis: The existing tabular flow used one-file analytical tools correctly, but multi-file coverage across selected workbooks was still heuristic. The route delegated repeated per-file execution to the SK planner and reviewer recovery path, which could enrich one workbook more than another and hand the outer model separate tool summaries instead of one deterministic combined result.
+
+Technical details
+
+Files modified:
+- application/single_app/route_backend_chats.py
+- application/single_app/config.py
+- functional_tests/test_tabular_multi_file_distinct_url_union.py
+
+Code changes summary:
+- Added a narrow deterministic multi-file route branch for distinct URL/site questions.
+- Added schema-based sheet and column selection for URL/location-style workbook columns.
+- Added route-side union and exact de-duplication of per-file distinct URL results before final prompt handoff.
+- Rewired all existing workspace and chat tabular analysis call sites to go through the new multi-file-aware wrapper before falling back to the existing SK planner.
+
+Testing approach:
+- Added a functional test that validates multi-file mode detection, sheet and column selection, combined exact distinct-value union behavior, and route wiring.
+
+Impact analysis:
+- Single-file tabular behavior still falls through to the existing SK planner.
+- The new deterministic path only applies to a narrow multi-file distinct URL/site question shape, which limits risk to the rest of tabular analysis.
+
+Validation
+
+Before:
+- Multi-file distinct SharePoint/site questions could produce correct per-file tool executions but still answer from only one workbook.
+
+After:
+- Multi-file distinct SharePoint/site questions can union per-file results in the route before the final model response.
+
+Related functional tests:
+- functional_tests/test_tabular_multi_file_distinct_url_union.py
\ No newline at end of file
diff --git a/docs/explanation/fixes/PUBLIC_WORKSPACE_DELETE_TOAST_FIX.md b/docs/explanation/fixes/PUBLIC_WORKSPACE_DELETE_TOAST_FIX.md
new file mode 100644
index 00000000..95c88577
--- /dev/null
+++ b/docs/explanation/fixes/PUBLIC_WORKSPACE_DELETE_TOAST_FIX.md
@@ -0,0 +1,45 @@
+# PUBLIC_WORKSPACE_DELETE_TOAST_FIX
+
+Fixed/Implemented in version: **0.240.056**
+
+## Issue Description
+
+Public workspace document delete failures used blocking browser `alert(...)` dialogs instead of the app's Bootstrap toast pattern.
+
+## Root Cause Analysis
+
+The public workspace page did not have a shared notification helper for document delete failures, so the single-delete and bulk-delete error paths surfaced native alerts directly from `public_workspace.js`.
+
+## Technical Details
+
+Files modified:
+
+- `application/single_app/static/js/public/public_workspace_utility.js`
+- `application/single_app/static/js/public/public_workspace.js`
+- `application/single_app/config.py`
+- `functional_tests/test_public_workspace_delete_toast_fix.py`
+- `ui_tests/test_public_workspace_delete_error_toast.py`
+
+Code changes summary:
+
+- Added `showPublicWorkspaceToast()` to the shared public workspace utility script.
+- Routed single-document delete failures through the shared toast helper with a danger variant.
+- Routed bulk delete partial-failure messaging through the same toast helper with warning or danger variants.
+- Added source-level and UI regression coverage for the non-blocking delete failure experience.
+
+Testing approach:
+
+- Added a functional regression test that verifies the shared toast helper exists and the delete flows call it instead of `alert(...)`.
+- Added a Playwright UI regression test that intercepts a failing public document delete request and confirms the page shows a toast without raising a browser dialog.
+
+## Validation
+
+Before:
+
+- Failed public document deletes showed blocking browser alerts.
+- Bulk delete partial failures also used alerts, interrupting the workflow.
+
+After:
+
+- Public workspace delete failures surface in the shared Bootstrap toast container.
+- Delete failure messaging is non-blocking and consistent with the rest of the application's notification patterns.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_ALL_SCOPE_GROUP_SOURCE_CONTEXT_FIX.md b/docs/explanation/fixes/TABULAR_ALL_SCOPE_GROUP_SOURCE_CONTEXT_FIX.md
new file mode 100644
index 00000000..7504fb34
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_ALL_SCOPE_GROUP_SOURCE_CONTEXT_FIX.md
@@ -0,0 +1,40 @@
+# Tabular All-Scope Group Source Context Fix
+
+Fixed/Implemented in version: **0.240.032**
+
+Related config.py update: `VERSION = "0.240.032"`
+
+## Issue Description
+
+Tabular analysis could fail on group or public workbook files when chat document scope was set to `all`, even though the documents were present in search results and visible in blob storage.
+
+The failure showed up as `BlobNotFound` during workbook schema preload for files that were actually stored under group or public blob prefixes.
+
+## Root Cause Analysis
+
+- Hybrid search results already carried per-document `group_id` and `public_workspace_id`, but `collect_workspace_tabular_filenames()` reduced those results to a bare filename set.
+- The tabular analysis runner then applied one batch-wide `source_hint`, which resolves to `workspace` whenever `document_scope='all'`.
+- As a result, group and public workbook hits discovered in all-scope search were preloaded from the personal workspace container instead of their real blob locations.
+
+## Files Modified
+
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/config.py`
+- `functional_tests/test_tabular_all_scope_group_source_context.py`
+
+## Code Changes Summary
+
+- Added per-file tabular source-context helpers so search hits and selected documents keep their original `group_id` or `public_workspace_id` metadata.
+- Updated both chat and streaming tabular-analysis paths to pass per-file source contexts into `run_tabular_sk_analysis()` instead of relying on one shared `source_hint` for the whole batch.
+- Updated schema-preload prompt context so each workbook advertises its own `source_context` metadata to later tool calls.
+- Preserved `public_workspace_id` alongside `group_id` on combined search documents so mixed-scope tabular analysis has the metadata it needs.
+
+## Testing Approach
+
+- Functional regression: `functional_tests/test_tabular_all_scope_group_source_context.py`
+
+## Validation
+
+- All-scope tabular search results now preserve group/public source metadata per file.
+- Group and public workbook hits found during `document_scope='all'` analysis preload against the correct blob container instead of defaulting to personal workspace storage.
+- Explicit selected tabular documents in `all` scope can now resolve from group and public Cosmos containers as well.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_AUTHOR_METADATA_NORMALIZATION_FIX.md b/docs/explanation/fixes/TABULAR_AUTHOR_METADATA_NORMALIZATION_FIX.md
new file mode 100644
index 00000000..16656c94
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_AUTHOR_METADATA_NORMALIZATION_FIX.md
@@ -0,0 +1,22 @@
+# TABULAR AUTHOR METADATA NORMALIZATION FIX
+
+Fixed/Implemented in version: **0.240.028**
+
+## Header Information
+
+- Issue description: Tabular uploads could fail during Azure AI Search indexing when the chunk `author` field contained `null` or blank list members.
+- Root cause analysis: Document metadata carried `authors` values forward without sanitization, and chunk indexing paths trusted those values when building the search payload.
+- Version implemented: 0.240.028
+
+## Technical Details
+
+- Files modified: `application/single_app/functions_documents.py`, `application/single_app/config.py`, `functional_tests/test_tabular_author_metadata_normalization_fix.py`
+- Code changes summary: Hardened `ensure_list()` to remove null and blank items, normalized carried-forward `authors` metadata, normalized chunk author values before single-chunk upload and chunk metadata sync, and defaulted new document `authors` values to an empty list.
+- Testing approach: Added a focused functional regression test that validates the helper behavior and checks the tabular indexing integration points in source.
+- Impact analysis: Prevents enhanced-citation tabular uploads from failing on invalid `author` metadata while preserving existing author lists that contain valid string values.
+
+## Validation
+
+- Test results: Targeted functional test validates author normalization behavior and version bump expectations.
+- Before/after comparison: Before the fix, `author` could reach Azure AI Search as `null` or contain null members; after the fix, it is always emitted as a list of non-empty strings.
+- User experience improvements: XLSX/CSV uploads that previously failed during schema-summary indexing now complete without the invalid-author payload error.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_CONTEXTUAL_CELL_SEARCH_FIX.md b/docs/explanation/fixes/TABULAR_CONTEXTUAL_CELL_SEARCH_FIX.md
new file mode 100644
index 00000000..106e0099
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_CONTEXTUAL_CELL_SEARCH_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR CONTEXTUAL CELL SEARCH FIX
+
+Fixed/Implemented in version: **0.240.039**
+
+Related config.py update: `VERSION = "0.240.039"`
+
+## Header Information
+
+- Issue description: Workbook questions about embedded SharePoint links could still miss valid results when whether a URL counted depended on the surrounding text in the original cell rather than the URL text itself.
+- Root cause analysis: The planner understood URL extraction, but it still treated `get_distinct_values(extract_mode='url')` as sufficient even when the relevant category signal lived in the full cell text. The raw fallback handoff also sampled only a handful of matching rows, so modest search cohorts could lose the context the outer model needed.
+- Version implemented: 0.240.039
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/config.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Clarified that `filter_rows` is the text-search tool for context-sensitive cell matching, updated reviewer and main analysis prompts to search/filter the original text column before classifying embedded URLs, and preserved complete small filter/query row sets in the raw fallback handoff when they fit the prompt budget.
+- Testing approach: Added regression coverage for full row-context preservation in fallback summaries and updated prompt/version checks for the new contextual search guidance.
+- Impact analysis: Context-dependent workbook questions can now preserve the original matching cell text instead of forcing the outer model to infer category membership from extracted URLs alone.
+
+## Validation
+
+- Test results: Focused tabular regressions verify prompt guidance, reviewer recovery wiring, full small-row fallback preservation, and the updated version checks.
+- Before/after comparison: Before the fix, reviewer recovery could jump straight to URL extraction and the fallback handoff sampled only a few matching rows. After the fix, the planner is told to search/filter the original text column first when context matters, and modest row cohorts can survive the handoff intact.
+- User experience improvements: Questions like counting SharePoint sites from mixed `Location` cells can retain the cell context needed to include URLs whose host/path text does not itself contain the qualifying keyword.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_DISTINCT_VALUE_HANDOFF_FIX.md b/docs/explanation/fixes/TABULAR_DISTINCT_VALUE_HANDOFF_FIX.md
new file mode 100644
index 00000000..ead6fc23
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_DISTINCT_VALUE_HANDOFF_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR DISTINCT VALUE HANDOFF FIX
+
+Fixed/Implemented in version: **0.240.036**
+
+Related config.py update: `VERSION = "0.240.036"`
+
+## Header Information
+
+- Issue description: Successful `get_distinct_values` reviewer-recovery runs could still produce weak final answers because the outer-model handoff compacted the value list too aggressively.
+- Root cause analysis: The reviewer recovery stage executed the right analytical tool, but the raw fallback formatter treated distinct-value lists like generic payloads and reduced them to a tiny preview. The outer GPT then saw a truncated list and answered conservatively instead of using the tool-backed values.
+- Version implemented: 0.240.036
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Added a list-aware fallback path for `get_distinct_values` so full scalar value lists are preserved when they fit the prompt budget, updated the reviewer prompt to favor filtered distinct-value calls for subset questions, and clarified that full scalar lists can be enumerated directly by the outer model.
+- Testing approach: Added regression coverage for preserved distinct-value lists, reviewer prompt guidance, and the version bump across the related tabular tests.
+- Impact analysis: List-style workbook questions can now survive the inner-to-outer handoff without losing the tool-backed values the outer GPT needs to answer directly.
+
+## Validation
+
+- Test results: Focused regressions verify distinct-value fallback preservation, reviewer guidance, and the preserved tabular orchestration/version checks.
+- Before/after comparison: Before the fix, reviewer recovery could succeed but the final answer still claimed truncation because only a preview of the distinct list survived. After the fix, full scalar lists are handed to the outer model whenever they fit the prompt budget.
+- User experience improvements: Questions like listing SharePoint sites from a workbook column now have a better chance of producing the full list instead of a conservative fallback response.
diff --git a/docs/explanation/fixes/TABULAR_EMBEDDED_VALUE_EXTRACTION_FIX.md b/docs/explanation/fixes/TABULAR_EMBEDDED_VALUE_EXTRACTION_FIX.md
new file mode 100644
index 00000000..bb102c89
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_EMBEDDED_VALUE_EXTRACTION_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR EMBEDDED VALUE EXTRACTION FIX
+
+Fixed/Implemented in version: **0.240.038**
+
+Related config.py update: `VERSION = "0.240.038"`
+
+## Header Information
+
+- Issue description: Workbook questions about SharePoint sites, links, or other identifiers embedded inside composite text cells could return inflated or misleading distinct counts because the plugin counted whole-cell strings instead of extracted matches.
+- Root cause analysis: `get_distinct_values` only deduplicated the full rendered cell value. When a cell contained descriptive prefixes plus a URL or other embedded identifier, the tool returned distinct cell strings instead of distinct extracted matches.
+- Version implemented: 0.240.038
+
+## Technical Details
+
+- Files modified: `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py`, `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Extended `get_distinct_values` with generic embedded extraction support for URLs and regex matches, added optional `url_path_segments` normalization for higher-level URL roots, updated planner guidance to prefer extraction over whole-cell distinct counts for embedded identifiers, and improved plugin invocation logs with compact structured summaries.
+- Testing approach: Added focused regressions for embedded URL extraction, regex extraction, raw fallback metadata preservation, and the updated prompt/version checks.
+- Impact analysis: Questions like counting SharePoint sites in filtered workbook rows can now extract and deduplicate canonical URLs instead of miscounting composite cell text.
+
+## Validation
+
+- Test results: Focused tabular regressions verify embedded URL extraction, regex extraction, raw fallback metadata preservation, and the updated route/version checks.
+- Before/after comparison: Before the fix, a tool call such as `get_distinct_values(column='Location')` could report many distinct composite cell strings without isolating the embedded SharePoint URLs. After the fix, the same filtered cohort can extract normalized URL roots or regex matches and return deterministic distinct counts.
+- User experience improvements: Embedded identifiers inside descriptive text cells are now analyzable with a reusable plugin capability rather than ad hoc heuristics.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_ENHANCED_CITATIONS_SCHEMA_SUMMARY_FIX.md b/docs/explanation/fixes/TABULAR_ENHANCED_CITATIONS_SCHEMA_SUMMARY_FIX.md
new file mode 100644
index 00000000..d9077be3
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_ENHANCED_CITATIONS_SCHEMA_SUMMARY_FIX.md
@@ -0,0 +1,52 @@
+# Tabular Enhanced Citations Schema Summary Fix (v0.240.023)
+
+Fixed/Implemented in version: **0.240.023**
+
+## Overview
+
+Enhanced-citation tabular uploads are supposed to store the original file in blob storage and index a single compact schema-summary chunk for discovery. A regression path in `process_tabular()` still allowed any schema-summary error to silently fall back to legacy row-by-row chunking, which made large CSV and workbook uploads look like standard citations again.
+
+## Root Cause
+
+The enhanced-citation branch built a schema summary inside a broad `try/except`. If any part of that summary generation or indexing path failed, the code logged a warning and continued into the standard row-chunking branch.
+
+For large or wide tabular files this meant:
+
+- the upload created thousands of indexed chunks instead of a single schema summary
+- `number_of_pages` reflected legacy chunk counts again
+- the workspace experience no longer matched the intended enhanced-citation tabular workflow
+
+## Technical Details
+
+### Files Modified
+
+| File | Change |
+| --- | --- |
+| `application/single_app/functions_documents.py` | Added bounded schema-summary helpers for tabular files, compact fallback summary generation, and a guard that prevents enhanced-citation uploads from silently reverting to row chunking |
+| `application/single_app/config.py` | Bumped version from `0.240.022` to `0.240.023` |
+| `functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py` | Added regression coverage for bounded schema summaries, the no-row-fallback guard, and the version bump |
+
+### Code Changes Summary
+
+- Added compact tabular schema-summary helpers that limit sheet count, column count, preview rows, and individual cell length.
+- Added a minimal summary fallback that still preserves blob-backed tabular analysis when a richer schema summary cannot be built.
+- Changed `process_tabular()` so row-by-row chunking only runs when enhanced citations is disabled.
+- Replaced the previous silent fallback behavior with explicit enhanced-citation summary retry/error handling.
+
+## Testing and Validation
+
+- Added `functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py`.
+- Verified the helper-generated CSV schema summary stays compact for wide tabular data.
+- Verified the tabular processor source now guards row chunking with `not enable_enhanced_citations`.
+- Verified the config version was updated to `0.240.023`.
+
+## Impact
+
+- Large enhanced-citation tabular uploads remain in schema-summary mode instead of reverting to legacy chunk indexing.
+- Workspace page/chunk counts now stay aligned with the intended enhanced-citation tabular flow.
+- Blob-backed tabular analysis remains available even when the richer schema summary needs to be reduced to a compact fallback.
+
+## Related References
+
+- Related config version update: `application/single_app/config.py`
+- Related functional test: `functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py`
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_EXHAUSTIVE_RESULT_LIMIT_ESCALATION_FIX.md b/docs/explanation/fixes/TABULAR_EXHAUSTIVE_RESULT_LIMIT_ESCALATION_FIX.md
new file mode 100644
index 00000000..0ce86c2c
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_EXHAUSTIVE_RESULT_LIMIT_ESCALATION_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR EXHAUSTIVE RESULT LIMIT ESCALATION FIX
+
+Fixed/Implemented in version: **0.240.049**
+
+Related config.py update: `VERSION = "0.240.049"`
+
+## Header Information
+
+- Issue description: Reviewer recovery could stop at a limited `search_rows` or `get_distinct_values` result even when the user explicitly asked for the full list of rows, URLs, sites, or other distinct values.
+- Root cause analysis: The controller already derived follow-up calls for row context and URL extraction, but it treated the first limited slice as sufficient. That left full-list questions stuck at the original `max_rows` or `max_values` cap and, in some cases, reused the row cap as the final distinct-value cap.
+- Version implemented: 0.240.049
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Added controller helpers that detect explicit exhaustive-result questions, parse returned row/value counts, and rerun `search_rows`, `filter_rows`, `query_tabular_data`, or `get_distinct_values` with higher limits when the current result is only a partial slice. The planner and reviewer guidance now also tell the route to escalate `max_rows` or `max_values` before answering when `total_matches > returned_rows` or `distinct_count > returned_values`.
+- Testing approach: Extended the reviewer-recovery regression suite with partial-row and partial-distinct-value rerun cases, and updated the prompt-guidance/version coverage in the related tabular route tests.
+- Impact analysis: Full-list workbook questions can now continue past an initial preview-sized slice and gather the complete modest cohort needed for a confident answer, instead of stopping at the first 25-result boundary.
+
+## Validation
+
+- Test results: Focused tabular reviewer-recovery, prompt-guidance, and all-scope source-context regressions cover the new limit-escalation path and the `0.240.049` version bump.
+- Before/after comparison: Before the fix, reviewer recovery could find the right sheet and even the right pattern, but still answer from a capped subset. After the fix, the controller can detect that the current result is incomplete for a full-list question and rerun with a larger limit before the final answer is composed.
+- User experience improvements: Users asking for complete site lists, URL inventories, or other exhaustive workbook results are less likely to receive answers that silently reflect only the first capped slice of tool output.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_GENERAL_COHORT_DISCOVERY_FIX.md b/docs/explanation/fixes/TABULAR_GENERAL_COHORT_DISCOVERY_FIX.md
new file mode 100644
index 00000000..cca3b24d
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_GENERAL_COHORT_DISCOVERY_FIX.md
@@ -0,0 +1,25 @@
+# TABULAR GENERAL COHORT DISCOVERY FIX
+
+Fixed/Implemented in version: **0.240.043**
+
+Related config.py update: `VERSION = "0.240.043"`
+
+## Header Information
+
+- Issue description: A workbook question could work on one file and fail on another with the same structure when the recovery planner guessed the wrong cohort column, such as interpreting "CCO locations" as `Location contains CCO` instead of discovering that `CCO` appears in another column.
+- Root cause analysis: Reviewer recovery reused speculative filters from the first analytical call. When that call returned zero matches, the controller repeated the same assumption instead of broadening to collect row context and letting the data reveal which column actually expressed the cohort.
+- Version implemented: 0.240.043
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/config.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`
+- Code changes summary: Generalized reviewer follow-up planning so zero-match same-column filters trigger a broader `search_rows` discovery step without the speculative filter. The controller can then inspect returned rows, infer a better cohort column, and run a second deterministic `get_distinct_values` extraction step. It also now iterates follow-up planning across multiple rounds instead of stopping after one automatic call.
+- Additional robustness: Added plugin-side fallback handling for reviewer-style null literals such as `Location != null` and `Location == null`.
+- Testing approach: Added route-helper regression coverage for broad discovery and cohort-column inference, plus plugin regression coverage for reviewer-style null literals.
+- Impact analysis: Questions about distinct URLs, sites, and other embedded identifiers are less dependent on workbook-specific wording or lucky column guesses. The controller now uses returned evidence to refine the next analytical call.
+
+## Validation
+
+- Test results: Focused reviewer-recovery, multisheet guidance, source-context, raw fallback, and relational-helper suites validate the new broad-search and refinement behavior.
+- Before/after comparison: Before the fix, the controller could repeat `Location contains CCO` and conclude there were no SharePoint sites. After the fix, it can broaden the search, inspect the matching rows, infer the actual cohort column, and then extract the canonical site list from the correct subset.
+- User experience improvements: The same question shape can now work across multiple workbooks with similar schemas even when the cohort term is represented in a different column than the value being counted or listed.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_GENERIC_SEARCH_FIX.md b/docs/explanation/fixes/TABULAR_GENERIC_SEARCH_FIX.md
new file mode 100644
index 00000000..db3d85b8
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_GENERIC_SEARCH_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR GENERIC SEARCH FIX
+
+Fixed/Implemented in version: **0.240.040**
+
+Related config.py update: `VERSION = "0.240.040"`
+
+## Header Information
+
+- Issue description: Tabular analysis could filter known columns or extract embedded values, but it still lacked a generic search capability for questions that ask where a topic, phrase, code, path, or other value appears anywhere in a worksheet or workbook.
+- Root cause analysis: The plugin exposed `filter_rows` for one known column and `query_tabular_data` for hand-authored DataFrame expressions, but it did not provide a first-class search tool for unknown-column or whole-document matching with row context preserved.
+- Version implemented: 0.240.040
+
+## Technical Details
+
+- Files modified: `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/semantic_kernel_plugins/plugin_invocation_logger.py`, `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Added a new `search_rows` tabular analysis function that can search specified columns or all columns across a sheet or workbook, return matched-column metadata, optionally project only selected `return_columns`, and preserve small full result cohorts in fallback handoffs. Updated the planner and reviewer prompts to use `search_rows` when the relevant column is unclear.
+- Testing approach: Added plugin-level regressions for cross-column generic search, fallback regressions for preserved small search cohorts, and updated route/reviewer/version checks.
+- Impact analysis: Workbook questions can now start from a true search primitive instead of forcing the model to guess the relevant column or build a brittle query expression before it has enough context.
+
+## Validation
+
+- Test results: Focused tabular regressions verify generic search behavior, preserved small search cohorts in fallback summaries, and the updated reviewer/prompt/version wiring.
+- Before/after comparison: Before the fix, whole-document search depended on guessing a column for `filter_rows` or writing a manual `query_expression`. After the fix, the model can call `search_rows` to search all columns or a chosen subset, then use the returned row context or selected columns to judge relevance.
+- User experience improvements: Users can ask broader workbook questions about arbitrary topics or values without needing to know which column contains the answer signal.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_GROUP_BLOB_CONTEXT_AND_SHEET_WHITESPACE_FIX.md b/docs/explanation/fixes/TABULAR_GROUP_BLOB_CONTEXT_AND_SHEET_WHITESPACE_FIX.md
new file mode 100644
index 00000000..b968ef9e
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_GROUP_BLOB_CONTEXT_AND_SHEET_WHITESPACE_FIX.md
@@ -0,0 +1,44 @@
+# Tabular Group Blob Context and Sheet Whitespace Fix
+
+Fixed/Implemented in version: **0.240.031**
+
+Related config.py update: `VERSION = "0.240.031"`
+
+## Issue Description
+
+Some group-scoped tabular analyses could fail on otherwise simple workbook questions.
+
+Two specific failure modes were identified:
+
+- Workbook schema preload could fail when an Excel sheet name contained trailing whitespace, such as `CUI `, but the runtime attempted to resolve it as `CUI`.
+- After schema preload successfully resolved a group workbook blob, later analytical tool calls could still fail with `BlobNotFound` if the model omitted `group_id` and the plugin retried against personal workspace or chat paths instead of the already known group blob path.
+
+## Root Cause Analysis
+
+- `_resolve_sheet_selection()` normalized requested worksheet names with `.strip()`, but matched them only against untrimmed workbook sheet names. A real worksheet named `CUI ` therefore failed to resolve even when the workbook metadata had already returned the exact tab.
+- `run_tabular_sk_analysis()` pre-resolved the correct blob path during schema preload, but the plugin did not retain that resolved location for later tool calls. When an analytical tool call arrived with `source='group'` and no `group_id`, `_resolve_blob_location_with_fallback()` could not retry the group path and fell back to incorrect workspace/chat candidates.
+
+## Files Modified
+
+- `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`
+- `application/single_app/route_backend_chats.py`
+- `application/single_app/config.py`
+- `functional_tests/test_tabular_group_blob_context_and_sheet_whitespace.py`
+
+## Code Changes Summary
+
+- Added per-analysis resolved blob location overrides so once tabular analysis discovers the correct blob path for a workbook, later analytical tool calls can reuse that location without depending on the model to resend `group_id` or `public_workspace_id`.
+- Updated workbook sheet matching so explicit sheet requests tolerate trailing whitespace and case drift while still preserving the exact stored worksheet name.
+- Updated tabular schema preload to register the resolved blob location with the plugin before any later analysis calls occur.
+- Added regression coverage for both trailing-space sheet names and the group blob context reuse path.
+
+## Testing Approach
+
+- Functional regression: `functional_tests/test_tabular_group_blob_context_and_sheet_whitespace.py`
+- Re-ran existing multi-sheet workbook regression coverage to ensure no regression in analytical workbook orchestration.
+
+## Validation
+
+- Workbook-level schema preload now succeeds for sheet inventories that include tabs such as `CUI `.
+- Trimmed worksheet requests such as `CUI` now resolve to the actual workbook tab `CUI `.
+- Group-scoped analytical tool calls can reuse the correct pre-resolved blob path even when later tool invocations omit `group_id`.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_MULTISHEET_LLM_REVIEWER_RECOVERY_FIX.md b/docs/explanation/fixes/TABULAR_MULTISHEET_LLM_REVIEWER_RECOVERY_FIX.md
new file mode 100644
index 00000000..327c24ac
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_MULTISHEET_LLM_REVIEWER_RECOVERY_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR MULTISHEET LLM REVIEWER RECOVERY FIX
+
+Fixed/Implemented in version: **0.240.035**
+
+Related config.py update: `VERSION = "0.240.035"`
+
+## Header Information
+
+- Issue description: Some multi-sheet workbook questions got very close to the answer but still stalled after schema discovery, returning schema-only narration instead of committing to the next analytical tool call.
+- Root cause analysis: The main tabular SK loop could preload workbook structure and even perform discovery, but if the same model still failed to choose an analytical function, the route had no final reasoning pass to convert the discovered workbook context into an explicit executable plan.
+- Version implemented: 0.240.035
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Added a last-resort LLM reviewer path for multi-sheet analytical runs. When the main SK loop still fails to produce computed analytical results, the route now asks the model for a JSON-only analytical tool plan, injects the correct file source context, executes those analytical plugin calls directly, and returns compact computed results back to the normal answer pipeline.
+- Testing approach: Added focused functional regression coverage for reviewer JSON extraction, function-name normalization, source-context injection, reviewer recovery wiring, and the new version bump.
+- Impact analysis: Multi-sheet workbook questions can now recover from near-miss discovery-only runs without hardcoded content or column heuristics because the LLM makes the final tool-selection decision from workbook schema and prior discovery output.
+
+## Validation
+
+- Test results: Focused regressions verify reviewer plan parsing, argument normalization, route wiring, and the preserved all-scope source-context behavior under the new version.
+- Before/after comparison: Before the fix, close workbook questions could stop after `describe_tabular_file` and fall back to schema narration; after the fix, the route gets one more LLM-driven analytical planning chance and can directly execute the chosen tool calls.
+- User experience improvements: Users get fewer “close but not computed” workbook answers because near-miss runs can recover into actual tabular tool execution instead of giving up after discovery.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_MULTISHEET_TOOL_START_GUIDANCE_FIX.md b/docs/explanation/fixes/TABULAR_MULTISHEET_TOOL_START_GUIDANCE_FIX.md
new file mode 100644
index 00000000..7090f2b8
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_MULTISHEET_TOOL_START_GUIDANCE_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR MULTISHEET TOOL START GUIDANCE FIX
+
+Fixed/Implemented in version: **0.240.034**
+
+Related config.py update: `VERSION = "0.240.034"`
+
+## Header Information
+
+- Issue description: Multi-sheet workbook questions could preload schemas successfully but still return a narrative answer without making any tabular tool calls.
+- Root cause analysis: The analysis path relied too much on preloaded schema plus route-side hints, while the model had no generic discovery loop to inspect workbook structure and then continue into analytical tools when the right worksheet was still unclear.
+- Version implemented: 0.240.034
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`
+- Code changes summary: Replaced content-targeted guidance with a generic multi-sheet discovery iteration model. Analysis mode now allows `describe_tabular_file` as an exploration step for multi-sheet workbooks, carries compact workbook-discovery summaries into retries, forces tool use on the first multi-sheet analytical pass, and still rejects discovery-only runs as incomplete until analytical tool calls succeed.
+- Testing approach: Added and updated functional regressions to verify generic entity-lookup routing, compact discovery summaries, multi-sheet discovery iteration guidance, and the preserved rule that discovery alone is not a completed analytical answer.
+- Impact analysis: Multi-sheet workbook prompts now have a more general tool-iteration path that lets the model inspect workbook structure and continue into analytical tools without hardcoded content or column targeting.
+
+## Validation
+
+- Test results: Targeted regressions verify the new multi-sheet discovery iteration guidance, workbook-discovery retry summaries, and the version bump.
+- Before/after comparison: Before the fix, some multi-sheet workbook prompts stalled with schema-only narration; after the fix, the route explicitly supports discovery-first iteration while still requiring analytical tool results before completion.
+- User experience improvements: Multi-sheet workbook analysis is less brittle because it relies on a generic workbook exploration loop instead of route-side content targeting.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_MULTI_CONDITION_FILTER_FIX.md b/docs/explanation/fixes/TABULAR_MULTI_CONDITION_FILTER_FIX.md
new file mode 100644
index 00000000..5861323e
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_MULTI_CONDITION_FILTER_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR MULTI-CONDITION FILTER FIX
+
+Fixed/Implemented in version: **0.240.037**
+
+Related config.py update: `VERSION = "0.240.037"`
+
+## Header Information
+
+- Issue description: Workbook questions that depended on two literal column conditions could still miss the right analytical call, even after reviewer recovery and distinct-value handoff improvements.
+- Root cause analysis: The deterministic tabular plugin exposed only one structured filter for `get_distinct_values`, `count_rows`, and `filter_rows`, which pushed the model toward broad `query_tabular_data` expressions or under-filtered counts.
+- Version implemented: 0.240.037
+
+## Technical Details
+
+- Files modified: `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`
+- Code changes summary: Extended the shared tabular filter helper and the main analytical plugin functions to accept an optional second structured filter, wired that support through cross-sheet execution, and updated route-side planner guidance so reviewer recovery and the main prompt prefer multi-condition filtered analytical calls over broad query fallbacks.
+- Testing approach: Added focused plugin-level regressions for cross-sheet distinct/count/filter calls that combine `Business Unit contains CCO` with `Location contains sharepoint`, then updated the related route/version regression checks.
+- Impact analysis: Questions like “how many discrete SharePoint sites appear in CCO locations?” can now be expressed as deterministic tool arguments instead of fragile query heuristics.
+
+## Validation
+
+- Test results: Focused tabular regressions verify the second-filter path on distinct counts, row counts, and row retrieval, plus the updated prompt/version checks.
+- Before/after comparison: Before the fix, the model often fell back to a broad query or a partially filtered count because the plugin only accepted one structured filter. After the fix, the same cohort can be represented directly with two explicit filter clauses.
+- User experience improvements: Workbook questions that depend on multi-column text matching are more likely to produce exact, tool-backed answers without adding route-specific heuristics.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_PREVIEW_JSON_SANITIZATION_FIX.md b/docs/explanation/fixes/TABULAR_PREVIEW_JSON_SANITIZATION_FIX.md
new file mode 100644
index 00000000..ef13fa95
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_PREVIEW_JSON_SANITIZATION_FIX.md
@@ -0,0 +1,22 @@
+# TABULAR PREVIEW JSON SANITIZATION FIX
+
+Fixed/Implemented in version: **0.240.030**
+
+## Header Information
+
+- Issue description: Some tabular enhanced-citation previews failed to open because the preview API returned raw `NaN` values that the browser rejected as invalid JSON.
+- Root cause analysis: `get_enhanced_citation_tabular_preview()` returned `preview.values.tolist()` directly from pandas, allowing null-like workbook values and blank headers to serialize as bare `NaN` tokens.
+- Version implemented: 0.240.030
+
+## Technical Details
+
+- Files modified: `application/single_app/route_enhanced_citations.py`, `application/single_app/config.py`, `functional_tests/test_tabular_preview_json_sanitization_fix.py`
+- Code changes summary: Added preview sanitization helpers that convert tabular headers and cells into JSON-safe display strings before calling `jsonify()`.
+- Testing approach: Added a focused functional regression test that executes the sanitizer helpers against `NaN`, `NaT`, blank headers, and timestamp values and verifies the preview route uses the sanitized payload.
+- Impact analysis: Workbook citations with sparse cells or blank column headers now render in the tabular preview modal instead of falling back to the download-only error state.
+
+## Validation
+
+- Test results: Targeted functional regression test validates both value sanitization behavior and preview route integration.
+- Before/after comparison: Before the fix, preview responses could contain invalid `NaN` JSON tokens; after the fix, the endpoint emits only JSON-safe strings for preview rows and headers.
+- User experience improvements: Users can open affected CSV/XLSX citation previews reliably, even when the sheet contains missing values.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_REVIEWER_AUTO_FOLLOW_UP_FIX.md b/docs/explanation/fixes/TABULAR_REVIEWER_AUTO_FOLLOW_UP_FIX.md
new file mode 100644
index 00000000..58f62610
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_REVIEWER_AUTO_FOLLOW_UP_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR REVIEWER AUTO FOLLOW-UP FIX
+
+Fixed/Implemented in version: **0.240.042**
+
+Related config.py update: `VERSION = "0.240.042"`
+
+## Header Information
+
+- Issue description: Multi-sheet workbook analysis could stop after an intermediate analytical result, such as whole-cell distinct `Location` values, even when the user asked for a search-first answer with matching rows and canonical SharePoint site counts.
+- Root cause analysis: Reviewer recovery executed only the calls proposed by the LLM and then immediately handed those results to the outer model. If the first successful call returned partial evidence instead of the final reasoning inputs, the outer model still lacked the row context or extracted site list needed to answer confidently.
+- Version implemented: 0.240.042
+
+## Technical Details
+
+- Files modified: `application/single_app/route_backend_chats.py`, `application/single_app/config.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`, `functional_tests/test_tabular_raw_tool_fallback.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`
+- Code changes summary: Added controller-side follow-up planning for reviewer recovery. After the first successful analytical call, the route now inspects the returned payload and can automatically schedule a second-step `search_rows` call for literal topic context plus a `get_distinct_values` extraction call for embedded URLs or sites when the question still needs canonical identifiers.
+- Testing approach: Added regression coverage for derived reviewer follow-up calls and updated the related version assertions in the focused tabular recovery suites.
+- Impact analysis: The route can now iterate over collected tabular evidence without introducing extra plugins. This keeps the tabular plugin surface stable while letting the controller gather search hits and extracted identifiers before the final model reasons across the results.
+
+## Validation
+
+- Test results: Focused reviewer-recovery and tabular fallback suites validate the new follow-up derivation path alongside the updated version checks.
+- Before/after comparison: Before the fix, reviewer recovery could stop at whole-cell distinct values and the outer model would answer that the exact count was not available. After the fix, reviewer recovery can add row-context search results and canonical URL extraction results before building the computed handoff.
+- User experience improvements: Questions like SharePoint site counting now have a better chance of returning concrete counts and the matching evidence rows instead of a cautious schema-only or partial-data answer.
\ No newline at end of file
diff --git a/docs/explanation/fixes/TABULAR_REVIEWER_PSEUDO_QUERY_REWRITE_FIX.md b/docs/explanation/fixes/TABULAR_REVIEWER_PSEUDO_QUERY_REWRITE_FIX.md
new file mode 100644
index 00000000..f3e623b8
--- /dev/null
+++ b/docs/explanation/fixes/TABULAR_REVIEWER_PSEUDO_QUERY_REWRITE_FIX.md
@@ -0,0 +1,24 @@
+# TABULAR REVIEWER PSEUDO QUERY REWRITE FIX
+
+Fixed/Implemented in version: **0.240.041**
+
+Related config.py update: `VERSION = "0.240.041"`
+
+## Header Information
+
+- Issue description: Reviewer recovery could regress into schema-only answers when it generated reviewer-style pseudo-pandas expressions such as `.astype(str).str.contains(...)` inside `query_expression`, because those expressions are not valid `DataFrame.query()` syntax.
+- Root cause analysis: The route prompt warned the model to avoid method calls in `query_expression`, but the plugin still executed reviewer output literally. When the reviewer emitted pseudo-query syntax, analytical functions such as `get_distinct_values` failed with errors like `name 'str' is not defined`.
+- Version implemented: 0.240.041
+
+## Technical Details
+
+- Files modified: `application/single_app/semantic_kernel_plugins/tabular_processing_plugin.py`, `application/single_app/config.py`, `functional_tests/test_tabular_relational_analysis_helpers.py`, `functional_tests/test_tabular_llm_reviewer_recovery.py`, `functional_tests/test_tabular_multisheet_tool_start_guidance.py`, `functional_tests/test_tabular_all_scope_group_source_context.py`, `functional_tests/test_tabular_raw_tool_fallback.py`
+- Code changes summary: Added a safe fallback parser for common reviewer-style pseudo queries such as `.notnull()`, `.isnull()`, `.str.contains()`, `.str.startswith()`, `.str.endswith()`, and simple `==` or `!=` string comparisons. Analytical helpers now rewrite those limited patterns into safe filter behavior instead of failing.
+- Testing approach: Added regression coverage for reviewer-style pseudo queries flowing through `count_rows` and `get_distinct_values`, then updated the related version checks.
+- Impact analysis: Reviewer recovery and other analytical calls are more resilient to model-generated pseudo-pandas syntax and are less likely to fall back to schema-only answers after successful workbook discovery.
+
+## Validation
+
+- Test results: Focused tabular regressions verify pseudo-query rewrite behavior and the updated version checks.
+- Before/after comparison: Before the fix, a reviewer plan with `Location.astype(str).str.contains(...)` failed inside `get_distinct_values`. After the fix, the same limited expression is rewritten into safe filter behavior and the analytical call can complete.
+- User experience improvements: Workbook questions are less likely to regress from computed analysis back to schema-only fallback because of minor model syntax drift in `query_expression`.
\ No newline at end of file
diff --git a/docs/explanation/release_notes.md b/docs/explanation/release_notes.md
index a1a8018f..1da18c6c 100644
--- a/docs/explanation/release_notes.md
+++ b/docs/explanation/release_notes.md
@@ -4,7 +4,7 @@ This page tracks notable Simple Chat releases and organizes the detailed change
 
 For feature-focused and fix-focused drill-downs by version, see [Features by Version](/explanation/features/) and [Fixes by Version](/explanation/fixes/).
 
-### **(v0.240.016)**
+### **(v0.240.053)**
 
 #### New Features
 
@@ -229,6 +229,19 @@ For feature-focused and fix-focused drill-downs by version, see [Features by Ver
     
 #### Bug Fixes
 
+*   **Chat History Citation Replay Improvements**
+    *   Fixed follow-up prompts so prior assistant turns can reuse stored citation results, including tabular tool outputs, instead of relying only on the visible assistant message text.
+    *   Assistant history replay now hydrates stored citation artifacts and deduplicates repeated cross-sheet tabular calls so later file results, such as Licensing workbook values, remain available to the next turn.
+    *   History-context diagnostics remain available in message metadata and optional debug citations, while the thoughts timeline stays compact.
+    *   (Ref: `route_backend_chats.py`, `functions_message_artifacts.py`, `chat-thoughts.js`, `chat-messages.js`, `test_chat_stream_history_context_fix.py`, `CHAT_STREAM_HISTORY_CONTEXT_FIX.md`)
+
+*   **Document Revision Visibility and Storage Preservation**
+    *   Fixed same-name document uploads so new revisions now inherit the previous document's editable metadata, including classification, tags, title, abstract, keywords, publication date, authors, and sharing state.
+    *   Workspace lists and chat search now only use the current revision, while older revisions remain retained for future comparison work instead of staying active in normal workspace flows.
+    *   Document deletion now offers a choice between deleting only the current revision or deleting all stored revisions for that document family.
+    *   Blob storage now preserves older source files by keeping the active document at the existing alias path and archiving prior current revisions into a revision-family hierarchy before the alias path is overwritten.
+    *   (Ref: document revision families, current-only workspace visibility, hybrid blob alias plus archived revision storage, `functions_documents.py`, `functions_search.py`, `route_enhanced_citations.py`, workspace/group/public document flows)
+    
 *   **Python Runtime Dependency Refresh and Supply-Chain Hardening**
     *   Continued the requirements hardening work from `v0.240.014` by tightening the main application runtime to exact package pins, reducing dependency drift across local development, CI, and Azure deployments to help mitigate supply-chain exposure.
     *   Upgraded the Flask runtime stack to `Flask==3.1.3` and `Werkzeug==3.1.6`, and updated the shared `Markup` import path to `markupsafe` so the app starts correctly with Flask 3's package boundary changes.
diff --git a/docs/images/release-timeline.png b/docs/images/release-timeline.png
index f4a6c973..8ee49d9d 100644
Binary files a/docs/images/release-timeline.png and b/docs/images/release-timeline.png differ
diff --git a/functional_tests/test_agent_citation_full_results_modal.py b/functional_tests/test_agent_citation_full_results_modal.py
new file mode 100644
index 00000000..4acb0d9b
--- /dev/null
+++ b/functional_tests/test_agent_citation_full_results_modal.py
@@ -0,0 +1,106 @@
+#!/usr/bin/env python3
+# test_agent_citation_full_results_modal.py
+"""
+Functional test for full agent citation result hydration.
+Version: 0.240.048
+Implemented in: 0.240.048
+
+This test ensures the chat UI can lazy-load raw agent citation artifacts and
+render tabular tool results with preview, 25-row, and full-row controls.
+"""
+
+import os
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_frontend_conversations.py')
+MESSAGES_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'static', 'js', 'chat', 'chat-messages.js')
+CITATIONS_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'static', 'js', 'chat', 'chat-citations.js')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+
+
+def read_file_text(path):
+    with open(path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_route_exposes_agent_citation_artifact_endpoint():
+    print('🔍 Testing agent citation artifact endpoint wiring...')
+
+    route_source = read_file_text(ROUTE_FILE)
+    required_snippets = [
+        "@app.route('/api/conversation/<conversation_id>/agent-citation/<artifact_id>', methods=['GET'])",
+        'build_message_artifact_payload_map',
+        "artifact_payload_map.get(str(artifact_id or ''))",
+        "return jsonify({'citation': citation})",
+    ]
+
+    missing = [snippet for snippet in required_snippets if snippet not in route_source]
+    assert not missing, f'Missing route snippets: {missing}'
+
+    print('✅ Agent citation artifact endpoint wiring passed')
+    return True
+
+
+def test_chat_ui_uses_lazy_hydration_and_row_controls():
+    print('🔍 Testing agent citation modal source and row controls...')
+
+    messages_source = read_file_text(MESSAGES_FILE)
+    citations_source = read_file_text(CITATIONS_FILE)
+
+    required_message_snippets = [
+        'data-artifact-id',
+        'data-conversation-id',
+    ]
+    required_citation_snippets = [
+        'AGENT_CITATION_EXPANDED_ROWS = 25',
+        'fetchAgentCitationArtifact',
+        'renderAgentCitationResult(',
+        'Show 25 rows',
+        'Show all rows',
+        'displayed_rows',
+        'data_rows_limited',
+        '/api/conversation/${encodeURIComponent(conversationId)}/agent-citation/${encodeURIComponent(artifactId)}',
+    ]
+
+    missing_messages = [snippet for snippet in required_message_snippets if snippet not in messages_source]
+    missing_citations = [snippet for snippet in required_citation_snippets if snippet not in citations_source]
+    assert not missing_messages, f'Missing message snippets: {missing_messages}'
+    assert not missing_citations, f'Missing citation snippets: {missing_citations}'
+
+    print('✅ Agent citation modal source and row controls passed')
+    return True
+
+
+def test_version_bump_alignment():
+    print('🔍 Testing version bump alignment...')
+
+    assert read_config_version() == '0.240.048'
+
+    print('✅ Version bump alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_route_exposes_agent_citation_artifact_endpoint,
+        test_chat_ui_uses_lazy_hydration_and_row_controls,
+        test_version_bump_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    raise SystemExit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_chat_citation_page_sort_fix.py b/functional_tests/test_chat_citation_page_sort_fix.py
new file mode 100644
index 00000000..87be8ed7
--- /dev/null
+++ b/functional_tests/test_chat_citation_page_sort_fix.py
@@ -0,0 +1,157 @@
+# test_chat_citation_page_sort_fix.py
+"""
+Functional test for mixed citation page sorting.
+Version: 0.240.055
+Implemented in: 0.240.055
+
+This test ensures hybrid citations with numeric pages and text labels such as
+Metadata or AI Vision sort deterministically in both standard and streaming
+chat paths without raising mixed-type comparison errors.
+"""
+
+import ast
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+FIX_DOC = os.path.join(
+    ROOT_DIR,
+    'docs',
+    'explanation',
+    'fixes',
+    'CHAT_CITATION_PAGE_SORT_FIX.md',
+)
+TARGET_FUNCTIONS = {
+    '_coerce_citation_sort_number',
+    '_build_hybrid_citation_sort_key',
+}
+
+
+def read_file_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_file_text(CONFIG_FILE).splitlines():
+        if line.startswith('VERSION = '):
+            return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def load_sort_helpers():
+    source = read_file_text(ROUTE_FILE)
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = [
+        node for node in parsed.body
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS
+    ]
+    assert len(selected_nodes) == len(TARGET_FUNCTIONS), (
+        f'Expected helpers {sorted(TARGET_FUNCTIONS)}, '
+        f'found {[node.name for node in selected_nodes]}'
+    )
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {}
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def test_citation_sort_number_parsing():
+    """Verify page and chunk sort values normalize safely."""
+    print('🔍 Testing citation sort number parsing...')
+
+    namespace, _ = load_sort_helpers()
+    coerce_sort_number = namespace['_coerce_citation_sort_number']
+
+    assert coerce_sort_number(12) == 12.0
+    assert coerce_sort_number('7') == 7.0
+    assert coerce_sort_number(' 3.5 ') == 3.5
+    assert coerce_sort_number('Metadata') is None
+    assert coerce_sort_number('AI Vision') is None
+    assert coerce_sort_number('') is None
+    assert coerce_sort_number(None) is None
+
+    print('✅ Citation sort number parsing passed')
+    return True
+
+
+def test_mixed_page_and_metadata_citations_sort_stably():
+    """Verify mixed numeric and text page labels sort without type errors."""
+    print('🔍 Testing mixed citation sort order...')
+
+    namespace, _ = load_sort_helpers()
+    build_sort_key = namespace['_build_hybrid_citation_sort_key']
+
+    citations = [
+        {'file_name': 'Policy.pdf', 'page_number': 2, 'chunk_sequence': 2},
+        {'file_name': 'Policy.pdf', 'page_number': 'Metadata', 'chunk_sequence': 9999, 'metadata_type': 'keywords'},
+        {'file_name': 'Policy.pdf', 'page_number': 'AI Vision', 'chunk_sequence': 9997, 'metadata_type': 'vision'},
+        {'file_name': 'Policy.pdf', 'page_number': '12', 'chunk_sequence': 12},
+        {'file_name': 'Policy.pdf', 'page_number': 7, 'chunk_sequence': 7},
+        {'file_name': 'Policy.pdf', 'page_number': None, 'chunk_sequence': None},
+    ]
+
+    sorted_citations = sorted(citations, key=build_sort_key, reverse=True)
+
+    assert [citation.get('page_number') for citation in sorted_citations] == [
+        '12',
+        7,
+        2,
+        'Metadata',
+        'AI Vision',
+        None,
+    ], sorted_citations
+
+    print('✅ Mixed citation sort order passed')
+    return True
+
+
+def test_route_uses_shared_sort_helper_for_standard_and_streaming_paths():
+    """Verify both retrieval paths use the shared mixed-page citation sort helper."""
+    print('🔍 Testing shared citation sort helper wiring...')
+
+    _, route_source = load_sort_helpers()
+
+    assert route_source.count('hybrid_citations_list.sort(key=_build_hybrid_citation_sort_key, reverse=True)') == 2
+    assert "lambda x: x.get('page_number', 0)" not in route_source
+    assert 'def _build_hybrid_citation_sort_key(citation):' in route_source
+
+    print('✅ Shared citation sort helper wiring passed')
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    """Verify version bump and fix documentation stay aligned."""
+    print('🔍 Testing version and fix documentation alignment...')
+
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert read_config_version() == '0.240.055'
+    assert 'Fixed/Implemented in version: **0.240.055**' in fix_doc_content
+    assert 'mixed numeric and text page labels' in fix_doc_content.lower()
+    assert 'application/single_app/route_backend_chats.py' in fix_doc_content
+
+    print('✅ Version and fix documentation alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_citation_sort_number_parsing,
+        test_mixed_page_and_metadata_citations_sort_stably,
+        test_route_uses_shared_sort_helper_for_standard_and_streaming_paths,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_chat_history_grounded_follow_up_fix.py b/functional_tests/test_chat_history_grounded_follow_up_fix.py
new file mode 100644
index 00000000..dc5b09a2
--- /dev/null
+++ b/functional_tests/test_chat_history_grounded_follow_up_fix.py
@@ -0,0 +1,349 @@
+# test_chat_history_grounded_follow_up_fix.py
+"""
+Functional test for grounded follow-up chat fallback.
+Version: 0.240.055
+Implemented in: 0.240.054; Updated in: 0.240.055
+
+This test ensures follow-up turns with workspace search disabled can reuse
+prior grounded document refs, derive bounded fallback search parameters, and
+preserve the no-search grounding contract in both chat execution paths.
+"""
+
+import ast
+import os
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+METADATA_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'functions_conversation_metadata.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+FIX_DOC = os.path.join(
+    ROOT_DIR,
+    'docs',
+    'explanation',
+    'fixes',
+    'CHAT_HISTORY_GROUNDED_FOLLOW_UP_FIX.md',
+)
+ROUTE_TARGET_FUNCTIONS = {
+    '_normalize_prior_grounded_document_refs',
+    'build_prior_grounded_document_search_parameters',
+    'build_history_only_assessment_messages',
+    'build_history_grounding_system_message',
+}
+METADATA_TARGET_FUNCTIONS = {
+    '_extract_document_id_from_search_result',
+    '_build_last_grounded_document_refs',
+}
+
+
+def read_file_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_file_text(CONFIG_FILE).splitlines():
+        if line.startswith('VERSION = '):
+            return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def load_route_helpers():
+    source = read_file_text(ROUTE_FILE)
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = [
+        node for node in parsed.body
+        if isinstance(node, ast.FunctionDef) and node.name in ROUTE_TARGET_FUNCTIONS
+    ]
+    assert len(selected_nodes) == len(ROUTE_TARGET_FUNCTIONS), (
+        f'Expected route helpers {sorted(ROUTE_TARGET_FUNCTIONS)}, '
+        f'found {[node.name for node in selected_nodes]}'
+    )
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {}
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def load_metadata_helpers():
+    source = read_file_text(METADATA_FILE)
+    parsed = ast.parse(source, filename=METADATA_FILE)
+    selected_nodes = [
+        node for node in parsed.body
+        if isinstance(node, ast.FunctionDef) and node.name in METADATA_TARGET_FUNCTIONS
+    ]
+    assert len(selected_nodes) == len(METADATA_TARGET_FUNCTIONS), (
+        f'Expected metadata helpers {sorted(METADATA_TARGET_FUNCTIONS)}, '
+        f'found {[node.name for node in selected_nodes]}'
+    )
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {}
+    exec(compile(module, METADATA_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def test_grounded_document_refs_capture_stable_document_ids():
+    """Verify grounded refs preserve stable parent document ids across scopes."""
+    print('🔍 Testing grounded document ref capture...')
+
+    namespace, _ = load_metadata_helpers()
+    extract_document_id = namespace['_extract_document_id_from_search_result']
+    build_grounded_refs = namespace['_build_last_grounded_document_refs']
+
+    assert extract_document_id({'document_id': 'doc-123', 'id': 'doc-123_0001'}) == 'doc-123'
+    assert extract_document_id({'id': 'group_doc_0007'}) == 'group_doc'
+    assert extract_document_id({'id': 'standalone-doc'}) == 'standalone-doc'
+
+    grounded_refs = build_grounded_refs({
+        'personal-doc': {
+            'scope': {'scope': 'personal', 'id': 'user-1'},
+            'classification': 'internal',
+            'file_name': 'Personal Notes.pdf',
+        },
+        'group-doc': {
+            'scope': {'scope': 'group', 'id': 'group-22'},
+            'classification': 'confidential',
+            'file_name': 'Group Plan.docx',
+        },
+        'public-doc': {
+            'scope': {'scope': 'public', 'id': 'workspace-33'},
+            'classification': 'public',
+            'file_name': 'FAQ.md',
+        },
+    })
+
+    assert grounded_refs == [
+        {
+            'document_id': 'personal-doc',
+            'scope': 'personal',
+            'scope_id': 'user-1',
+            'file_name': 'Personal Notes.pdf',
+            'classification': 'internal',
+            'user_id': 'user-1',
+        },
+        {
+            'document_id': 'group-doc',
+            'scope': 'group',
+            'scope_id': 'group-22',
+            'file_name': 'Group Plan.docx',
+            'classification': 'confidential',
+            'group_id': 'group-22',
+        },
+        {
+            'document_id': 'public-doc',
+            'scope': 'public',
+            'scope_id': 'workspace-33',
+            'file_name': 'FAQ.md',
+            'classification': 'public',
+            'public_workspace_id': 'workspace-33',
+        },
+    ], grounded_refs
+
+    print('✅ Grounded document ref capture passed')
+    return True
+
+
+def test_prior_grounded_refs_normalize_from_saved_refs_and_tags():
+    """Verify fallback refs normalize saved grounded refs first, then tags."""
+    print('🔍 Testing grounded ref normalization...')
+
+    namespace, _ = load_route_helpers()
+    normalize_refs = namespace['_normalize_prior_grounded_document_refs']
+
+    normalized_refs = normalize_refs({
+        'last_grounded_document_refs': [
+            {
+                'document_id': 'doc-1',
+                'scope': 'group',
+                'scope_id': 'group-1',
+                'file_name': 'Plan A.docx',
+                'classification': 'internal',
+            },
+            {
+                'document_id': 'doc-1',
+                'scope': 'group',
+                'group_id': 'group-1',
+                'file_name': 'Plan A.docx',
+            },
+            {
+                'document_id': 'doc-2',
+                'scope': 'personal',
+                'user_id': 'user-1',
+                'file_name': 'Notes.txt',
+            },
+        ]
+    })
+
+    assert normalized_refs == [
+        {
+            'document_id': 'doc-1',
+            'scope': 'group',
+            'scope_id': 'group-1',
+            'file_name': 'Plan A.docx',
+            'classification': 'internal',
+            'group_id': 'group-1',
+        },
+        {
+            'document_id': 'doc-2',
+            'scope': 'personal',
+            'scope_id': 'user-1',
+            'file_name': 'Notes.txt',
+            'classification': None,
+            'user_id': 'user-1',
+        },
+    ], normalized_refs
+
+    tag_fallback_refs = normalize_refs({
+        'tags': [
+            {
+                'category': 'document',
+                'document_id': 'doc-3',
+                'title': 'Workspace FAQ.md',
+                'classification': 'public',
+                'scope': {'type': 'public', 'id': 'workspace-7'},
+            },
+        ]
+    })
+
+    assert tag_fallback_refs == [
+        {
+            'document_id': 'doc-3',
+            'scope': 'public',
+            'scope_id': 'workspace-7',
+            'file_name': 'Workspace FAQ.md',
+            'classification': 'public',
+            'public_workspace_id': 'workspace-7',
+        },
+    ], tag_fallback_refs
+
+    print('✅ Grounded ref normalization passed')
+    return True
+
+
+def test_prior_grounded_search_parameters_stay_bounded():
+    """Verify grounded fallback search stays limited to previously grounded docs."""
+    print('🔍 Testing grounded fallback search parameter derivation...')
+
+    namespace, _ = load_route_helpers()
+    build_search_parameters = namespace['build_prior_grounded_document_search_parameters']
+
+    mixed_scope_parameters = build_search_parameters([
+        {'document_id': 'doc-1', 'scope': 'group', 'group_id': 'group-1'},
+        {'document_id': 'doc-2', 'scope': 'public', 'public_workspace_id': 'workspace-1'},
+        {'document_id': 'doc-3', 'scope': 'personal', 'user_id': 'user-1'},
+        {'document_id': 'doc-2', 'scope': 'public', 'public_workspace_id': 'workspace-1'},
+    ])
+
+    assert mixed_scope_parameters == {
+        'document_ids': ['doc-1', 'doc-2', 'doc-3'],
+        'doc_scope': 'all',
+        'active_group_ids': ['group-1'],
+        'active_group_id': 'group-1',
+        'active_public_workspace_ids': ['workspace-1'],
+        'active_public_workspace_id': 'workspace-1',
+        'scope_types': ['group', 'personal', 'public'],
+    }, mixed_scope_parameters
+
+    group_only_parameters = build_search_parameters([
+        {'document_id': 'group-doc-1', 'scope': 'group', 'group_id': 'group-9'},
+        {'document_id': 'group-doc-2', 'scope': 'group', 'group_id': 'group-9'},
+    ])
+
+    assert group_only_parameters['doc_scope'] == 'group'
+    assert group_only_parameters['active_group_ids'] == ['group-9']
+    assert group_only_parameters['document_ids'] == ['group-doc-1', 'group-doc-2']
+
+    print('✅ Grounded fallback search parameter derivation passed')
+    return True
+
+
+def test_history_only_prompt_contract_is_explicit():
+    """Verify history-only assessment and final no-search prompt stay explicit."""
+    print('🔍 Testing history-only prompt contract...')
+
+    namespace, _ = load_route_helpers()
+    build_assessment_messages = namespace['build_history_only_assessment_messages']
+    build_grounding_message = namespace['build_history_grounding_system_message']
+
+    assessment_messages = build_assessment_messages(
+        {
+            'summary_of_older': 'Older answer summary',
+            'history_messages': [
+                {'role': 'assistant', 'content': 'The cited policy says approvals take two days.'},
+                {'role': 'user', 'content': 'What about exceptions?'},
+            ],
+        },
+        'Use concise answers.',
+    )
+
+    assert assessment_messages[0]['role'] == 'system'
+    assert '<Summary of previous conversation context>' in assessment_messages[0]['content']
+    assert assessment_messages[1] == {'role': 'system', 'content': 'Use concise answers.'}
+    assert assessment_messages[2]['role'] == 'assistant'
+    assert assessment_messages[3]['content'] == 'What about exceptions?'
+
+    grounding_message = build_grounding_message()
+    assert grounding_message['role'] == 'system'
+    assert 'Workspace search is disabled for this turn.' in grounding_message['content']
+    assert 'ask the user to select a workspace or document' in grounding_message['content']
+
+    print('✅ History-only prompt contract passed')
+    return True
+
+
+def test_route_and_metadata_wiring_cover_both_chat_paths():
+    """Verify grounded follow-up fallback is wired in standard and streaming chat paths."""
+    print('🔍 Testing grounded follow-up wiring...')
+
+    _, route_source = load_route_helpers()
+    _, metadata_source = load_metadata_helpers()
+
+    assert "conversation_item['last_grounded_document_refs'] = _build_last_grounded_document_refs(document_map)" in metadata_source
+    assert route_source.count('history_grounded_search_used = True') == 2
+    assert route_source.count('Checking whether prior conversation context already answers the question') == 2
+    assert route_source.count('Conversation context alone was insufficient; searching previously grounded documents') == 2
+    assert route_source.count('No prior grounded documents were available; using conversation history only') == 2
+    assert route_source.count("'history_grounded_fallback'") == 2
+    assert route_source.count('history_grounding_message = build_history_grounding_system_message()') == 2
+
+    print('✅ Grounded follow-up wiring passed')
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    """Verify version bump and fix documentation stay aligned."""
+    print('🔍 Testing version and fix documentation alignment...')
+
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert read_config_version() == '0.240.055'
+    assert 'Fixed/Implemented in version: **0.240.055**' in fix_doc_content
+    assert 'last_grounded_document_refs' in fix_doc_content
+    assert 'previously grounded documents' in fix_doc_content.lower()
+    assert 'application/single_app/route_backend_chats.py' in fix_doc_content
+    assert 'application/single_app/functions_conversation_metadata.py' in fix_doc_content
+
+    print('✅ Version and fix documentation alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_grounded_document_refs_capture_stable_document_ids,
+        test_prior_grounded_refs_normalize_from_saved_refs_and_tags,
+        test_prior_grounded_search_parameters_stay_bounded,
+        test_history_only_prompt_contract_is_explicit,
+        test_route_and_metadata_wiring_cover_both_chat_paths,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    raise SystemExit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_chat_new_conversation_tag_reset.py b/functional_tests/test_chat_new_conversation_tag_reset.py
new file mode 100644
index 00000000..e3bb5a2c
--- /dev/null
+++ b/functional_tests/test_chat_new_conversation_tag_reset.py
@@ -0,0 +1,97 @@
+# test_chat_new_conversation_tag_reset.py
+"""
+Functional test for chat tag reset on new conversation.
+Version: 0.240.026
+Implemented in: 0.240.026
+
+This test ensures that rebuilding the chat tag list clears stale tag
+selection UI state so starting a new conversation resets the tag selector
+label and document filtering back to the default state.
+"""
+
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+
+CHAT_DOCUMENTS_FILE = os.path.join(
+    ROOT_DIR,
+    'application',
+    'single_app',
+    'static',
+    'js',
+    'chat',
+    'chat-documents.js',
+)
+CONFIG_FILE = os.path.join(
+    ROOT_DIR,
+    'application',
+    'single_app',
+    'config.py',
+)
+
+
+def read_file(path):
+    with open(path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def test_load_tags_for_scope_resets_tag_selection_state_before_rebuild():
+    """Verify tag selection UI state is cleared before in-scope tags are rebuilt."""
+    print('🔍 Testing chat tag reset before tag reload...')
+
+    content = read_file(CHAT_DOCUMENTS_FILE)
+
+    required_snippets = [
+        'function resetTagSelectionState() {',
+        'tagsSearchController?.resetFilter();',
+        'syncTagsDropdownButtonText();',
+        'filterDocumentsBySelectedTags();',
+        "chatTagsFilter.innerHTML = '';",
+        "if (tagsDropdownItems) tagsDropdownItems.innerHTML = '';",
+        'resetTagSelectionState();',
+    ]
+
+    missing = [snippet for snippet in required_snippets if snippet not in content]
+    assert not missing, f'Missing tag reset snippets: {missing}'
+
+    load_tags_block = """export async function loadTagsForScope() {
+  if (!chatTagsFilter) return;
+
+  // Clear existing options in both hidden select and custom dropdown
+  chatTagsFilter.innerHTML = '';
+  if (tagsDropdownItems) tagsDropdownItems.innerHTML = '';
+  resetTagSelectionState();
+"""
+    assert load_tags_block in content, 'Expected loadTagsForScope to reset tag UI state immediately after clearing options.'
+
+    print('✅ chat tag reset before reload passed')
+    return True
+
+
+def test_config_version_is_bumped_for_chat_tag_reset_fix():
+    """Verify config version was bumped for the new conversation tag reset fix."""
+    print('🔍 Testing config version bump...')
+
+    config_content = read_file(CONFIG_FILE)
+    assert 'VERSION = "0.240.026"' in config_content, 'Expected config.py version 0.240.026'
+
+    print('✅ Config version bump passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_load_tags_for_scope_resets_tag_selection_state_before_rebuild,
+        test_config_version_is_bumped_for_chat_tag_reset_fix,
+    ]
+
+    results = []
+    for test in tests:
+        print(f"\n🧪 Running {test.__name__}...")
+        results.append(test())
+
+    success = all(results)
+    print(f"\n📊 Results: {sum(results)}/{len(results)} tests passed")
+    sys.exit(0 if success else 1)
diff --git a/functional_tests/test_chat_scope_tag_filter_fix.py b/functional_tests/test_chat_scope_tag_filter_fix.py
new file mode 100644
index 00000000..266c60b4
--- /dev/null
+++ b/functional_tests/test_chat_scope_tag_filter_fix.py
@@ -0,0 +1,121 @@
+# test_chat_scope_tag_filter_fix.py
+"""
+Functional test for chat scoped tag filter enforcement.
+Version: 0.240.029
+Implemented in: 0.240.029
+
+This test ensures that hybrid chat search applies the selected tag filter
+consistently for personal, group, and public scopes so chat answers stay
+inside the selected document tag scope.
+"""
+
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+FUNCTIONS_SEARCH_FILE = os.path.join(
+    ROOT_DIR,
+    "application",
+    "single_app",
+    "functions_search.py",
+)
+CONFIG_FILE = os.path.join(
+    ROOT_DIR,
+    "application",
+    "single_app",
+    "config.py",
+)
+
+
+def read_file(path):
+    with open(path, "r", encoding="utf-8") as file_handle:
+        return file_handle.read()
+
+
+def get_scoped_block(content, start_marker, end_marker):
+    start_index = content.index(start_marker)
+    end_index = content.index(end_marker, start_index)
+    return content[start_index:end_index]
+
+
+def test_hybrid_search_applies_tag_filters_to_personal_group_and_public_scopes():
+    """Verify scoped hybrid search branches all append the tag filter clause."""
+    print("🔍 Testing scoped hybrid search tag filters...")
+
+    content = read_file(FUNCTIONS_SEARCH_FILE)
+
+    personal_block = get_scoped_block(
+        content,
+        '    elif doc_scope == "personal":',
+        '    elif doc_scope == "group":',
+    )
+    group_block = get_scoped_block(
+        content,
+        '    elif doc_scope == "group":',
+        '    elif doc_scope == "public":',
+    )
+    public_block = get_scoped_block(
+        content,
+        '    elif doc_scope == "public":',
+        '    # Log pre-sort statistics',
+    )
+
+    required_scope_snippets = {
+        "personal": [
+            'user_filter = f"{user_base_filter} and {tags_filter_clause}" if tags_filter_clause else user_base_filter',
+            'user_filter = f"{user_base_filter} and {tags_filter_clause}" if tags_filter_clause else user_base_filter.strip()',
+            'filter=user_filter,',
+            '"document_tags",',
+        ],
+        "group": [
+            'group_filter = f"{group_base_filter} and {tags_filter_clause}" if tags_filter_clause else group_base_filter',
+            'filter=group_filter,',
+            '"document_tags",',
+        ],
+        "public": [
+            'public_filter = f"{public_base_filter} and {tags_filter_clause}" if tags_filter_clause else public_base_filter',
+            'filter=public_filter,',
+            '"document_tags",',
+        ],
+    }
+
+    scoped_blocks = {
+        "personal": personal_block,
+        "group": group_block,
+        "public": public_block,
+    }
+
+    for scope_name, snippets in required_scope_snippets.items():
+        missing = [snippet for snippet in snippets if snippet not in scoped_blocks[scope_name]]
+        assert not missing, f"Missing {scope_name} scoped tag filter snippets: {missing}"
+
+    print("✅ Scoped hybrid search tag filters passed")
+    return True
+
+
+def test_config_version_is_bumped_for_chat_scope_tag_filter_fix():
+    """Verify config version was bumped for the scoped chat tag filter fix."""
+    print("🔍 Testing config version bump...")
+
+    config_content = read_file(CONFIG_FILE)
+    assert 'VERSION = "0.240.029"' in config_content, "Expected config.py version 0.240.029"
+
+    print("✅ Config version bump passed")
+    return True
+
+
+if __name__ == "__main__":
+    tests = [
+        test_hybrid_search_applies_tag_filters_to_personal_group_and_public_scopes,
+        test_config_version_is_bumped_for_chat_scope_tag_filter_fix,
+    ]
+
+    results = []
+    for test in tests:
+        print(f"\n🧪 Running {test.__name__}...")
+        results.append(test())
+
+    success = all(results)
+    print(f"\n📊 Results: {sum(results)}/{len(results)} tests passed")
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_chat_stream_history_context_fix.py b/functional_tests/test_chat_stream_history_context_fix.py
new file mode 100644
index 00000000..a1c71b78
--- /dev/null
+++ b/functional_tests/test_chat_stream_history_context_fix.py
@@ -0,0 +1,397 @@
+# test_chat_stream_history_context_fix.py
+#!/usr/bin/env python3
+"""
+Functional test for shared chat history context fix.
+Version: 0.240.053
+Implemented in: 0.240.053
+
+This test ensures streaming and non-streaming chat paths share the same
+history builder so older turns can be summarized instead of being dropped
+when the recent message window is small, and that the selected history
+context remains available for debugging without overloading the thoughts UI.
+"""
+
+import ast
+import json
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, "application", "single_app", "route_backend_chats.py")
+CONFIG_FILE = os.path.join(ROOT_DIR, "application", "single_app", "config.py")
+THOUGHTS_JS = os.path.join(ROOT_DIR, "application", "single_app", "static", "js", "chat", "chat-thoughts.js")
+MESSAGES_JS = os.path.join(ROOT_DIR, "application", "single_app", "static", "js", "chat", "chat-messages.js")
+FIX_DOC = os.path.join(
+    ROOT_DIR,
+    "docs",
+    "explanation",
+    "fixes",
+    "CHAT_STREAM_HISTORY_CONTEXT_FIX.md",
+)
+TARGET_FUNCTIONS = {
+    "remove_masked_content",
+    "_format_history_message_ref",
+    "_capture_history_refs",
+    "_truncate_history_citation_text",
+    "_serialize_history_citation_value",
+    "_build_agent_citation_history_lines",
+    "_build_document_citation_history_lines",
+    "_build_web_citation_history_lines",
+    "build_assistant_history_content_with_citations",
+    "build_conversation_history_segments",
+}
+
+
+def read_file_text(file_path):
+    with open(file_path, "r", encoding="utf-8") as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_file_text(CONFIG_FILE).splitlines():
+        if line.startswith("VERSION = "):
+            return line.split("=", 1)[1].strip().strip('"')
+    raise AssertionError("VERSION assignment not found in config.py")
+
+
+def load_history_helpers():
+    source = read_file_text(ROUTE_FILE)
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = [
+        node for node in parsed.body
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS
+    ]
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        "json": json,
+        "filter_assistant_artifact_items": lambda messages: list(messages),
+        "build_message_artifact_payload_map": lambda messages: {},
+        "hydrate_agent_citations_from_artifacts": lambda messages, artifact_payload_map: list(messages),
+        "sort_messages_by_thread": lambda messages: list(messages),
+        "debug_print": lambda *args, **kwargs: None,
+    }
+    exec(compile(module, ROUTE_FILE, "exec"), namespace)
+    return namespace, source
+
+
+class FakeSummaryMessage:
+    def __init__(self, content):
+        self.content = content
+
+
+class FakeSummaryChoice:
+    def __init__(self, content):
+        self.message = FakeSummaryMessage(content)
+
+
+class FakeSummaryResponse:
+    def __init__(self, content):
+        self.choices = [FakeSummaryChoice(content)]
+
+
+class FakeChatCompletions:
+    def __init__(self, summary_content):
+        self.summary_content = summary_content
+        self.calls = []
+
+    def create(self, **kwargs):
+        self.calls.append(kwargs)
+        return FakeSummaryResponse(self.summary_content)
+
+
+class FakeGPTClient:
+    def __init__(self, summary_content):
+        self.chat = type("ChatNamespace", (), {})()
+        self.chat.completions = FakeChatCompletions(summary_content)
+
+
+def test_history_builder_summarizes_older_turns_when_recent_window_is_small():
+    print("🔍 Testing shared history builder older-turn summarization...")
+
+    namespace, _ = load_history_helpers()
+    build_segments = namespace["build_conversation_history_segments"]
+    fake_client = FakeGPTClient("Older context summary")
+
+    all_messages = [
+        {"id": "u1", "role": "user", "content": "How many discrete SharePoint sites appear in CCO locations?", "timestamp": "2026-04-03T10:00:00", "metadata": {}},
+        {"id": "a1", "role": "assistant", "content": "There are 10 discrete SharePoint sites.", "timestamp": "2026-04-03T10:00:01", "metadata": {}},
+        {"id": "u2", "role": "user", "content": "How many discrete SharePoint sites appear in CCO locations? please list them out", "timestamp": "2026-04-03T10:00:02", "metadata": {}},
+        {"id": "a2", "role": "assistant", "content": "There are 2 discrete site locations from the Licensing sheet.", "timestamp": "2026-04-03T10:00:03", "metadata": {}},
+        {"id": "u3", "role": "user", "content": "please list the locations out in a single table", "timestamp": "2026-04-03T10:00:04", "metadata": {}},
+    ]
+
+    result = build_segments(
+        all_messages=all_messages,
+        conversation_history_limit=2,
+        enable_summarize_older_messages=True,
+        gpt_client=fake_client,
+        gpt_model="gpt-4o",
+        user_message_id="u3",
+        fallback_user_message="please list the locations out in a single table",
+    )
+
+    assert result["summary_of_older"] == "Older context summary"
+    assert [msg["role"] for msg in result["history_messages"]] == ["assistant", "user"]
+    assert result["history_messages"][0]["content"] == "There are 2 discrete site locations from the Licensing sheet."
+    assert result["history_messages"][1]["content"] == "please list the locations out in a single table"
+    assert len(fake_client.chat.completions.calls) == 1
+
+    summary_prompt = fake_client.chat.completions.calls[0]["messages"][0]["content"]
+    assert "There are 10 discrete SharePoint sites." in summary_prompt
+    assert "please list the locations out in a single table" not in summary_prompt
+
+    print("✅ Shared history builder older-turn summarization passed")
+    return True
+
+
+def test_history_builder_filters_inactive_and_masked_messages():
+    print("🔍 Testing shared history builder filtering rules...")
+
+    namespace, _ = load_history_helpers()
+    build_segments = namespace["build_conversation_history_segments"]
+
+    all_messages = [
+        {
+            "id": "a-inactive",
+            "role": "assistant",
+            "content": "inactive answer should not be reused",
+            "timestamp": "2026-04-03T11:00:00",
+            "metadata": {"thread_info": {"active_thread": False}},
+        },
+        {
+            "id": "u-masked",
+            "role": "user",
+            "content": "AlphaSecretOmega",
+            "timestamp": "2026-04-03T11:00:01",
+            "metadata": {"masked_ranges": [{"start": 5, "end": 11}]},
+        },
+        {
+            "id": "u-latest",
+            "role": "user",
+            "content": "latest follow-up",
+            "timestamp": "2026-04-03T11:00:02",
+            "metadata": {},
+        },
+    ]
+
+    result = build_segments(
+        all_messages=all_messages,
+        conversation_history_limit=3,
+        enable_summarize_older_messages=False,
+        gpt_client=None,
+        gpt_model=None,
+        user_message_id="u-latest",
+        fallback_user_message="latest follow-up",
+    )
+
+    contents = [message["content"] for message in result["history_messages"]]
+    assert "inactive answer should not be reused" not in contents
+    assert "AlphaOmega" in contents
+    assert "AlphaSecretOmega" not in contents
+    assert contents[-1] == "latest follow-up"
+
+    print("✅ Shared history builder filtering rules passed")
+    return True
+
+
+def test_streaming_and_non_streaming_paths_share_history_builder():
+    print("🔍 Testing shared history builder wiring...")
+
+    _, route_source = load_history_helpers()
+    assert route_source.count("history_segments = build_conversation_history_segments(") == 2
+    assert "enable_summarize_content_history_beyond_conversation_history_limit = settings.get(" in route_source
+    assert "msg.get('content', '').startswith('<Summary of previous conversation context>')" in route_source
+
+    print("✅ Shared history builder wiring passed")
+    return True
+
+
+def test_history_builder_includes_prior_citation_results_for_follow_ups():
+    print("🔍 Testing citation results are included in assistant history turns...")
+
+    namespace, _ = load_history_helpers()
+    build_segments = namespace["build_conversation_history_segments"]
+
+    all_messages = [
+        {
+            "id": "u1",
+            "role": "user",
+            "content": "How many discrete SharePoint sites appear in CCO locations?",
+            "timestamp": "2026-04-03T12:00:00",
+            "metadata": {},
+        },
+        {
+            "id": "a1",
+            "role": "assistant",
+            "content": "A total of 9 discrete SharePoint sites appear in CCO locations.",
+            "timestamp": "2026-04-03T12:00:01",
+            "metadata": {},
+            "agent_citations": [
+                {
+                    "tool_name": "TabularProcessingPlugin.get_distinct_values [Legal]",
+                    "function_arguments": {
+                        "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+                        "sheet_name": "Legal",
+                        "column": "Location",
+                    },
+                    "function_result": {
+                        "distinct_count": 8,
+                        "values": [
+                            "http://occtreasgovprod.sharepoint.com/sites/CCO/lawnotated",
+                            "http://occtreasgovprod.sharepoint.com/sites/LCFrmwrk/Compliance%20Framework/Forms/Allltems.aspx",
+                            "http://occtreasgovprod.sharepoint.com/sites/WDLD/Site",
+                        ],
+                    },
+                    "success": True,
+                },
+                {
+                    "tool_name": "TabularProcessingPlugin.get_distinct_values",
+                    "function_arguments": {
+                        "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+                        "column": "Location",
+                    },
+                    "function_result": {
+                        "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+                        "selected_sheet": "ALL (cross-sheet search)",
+                        "column": "Location",
+                        "distinct_count": 3,
+                        "returned_values": 3,
+                        "values": [
+                            "http://occtreasgovprod.sharepoint.com/sites/CCO/lawnotated",
+                            "http://occtreasgovprod.sharepoint.com/sites/LCFrmwrk/Compliance%20Framework/Forms/Allltems.aspx",
+                            "http://occtreasgovprod.sharepoint.com/sites/WDLD/Site",
+                        ],
+                    },
+                    "success": True,
+                },
+                {
+                    "tool_name": "TabularProcessingPlugin.get_distinct_values [Licensing]",
+                    "function_arguments": {
+                        "filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx",
+                        "sheet_name": "Licensing",
+                        "column": "Location",
+                    },
+                    "function_result": {
+                        "distinct_count": 2,
+                        "values": [
+                            "http://share/sites/CC/LICA/default.aspx",
+                            "https://occtreasgovprod.sharepoint.com/sites/LIC",
+                        ],
+                    },
+                    "success": True,
+                },
+                {
+                    "tool_name": "TabularProcessingPlugin.get_distinct_values",
+                    "function_arguments": {
+                        "filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx",
+                        "column": "Location",
+                    },
+                    "function_result": {
+                        "filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx",
+                        "selected_sheet": "ALL (cross-sheet search)",
+                        "column": "Location",
+                        "distinct_count": 2,
+                        "returned_values": 2,
+                        "values": [
+                            "http://share/sites/CC/LICA/default.aspx",
+                            "https://occtreasgovprod.sharepoint.com/sites/LIC",
+                        ],
+                    },
+                    "success": True,
+                },
+            ],
+        },
+        {
+            "id": "u2",
+            "role": "user",
+            "content": "please list them out",
+            "timestamp": "2026-04-03T12:00:02",
+            "metadata": {},
+        },
+    ]
+
+    result = build_segments(
+        all_messages=all_messages,
+        conversation_history_limit=3,
+        enable_summarize_older_messages=False,
+        gpt_client=None,
+        gpt_model=None,
+        user_message_id="u2",
+        fallback_user_message="please list them out",
+    )
+
+    assistant_turn = result["history_messages"][1]["content"]
+    assert "Supporting citation context from this assistant turn" in assistant_turn
+    assert "TabularProcessingPlugin.get_distinct_values [Legal]" in assistant_turn
+    assert "http://share/sites/CC/LICA/default.aspx" in assistant_turn
+    assert "https://occtreasgovprod.sharepoint.com/sites/LIC" in assistant_turn
+    assert assistant_turn.count("ALL (cross-sheet search)") == 0
+    assert assistant_turn.count("CCO-Licensing File Plan 2025_Final Approved.xlsx") == 1
+
+    print("✅ Citation results are included in assistant history turns")
+    return True
+
+
+def test_history_context_diagnostics_are_exposed_in_backend_and_ui():
+    print("🔍 Testing history context diagnostics visibility...")
+
+    route_source = read_file_text(ROUTE_FILE)
+    thoughts_source = read_file_text(THOUGHTS_JS)
+    messages_source = read_file_text(MESSAGES_JS)
+
+    assert "build_history_context_thought_content(history_debug_info)" in route_source
+    assert "build_history_context_thought_detail(history_debug_info)" in route_source
+    assert route_source.count("'history_context': history_debug_info") >= 3
+    assert "build_history_context_debug_citation(history_debug_info, 'streaming')" in route_source
+    assert "build_history_context_debug_citation(history_debug_info, 'standard')" in route_source
+
+    assert "'history_context': 'bi-diagram-3'" in thoughts_source
+    assert "t.detail != null && String(t.detail).trim()" not in thoughts_source
+    assert "thought-detail" not in thoughts_source
+
+    assert "History Context" in messages_source
+    assert "selected_recent_message_refs" in messages_source
+    assert "final_api_source_refs" in messages_source
+    assert "renderHistoryContextSection" in messages_source
+
+    print("✅ History context diagnostics visibility passed")
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    print("🔍 Testing version and fix documentation alignment...")
+
+    version = read_config_version()
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert version == "0.240.053", version
+    assert "Fixed/Implemented in version: **0.240.053**" in fix_doc_content
+    assert "build_conversation_history_segments" in fix_doc_content
+    assert "history_context" in fix_doc_content
+    assert "citation results" in fix_doc_content.lower()
+    assert "application/single_app/route_backend_chats.py" in fix_doc_content
+
+    print("✅ Version and fix documentation alignment passed")
+    return True
+
+
+if __name__ == "__main__":
+    tests = [
+        test_history_builder_summarizes_older_turns_when_recent_window_is_small,
+        test_history_builder_filters_inactive_and_masked_messages,
+        test_streaming_and_non_streaming_paths_share_history_builder,
+        test_history_builder_includes_prior_citation_results_for_follow_ups,
+        test_history_context_diagnostics_are_exposed_in_backend_and_ui,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f"\n🧪 Running {test.__name__}...")
+        results.append(test())
+
+    success = all(results)
+    print(f"\n📊 Results: {sum(results)}/{len(results)} tests passed")
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_citation_revision_lookup_fix.py b/functional_tests/test_citation_revision_lookup_fix.py
new file mode 100644
index 00000000..8a3cda90
--- /dev/null
+++ b/functional_tests/test_citation_revision_lookup_fix.py
@@ -0,0 +1,182 @@
+# test_citation_revision_lookup_fix.py
+#!/usr/bin/env python3
+"""
+Functional test for citation revision lookup fix.
+Version: 0.240.025
+Implemented in: 0.240.024
+
+This test ensures citation lookup resolves access by the exact document ID
+behind a chunk so new revisions continue to point at the correct document
+record as revision-aware blob paths are introduced.
+"""
+
+import ast
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(ROOT_DIR)
+
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_documents.py')
+ENHANCED_ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_enhanced_citations.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+FIX_DOC = os.path.join(ROOT_DIR, 'docs', 'explanation', 'fixes', 'CITATION_REVISION_LOOKUP_FIX.md')
+TARGET_FUNCTIONS = {
+    '_extract_citation_document_id',
+    '_try_get_document_json',
+    '_find_accessible_citation_document',
+}
+
+
+class FakeResponse:
+    def __init__(self, payload):
+        self.payload = payload
+
+    def get_json(self):
+        return self.payload
+
+
+def load_citation_helpers():
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = [
+        node for node in parsed.body
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS
+    ]
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {}
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_file_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_file_text(CONFIG_FILE).splitlines():
+        if line.startswith('VERSION = '):
+            return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_extract_citation_document_id_prefers_chunk_metadata():
+    print('🔍 Testing citation document ID extraction...')
+
+    namespace, _ = load_citation_helpers()
+    extract_document_id = namespace['_extract_citation_document_id']
+
+    assert extract_document_id({'document_id': 'doc-revision-2'}, 'doc-revision-1_4') == 'doc-revision-2'
+    assert extract_document_id({}, 'doc-revision-1_4') == 'doc-revision-1'
+    assert extract_document_id({}, 'raw-citation-id') == 'raw-citation-id'
+
+    print('✅ Citation document ID extraction passed')
+    return True
+
+
+def test_find_accessible_citation_document_uses_exact_document_id():
+    print('🔍 Testing exact document lookup across citation scopes...')
+
+    namespace, _ = load_citation_helpers()
+    find_accessible_document = namespace['_find_accessible_citation_document']
+    calls = []
+
+    def fake_get_settings():
+        return {
+            'enable_user_workspace': True,
+            'enable_group_workspaces': True,
+            'enable_public_workspaces': True,
+        }
+
+    def fake_get_document(user_id, document_id, group_id=None, public_workspace_id=None):
+        calls.append({
+            'user_id': user_id,
+            'document_id': document_id,
+            'group_id': group_id,
+            'public_workspace_id': public_workspace_id,
+        })
+
+        if document_id != 'doc-revision-2':
+            return {'error': 'not found'}, 404
+
+        if group_id == 'group-1':
+            return FakeResponse({'id': document_id, 'group_id': group_id}), 200
+
+        if public_workspace_id == 'ws-1':
+            return FakeResponse({'id': document_id, 'public_workspace_id': public_workspace_id}), 200
+
+        if group_id is None and public_workspace_id is None:
+            return FakeResponse({'id': document_id, 'user_id': user_id}), 200
+
+        return {'error': 'not found'}, 404
+
+    namespace['get_settings'] = fake_get_settings
+    namespace['get_document'] = fake_get_document
+    namespace['get_user_groups'] = lambda user_id: [{'id': 'group-1'}, {'id': 'group-2'}]
+    namespace['get_user_visible_public_workspace_ids_from_settings'] = lambda user_id: ['ws-1']
+
+    personal_doc = find_accessible_document('user-1', 'doc-revision-2', 'personal')
+    group_doc = find_accessible_document('user-1', 'doc-revision-2', 'group')
+    public_doc = find_accessible_document('user-1', 'doc-revision-2', 'public')
+
+    assert personal_doc['id'] == 'doc-revision-2'
+    assert group_doc['group_id'] == 'group-1'
+    assert public_doc['public_workspace_id'] == 'ws-1'
+    assert all(call['document_id'] == 'doc-revision-2' for call in calls), calls
+
+    print('✅ Exact document lookup across citation scopes passed')
+    return True
+
+
+def test_revision_lookup_is_wired_into_text_and_enhanced_citations():
+    print('🔍 Testing citation route wiring...')
+
+    _, route_source = load_citation_helpers()
+    enhanced_route_source = read_file_text(ENHANCED_ROUTE_FILE)
+
+    assert "document_id = _extract_citation_document_id(chunk, citation_id)" in route_source
+    assert "accessible_document = _find_accessible_citation_document(user_id, document_id, scope_name)" in route_source
+    assert 'Unauthorized access to citation' in route_source
+    assert 'backend_get_document(user_id, doc_id)' in enhanced_route_source
+    assert 'get_document_blob_storage_info(raw_doc)' in enhanced_route_source
+
+    print('✅ Citation route wiring passed')
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    print('🔍 Testing version and fix documentation alignment...')
+
+    version = read_config_version()
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert version == '0.240.025', version
+    assert 'Fixed/Implemented in version: **0.240.024**' in fix_doc_content
+    assert 'exact document ID behind the citation chunk' in fix_doc_content
+    assert 'application/single_app/route_backend_documents.py' in fix_doc_content
+
+    print('✅ Version and fix documentation alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_extract_citation_document_id_prefers_chunk_metadata,
+        test_find_accessible_citation_document_uses_exact_document_id,
+        test_revision_lookup_is_wired_into_text_and_enhanced_citations,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_document_revision_current_version_fix.py b/functional_tests/test_document_revision_current_version_fix.py
new file mode 100644
index 00000000..14497f00
--- /dev/null
+++ b/functional_tests/test_document_revision_current_version_fix.py
@@ -0,0 +1,197 @@
+# test_document_revision_current_version_fix.py
+"""
+Functional test for document revision current-version behavior.
+Version: 0.240.022
+Implemented in: 0.240.022
+
+This test ensures duplicate-name uploads preserve revision metadata, only the
+latest revision stays visible/searchable, and workspace delete flows expose a
+current-only versus all-versions choice.
+"""
+
+import os
+
+
+REPO_ROOT = os.path.abspath(os.path.join(os.path.dirname(__file__), '..'))
+CONFIG_FILE = os.path.join(REPO_ROOT, 'application', 'single_app', 'config.py')
+FUNCTIONS_DOCUMENTS = os.path.join(REPO_ROOT, 'application', 'single_app', 'functions_documents.py')
+FUNCTIONS_SEARCH = os.path.join(REPO_ROOT, 'application', 'single_app', 'functions_search.py')
+PERSONAL_ROUTE = os.path.join(REPO_ROOT, 'application', 'single_app', 'route_backend_documents.py')
+GROUP_ROUTE = os.path.join(REPO_ROOT, 'application', 'single_app', 'route_backend_group_documents.py')
+PUBLIC_ROUTE = os.path.join(REPO_ROOT, 'application', 'single_app', 'route_backend_public_documents.py')
+EXTERNAL_PUBLIC_ROUTE = os.path.join(REPO_ROOT, 'application', 'single_app', 'route_external_public_documents.py')
+ENHANCED_CITATIONS_ROUTE = os.path.join(REPO_ROOT, 'application', 'single_app', 'route_enhanced_citations.py')
+WORKSPACE_TEMPLATE = os.path.join(REPO_ROOT, 'application', 'single_app', 'templates', 'workspace.html')
+PUBLIC_TEMPLATE = os.path.join(REPO_ROOT, 'application', 'single_app', 'templates', 'public_workspaces.html')
+GROUP_TEMPLATE = os.path.join(REPO_ROOT, 'application', 'single_app', 'templates', 'group_workspaces.html')
+WORKSPACE_JS = os.path.join(REPO_ROOT, 'application', 'single_app', 'static', 'js', 'workspace', 'workspace-documents.js')
+PUBLIC_JS = os.path.join(REPO_ROOT, 'application', 'single_app', 'static', 'js', 'public', 'public_workspace.js')
+FIX_DOC = os.path.join(REPO_ROOT, 'docs', 'explanation', 'fixes', 'DOCUMENT_REVISION_CURRENT_VERSION_FIX.md')
+
+
+def read_file_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def test_revision_metadata_helpers_exist():
+    """Ensure document metadata now models revision families and current visibility."""
+    print('🔍 Validating revision metadata helpers...')
+
+    documents_content = read_file_text(FUNCTIONS_DOCUMENTS)
+    search_content = read_file_text(FUNCTIONS_SEARCH)
+    enhanced_citations_content = read_file_text(ENHANCED_CITATIONS_ROUTE)
+
+    for marker in [
+        'revision_family_id',
+        'is_current_version',
+        'search_visibility_state',
+        'select_current_documents',
+        'normalize_document_revision_families',
+        'set_document_chunk_visibility',
+        'def delete_document_revision(',
+        'carried_forward = _build_carried_forward_metadata(',
+        'CURRENT_ALIAS_BLOB_PATH_MODE = "current_alias"',
+        'ARCHIVED_REVISION_BLOB_PATH_MODE = "archived_revision"',
+        'def build_current_blob_path(',
+        'def build_archived_blob_path(',
+        'def get_document_blob_storage_info(',
+        'def get_document_blob_delete_targets(',
+        'def _archive_previous_document_blob(',
+        'def _promote_document_blob_to_current_alias(',
+        '"search_visibility_state": "active"',
+        "existing_document['search_visibility_state'] = 'archived'",
+        "promoted_document['is_current_version'] = True",
+        'blob_container',
+        'archived_blob_path',
+        'blob_path_mode',
+    ]:
+        assert marker in documents_content, f'Missing revision metadata marker: {marker}'
+
+    assert 'normalize_document_revision_families(' in search_content, (
+        'Hybrid search should normalize duplicate revision families before searching.'
+    )
+    assert 'get_document_blob_storage_info' in enhanced_citations_content, (
+        'Enhanced citations should resolve stored blob metadata before falling back to legacy paths.'
+    )
+
+    print('✅ Revision metadata helpers are present')
+
+
+def test_blob_revision_paths_preserve_current_alias_and_archive_history():
+    """Ensure the blob storage model keeps the current alias and archives prior revisions hierarchically."""
+    print('🔍 Validating blob revision path hierarchy...')
+
+    documents_content = read_file_text(FUNCTIONS_DOCUMENTS)
+
+    assert 'return f"{scope_id}/{blob_filename}"' in documents_content, (
+        'Current revisions should keep the existing workspace alias path.'
+    )
+    assert 'return f"{scope_id}/{revision_family_id}/{document_id}/{file_name}"' in documents_content, (
+        'Archived revisions should be grouped under revision_family_id/document_id/filename.'
+    )
+    assert 'previous_document["blob_path"] = archived_blob_path' in documents_content, (
+        'Previous current revisions should move to the archived blob path.'
+    )
+    assert 'promoted_document["blob_path"] = current_blob_path' in documents_content, (
+        'Promoted revisions should return to the current alias blob path.'
+    )
+
+    print('✅ Blob revision path hierarchy is present')
+
+
+def test_workspace_routes_only_return_current_revisions_and_accept_delete_modes():
+    """Ensure every workspace route collapses to current revisions and supports delete_mode."""
+    print('🔍 Validating workspace route revision filtering and delete modes...')
+
+    route_expectations = [
+        PERSONAL_ROUTE,
+        GROUP_ROUTE,
+        PUBLIC_ROUTE,
+        EXTERNAL_PUBLIC_ROUTE,
+    ]
+
+    for route_path in route_expectations:
+        route_content = read_file_text(route_path)
+        assert 'select_current_documents' in route_content, (
+            f'{os.path.basename(route_path)} should collapse results to current revisions.'
+        )
+        assert 'sort_documents' in route_content, (
+            f'{os.path.basename(route_path)} should sort collapsed current revisions.'
+        )
+        assert "delete_mode = request.args.get('delete_mode', 'all_versions')" in route_content, (
+            f'{os.path.basename(route_path)} should accept delete_mode.'
+        )
+        assert 'delete_document_revision(' in route_content, (
+            f'{os.path.basename(route_path)} should use revision-aware deletion.'
+        )
+
+    print('✅ Workspace routes enforce current revision visibility and delete modes')
+
+
+def test_delete_ui_uses_revision_choice_modals():
+    """Ensure personal, public, and group workspaces expose Bootstrap revision delete choices."""
+    print('🔍 Validating delete choice UI wiring...')
+
+    workspace_template = read_file_text(WORKSPACE_TEMPLATE)
+    public_template = read_file_text(PUBLIC_TEMPLATE)
+    group_template = read_file_text(GROUP_TEMPLATE)
+    workspace_js = read_file_text(WORKSPACE_JS)
+    public_js = read_file_text(PUBLIC_JS)
+
+    assert 'documentDeleteModal' in workspace_template, 'Workspace template should include the delete choice modal.'
+    assert 'publicDocumentDeleteModal' in public_template, 'Public workspace template should include the delete choice modal.'
+    assert 'groupDocumentDeleteModal' in group_template, 'Group workspace template should include the delete choice modal.'
+
+    for content, label in [
+        (workspace_js, 'workspace JS'),
+        (public_js, 'public workspace JS'),
+        (group_template, 'group workspace template JS'),
+    ]:
+        assert 'Delete Current Version' in content, f'{label} should offer current-version deletion.'
+        assert 'Delete All Versions' in content, f'{label} should offer all-version deletion.'
+        assert 'delete_mode' in content, f'{label} should send delete_mode to the backend.'
+
+    print('✅ Delete choice UI wiring is present across workspace pages')
+
+
+def test_document_revision_fix_documentation_and_version_alignment():
+    """Ensure config and fix documentation capture the new revision behavior."""
+    print('🔍 Validating version bump and fix documentation...')
+
+    config_content = read_file_text(CONFIG_FILE)
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert 'VERSION = "0.240.022"' in config_content, 'Expected config.py version 0.240.022'
+    assert 'Fixed/Implemented in version: **0.240.022**' in fix_doc_content, (
+        'Fix documentation should reference version 0.240.022.'
+    )
+    assert 'Delete Current Version' in fix_doc_content, (
+        'Fix documentation should describe the current-version delete option.'
+    )
+    assert 'Delete All Versions' in fix_doc_content, (
+        'Fix documentation should describe the all-versions delete option.'
+    )
+    assert 'user-id/revision-family-id/revision-document-id/filename' in fix_doc_content, (
+        'Fix documentation should describe the archived revision blob path hierarchy.'
+    )
+    assert 'user-id/filename' in fix_doc_content, (
+        'Fix documentation should describe the retained current alias blob path.'
+    )
+    assert 'older revisions' in fix_doc_content.lower(), (
+        'Fix documentation should explain older revision retention.'
+    )
+
+    print('✅ Version bump and fix documentation are aligned')
+
+
+if __name__ == '__main__':
+    test_revision_metadata_helpers_exist()
+    print()
+    test_blob_revision_paths_preserve_current_alias_and_archive_history()
+    print()
+    test_workspace_routes_only_return_current_revisions_and_accept_delete_modes()
+    print()
+    test_delete_ui_uses_revision_choice_modals()
+    print()
+    test_document_revision_fix_documentation_and_version_alignment()
\ No newline at end of file
diff --git a/functional_tests/test_fact_memory_streaming_context_fix.py b/functional_tests/test_fact_memory_streaming_context_fix.py
new file mode 100644
index 00000000..2337fe0f
--- /dev/null
+++ b/functional_tests/test_fact_memory_streaming_context_fix.py
@@ -0,0 +1,198 @@
+# test_fact_memory_streaming_context_fix.py
+"""
+Functional test for fact memory chat-context parity.
+Version: 0.240.051
+Implemented in: 0.240.050; 0.240.051
+
+This test ensures both standard and streaming agent chat paths inject saved fact
+memory into model context, and that fact lookup preserves the selected agent id
+instead of silently falling back to the default configured agent.
+"""
+
+import ast
+import copy
+import os
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+FIX_DOC = os.path.join(
+    ROOT_DIR,
+    'docs',
+    'explanation',
+    'fixes',
+    'FACT_MEMORY_STREAMING_CONTEXT_FIX.md',
+)
+TARGET_FUNCTIONS = {
+    'get_facts_for_context',
+    'inject_fact_memory_context',
+}
+
+
+def read_file_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_file_text(CONFIG_FILE).splitlines():
+        if line.startswith('VERSION = '):
+            return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def load_fact_memory_helpers():
+    route_source = read_file_text(ROUTE_FILE)
+    parsed = ast.parse(route_source, filename=ROUTE_FILE)
+    selected_nodes = []
+
+    class NestedFunctionCollector(ast.NodeVisitor):
+        def visit_FunctionDef(self, node):
+            if node.name in TARGET_FUNCTIONS:
+                selected_nodes.append(copy.deepcopy(node))
+            self.generic_visit(node)
+
+    NestedFunctionCollector().visit(parsed)
+    assert len(selected_nodes) == len(TARGET_FUNCTIONS), (
+        f'Expected to find helpers {sorted(TARGET_FUNCTIONS)}, '
+        f'found {[node.name for node in selected_nodes]}'
+    )
+
+    class FakeFactMemoryStore:
+        created_instances = []
+        next_facts = []
+
+        def __init__(self):
+            self.calls = []
+            self.__class__.created_instances.append(self)
+
+        def get_facts(self, **kwargs):
+            self.calls.append(kwargs)
+            return list(self.__class__.next_facts)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    ast.fix_missing_locations(module)
+
+    namespace = {
+        'FactMemoryStore': FakeFactMemoryStore,
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, route_source, FakeFactMemoryStore
+
+
+def test_get_facts_for_context_preserves_selected_agent_id():
+    """Verify fact lookup uses the caller-provided selected agent id."""
+    print('🔍 Testing fact lookup preserves selected agent id...')
+
+    namespace, _, fake_store_class = load_fact_memory_helpers()
+    fake_store_class.created_instances = []
+    fake_store_class.next_facts = [
+        {'value': 'The user prefers hyphens instead of em dashes.'},
+    ]
+
+    facts = namespace['get_facts_for_context'](
+        scope_id='user-123',
+        scope_type='user',
+        conversation_id='conversation-456',
+        agent_id='agent-789',
+    )
+
+    assert '- The user prefers hyphens instead of em dashes.' in facts, facts
+    assert '- agent_id: agent-789' in facts, facts
+    assert fake_store_class.created_instances, 'Expected FactMemoryStore to be instantiated.'
+    assert fake_store_class.created_instances[-1].calls == [{
+        'scope_type': 'user',
+        'scope_id': 'user-123',
+        'agent_id': 'agent-789',
+        'conversation_id': 'conversation-456',
+    }], fake_store_class.created_instances[-1].calls
+
+    print('✅ Fact lookup preserves selected agent id')
+    return True
+
+
+def test_inject_fact_memory_context_adds_metadata_and_facts():
+    """Verify injected system messages prepend metadata and saved facts."""
+    print('🔍 Testing fact memory context injection...')
+
+    namespace, _, fake_store_class = load_fact_memory_helpers()
+    fake_store_class.created_instances = []
+    fake_store_class.next_facts = [
+        {'value': 'The user prefers hyphens instead of em dashes.'},
+    ]
+
+    conversation_history = [
+        {'role': 'user', 'content': 'Please draft the response.'},
+    ]
+    namespace['inject_fact_memory_context'](
+        conversation_history=conversation_history,
+        scope_id='user-123',
+        scope_type='user',
+        conversation_id='conversation-456',
+        agent_id='agent-789',
+    )
+
+    assert conversation_history[0]['role'] == 'system', conversation_history
+    assert '<Conversation Metadata>' in conversation_history[0]['content'], conversation_history[0]
+    assert '<Agent ID: agent-789>' in conversation_history[0]['content'], conversation_history[0]
+    assert conversation_history[1]['role'] == 'system', conversation_history
+    assert '<Fact Memory>' in conversation_history[1]['content'], conversation_history[1]
+    assert 'The user prefers hyphens instead of em dashes.' in conversation_history[1]['content'], conversation_history[1]
+    assert conversation_history[-1]['role'] == 'user', conversation_history
+
+    print('✅ Fact memory context injection passed')
+    return True
+
+
+def test_route_wires_fact_memory_injection_for_standard_and_streaming_paths():
+    """Verify both chat execution paths call the shared fact-memory injector."""
+    print('🔍 Testing route wiring for standard and streaming fact injection...')
+
+    _, route_source, _ = load_fact_memory_helpers()
+
+    assert route_source.count('inject_fact_memory_context(') == 3, (
+        'Expected one helper definition and two call sites for fact-memory injection.'
+    )
+    assert "agent_id=getattr(selected_agent, 'id', None)" in route_source, (
+        'Expected streaming injection to use the selected agent id.'
+    )
+    assert '<Fact Memory>' in route_source, 'Expected fact memory system message markup.'
+    assert '<Conversation Metadata>' in route_source, 'Expected conversation metadata system message markup.'
+
+    print('✅ Route wiring for standard and streaming fact injection passed')
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    """Verify version bump and fix documentation stay aligned."""
+    print('🔍 Testing version and fix documentation alignment...')
+
+    fix_doc_content = read_file_text(FIX_DOC)
+
+    assert read_config_version() == '0.240.051'
+    assert 'Fixed/Implemented in version: **0.240.051**' in fix_doc_content
+    assert 'streaming chat path' in fix_doc_content.lower()
+    assert 'selected agent id' in fix_doc_content.lower()
+    assert 'application/single_app/route_backend_chats.py' in fix_doc_content
+
+    print('✅ Version and fix documentation alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_get_facts_for_context_preserves_selected_agent_id,
+        test_inject_fact_memory_context_adds_metadata_and_facts,
+        test_route_wires_fact_memory_injection_for_standard_and_streaming_paths,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    raise SystemExit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_group_workspace_initial_documents_fetch_fix.py b/functional_tests/test_group_workspace_initial_documents_fetch_fix.py
new file mode 100644
index 00000000..12c6dafa
--- /dev/null
+++ b/functional_tests/test_group_workspace_initial_documents_fetch_fix.py
@@ -0,0 +1,106 @@
+# test_group_workspace_initial_documents_fetch_fix.py
+"""
+Functional test for group workspace initial document fetch fix.
+Version: 0.240.027
+Implemented in: 0.240.027
+
+This test ensures that the group workspace document loader rebuilds its query
+parameters before the first fetch and does not trigger bulk-delete confirmation
+logic while the page is still initializing.
+"""
+
+import os
+import re
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+GROUP_WORKSPACE_TEMPLATE = os.path.join(
+    ROOT_DIR,
+    "application",
+    "single_app",
+    "templates",
+    "group_workspaces.html",
+)
+CONFIG_FILE = os.path.join(
+    ROOT_DIR,
+    "application",
+    "single_app",
+    "config.py",
+)
+
+
+def read_file(path):
+    with open(path, "r", encoding="utf-8") as file_handle:
+        return file_handle.read()
+
+
+def extract_fetch_group_documents_block(content):
+    match = re.search(
+        r"function fetchGroupDocuments\(\) \{(?P<body>.*?)\n  \}\n\n  // --- Render Group Document Row ---",
+        content,
+        re.DOTALL,
+    )
+    assert match, "Could not locate fetchGroupDocuments block in group_workspaces.html"
+    return f"function fetchGroupDocuments() {{{match.group('body')}\n  }}"
+
+
+def test_group_workspace_initial_fetch_builds_params_without_delete_prompt():
+    """Verify the initial group document fetch path does not invoke delete UI."""
+    print("🔍 Testing group workspace initial document fetch path...")
+
+    content = read_file(GROUP_WORKSPACE_TEMPLATE)
+    fetch_block = extract_fetch_group_documents_block(content)
+
+    required_snippets = [
+        "const params = new URLSearchParams({",
+        "page: groupDocsCurrentPage,",
+        "page_size: groupDocsPageSize,",
+        "params.append(\"search\", groupDocsSearchTerm);",
+        "params.append(\"classification\", groupDocsClassificationFilter);",
+        "params.append(\"author\", groupDocsAuthorFilter);",
+        "params.append(\"keywords\", groupDocsKeywordsFilter);",
+        "params.append(\"abstract\", groupDocsAbstractFilter);",
+        "params.append(\"tags\", groupDocsTagsFilter);",
+        "fetch(`/api/group_documents?${params.toString()}`)",
+    ]
+    missing = [snippet for snippet in required_snippets if snippet not in fetch_block]
+    assert not missing, f"Missing required fetchGroupDocuments snippets: {missing}"
+
+    forbidden_snippets = [
+        "promptGroupDeleteMode(",
+        "requestGroupDocumentDeletion(",
+        "Promise.allSettled(deletePromises)",
+    ]
+    present = [snippet for snippet in forbidden_snippets if snippet in fetch_block]
+    assert not present, f"Unexpected delete flow found in fetchGroupDocuments: {present}"
+
+    print("✅ Group workspace initial fetch path passed")
+    return True
+
+
+def test_config_version_is_bumped_for_group_workspace_fetch_fix():
+    """Verify config version was bumped for the group workspace fetch fix."""
+    print("🔍 Testing config version bump...")
+
+    config_content = read_file(CONFIG_FILE)
+    assert 'VERSION = "0.240.027"' in config_content, "Expected config.py version 0.240.027"
+
+    print("✅ Config version bump passed")
+    return True
+
+
+if __name__ == "__main__":
+    tests = [
+        test_group_workspace_initial_fetch_builds_params_without_delete_prompt,
+        test_config_version_is_bumped_for_group_workspace_fetch_fix,
+    ]
+
+    results = []
+    for test in tests:
+        print(f"\n🧪 Running {test.__name__}...")
+        results.append(test())
+
+    success = all(results)
+    print(f"\n📊 Results: {sum(results)}/{len(results)} tests passed")
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_historical_enhanced_citation_revision_rendering_fix.py b/functional_tests/test_historical_enhanced_citation_revision_rendering_fix.py
new file mode 100644
index 00000000..5c4ac794
--- /dev/null
+++ b/functional_tests/test_historical_enhanced_citation_revision_rendering_fix.py
@@ -0,0 +1,97 @@
+#!/usr/bin/env python3
+"""
+Functional test for historical enhanced citation revision rendering fix.
+Version: 0.240.025
+Implemented in: 0.240.025
+
+This test ensures older chat citations can fetch exact document metadata on
+demand and continue rendering archived PDF and tabular content after a newer
+revision becomes the current workspace document.
+"""
+
+import os
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+CHAT_DOCUMENTS_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'static', 'js', 'chat', 'chat-documents.js')
+CHAT_ENHANCED_CITATIONS_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'static', 'js', 'chat', 'chat-enhanced-citations.js')
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_enhanced_citations.py')
+FIX_DOC = os.path.join(ROOT_DIR, 'docs', 'explanation', 'fixes', 'HISTORICAL_ENHANCED_CITATION_REVISION_RENDERING_FIX.md')
+
+
+def read_text(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file_handle:
+        return file_handle.read()
+
+
+def read_config_version():
+    for line in read_text(CONFIG_FILE).splitlines():
+        if line.startswith('VERSION = '):
+            return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_chat_can_fetch_metadata_for_historical_cited_revisions():
+    print('🔍 Testing on-demand metadata fetch for historical cited revisions...')
+
+    chat_documents = read_text(CHAT_DOCUMENTS_FILE)
+    chat_enhanced_citations = read_text(CHAT_ENHANCED_CITATIONS_FILE)
+
+    assert 'const citationMetadataCache = new Map();' in chat_documents
+    assert 'export async function fetchDocumentMetadata(docId)' in chat_documents
+    assert '/api/enhanced_citations/document_metadata?doc_id=' in chat_documents
+    assert 'let docMetadata = getDocumentMetadata(docId);' in chat_enhanced_citations
+    assert 'docMetadata = await fetchDocumentMetadata(docId);' in chat_enhanced_citations
+    assert 'Historical cited revisions' in chat_enhanced_citations
+    assert 'fetch on demand when needed' in chat_enhanced_citations
+
+    print('✅ On-demand metadata fetch for historical cited revisions passed')
+    return True
+
+
+def test_enhanced_citations_route_exposes_exact_document_metadata_lookup():
+    print('🔍 Testing enhanced citation metadata route...')
+
+    route_source = read_text(ROUTE_FILE)
+
+    assert '@app.route("/api/enhanced_citations/document_metadata", methods=["GET"])' in route_source
+    assert 'doc_response, status_code = get_document(user_id, doc_id)' in route_source
+    assert 'get_document_blob_storage_info(raw_doc)' in route_source
+    assert '"file_name": raw_doc.get("file_name")' in route_source
+    assert '"enhanced_citations": bool(blob_path)' in route_source
+
+    print('✅ Enhanced citation metadata route passed')
+    return True
+
+
+def test_version_and_fix_documentation_alignment():
+    print('🔍 Testing version and fix documentation alignment...')
+
+    version = read_config_version()
+    fix_doc_content = read_text(FIX_DOC)
+
+    assert version == '0.240.025', version
+    assert 'Fixed/Implemented in version: **0.240.025**' in fix_doc_content
+    assert 'older chat citations' in fix_doc_content.lower()
+    assert 'archived PDF and tabular content' in fix_doc_content
+
+    print('✅ Version and fix documentation alignment passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_chat_can_fetch_metadata_for_historical_cited_revisions,
+        test_enhanced_citations_route_exposes_exact_document_metadata_lookup,
+        test_version_and_fix_documentation_alignment,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    raise SystemExit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_public_workspace_delete_toast_fix.py b/functional_tests/test_public_workspace_delete_toast_fix.py
new file mode 100644
index 00000000..3408936c
--- /dev/null
+++ b/functional_tests/test_public_workspace_delete_toast_fix.py
@@ -0,0 +1,53 @@
+# test_public_workspace_delete_toast_fix.py
+"""
+Functional test for public workspace delete toast fix.
+Version: 0.240.056
+Implemented in: 0.240.056
+
+This test ensures public workspace document delete failures use the shared
+Bootstrap toast helper instead of a blocking browser alert.
+"""
+
+from pathlib import Path
+import sys
+
+
+REPO_ROOT = Path(__file__).resolve().parents[1]
+PUBLIC_WORKSPACE_JS = REPO_ROOT / 'application' / 'single_app' / 'static' / 'js' / 'public' / 'public_workspace.js'
+PUBLIC_WORKSPACE_UTILITY_JS = REPO_ROOT / 'application' / 'single_app' / 'static' / 'js' / 'public' / 'public_workspace_utility.js'
+
+
+def read_text(path):
+    return path.read_text(encoding='utf-8')
+
+
+def test_public_workspace_delete_failures_use_toast_helper():
+    """Validate that public workspace delete failures use the toast helper."""
+    workspace_content = read_text(PUBLIC_WORKSPACE_JS)
+    utility_content = read_text(PUBLIC_WORKSPACE_UTILITY_JS)
+
+    assert 'function showPublicWorkspaceToast(message, type = \'info\', duration = 5000)' in utility_content, (
+        'Expected a shared public workspace toast helper in the utility script.'
+    )
+    assert "document.getElementById('toast-container')" in utility_content, (
+        'Expected the public workspace toast helper to use the shared toast container.'
+    )
+    assert "showPublicWorkspaceToast(`Error deleting: ${e.error || e.message}`, 'danger');" in workspace_content, (
+        'Expected single-document delete failures to use the shared toast helper.'
+    )
+    assert 'alert(`Error deleting: ${e.error || e.message}`);' not in workspace_content, (
+        'Did not expect single-document delete failures to use browser alerts.'
+    )
+    assert 'showPublicWorkspaceToast(`Deleted ${successful} document(s). ${failed} failed to delete.`, toastType);' in workspace_content, (
+        'Expected bulk delete partial failures to use the shared toast helper.'
+    )
+    assert 'alert(`Deleted ${successful} document(s). ${failed} failed to delete.`);' not in workspace_content, (
+        'Did not expect bulk delete partial failures to use browser alerts.'
+    )
+
+    print('✅ Public workspace delete failure toast helper verified.')
+
+
+if __name__ == '__main__':
+    test_public_workspace_delete_failures_use_toast_helper()
+    sys.exit(0)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_all_scope_group_source_context.py b/functional_tests/test_tabular_all_scope_group_source_context.py
new file mode 100644
index 00000000..f966e9c0
--- /dev/null
+++ b/functional_tests/test_tabular_all_scope_group_source_context.py
@@ -0,0 +1,228 @@
+#!/usr/bin/env python3
+# test_tabular_all_scope_group_source_context.py
+"""
+Functional test for all-scope tabular group source context handling.
+Version: 0.240.049
+Implemented in: 0.240.032; 0.240.041; 0.240.042; 0.240.043; 0.240.048; 0.240.049
+
+This test ensures mixed-scope workspace search keeps per-file group/public
+source metadata so tabular analysis can open group and public workbooks even
+when chat document scope is set to all.
+"""
+
+import ast
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    'is_tabular_filename',
+    'get_document_containers_for_scope',
+    'build_tabular_file_context',
+    'dedupe_tabular_file_contexts',
+    'infer_tabular_source_context_from_document',
+    'get_selected_workspace_tabular_file_contexts',
+    'collect_workspace_tabular_file_contexts',
+    'build_tabular_analysis_source_context',
+}
+
+
+class MockContainer:
+    """Minimal query_items stub for selected-document resolution tests."""
+
+    def __init__(self, rows_by_doc_id=None):
+        self.rows_by_doc_id = rows_by_doc_id or {}
+
+    def query_items(self, query, parameters, enable_cross_partition_query):
+        del query, enable_cross_partition_query
+        doc_id = None
+        for parameter in parameters:
+            if parameter.get('name') == '@doc_id':
+                doc_id = parameter.get('value')
+                break
+        return list(self.rows_by_doc_id.get(doc_id, []))
+
+
+def load_helpers():
+    """Load targeted tabular helper functions without importing the full Flask app."""
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'os': os,
+        'Mapping': __import__('typing').Mapping,
+        'TABULAR_EXTENSIONS': {'csv', 'tsv', 'xls', 'xlsx', 'xlsm'},
+        'log_event': lambda *args, **kwargs: None,
+        'logging': __import__('logging'),
+        'cosmos_user_documents_container': MockContainer(),
+        'cosmos_group_documents_container': MockContainer(),
+        'cosmos_public_documents_container': MockContainer(),
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_collect_workspace_tabular_file_contexts_preserves_group_and_public_sources_in_all_scope():
+    """Verify mixed all-scope search results keep their original per-file source metadata."""
+    print('🔍 Testing all-scope tabular file context preservation...')
+
+    helpers, _ = load_helpers()
+    collect_contexts = helpers['collect_workspace_tabular_file_contexts']
+
+    contexts = collect_contexts(
+        combined_documents=[
+            {
+                'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+            },
+            {
+                'file_name': 'Public Metrics.xlsx',
+                'public_workspace_id': 'public-456',
+            },
+            {
+                'file_name': 'notes.pdf',
+                'group_id': 'ignored-group',
+            },
+        ],
+        document_scope='all',
+        active_group_id='different-active-group',
+        active_public_workspace_id='different-public-workspace',
+    )
+
+    assert contexts == [
+        {
+            'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'source_hint': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        {
+            'file_name': 'Public Metrics.xlsx',
+            'source_hint': 'public',
+            'public_workspace_id': 'public-456',
+        },
+    ], contexts
+
+    print('✅ All-scope tabular file context preservation passed')
+    return True
+
+
+def test_selected_tabular_document_lookup_checks_all_scope_containers():
+    """Verify selected tabular docs in all scope can resolve from group/public containers."""
+    print('🔍 Testing all-scope selected tabular document lookup...')
+
+    helpers, _ = load_helpers()
+    helpers['cosmos_group_documents_container'] = MockContainer({
+        'group-doc-123': [{
+            'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        }],
+    })
+    helpers['cosmos_public_documents_container'] = MockContainer({
+        'public-doc-456': [{
+            'file_name': 'Public Metrics.xlsx',
+            'public_workspace_id': 'public-456',
+        }],
+    })
+
+    selected_contexts = helpers['get_selected_workspace_tabular_file_contexts'](
+        selected_document_ids=['group-doc-123', 'public-doc-456'],
+        document_scope='all',
+    )
+
+    assert selected_contexts == [
+        {
+            'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'source_hint': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        {
+            'file_name': 'Public Metrics.xlsx',
+            'source_hint': 'public',
+            'public_workspace_id': 'public-456',
+        },
+    ], selected_contexts
+
+    print('✅ All-scope selected tabular document lookup passed')
+    return True
+
+
+def test_build_tabular_analysis_source_context_mentions_per_file_scope_metadata():
+    """Verify the prompt helper emits per-file source instructions for mixed-scope workbooks."""
+    print('🔍 Testing tabular analysis source-context prompt...')
+
+    helpers, _ = load_helpers()
+    source_context = helpers['build_tabular_analysis_source_context']([
+        {
+            'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'source_hint': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        {
+            'file_name': 'Public Metrics.xlsx',
+            'source_hint': 'public',
+            'public_workspace_id': 'public-456',
+        },
+    ])
+
+    assert "CCO-Legal File Plan 2025_Final Approved.xlsx: source='group', group_id='93aa364a-99ee-4cfd-8e4d-f37d175f00f5'" in source_context, source_context
+    assert "Public Metrics.xlsx: source='public', public_workspace_id='public-456'" in source_context, source_context
+
+    print('✅ Tabular analysis source-context prompt passed')
+    return True
+
+
+def test_route_uses_context_aware_tabular_analysis_and_version_bump():
+    """Verify the chat route passes per-file contexts into tabular analysis and bumps the version."""
+    print('🔍 Testing route integration and version bump...')
+
+    _, source = load_helpers()
+
+    required_snippets = [
+        'workspace_tabular_file_contexts = collect_workspace_tabular_file_contexts(',
+        'tabular_file_contexts=workspace_tabular_file_contexts,',
+        'doc_public_workspace_id = doc.get(\'public_workspace_id\', None)',
+        '"public_workspace_id": doc_public_workspace_id,',
+    ]
+    missing = [snippet for snippet in required_snippets if snippet not in source]
+    assert not missing, f'Missing route integration snippets: {missing}'
+    assert read_config_version() == '0.240.049'
+
+    print('✅ Route integration and version bump passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_collect_workspace_tabular_file_contexts_preserves_group_and_public_sources_in_all_scope,
+        test_selected_tabular_document_lookup_checks_all_scope_containers,
+        test_build_tabular_analysis_source_context_mentions_per_file_scope_metadata,
+        test_route_uses_context_aware_tabular_analysis_and_version_bump,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_analysis_rejects_discovery_only.py b/functional_tests/test_tabular_analysis_rejects_discovery_only.py
index ea6fcd49..7e173785 100644
--- a/functional_tests/test_tabular_analysis_rejects_discovery_only.py
+++ b/functional_tests/test_tabular_analysis_rejects_discovery_only.py
@@ -6,8 +6,9 @@
 Implemented in: 0.239.111
 
 This test ensures that discovery-only tabular tool calls are not accepted as
-completed analysis for analytical questions, and that the tabular SK pass is
-restricted to analytical tools on retry attempts.
+completed analysis for analytical questions, and that multi-sheet workbook
+analysis may use discovery as an intermediate step while still requiring
+analytical tools before completion.
 """
 
 import ast
@@ -58,7 +59,8 @@ def test_discovery_only_calls_trigger_retry_guardrails():
         _, route_content = load_tabular_route_helpers()
 
         checks = {
-            'prompt disables discovery tools in analysis pass': 'Discovery functions are not available in this analysis run because schema context is already pre-loaded.' in route_content,
+            'prompt allows workbook discovery for multi-sheet analysis': 'Workbook discovery is available through describe_tabular_file.' in route_content,
+            'prompt rejects discovery-only completion': 'Discovery-only results do NOT complete the analysis.' in route_content,
             'analysis run filters callable functions': 'included_functions' in route_content,
             'retry path requires analytical tools': 'FunctionChoiceBehavior.Required(' in route_content,
             'retry logging mentions discovery tools': 'used only discovery tool(s)' in route_content,
diff --git a/functional_tests/test_tabular_author_metadata_normalization_fix.py b/functional_tests/test_tabular_author_metadata_normalization_fix.py
new file mode 100644
index 00000000..37ef6866
--- /dev/null
+++ b/functional_tests/test_tabular_author_metadata_normalization_fix.py
@@ -0,0 +1,138 @@
+# test_tabular_author_metadata_normalization_fix.py
+"""
+Functional test for tabular author metadata normalization.
+Version: 0.240.028
+Implemented in: 0.240.028
+
+This test ensures tabular schema-summary indexing normalizes author metadata
+before Azure AI Search upload so null or blank author entries do not break
+enhanced citation processing.
+"""
+
+import ast
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+FUNCTIONS_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'functions_documents.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    'ensure_list',
+}
+
+
+def load_helpers():
+    """Load targeted helpers from functions_documents.py without importing the full app."""
+    with open(FUNCTIONS_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=FUNCTIONS_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        're': __import__('re'),
+    }
+    exec(compile(module, FUNCTIONS_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_ensure_list_filters_null_and_blank_author_values():
+    """Verify ensure_list removes invalid author entries that would break search indexing."""
+    print('🔍 Testing author list normalization...')
+
+    try:
+        helpers, _ = load_helpers()
+        ensure_list = helpers['ensure_list']
+
+        normalized = ensure_list([None, '  Alice  ', '', 'Bob', '   '])
+        assert normalized == ['Alice', 'Bob'], normalized
+
+        normalized_scalar = ensure_list('Alice; ; Bob,  ')
+        assert normalized_scalar == ['Alice', 'Bob'], normalized_scalar
+
+        print('✅ Author list normalization passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_tabular_chunk_indexing_uses_normalized_authors_everywhere():
+    """Verify author normalization is applied to carried metadata and chunk uploads."""
+    print('🔍 Testing tabular author normalization integration points...')
+
+    try:
+        _, source = load_helpers()
+
+        required_snippets = [
+            '"authors": ensure_list(document_item.get("authors"))',
+            "'authors': []",
+            '"authors": ensure_list(carried_forward.get("authors"))',
+            "author = ensure_list(metadata.get('authors')) if metadata else []",
+            "chunk_updates['author'] = ensure_list(existing_document.get('authors'))",
+            "chunk_item[field] = ensure_list(kwargs[field])",
+        ]
+
+        missing = [snippet for snippet in required_snippets if snippet not in source]
+        assert not missing, f'Missing normalization snippets: {missing}'
+
+        print('✅ Tabular author normalization integration passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_version_bump_applied():
+    """Verify the current config version matches the implemented fix version."""
+    print('🔍 Testing config version bump...')
+
+    try:
+        version = read_config_version()
+        assert version == '0.240.028', version
+
+        print('✅ Config version bump passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+if __name__ == '__main__':
+    tests = [
+        test_ensure_list_filters_null_and_blank_author_values,
+        test_tabular_chunk_indexing_uses_normalized_authors_everywhere,
+        test_version_bump_applied,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py b/functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py
new file mode 100644
index 00000000..06cd9a83
--- /dev/null
+++ b/functional_tests/test_tabular_enhanced_citations_schema_summary_fix.py
@@ -0,0 +1,166 @@
+#!/usr/bin/env python3
+"""
+Functional test for enhanced-citation tabular schema summary fallback fix.
+Version: 0.240.023
+Implemented in: 0.240.023
+
+This test ensures enhanced-citation tabular uploads stay in schema-summary mode,
+use bounded summaries, and do not silently fall back to legacy row chunking.
+"""
+
+import ast
+import os
+import sys
+import tempfile
+
+import pandas
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(ROOT_DIR)
+sys.path.append(os.path.join(ROOT_DIR, 'application', 'single_app'))
+
+FUNCTIONS_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'functions_documents.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    '_compact_tabular_schema_value',
+    '_compact_tabular_columns',
+    '_build_compact_tabular_preview',
+    '_build_minimal_tabular_summary',
+    '_build_tabular_schema_summary',
+}
+TARGET_ASSIGNMENTS = {
+    'TABULAR_SCHEMA_SUMMARY_MAX_SHEETS',
+    'TABULAR_SCHEMA_SUMMARY_MAX_COLUMNS',
+    'TABULAR_SCHEMA_SUMMARY_MAX_PREVIEW_ROWS',
+    'TABULAR_SCHEMA_SUMMARY_MAX_CELL_CHARS',
+}
+
+
+def load_tabular_schema_helpers():
+    """Load schema-summary helpers from the source file without importing the full app."""
+    with open(FUNCTIONS_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=FUNCTIONS_FILE)
+    selected_nodes = []
+
+    for node in parsed.body:
+        if isinstance(node, ast.Assign):
+            for target in node.targets:
+                if isinstance(target, ast.Name) and target.id in TARGET_ASSIGNMENTS:
+                    selected_nodes.append(node)
+                    break
+        elif isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'os': os,
+        'pandas': pandas,
+    }
+    exec(compile(module, FUNCTIONS_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_bounded_csv_schema_summary():
+    """Verify large tabular previews are compacted into a bounded schema summary."""
+    print('🔍 Testing bounded CSV schema summary generation...')
+
+    try:
+        helpers, _ = load_tabular_schema_helpers()
+        build_schema_summary = helpers['_build_tabular_schema_summary']
+
+        dataframe = pandas.DataFrame({
+            f'column_{index}': [f'value_{index}_' + ('x' * 180) for _ in range(3)]
+            for index in range(30)
+        })
+
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.csv') as temp_file:
+            temp_path = temp_file.name
+
+        try:
+            dataframe.to_csv(temp_path, index=False)
+            summary = build_schema_summary(temp_path, 'wide-tabular.csv', '.csv')
+        finally:
+            if os.path.exists(temp_path):
+                os.remove(temp_path)
+
+        assert 'Tabular data file: wide-tabular.csv' in summary, summary
+        assert 'This file is available for detailed analysis via the Tabular Processing plugin.' in summary, summary
+        assert '... +' in summary and 'more columns' in summary, summary
+        assert len(summary) < 6000, len(summary)
+
+        print('✅ Bounded CSV schema summary generation passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_enhanced_citations_tabular_no_longer_falls_back_to_row_chunking():
+    """Verify enhanced citations tabular uploads no longer revert to legacy row chunking."""
+    print('🔍 Testing enhanced citations tabular fallback guard...')
+
+    try:
+        _, source = load_tabular_schema_helpers()
+
+        assert 'if total_chunks_saved == 0 and not enable_enhanced_citations:' in source, source
+        assert 'falling back to row-by-row' not in source, source
+        assert 'Failed indexing enhanced tabular summary' in source, source
+
+        print('✅ Enhanced citations tabular fallback guard passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_version_bump_applied():
+    """Verify the current config version matches the implemented fix version."""
+    print('🔍 Testing config version bump...')
+
+    try:
+        version = read_config_version()
+        assert version == '0.240.023', version
+
+        print('✅ Config version bump passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+if __name__ == '__main__':
+    tests = [
+        test_bounded_csv_schema_summary,
+        test_enhanced_citations_tabular_no_longer_falls_back_to_row_chunking,
+        test_version_bump_applied,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_group_blob_context_and_sheet_whitespace.py b/functional_tests/test_tabular_group_blob_context_and_sheet_whitespace.py
new file mode 100644
index 00000000..321ce9ca
--- /dev/null
+++ b/functional_tests/test_tabular_group_blob_context_and_sheet_whitespace.py
@@ -0,0 +1,204 @@
+#!/usr/bin/env python3
+# test_tabular_group_blob_context_and_sheet_whitespace.py
+"""
+Functional test for tabular group blob context and sheet whitespace handling.
+Version: 0.240.031
+Implemented in: 0.240.031
+
+This test ensures workbook tabs with trailing whitespace still resolve
+correctly and that tabular analysis can reuse pre-resolved group blob
+locations even when later tool calls omit group_id.
+"""
+
+import asyncio
+import importlib.util
+import os
+import sys
+
+import pandas as pd
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(ROOT_DIR)
+sys.path.append(os.path.join(ROOT_DIR, 'application', 'single_app'))
+
+PLUGIN_FILE = os.path.join(
+    ROOT_DIR,
+    'application',
+    'single_app',
+    'semantic_kernel_plugins',
+    'tabular_processing_plugin.py',
+)
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+
+PLUGIN_SPEC = importlib.util.spec_from_file_location('tabular_processing_plugin', PLUGIN_FILE)
+PLUGIN_MODULE = importlib.util.module_from_spec(PLUGIN_SPEC)
+PLUGIN_SPEC.loader.exec_module(PLUGIN_MODULE)
+TabularProcessingPlugin = PLUGIN_MODULE.TabularProcessingPlugin
+
+
+def build_mock_whitespace_workbook_plugin():
+    """Create a plugin backed by an in-memory workbook with a trailing-space sheet name."""
+    plugin = TabularProcessingPlugin()
+    container_name = 'mock-group-container'
+    blob_name = 'group-123/CCO-Legal File Plan 2025_Final Approved.xlsx'
+    workbook_frames = {
+        'Legal': pd.DataFrame({
+            'Records Schedule Item': ['GRS 5.1, item 010', 'GRS 2.3, item 050'],
+            'File Type (Description)': ['Travel', 'Administrative Inquiries'],
+        }),
+        'CUI ': pd.DataFrame({
+            'Records Schedule Item': ['CUI 1.0'],
+            'File Type (Description)': ['Controlled Unclassified Information'],
+        }),
+        'GRS': pd.DataFrame({
+            'Schedule': ['GRS 5.1', 'GRS 2.3'],
+            'Title': ['Administrative Records', 'Transitory Records'],
+        }),
+    }
+    workbook_metadata = {
+        'is_workbook': True,
+        'sheet_names': ['Legal', 'CUI ', 'GRS'],
+        'sheet_count': 3,
+        'default_sheet': 'Legal',
+    }
+
+    plugin._resolve_blob_location_with_fallback = lambda *args, **kwargs: (container_name, blob_name)
+    plugin._get_workbook_metadata = lambda *args, **kwargs: workbook_metadata.copy()
+
+    def read_dataframe(container, blob, sheet_name=None, sheet_index=None, require_explicit_sheet=False):
+        selected_sheet, _ = plugin._resolve_sheet_selection(
+            container,
+            blob,
+            sheet_name=sheet_name,
+            sheet_index=sheet_index,
+            require_explicit_sheet=require_explicit_sheet,
+        )
+        return workbook_frames[selected_sheet].copy()
+
+    plugin._read_tabular_blob_to_dataframe = read_dataframe
+    return plugin, container_name, blob_name
+
+
+def test_workbook_schema_summary_handles_trailing_space_sheet_names():
+    """Verify workbook-level schema preload succeeds when sheet names include trailing spaces."""
+    print('Testing workbook schema summary with trailing-space sheet names...')
+
+    try:
+        plugin, container_name, blob_name = build_mock_whitespace_workbook_plugin()
+        summary = plugin._build_workbook_schema_summary(
+            container_name,
+            blob_name,
+            'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            preview_rows=2,
+        )
+
+        assert summary['sheet_names'] == ['Legal', 'CUI ', 'GRS'], summary
+        assert 'CUI ' in summary['per_sheet_schemas'], summary
+        assert summary['per_sheet_schemas']['CUI ']['row_count'] == 1, summary
+
+        print('PASS workbook schema summary with trailing-space sheets')
+        return True
+    except Exception as exc:
+        print(f'FAIL test: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_sheet_selection_matches_trimmed_sheet_request():
+    """Verify callers can request a tab without reproducing trailing whitespace exactly."""
+    print('Testing trimmed sheet selection against trailing-space tab names...')
+
+    try:
+        plugin, _, _ = build_mock_whitespace_workbook_plugin()
+        payload = asyncio.run(plugin.get_distinct_values(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='CCO-Legal File Plan 2025_Final Approved.xlsx',
+            sheet_name='CUI',
+            column='Records Schedule Item',
+            source='group',
+            max_values='10',
+        ))
+
+        assert '"selected_sheet": "CUI "' in payload, payload
+        assert '"values": [' in payload, payload
+        assert 'CUI 1.0' in payload, payload
+
+        print('PASS trimmed sheet selection against trailing-space tab names')
+        return True
+    except Exception as exc:
+        print(f'FAIL test: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_resolved_group_blob_override_survives_missing_group_id():
+    """Verify a pre-resolved group blob location can be reused without group_id on later tool calls."""
+    print('Testing resolved group blob location override...')
+
+    try:
+        plugin = TabularProcessingPlugin()
+        plugin.remember_resolved_blob_location(
+            'group',
+            'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'group-documents',
+            'group-123/CCO-Legal File Plan 2025_Final Approved.xlsx',
+        )
+
+        resolved_container, resolved_blob = plugin._resolve_blob_location_with_fallback(
+            'test-user',
+            'test-conversation',
+            'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'group',
+        )
+
+        assert resolved_container == 'group-documents', (resolved_container, resolved_blob)
+        assert resolved_blob == 'group-123/CCO-Legal File Plan 2025_Final Approved.xlsx', (resolved_container, resolved_blob)
+
+        print('PASS resolved group blob location override')
+        return True
+    except Exception as exc:
+        print(f'FAIL test: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_route_registers_resolved_blob_locations_for_tabular_analysis():
+    """Verify the chat route registers pre-resolved blob locations for later tool calls."""
+    print('Testing route registration of resolved blob locations...')
+
+    try:
+        with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+            route_content = file_handle.read()
+
+        assert 'tabular_plugin.remember_resolved_blob_location(' in route_content, route_content
+
+        print('PASS route registration of resolved blob locations')
+        return True
+    except Exception as exc:
+        print(f'FAIL test: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+if __name__ == '__main__':
+    tests = [
+        test_workbook_schema_summary_handles_trailing_space_sheet_names,
+        test_sheet_selection_matches_trimmed_sheet_request,
+        test_resolved_group_blob_override_survives_missing_group_id,
+        test_route_registers_resolved_blob_locations_for_tabular_analysis,
+    ]
+    results = []
+
+    for test in tests:
+        print(f'\nRunning {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\nResults: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_llm_reviewer_recovery.py b/functional_tests/test_tabular_llm_reviewer_recovery.py
new file mode 100644
index 00000000..84854efa
--- /dev/null
+++ b/functional_tests/test_tabular_llm_reviewer_recovery.py
@@ -0,0 +1,435 @@
+#!/usr/bin/env python3
+# test_tabular_llm_reviewer_recovery.py
+"""
+Functional test for multi-sheet tabular LLM reviewer recovery.
+Version: 0.240.049
+Implemented in: 0.240.035; 0.240.036; 0.240.037; 0.240.038; 0.240.039; 0.240.040; 0.240.041; 0.240.042; 0.240.043; 0.240.048; 0.240.049
+
+This test ensures that stalled multi-sheet analytical runs can parse a reviewer
+JSON plan, normalize the selected function, and inject the correct source
+context before directly executing analytical plugin calls.
+"""
+
+import ast
+import os
+import sys
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    'build_tabular_follow_up_call_signature',
+    'determine_tabular_follow_up_limit',
+    'derive_tabular_follow_up_calls_from_invocations',
+    'extract_json_object_from_text',
+    'extract_tabular_high_signal_search_terms',
+    'extract_tabular_secondary_filter_terms',
+    'get_tabular_invocation_error_message',
+    'get_tabular_invocation_data_rows',
+    'get_tabular_invocation_result_payload',
+    'get_tabular_invocation_selected_sheet',
+    'infer_tabular_url_path_segments',
+    'infer_tabular_url_value_column_from_rows',
+    'infer_tabular_secondary_filter_from_rows',
+    'is_tabular_distinct_url_question',
+    'normalize_tabular_reviewer_function_name',
+    'normalize_tabular_row_text',
+    'parse_tabular_result_count',
+    'parse_tabular_column_candidates',
+    'parse_tabular_reviewer_plan',
+    'question_requests_tabular_exhaustive_results',
+    'question_requests_tabular_row_context',
+    'resolve_tabular_reviewer_call_arguments',
+    'tabular_value_looks_url_like',
+    'tabular_result_payload_contains_url_like_content',
+}
+
+
+class FakeInvocation:
+    """Simple invocation stub for follow-up derivation tests."""
+
+    def __init__(self, function_name, parameters, result, error_message=None):
+        self.function_name = function_name
+        self.parameters = parameters
+        self.result = result
+        self.error_message = error_message
+
+
+def load_route_helpers():
+    """Load selected reviewer helpers from the chat route source."""
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'json': __import__('json'),
+        're': __import__('re'),
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_reviewer_json_extraction_handles_markdown_wrapping():
+    """Verify reviewer JSON can be extracted even when the model adds wrapper text."""
+    print('🔍 Testing reviewer JSON extraction...')
+
+    helpers, _ = load_route_helpers()
+    payload = helpers['extract_json_object_from_text'](
+        'Plan follows:\n```json\n{"calls":[{"function":"TabularProcessingPlugin.get_distinct_values","arguments":{"column":"Location"}}]}\n```'
+    )
+
+    assert payload['calls'][0]['function'] == 'TabularProcessingPlugin.get_distinct_values', payload
+
+    print('✅ Reviewer JSON extraction passed')
+    return True
+
+
+def test_reviewer_plan_normalizes_prefixed_function_names():
+    """Verify reviewer plans normalize plugin-prefixed function names."""
+    print('🔍 Testing reviewer plan normalization...')
+
+    helpers, _ = load_route_helpers()
+    calls = helpers['parse_tabular_reviewer_plan'](
+        '{"calls":[{"function":"tabular_processing-get_distinct_values","arguments":{"filename":"CCO-Legal File Plan 2025_Final Approved.xlsx","column":"Location","filter_column":"Location","filter_operator":"contains","filter_value":"SharePoint"}}]}'
+    )
+
+    assert calls == [{
+        'function_name': 'get_distinct_values',
+        'arguments': {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'column': 'Location',
+            'filter_column': 'Location',
+            'filter_operator': 'contains',
+            'filter_value': 'SharePoint',
+        },
+    }], calls
+
+    print('✅ Reviewer plan normalization passed')
+    return True
+
+
+def test_reviewer_call_argument_resolution_injects_group_context():
+    """Verify reviewer-planned calls inherit filename and source context correctly."""
+    print('🔍 Testing reviewer call argument resolution...')
+
+    helpers, _ = load_route_helpers()
+    resolve_arguments = helpers['resolve_tabular_reviewer_call_arguments']
+
+    resolved_arguments, error_message = resolve_arguments(
+        {
+            'column': 'Location',
+            'filter_column': 'Location',
+            'filter_operator': 'contains',
+            'filter_value': 'SharePoint',
+        },
+        [
+            {
+                'file_name': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                'source_hint': 'group',
+                'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+            }
+        ],
+        fallback_source_hint='group',
+    )
+
+    assert error_message is None, error_message
+    assert resolved_arguments['filename'] == 'CCO-Legal File Plan 2025_Final Approved.xlsx', resolved_arguments
+    assert resolved_arguments['source'] == 'group', resolved_arguments
+    assert resolved_arguments['group_id'] == '93aa364a-99ee-4cfd-8e4d-f37d175f00f5', resolved_arguments
+
+    print('✅ Reviewer call argument resolution passed')
+    return True
+
+
+def test_reviewer_follow_up_derivation_adds_row_context_and_url_extraction():
+    """Verify reviewer recovery derives a search step and URL extraction follow-up."""
+    print('🔍 Testing reviewer follow-up derivation...')
+
+    helpers, _ = load_route_helpers()
+    derive_follow_ups = helpers['derive_tabular_follow_up_calls_from_invocations']
+
+    initial_invocation = FakeInvocation(
+        'get_distinct_values',
+        {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'sheet_name': 'Legal',
+            'column': 'Location',
+            'filter_column': 'Location',
+            'filter_operator': 'contains',
+            'filter_value': 'CCO',
+            'normalize_match': 'false',
+            'source': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        '{"filename": "CCO-Legal File Plan 2025_Final Approved.xlsx", "selected_sheet": "Legal", "column": "Location", "distinct_count": 25, "returned_values": 25, "values": ["AIL: SharePoint - https://contoso.sharepoint.com/sites/Alpha/SitePages/Home.aspx", "BA: SharePoint - https://contoso.sharepoint.com/sites/Beta/Forms/AllItems.aspx", "Network Drive"]}',
+    )
+
+    follow_up_calls = derive_follow_ups(
+        'How many discrete SharePoint sites appear in CCO locations?',
+        [initial_invocation],
+    )
+
+    assert [call['function_name'] for call in follow_up_calls] == ['search_rows', 'get_distinct_values'], follow_up_calls
+
+    row_context_arguments = follow_up_calls[0]['arguments']
+    assert row_context_arguments['filename'] == 'CCO-Legal File Plan 2025_Final Approved.xlsx', row_context_arguments
+    assert row_context_arguments['sheet_name'] == 'Legal', row_context_arguments
+    assert row_context_arguments['search_value'] == 'SharePoint', row_context_arguments
+    assert row_context_arguments['search_columns'] == 'Location', row_context_arguments
+    assert row_context_arguments['filter_column'] == 'Location', row_context_arguments
+    assert row_context_arguments['filter_value'] == 'CCO', row_context_arguments
+    assert row_context_arguments['max_rows'] == '25', row_context_arguments
+
+    extraction_arguments = follow_up_calls[1]['arguments']
+    assert extraction_arguments['filename'] == 'CCO-Legal File Plan 2025_Final Approved.xlsx', extraction_arguments
+    assert extraction_arguments['sheet_name'] == 'Legal', extraction_arguments
+    assert extraction_arguments['column'] == 'Location', extraction_arguments
+    assert extraction_arguments['filter_column'] == 'Location', extraction_arguments
+    assert extraction_arguments['filter_value'] == 'CCO', extraction_arguments
+    assert extraction_arguments['extract_mode'] == 'url', extraction_arguments
+    assert extraction_arguments['url_path_segments'] == '2', extraction_arguments
+
+    print('✅ Reviewer follow-up derivation passed')
+    return True
+
+
+def test_reviewer_follow_up_derivation_broadens_zero_match_same_column_filter():
+    """Verify zero-match same-column filters trigger a broad discovery search instead of repetition."""
+    print('🔍 Testing reviewer broad discovery follow-up derivation...')
+
+    helpers, _ = load_route_helpers()
+    derive_follow_ups = helpers['derive_tabular_follow_up_calls_from_invocations']
+
+    initial_invocation = FakeInvocation(
+        'get_distinct_values',
+        {
+            'filename': 'CCO-Licensing File Plan 2025_Final Approved.xlsx',
+            'sheet_name': 'Licensing',
+            'column': 'Location',
+            'filter_column': 'Location',
+            'filter_operator': 'contains',
+            'filter_value': 'CCO',
+            'normalize_match': 'false',
+            'source': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        '{"filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx", "selected_sheet": "Licensing", "column": "Location", "distinct_count": 0, "returned_values": 0, "values": []}',
+    )
+
+    follow_up_calls = derive_follow_ups(
+        'How many discrete SharePoint sites appear in CCO locations? please list them out',
+        [initial_invocation],
+    )
+
+    assert len(follow_up_calls) == 1, follow_up_calls
+    assert follow_up_calls[0]['function_name'] == 'search_rows', follow_up_calls
+    search_arguments = follow_up_calls[0]['arguments']
+    assert search_arguments['filename'] == 'CCO-Licensing File Plan 2025_Final Approved.xlsx', search_arguments
+    assert search_arguments['sheet_name'] == 'Licensing', search_arguments
+    assert search_arguments['search_value'] == 'SharePoint', search_arguments
+    assert search_arguments['search_columns'] == 'Location', search_arguments
+    assert search_arguments['max_rows'] == '50', search_arguments
+    assert 'filter_column' not in search_arguments, search_arguments
+    assert 'return_columns' not in search_arguments, search_arguments
+
+    print('✅ Reviewer broad discovery follow-up derivation passed')
+    return True
+
+
+def test_reviewer_follow_up_derivation_infers_cohort_column_from_row_context():
+    """Verify row-context search results can infer a better cohort column for extraction."""
+    print('🔍 Testing reviewer row-context cohort inference...')
+
+    helpers, _ = load_route_helpers()
+    derive_follow_ups = helpers['derive_tabular_follow_up_calls_from_invocations']
+
+    row_context_invocation = FakeInvocation(
+        'search_rows',
+        {
+            'filename': 'CCO-Licensing File Plan 2025_Final Approved.xlsx',
+            'sheet_name': 'Licensing',
+            'search_value': 'SharePoint',
+            'search_columns': 'Location',
+            'normalize_match': 'false',
+            'source': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+            'max_rows': '50',
+        },
+        '{"filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx", "selected_sheet": "Licensing", "search_value": "SharePoint", "searched_columns": ["Location"], "total_matches": 3, "returned_rows": 3, "data": [{"Business Unit": "CCO Licensing", "Location": "Licensing SharePoint - https://contoso.sharepoint.com/sites/Alpha/SitePages/Home.aspx", "Site": "Alpha"}, {"Business Unit": "CCO Licensing", "Location": "Licensing SharePoint - https://contoso.sharepoint.com/sites/Beta/Forms/AllItems.aspx", "Site": "Beta"}, {"Business Unit": "Finance", "Location": "Finance docs - https://contoso.sharepoint.com/sites/Gamma/SitePages/Home.aspx", "Site": "Gamma"}]}',
+    )
+
+    follow_up_calls = derive_follow_ups(
+        'How many discrete SharePoint sites appear in CCO locations? please list them out',
+        [row_context_invocation],
+    )
+
+    assert len(follow_up_calls) == 1, follow_up_calls
+    assert follow_up_calls[0]['function_name'] == 'get_distinct_values', follow_up_calls
+    extraction_arguments = follow_up_calls[0]['arguments']
+    assert extraction_arguments['filename'] == 'CCO-Licensing File Plan 2025_Final Approved.xlsx', extraction_arguments
+    assert extraction_arguments['sheet_name'] == 'Licensing', extraction_arguments
+    assert extraction_arguments['column'] == 'Location', extraction_arguments
+    assert extraction_arguments['filter_column'] == 'Business Unit', extraction_arguments
+    assert extraction_arguments['filter_operator'] == 'contains', extraction_arguments
+    assert extraction_arguments['filter_value'] == 'CCO', extraction_arguments
+    assert extraction_arguments['extract_mode'] == 'url', extraction_arguments
+    assert extraction_arguments['url_path_segments'] == '2', extraction_arguments
+
+    print('✅ Reviewer row-context cohort inference passed')
+    return True
+
+
+def test_reviewer_follow_up_derivation_expands_limited_search_rows_and_extraction_values():
+    """Verify exhaustive list questions can expand a partial row slice and the derived value list."""
+    print('🔍 Testing reviewer exhaustive row/value expansion...')
+
+    helpers, _ = load_route_helpers()
+    derive_follow_ups = helpers['derive_tabular_follow_up_calls_from_invocations']
+
+    row_context_invocation = FakeInvocation(
+        'search_rows',
+        {
+            'filename': 'CCO-Licensing File Plan 2025_Final Approved.xlsx',
+            'sheet_name': 'Licensing',
+            'search_value': 'SharePoint',
+            'search_columns': 'Location',
+            'normalize_match': 'false',
+            'source': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+            'max_rows': '25',
+        },
+        '{"filename": "CCO-Licensing File Plan 2025_Final Approved.xlsx", "selected_sheet": "Licensing", "search_value": "SharePoint", "searched_columns": ["Location"], "total_matches": 40, "returned_rows": 25, "data": [{"Business Unit": "CCO Licensing", "Location": "Licensing SharePoint - https://contoso.sharepoint.com/sites/Alpha/SitePages/Home.aspx", "Site": "Alpha"}, {"Business Unit": "CCO Licensing", "Location": "Licensing SharePoint - https://contoso.sharepoint.com/sites/Beta/Forms/AllItems.aspx", "Site": "Beta"}]}'
+    )
+
+    follow_up_calls = derive_follow_ups(
+        'How many discrete SharePoint sites appear in CCO locations? please list them all out',
+        [row_context_invocation],
+    )
+
+    assert [call['function_name'] for call in follow_up_calls] == ['search_rows', 'get_distinct_values'], follow_up_calls
+
+    expanded_row_arguments = follow_up_calls[0]['arguments']
+    assert expanded_row_arguments['max_rows'] == '40', expanded_row_arguments
+    assert expanded_row_arguments['search_value'] == 'SharePoint', expanded_row_arguments
+
+    extraction_arguments = follow_up_calls[1]['arguments']
+    assert extraction_arguments['filter_column'] == 'Business Unit', extraction_arguments
+    assert extraction_arguments['filter_value'] == 'CCO', extraction_arguments
+    assert extraction_arguments['max_values'] == '40', extraction_arguments
+    assert extraction_arguments['extract_mode'] == 'url', extraction_arguments
+
+    print('✅ Reviewer exhaustive row/value expansion passed')
+    return True
+
+
+def test_reviewer_follow_up_derivation_expands_limited_distinct_value_lists():
+    """Verify exhaustive list questions can rerun get_distinct_values with a higher max_values limit."""
+    print('🔍 Testing reviewer exhaustive distinct-value expansion...')
+
+    helpers, _ = load_route_helpers()
+    derive_follow_ups = helpers['derive_tabular_follow_up_calls_from_invocations']
+
+    initial_invocation = FakeInvocation(
+        'get_distinct_values',
+        {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'sheet_name': 'Legal',
+            'column': 'Location',
+            'filter_column': 'Location',
+            'filter_operator': 'contains',
+            'filter_value': 'SharePoint',
+            'normalize_match': 'false',
+            'max_values': '25',
+            'source': 'group',
+            'group_id': '93aa364a-99ee-4cfd-8e4d-f37d175f00f5',
+        },
+        '{"filename": "CCO-Legal File Plan 2025_Final Approved.xlsx", "selected_sheet": "Legal", "column": "Location", "distinct_count": 40, "returned_values": 25, "values_limited": true, "values": ["https://contoso.sharepoint.com/sites/Site01", "https://contoso.sharepoint.com/sites/Site02"]}'
+    )
+
+    follow_up_calls = derive_follow_ups(
+        'List all SharePoint sites in the Legal worksheet',
+        [initial_invocation],
+    )
+
+    assert len(follow_up_calls) == 1, follow_up_calls
+    assert follow_up_calls[0]['function_name'] == 'get_distinct_values', follow_up_calls
+    expanded_arguments = follow_up_calls[0]['arguments']
+    assert expanded_arguments['max_values'] == '40', expanded_arguments
+    assert expanded_arguments['sheet_name'] == 'Legal', expanded_arguments
+    assert expanded_arguments['column'] == 'Location', expanded_arguments
+
+    print('✅ Reviewer exhaustive distinct-value expansion passed')
+    return True
+
+
+def test_route_contains_llm_reviewer_recovery_and_version_bump():
+    """Verify the route wires in reviewer recovery and the config version bump."""
+    print('🔍 Testing reviewer recovery route wiring...')
+
+    _, source = load_route_helpers()
+
+    required_snippets = [
+        'You are a tabular recovery planner.',
+        'Return JSON only with this schema:',
+        'maybe_recover_tabular_analysis_with_llm_reviewer(',
+        'Reviewer recovery produced computed analytical tool results',
+        'For deterministic how-many, discrete, unique, or canonical-list questions, prefer count_rows or get_distinct_values',
+        'When the user is asking where a topic, phrase, code, path, identifier, or other value appears and the relevant column is unclear, prefer search_rows.',
+        'When the user wants values from a subset or pattern within one column, prefer get_distinct_values with filter_column/filter_operator/filter_value',
+        'When the answer depends on two literal column conditions, prefer count_rows, get_distinct_values, or filter_rows with filter_column/filter_operator/filter_value plus additional_filter_column/additional_filter_operator/additional_filter_value',
+        "When the user is asking for URLs, sites, links, or regex-like identifiers embedded inside a text cell, prefer get_distinct_values with extract_mode='url' or extract_mode='regex'",
+        'If whether an embedded URL or identifier counts depends on surrounding text in the original cell rather than the extracted value itself, search/filter the original text column first.',
+        'If a prior tool result is limited and the user explicitly asked for the full list, rerun with a higher max_rows or max_values instead of stopping at the preview slice.',
+        'Do not classify extracted URLs solely by whether the URL text itself contains the keyword when the original cell text already defines the category.',
+        'For URLs, links, paths, and literal identifiers, set normalize_match=false unless normalization is clearly necessary.',
+        'If a prior result reports total_matches > returned_rows or distinct_count > returned_values for a full-list question, rerun with a higher max_rows or max_values before answering.',
+        'derive_tabular_follow_up_calls_from_invocations(',
+        'infer_tabular_secondary_filter_from_rows(',
+        'Reviewer recovery executed automatic analytical follow-up calls',
+        'follow_up_round',
+    ]
+    missing = [snippet for snippet in required_snippets if snippet not in source]
+    assert not missing, f'Missing reviewer recovery snippets: {missing}'
+    assert read_config_version() == '0.240.049'
+
+    print('✅ Reviewer recovery route wiring passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_reviewer_json_extraction_handles_markdown_wrapping,
+        test_reviewer_plan_normalizes_prefixed_function_names,
+        test_reviewer_call_argument_resolution_injects_group_context,
+        test_reviewer_follow_up_derivation_adds_row_context_and_url_extraction,
+        test_reviewer_follow_up_derivation_broadens_zero_match_same_column_filter,
+        test_reviewer_follow_up_derivation_infers_cohort_column_from_row_context,
+        test_reviewer_follow_up_derivation_expands_limited_search_rows_and_extraction_values,
+        test_reviewer_follow_up_derivation_expands_limited_distinct_value_lists,
+        test_route_contains_llm_reviewer_recovery_and_version_bump,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_multi_file_distinct_url_union.py b/functional_tests/test_tabular_multi_file_distinct_url_union.py
new file mode 100644
index 00000000..6c3fa0ec
--- /dev/null
+++ b/functional_tests/test_tabular_multi_file_distinct_url_union.py
@@ -0,0 +1,219 @@
+#!/usr/bin/env python3
+# test_tabular_multi_file_distinct_url_union.py
+"""
+Functional test for deterministic multi-file tabular distinct URL unions.
+Version: 0.240.052
+Implemented in: 0.240.052
+
+This test ensures multi-file SharePoint/site questions can bypass the LLM
+planner, pick a URL/location-style column per workbook, and union exact
+distinct values across multiple tabular files before the final model response.
+"""
+
+import ast
+import json
+import os
+import re
+import sys
+from typing import Mapping
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    'build_multi_file_tabular_distinct_value_analysis',
+    'dedupe_tabular_file_contexts',
+    'get_multi_file_tabular_analysis_mode',
+    'is_tabular_distinct_url_question',
+    'normalize_multi_file_tabular_distinct_value',
+    'parse_tabular_result_count',
+    'score_tabular_distinct_url_column',
+    'select_tabular_distinct_url_column',
+    'select_tabular_distinct_url_sheet_and_column',
+}
+
+
+def load_helpers():
+    """Load targeted multi-file tabular helpers without importing the full app."""
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'json': json,
+        'Mapping': Mapping,
+        're': re,
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_multi_file_mode_only_applies_to_multi_file_analysis_questions():
+    """Verify deterministic mode only activates for multi-file analysis questions."""
+    print('🔍 Testing multi-file mode detection...')
+
+    helpers, _ = load_helpers()
+    get_mode = helpers['get_multi_file_tabular_analysis_mode']
+
+    single_file_mode = get_mode(
+        'How many discrete SharePoint sites appear in CCO locations?',
+        execution_mode='analysis',
+        analysis_file_contexts=[{'file_name': 'one.xlsx', 'source_hint': 'group'}],
+    )
+    schema_summary_mode = get_mode(
+        'How many discrete SharePoint sites appear in CCO locations?',
+        execution_mode='schema_summary',
+        analysis_file_contexts=[
+            {'file_name': 'one.xlsx', 'source_hint': 'group'},
+            {'file_name': 'two.xlsx', 'source_hint': 'group'},
+        ],
+    )
+    multi_file_mode = get_mode(
+        'How many discrete SharePoint sites appear in CCO locations?',
+        execution_mode='analysis',
+        analysis_file_contexts=[
+            {'file_name': 'one.xlsx', 'source_hint': 'group'},
+            {'file_name': 'two.xlsx', 'source_hint': 'group'},
+        ],
+    )
+
+    assert single_file_mode is None, single_file_mode
+    assert schema_summary_mode is None, schema_summary_mode
+    assert multi_file_mode == 'distinct_url_union', multi_file_mode
+
+    print('✅ Multi-file mode detection passed')
+    return True
+
+
+def test_sheet_and_column_selection_prefers_location_like_columns():
+    """Verify deterministic selection can find the right sheet even when tab names differ."""
+    print('🔍 Testing deterministic sheet/column selection...')
+
+    helpers, _ = load_helpers()
+    select_sheet_and_column = helpers['select_tabular_distinct_url_sheet_and_column']
+
+    schema_info = {
+        'is_workbook': True,
+        'sheet_names': ['Overview', 'Licensing'],
+        'per_sheet_schemas': {
+            'Overview': {
+                'row_count': 42,
+                'columns': ['Category', 'Owner', 'Status'],
+            },
+            'Licensing': {
+                'row_count': 13,
+                'columns': ['Business Unit', 'Location', 'Disposition'],
+            },
+        },
+    }
+
+    selected_sheet, selected_column = select_sheet_and_column(schema_info)
+
+    assert selected_sheet == 'Licensing', (selected_sheet, selected_column)
+    assert selected_column == 'Location', (selected_sheet, selected_column)
+
+    print('✅ Deterministic sheet/column selection passed')
+    return True
+
+
+def test_multi_file_distinct_value_analysis_unions_and_dedupes_values():
+    """Verify per-file results are unioned into one exact distinct value list."""
+    print('🔍 Testing multi-file distinct value union...')
+
+    helpers, _ = load_helpers()
+    build_analysis = helpers['build_multi_file_tabular_distinct_value_analysis']
+
+    analysis = json.loads(build_analysis([
+        {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'Legal',
+            'column': 'Location',
+            'distinct_count': 2,
+            'returned_values': 2,
+            'values': [
+                'http://share/sites/CCO/default.aspx',
+                'https://occtreasgovprod.sharepoint.com/sites/LIC',
+            ],
+        },
+        {
+            'filename': 'CCO-Licensing File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'Licensing',
+            'column': 'Location',
+            'distinct_count': 2,
+            'returned_values': 2,
+            'values': [
+                'https://occtreasgovprod.sharepoint.com/sites/LIC',
+                'http://share/sites/CC/LICA/default.aspx',
+            ],
+        },
+    ]))
+
+    assert analysis['analysis_type'] == 'multi_file_distinct_url_union', analysis
+    assert analysis['files_requested'] == 2, analysis
+    assert analysis['files_analyzed'] == 2, analysis
+    assert analysis['distinct_count'] == 3, analysis
+    assert analysis['returned_values'] == 3, analysis
+    assert analysis['values'] == [
+        'http://share/sites/CC/LICA/default.aspx',
+        'http://share/sites/CCO/default.aspx',
+        'https://occtreasgovprod.sharepoint.com/sites/LIC',
+    ], analysis
+
+    print('✅ Multi-file distinct value union passed')
+    return True
+
+
+def test_route_uses_multi_file_tabular_wrapper_and_version_bump():
+    """Verify the route now routes tabular execution through the multi-file-aware wrapper."""
+    print('🔍 Testing multi-file wrapper route wiring...')
+
+    _, source = load_helpers()
+
+    required_snippets = [
+        'MULTI_FILE_TABULAR_DISTINCT_URL_EXTRACT_PATTERN',
+        'def get_multi_file_tabular_analysis_mode(',
+        'def run_multi_file_tabular_distinct_url_analysis(',
+        'def run_tabular_analysis_with_multi_file_support(',
+        'workspace_tabular_file_contexts = collect_workspace_tabular_file_contexts(',
+    ]
+    missing = [snippet for snippet in required_snippets if snippet not in source]
+    assert not missing, f'Missing multi-file tabular snippets: {missing}'
+    assert source.count('asyncio.run(run_tabular_analysis_with_multi_file_support(') == 4, source
+    assert read_config_version() == '0.240.052'
+
+    print('✅ Multi-file wrapper route wiring passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_multi_file_mode_only_applies_to_multi_file_analysis_questions,
+        test_sheet_and_column_selection_prefers_location_like_columns,
+        test_multi_file_distinct_value_analysis_unions_and_dedupes_values,
+        test_route_uses_multi_file_tabular_wrapper_and_version_bump,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_multisheet_tool_start_guidance.py b/functional_tests/test_tabular_multisheet_tool_start_guidance.py
new file mode 100644
index 00000000..73036770
--- /dev/null
+++ b/functional_tests/test_tabular_multisheet_tool_start_guidance.py
@@ -0,0 +1,144 @@
+#!/usr/bin/env python3
+# test_tabular_multisheet_tool_start_guidance.py
+"""
+Functional test for multi-sheet tabular discovery iteration.
+Version: 0.240.049
+Implemented in: 0.240.035; 0.240.036; 0.240.039; 0.240.040; 0.240.041; 0.240.042; 0.240.043; 0.240.048; 0.240.049
+
+This test ensures multi-sheet workbook analysis can start with generic workbook
+discovery, carry discovery summaries into retries, and still require
+analytical tool calls before the analysis is considered complete.
+"""
+
+import ast
+import os
+import sys
+from types import SimpleNamespace
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'route_backend_chats.py')
+CONFIG_FILE = os.path.join(ROOT_DIR, 'application', 'single_app', 'config.py')
+TARGET_FUNCTIONS = {
+    'is_tabular_schema_summary_question',
+    'is_tabular_entity_lookup_question',
+    'get_tabular_execution_mode',
+    'get_tabular_invocation_result_payload',
+    'get_tabular_invocation_error_message',
+    'summarize_tabular_discovery_invocations',
+}
+
+
+def load_route_helpers():
+    """Load selected helpers from the chat route source without importing the full app."""
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'json': __import__('json'),
+        're': __import__('re'),
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_identifier_led_return_question_routes_to_entity_lookup_mode():
+    """Verify generic identifier-led workbook questions still use entity lookup mode."""
+    print('🔍 Testing generic identifier-led entity lookup routing...')
+
+    helpers, _ = load_route_helpers()
+    question = 'For return RET000123, explain why the refund amount changed after withholding and estimated payments were applied.'
+
+    assert helpers['is_tabular_entity_lookup_question'](question), question
+    assert helpers['get_tabular_execution_mode'](question) == 'entity_lookup', question
+
+    print('✅ Generic identifier-led entity lookup routing passed')
+    return True
+
+
+def test_discovery_summaries_are_compact_and_generic():
+    """Verify discovery retry summaries stay workbook-level and avoid content targeting."""
+    print('🔍 Testing compact discovery summaries...')
+
+    helpers, _ = load_route_helpers()
+    summarize_discovery = helpers['summarize_tabular_discovery_invocations']
+
+    invocation = SimpleNamespace(
+        function_name='describe_tabular_file',
+        error_message=None,
+        result='''{
+  "filename": "irs_treasury_multi_tab_workbook.xlsx",
+  "is_workbook": true,
+  "sheet_count": 11,
+  "sheet_names": ["Taxpayers", "TaxReturns", "W2Forms", "Form1099Income"],
+  "relationship_hints": [{"from_sheet": "Taxpayers", "to_sheet": "TaxReturns"}]
+}''',
+    )
+
+    summaries = summarize_discovery([invocation])
+
+    assert summaries == [
+        'irs_treasury_multi_tab_workbook.xlsx; sheet_count=11; sheets=Taxpayers, TaxReturns, W2Forms, Form1099Income; relationship_hints=1'
+    ], summaries
+
+    print('✅ Compact discovery summaries passed')
+    return True
+
+
+def test_route_uses_generic_multisheet_discovery_iteration_and_version_bump():
+    """Verify the route uses generic discovery iteration for multi-sheet workbooks."""
+    print('🔍 Testing generic multi-sheet discovery iteration guidance...')
+
+    _, source = load_route_helpers()
+
+    required_snippets = [
+        'Workbook discovery is available through describe_tabular_file.',
+        'Discovery-only results do NOT complete the analysis.',
+        'call describe_tabular_file without sheet_name as an exploration step',
+        'previous_discovery_feedback_messages = []',
+        'Previous attempt explored workbook structure but did not execute analytical functions. Continue with analytical tool calls now.',
+        'analysis_requires_immediate_tool_choice = has_multi_sheet_workbook and not schema_summary_mode',
+        'You are a tabular recovery planner.',
+        'Choose the next 1-3 analytical tabular calls that should be executed directly.',
+        'If a prior result reports total_matches > returned_rows or distinct_count > returned_values for a full-list question, rerun with a higher max_rows or max_values before answering.',
+        'maybe_recover_tabular_analysis_with_llm_reviewer(',
+    ]
+    missing = [snippet for snippet in required_snippets if snippet not in source]
+    assert not missing, f'Missing route discovery-iteration snippets: {missing}'
+    assert read_config_version() == '0.240.049'
+
+    print('✅ Generic multi-sheet discovery iteration guidance passed')
+    return True
+
+
+if __name__ == '__main__':
+    tests = [
+        test_identifier_led_return_question_routes_to_entity_lookup_mode,
+        test_discovery_summaries_are_compact_and_generic,
+        test_route_uses_generic_multisheet_discovery_iteration_and_version_bump,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_multisheet_workbook_support.py b/functional_tests/test_tabular_multisheet_workbook_support.py
index 75b389e6..43530a02 100644
--- a/functional_tests/test_tabular_multisheet_workbook_support.py
+++ b/functional_tests/test_tabular_multisheet_workbook_support.py
@@ -224,8 +224,9 @@ def test_route_uses_analytical_filters_and_lookup_guidance():
         _, route_content = load_tabular_route_helpers()
 
         checks = {
-            'lookup_value is advertised first': 'AVAILABLE FUNCTIONS: lookup_value' in route_content,
-            'discovery tools are disabled for analysis': 'Discovery functions are not available in this analysis run because schema context is already pre-loaded.' in route_content,
+            'lookup_value remains advertised for analysis': 'lookup_value' in route_content,
+            'discovery iteration is allowed for multi-sheet analysis': 'Workbook discovery is available through describe_tabular_file.' in route_content,
+            'discovery-only analysis is rejected': 'Discovery-only results do NOT complete the analysis.' in route_content,
             'prompt includes likely worksheet hints': 'LIKELY WORKSHEET HINTS:' in route_content,
             'analysis function filters are configured': 'included_functions' in route_content,
             'retry attempts require analytical function use': 'FunctionChoiceBehavior.Required(' in route_content,
diff --git a/functional_tests/test_tabular_preview_json_sanitization_fix.py b/functional_tests/test_tabular_preview_json_sanitization_fix.py
new file mode 100644
index 00000000..e61e7b3f
--- /dev/null
+++ b/functional_tests/test_tabular_preview_json_sanitization_fix.py
@@ -0,0 +1,166 @@
+#!/usr/bin/env python3
+# test_tabular_preview_json_sanitization_fix.py
+"""
+Functional test for tabular preview JSON sanitization.
+Version: 0.240.030
+Implemented in: 0.240.030
+
+This test ensures the enhanced citation tabular preview converts pandas null-like
+values into JSON-safe strings so browser preview loading does not fail on NaN.
+"""
+
+import ast
+import math
+import os
+import sys
+
+import pandas as pd
+
+
+ROOT_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+ROUTE_FILE = os.path.join(
+    ROOT_DIR,
+    'application',
+    'single_app',
+    'route_enhanced_citations.py',
+)
+CONFIG_FILE = os.path.join(
+    ROOT_DIR,
+    'application',
+    'single_app',
+    'config.py',
+)
+TARGET_FUNCTIONS = {
+    '_sanitize_tabular_preview_value',
+    '_serialize_tabular_preview_table',
+}
+
+
+def load_preview_helpers():
+    """Load tabular preview helpers from the route source without importing the app."""
+    with open(ROUTE_FILE, 'r', encoding='utf-8') as file_handle:
+        source = file_handle.read()
+
+    parsed = ast.parse(source, filename=ROUTE_FILE)
+    selected_nodes = []
+    for node in parsed.body:
+        if isinstance(node, ast.FunctionDef) and node.name in TARGET_FUNCTIONS:
+            selected_nodes.append(node)
+
+    module = ast.Module(body=selected_nodes, type_ignores=[])
+    namespace = {
+        'pandas': pd,
+    }
+    exec(compile(module, ROUTE_FILE, 'exec'), namespace)
+    return namespace, source
+
+
+def read_config_version():
+    """Extract the current application version from config.py."""
+    with open(CONFIG_FILE, 'r', encoding='utf-8') as file_handle:
+        for line in file_handle:
+            if line.startswith('VERSION = '):
+                return line.split('=', 1)[1].strip().strip('"')
+    raise AssertionError('VERSION assignment not found in config.py')
+
+
+def test_preview_value_sanitizer_returns_json_safe_strings():
+    """Verify null-like and datetime preview values become safe display strings."""
+    print('🔍 Testing tabular preview value sanitizer...')
+
+    try:
+        helpers, _ = load_preview_helpers()
+        sanitize_value = helpers['_sanitize_tabular_preview_value']
+
+        assert sanitize_value(float('nan')) == ''
+        assert sanitize_value(pd.NA) == ''
+        assert sanitize_value(pd.NaT) == ''
+        assert sanitize_value(pd.Timestamp('2025-01-02 03:04:05')) == '2025-01-02T03:04:05'
+        assert sanitize_value(42) == '42'
+
+        print('✅ Tabular preview value sanitizer passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_preview_table_serializer_replaces_blank_headers_and_nan_cells():
+    """Verify serialized preview output contains JSON-safe strings only."""
+    print('🔍 Testing tabular preview table serializer...')
+
+    try:
+        helpers, _ = load_preview_helpers()
+        serialize_table = helpers['_serialize_tabular_preview_table']
+
+        preview_df = pd.DataFrame(
+            [
+                ['Status', float('nan')],
+                [pd.Timestamp('2024-02-03 04:05:06'), 5],
+            ],
+            columns=['Column A', math.nan],
+        )
+
+        columns, rows = serialize_table(preview_df)
+
+        assert columns == ['Column A', ''], columns
+        assert rows == [
+            ['Status', ''],
+            ['2024-02-03T04:05:06', '5.0'],
+        ], rows
+
+        print('✅ Tabular preview table serializer passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_route_uses_serialized_preview_output_and_version_bump():
+    """Verify the preview endpoint uses the sanitizer helpers and version bump."""
+    print('🔍 Testing route integration and version bump...')
+
+    try:
+        _, source = load_preview_helpers()
+
+        required_snippets = [
+            'columns, rows = _serialize_tabular_preview_table(preview)',
+            '"columns": columns,',
+            '"rows": rows,',
+        ]
+        missing = [snippet for snippet in required_snippets if snippet not in source]
+        assert not missing, f'Missing route integration snippets: {missing}'
+
+        assert read_config_version() == '0.240.030'
+
+        print('✅ Route integration and version bump passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+if __name__ == '__main__':
+    tests = [
+        test_preview_value_sanitizer_returns_json_safe_strings,
+        test_preview_table_serializer_replaces_blank_headers_and_nan_cells,
+        test_route_uses_serialized_preview_output_and_version_bump,
+    ]
+
+    results = []
+    for test in tests:
+        print(f'\n🧪 Running {test.__name__}...')
+        results.append(test())
+
+    success = all(results)
+    print(f'\n📊 Results: {sum(results)}/{len(results)} tests passed')
+    sys.exit(0 if success else 1)
\ No newline at end of file
diff --git a/functional_tests/test_tabular_raw_tool_fallback.py b/functional_tests/test_tabular_raw_tool_fallback.py
index ea405155..76f9e66a 100644
--- a/functional_tests/test_tabular_raw_tool_fallback.py
+++ b/functional_tests/test_tabular_raw_tool_fallback.py
@@ -2,8 +2,8 @@
 # test_tabular_raw_tool_fallback.py
 """
 Functional test for tabular raw tool fallback summaries.
-Version: 0.240.013
-Implemented in: 0.239.125; 0.240.013 (prompt-budgeted fallback handoff)
+Version: 0.240.048
+Implemented in: 0.239.125; 0.240.013; 0.240.036; 0.240.038; 0.240.039; 0.240.040; 0.240.041; 0.240.042; 0.240.043; 0.240.048 (prompt-budgeted fallback handoff)
 
 This test ensures successful tabular tool calls are not discarded when the
 inner tabular synthesis step fails, and that the analysis prompt now prefers
@@ -345,6 +345,283 @@ def test_raw_fallback_stays_within_prompt_budget_for_large_rows():
         return False
 
 
+def test_raw_fallback_preserves_distinct_value_lists_when_budget_allows():
+    """Verify distinct-value tool results keep full scalar lists when they fit the budget."""
+    print('🔍 Testing raw fallback distinct-value preservation...')
+
+    try:
+        helpers, _ = load_fallback_helpers()
+        build_fallback = helpers['build_tabular_analysis_fallback_from_invocations']
+
+        distinct_values_payload = {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'Legal',
+            'column': 'Location',
+            'filter_applied': [
+                {
+                    'column': 'Location',
+                    'operator': 'contains',
+                    'value': 'SharePoint',
+                }
+            ],
+            'normalize_match': False,
+            'distinct_count': 4,
+            'returned_values': 4,
+            'values_limited': False,
+            'values': [
+                'http://occtreasgovprod.sharepoint.com/sites/CCO',
+                'http://occtreasgovprod.sharepoint.com/sites/LCFrmwrk',
+                'http://occtreasgovprod.sharepoint.com/sites/PolicyOps',
+                'http://occtreasgovprod.sharepoint.com/sites/RecordsMgmt',
+            ],
+        }
+
+        invocations = [
+            FakeInvocation(
+                'get_distinct_values',
+                {
+                    'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                    'sheet_name': 'Legal',
+                    'column': 'Location',
+                    'filter_column': 'Location',
+                    'filter_operator': 'contains',
+                    'filter_value': 'SharePoint',
+                    'normalize_match': 'false',
+                },
+                json.dumps(distinct_values_payload),
+            ),
+        ]
+
+        fallback_summary = build_fallback(invocations)
+
+        assert fallback_summary is not None, 'Expected raw fallback summary'
+        assert '"distinct_count": 4' in fallback_summary, fallback_summary
+        assert '"full_values_included": true' in fallback_summary.lower(), fallback_summary
+        for expected_value in distinct_values_payload['values']:
+            assert expected_value in fallback_summary, fallback_summary
+
+        print('✅ Raw fallback distinct-value preservation passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_raw_fallback_preserves_embedded_extraction_metadata():
+    """Verify embedded extraction summaries survive the raw fallback handoff."""
+    print('🔍 Testing raw fallback embedded extraction metadata...')
+
+    try:
+        helpers, _ = load_fallback_helpers()
+        build_fallback = helpers['build_tabular_analysis_fallback_from_invocations']
+
+        distinct_values_payload = {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'Legal',
+            'column': 'Location',
+            'filter_applied': [
+                'Business Unit contains CCO',
+                'Location contains sharepoint',
+            ],
+            'extract_mode': 'url',
+            'url_path_segments': 2,
+            'matched_cell_count': 4,
+            'extracted_match_count': 4,
+            'normalize_match': False,
+            'distinct_count': 3,
+            'returned_values': 3,
+            'values_limited': False,
+            'values': [
+                'https://contoso.sharepoint.com/sites/Alpha',
+                'https://contoso.sharepoint.com/sites/Beta',
+                'https://contoso.sharepoint.com/sites/Delta',
+            ],
+        }
+
+        invocations = [
+            FakeInvocation(
+                'get_distinct_values',
+                {
+                    'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                    'sheet_name': 'Legal',
+                    'column': 'Location',
+                    'filter_column': 'Business Unit',
+                    'filter_operator': 'contains',
+                    'filter_value': 'CCO',
+                    'additional_filter_column': 'Location',
+                    'additional_filter_operator': 'contains',
+                    'additional_filter_value': 'sharepoint',
+                    'extract_mode': 'url',
+                    'url_path_segments': '2',
+                    'normalize_match': 'false',
+                },
+                json.dumps(distinct_values_payload),
+            ),
+        ]
+
+        fallback_summary = build_fallback(invocations)
+
+        assert fallback_summary is not None, 'Expected raw fallback summary'
+        assert '"extract_mode": "url"' in fallback_summary, fallback_summary
+        assert '"url_path_segments": 2' in fallback_summary, fallback_summary
+        assert '"matched_cell_count": 4' in fallback_summary, fallback_summary
+        assert '"extracted_match_count": 4' in fallback_summary, fallback_summary
+
+        print('✅ Raw fallback embedded extraction metadata passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_raw_fallback_preserves_complete_small_row_sets_when_budget_allows():
+    """Verify small search/filter cohorts keep the full row context in the fallback handoff."""
+    print('🔍 Testing raw fallback full row-context preservation...')
+
+    try:
+        helpers, _ = load_fallback_helpers()
+        build_fallback = helpers['build_tabular_analysis_fallback_from_invocations']
+
+        matching_rows_payload = {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'Legal',
+            'filter_applied': [
+                'Business Unit contains CCO',
+                'Location contains sharepoint',
+            ],
+            'total_matches': 8,
+            'returned_rows': 8,
+            'data': [
+                {
+                    'Business Unit': 'CCO Legal',
+                    'Location': f'CCO Wide: DAP SharePoint site - http://share/sites/CSPA/BorderTracking/SitePages/Home.aspx; row {index}',
+                    'Site': f'Site {index}',
+                }
+                for index in range(8)
+            ],
+        }
+
+        invocations = [
+            FakeInvocation(
+                'filter_rows',
+                {
+                    'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                    'sheet_name': 'Legal',
+                    'column': 'Location',
+                    'operator': 'contains',
+                    'value': 'sharepoint',
+                    'additional_filter_column': 'Business Unit',
+                    'additional_filter_operator': 'contains',
+                    'additional_filter_value': 'CCO',
+                    'normalize_match': 'false',
+                    'max_rows': '50',
+                },
+                json.dumps(matching_rows_payload),
+            ),
+        ]
+
+        fallback_summary = build_fallback(invocations)
+
+        assert fallback_summary is not None, 'Expected raw fallback summary'
+        assert 'http://share/sites/CSPA/BorderTracking/SitePages/Home.aspx; row 0' in fallback_summary, fallback_summary
+        assert 'http://share/sites/CSPA/BorderTracking/SitePages/Home.aspx; row 7' in fallback_summary, fallback_summary
+        assert '"full_rows_included": true' in fallback_summary.lower(), fallback_summary
+
+        print('✅ Raw fallback full row-context preservation passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_raw_fallback_preserves_complete_small_search_row_sets_when_budget_allows():
+    """Verify generic search_rows results keep the full small cohort in the fallback handoff."""
+    print('🔍 Testing raw fallback full search-row preservation...')
+
+    try:
+        helpers, _ = load_fallback_helpers()
+        build_fallback = helpers['build_tabular_analysis_fallback_from_invocations']
+
+        matching_rows_payload = {
+            'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+            'selected_sheet': 'ALL (cross-sheet search)',
+            'search_value': 'GRS 6.1',
+            'search_operator': 'contains',
+            'searched_columns': ['Business Unit', 'Location', 'Site', 'Schedule Notes'],
+            'matched_columns': ['Schedule Notes'],
+            'return_columns': ['Business Unit', 'Location', 'Site'],
+            'total_matches': 3,
+            'returned_rows': 3,
+            'data': [
+                {
+                    'Business Unit': 'CCO - Supervision',
+                    'Location': 'AIL: SharePoint - https://contoso.sharepoint.com/sites/Alpha/SitePages/Home.aspx',
+                    'Site': 'Alpha',
+                    '_matched_columns': ['Schedule Notes'],
+                    '_matched_values': {'Schedule Notes': 'Primary schedules: GRS 6.1; GRS 2.4'},
+                    '_sheet': 'File Plan Q1',
+                },
+                {
+                    'Business Unit': 'CCO Legal',
+                    'Location': 'DCCO: SharePoint - https://contoso.sharepoint.com/sites/Delta/Shared%20Documents/Forms/AllItems.aspx',
+                    'Site': 'Delta',
+                    '_matched_columns': ['Schedule Notes'],
+                    '_matched_values': {'Schedule Notes': 'Legal schedules: GRS 6.1'},
+                    '_sheet': 'File Plan Q2',
+                },
+                {
+                    'Business Unit': 'CCO Legal',
+                    'Location': 'WEDO: SharePoint - https://contoso.sharepoint.com/sites/Beta/SitePages/Home.aspx',
+                    'Site': 'Beta',
+                    '_matched_columns': ['Schedule Notes'],
+                    '_matched_values': {'Schedule Notes': 'Duplicates: GRS 2.4; GRS 6.1'},
+                    '_sheet': 'File Plan Q2',
+                },
+            ],
+        }
+
+        invocations = [
+            FakeInvocation(
+                'search_rows',
+                {
+                    'filename': 'CCO-Legal File Plan 2025_Final Approved.xlsx',
+                    'search_value': 'GRS 6.1',
+                    'search_operator': 'contains',
+                    'return_columns': 'Business Unit,Location,Site',
+                    'max_rows': '10',
+                },
+                json.dumps(matching_rows_payload),
+            ),
+        ]
+
+        fallback_summary = build_fallback(invocations)
+
+        assert fallback_summary is not None, 'Expected raw fallback summary'
+        assert '"search_value": "GRS 6.1"' in fallback_summary, fallback_summary
+        assert '"full_rows_included": true' in fallback_summary.lower(), fallback_summary
+        assert '"Site": "Alpha"' in fallback_summary, fallback_summary
+        assert '"Site": "Beta"' in fallback_summary, fallback_summary
+        assert '"Site": "Delta"' in fallback_summary, fallback_summary
+
+        print('✅ Raw fallback full search-row preservation passed')
+        return True
+
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
 def test_computed_results_system_message_truncates_large_handoffs():
     """Verify computed-results handoffs are capped before the outer model call."""
     print('🔍 Testing computed-results handoff truncation...')
@@ -374,6 +651,10 @@ def test_computed_results_system_message_truncates_large_handoffs():
         test_raw_fallback_preserves_aggregate_and_group_summaries,
         test_route_prompt_prefers_combined_queries_and_raw_fallback_helper,
         test_raw_fallback_stays_within_prompt_budget_for_large_rows,
+        test_raw_fallback_preserves_distinct_value_lists_when_budget_allows,
+        test_raw_fallback_preserves_embedded_extraction_metadata,
+        test_raw_fallback_preserves_complete_small_row_sets_when_budget_allows,
+        test_raw_fallback_preserves_complete_small_search_row_sets_when_budget_allows,
         test_computed_results_system_message_truncates_large_handoffs,
     ]
 
diff --git a/functional_tests/test_tabular_relational_analysis_helpers.py b/functional_tests/test_tabular_relational_analysis_helpers.py
index 70aaa80f..c72aa5a0 100644
--- a/functional_tests/test_tabular_relational_analysis_helpers.py
+++ b/functional_tests/test_tabular_relational_analysis_helpers.py
@@ -2,8 +2,8 @@
 # test_tabular_relational_analysis_helpers.py
 """
 Functional test for tabular relational analysis helpers.
-Version: 0.240.018
-Implemented in: 0.240.018
+Version: 0.240.048
+Implemented in: 0.240.018; 0.240.037; 0.240.038; 0.240.039; 0.240.040; 0.240.041; 0.240.042; 0.240.043; 0.240.048
 
 This test ensures the tabular processing plugin can infer workbook relationship
 metadata, return deterministic distinct values and row counts, and perform
@@ -99,6 +99,87 @@ def read_dataframe(container, blob, sheet_name=None, sheet_index=None, require_e
     return plugin
 
 
+def build_multi_filter_workbook_plugin():
+    """Create a plugin backed by workbook sheets for multi-condition text filters."""
+    plugin = TabularProcessingPlugin()
+    container_name = 'mock-container'
+    blob_name = 'cco_sharepoint_sites.xlsx'
+
+    workbook_frames = {
+        'File Plan Q1': pd.DataFrame([
+            {
+                'Business Unit': 'CCO - Supervision',
+                'Location': 'AIL: SharePoint - https://contoso.sharepoint.com/sites/Alpha/SitePages/Home.aspx',
+                'Site': 'Alpha',
+                'Schedule Notes': 'Primary schedules: GRS 6.1; GRS 2.4',
+            },
+            {
+                'Business Unit': 'CCO - Supervision',
+                'Location': 'BA: SharePoint - https://contoso.sharepoint.com/sites/Beta/Forms/AllItems.aspx',
+                'Site': 'Beta',
+                'Schedule Notes': 'Secondary schedules: GRS 2.4',
+            },
+            {
+                'Business Unit': 'Finance',
+                'Location': 'Finance docs - https://contoso.sharepoint.com/sites/Gamma/SitePages/Home.aspx',
+                'Site': 'Gamma',
+                'Schedule Notes': 'Finance schedules: GRS 8.3',
+            },
+            {
+                'Business Unit': 'CCO - Supervision',
+                'Location': 'Network Drive',
+                'Site': 'Legacy',
+                'Schedule Notes': 'Legacy schedules: GRS 1.1',
+            },
+        ]),
+        'File Plan Q2': pd.DataFrame([
+            {
+                'Business Unit': 'CCO Legal',
+                'Location': 'DCCO: SharePoint - https://contoso.sharepoint.com/sites/Delta/Shared%20Documents/Forms/AllItems.aspx',
+                'Site': 'Delta',
+                'Schedule Notes': 'Legal schedules: GRS 6.1',
+            },
+            {
+                'Business Unit': 'CCO Legal',
+                'Location': 'WEDO: SharePoint - https://contoso.sharepoint.com/sites/Beta/SitePages/Home.aspx',
+                'Site': 'Beta',
+                'Schedule Notes': 'Duplicates: GRS 2.4; GRS 6.1',
+            },
+            {
+                'Business Unit': 'Treasury',
+                'Location': 'Treasury docs - https://contoso.sharepoint.com/sites/Zeta/SitePages/Home.aspx',
+                'Site': 'Zeta',
+                'Schedule Notes': 'Treasury schedules: GRS 9.1',
+            },
+        ]),
+        'Notes': pd.DataFrame([
+            {'Comment': 'Ignore this sheet for site searches'},
+        ]),
+    }
+    workbook_metadata = {
+        'is_workbook': True,
+        'sheet_names': ['File Plan Q1', 'File Plan Q2', 'Notes'],
+        'sheet_count': 3,
+        'default_sheet': 'File Plan Q1',
+    }
+
+    plugin._resolve_blob_location_with_fallback = lambda *args, **kwargs: (container_name, blob_name)
+    plugin._get_workbook_metadata = lambda *args, **kwargs: workbook_metadata.copy()
+
+    def read_dataframe(container, blob, sheet_name=None, sheet_index=None, require_explicit_sheet=False):
+        selected_sheet, _ = plugin._resolve_sheet_selection(
+            container,
+            blob,
+            sheet_name=sheet_name,
+            sheet_index=sheet_index,
+            require_explicit_sheet=require_explicit_sheet,
+        )
+        return workbook_frames[selected_sheet].copy()
+
+    plugin._read_tabular_blob_to_dataframe = read_dataframe
+    return plugin
+
+
 def test_describe_tabular_file_infers_relationship_hints():
     """Verify workbook schema summaries include role and relationship hints."""
     print('🔍 Testing workbook relationship metadata...')
@@ -193,6 +274,290 @@ def test_count_rows_returns_deterministic_row_count():
         return False
 
 
+def test_multi_filter_helpers_support_cross_sheet_contains_queries():
+    """Verify count and distinct helpers can combine two text filters across sheets."""
+    print('🔍 Testing cross-sheet multi-filter helpers...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        distinct_payload = json.loads(asyncio.run(plugin.get_distinct_values(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            column='Site',
+            filter_column='Business Unit',
+            filter_operator='contains',
+            filter_value='CCO',
+            additional_filter_column='Location',
+            additional_filter_operator='contains',
+            additional_filter_value='sharepoint',
+            normalize_match='false',
+            source='workspace',
+        )))
+        count_payload = json.loads(asyncio.run(plugin.count_rows(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            filter_column='Business Unit',
+            filter_operator='contains',
+            filter_value='CCO',
+            additional_filter_column='Location',
+            additional_filter_operator='contains',
+            additional_filter_value='sharepoint',
+            normalize_match='false',
+            source='workspace',
+        )))
+
+        assert distinct_payload['selected_sheet'] == 'ALL (cross-sheet search)', distinct_payload
+        assert distinct_payload['distinct_count'] == 3, distinct_payload
+        assert distinct_payload['values'] == ['Alpha', 'Beta', 'Delta'], distinct_payload
+        assert len(distinct_payload['filter_applied']) == 2, distinct_payload
+        assert count_payload['selected_sheet'] == 'ALL (cross-sheet search)', count_payload
+        assert count_payload['row_count'] == 4, count_payload
+        assert len(count_payload['filter_applied']) == 2, count_payload
+
+        print('✅ Cross-sheet multi-filter helpers passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_filter_rows_supports_additional_column_filter():
+    """Verify filter_rows can apply a second literal filter without query syntax."""
+    print('🔍 Testing additional filter support in filter_rows...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        payload = json.loads(asyncio.run(plugin.filter_rows(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            column='Business Unit',
+            operator='contains',
+            value='CCO',
+            additional_filter_column='Location',
+            additional_filter_operator='contains',
+            additional_filter_value='sharepoint',
+            normalize_match='false',
+            source='workspace',
+            max_rows='10',
+        )))
+
+        assert payload['selected_sheet'] == 'ALL (cross-sheet search)', payload
+        assert payload['total_matches'] == 4, payload
+        assert payload['returned_rows'] == 4, payload
+        assert len(payload['filter_applied']) == 2, payload
+        assert {row['_sheet'] for row in payload['data']} == {'File Plan Q1', 'File Plan Q2'}, payload
+
+        print('✅ Additional filter support in filter_rows passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_get_distinct_values_extracts_embedded_url_roots_from_filtered_cells():
+    """Verify embedded URL extraction can normalize higher-level site roots from text cells."""
+    print('🔍 Testing embedded URL extraction in distinct values...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        payload = json.loads(asyncio.run(plugin.get_distinct_values(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            column='Location',
+            filter_column='Business Unit',
+            filter_operator='contains',
+            filter_value='CCO',
+            additional_filter_column='Location',
+            additional_filter_operator='contains',
+            additional_filter_value='sharepoint',
+            extract_mode='url',
+            url_path_segments='2',
+            normalize_match='false',
+            source='workspace',
+        )))
+
+        assert payload['selected_sheet'] == 'ALL (cross-sheet search)', payload
+        assert payload['extract_mode'] == 'url', payload
+        assert payload['url_path_segments'] == 2, payload
+        assert payload['matched_cell_count'] == 4, payload
+        assert payload['extracted_match_count'] == 4, payload
+        assert payload['distinct_count'] == 3, payload
+        assert payload['values'] == [
+            'https://contoso.sharepoint.com/sites/Alpha',
+            'https://contoso.sharepoint.com/sites/Beta',
+            'https://contoso.sharepoint.com/sites/Delta',
+        ], payload
+
+        print('✅ Embedded URL extraction in distinct values passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_get_distinct_values_supports_regex_extraction_from_text_cells():
+    """Verify regex extraction can return canonical identifiers embedded in text cells."""
+    print('🔍 Testing regex extraction in distinct values...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        payload = json.loads(asyncio.run(plugin.get_distinct_values(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            column='Schedule Notes',
+            filter_column='Business Unit',
+            filter_operator='contains',
+            filter_value='CCO',
+            extract_mode='regex',
+            extract_pattern=r'(GRS\s+\d+\.\d+)',
+            normalize_match='false',
+            source='workspace',
+        )))
+
+        assert payload['extract_mode'] == 'regex', payload
+        assert payload['matched_cell_count'] == 5, payload
+        assert payload['extracted_match_count'] == 7, payload
+        assert payload['distinct_count'] == 3, payload
+        assert payload['values'] == ['GRS 1.1', 'GRS 2.4', 'GRS 6.1'], payload
+
+        print('✅ Regex extraction in distinct values passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_search_rows_can_search_all_columns_and_return_target_values():
+    """Verify generic row search can scan all columns and surface chosen values."""
+    print('🔍 Testing generic row search across all columns...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        payload = json.loads(asyncio.run(plugin.search_rows(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            search_value='GRS 6.1',
+            return_columns='Business Unit,Location,Site',
+            normalize_match='false',
+            source='workspace',
+            max_rows='10',
+        )))
+
+        assert payload['selected_sheet'] == 'ALL (cross-sheet search)', payload
+        assert payload['search_value'] == 'GRS 6.1', payload
+        assert payload['total_matches'] == 3, payload
+        assert payload['returned_rows'] == 3, payload
+        assert payload['matched_columns'] == ['Schedule Notes'], payload
+        assert payload['return_columns'] == ['Business Unit', 'Location', 'Site'], payload
+        assert payload['data'][0]['_matched_columns'] == ['Schedule Notes'], payload
+        assert 'Schedule Notes' not in payload['data'][0], payload
+        assert payload['data'][0]['Business Unit'], payload
+        assert payload['data'][0]['Location'], payload
+        assert payload['data'][0]['Site'], payload
+
+        print('✅ Generic row search across all columns passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_reviewer_style_text_query_expression_rewrites_for_count_and_distinct_calls():
+    """Verify reviewer-style pseudo queries are rewritten instead of failing."""
+    print('🔍 Testing reviewer-style pseudo query rewrite...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        pseudo_query = "`Business Unit`.astype(str).str.contains('CCO', case=False, na=False) and Location.astype(str).str.contains('sharepoint', case=False, na=False)"
+
+        count_payload = json.loads(asyncio.run(plugin.count_rows(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            query_expression=pseudo_query,
+            normalize_match='false',
+            source='workspace',
+        )))
+        distinct_payload = json.loads(asyncio.run(plugin.get_distinct_values(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            column='Location',
+            query_expression=pseudo_query,
+            extract_mode='url',
+            url_path_segments='2',
+            normalize_match='false',
+            source='workspace',
+        )))
+
+        assert count_payload['selected_sheet'] == 'ALL (cross-sheet search)', count_payload
+        assert count_payload['row_count'] == 4, count_payload
+        assert count_payload['filter_applied'][0].endswith('[reviewer-style fallback]'), count_payload
+        assert distinct_payload['selected_sheet'] == 'ALL (cross-sheet search)', distinct_payload
+        assert distinct_payload['distinct_count'] == 3, distinct_payload
+        assert distinct_payload['filter_applied'][0].endswith('[reviewer-style fallback]'), distinct_payload
+        assert distinct_payload['values'] == [
+            'https://contoso.sharepoint.com/sites/Alpha',
+            'https://contoso.sharepoint.com/sites/Beta',
+            'https://contoso.sharepoint.com/sites/Delta',
+        ], distinct_payload
+
+        print('✅ Reviewer-style pseudo query rewrite passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+def test_reviewer_style_null_literal_query_expression_rewrites_for_count_calls():
+    """Verify reviewer-style null literals are rewritten instead of failing."""
+    print('🔍 Testing reviewer-style null literal query rewrite...')
+
+    try:
+        plugin = build_multi_filter_workbook_plugin()
+        count_payload = json.loads(asyncio.run(plugin.count_rows(
+            user_id='test-user',
+            conversation_id='test-conversation',
+            filename='cco_sharepoint_sites.xlsx',
+            query_expression='Location != null',
+            filter_column='Business Unit',
+            filter_operator='contains',
+            filter_value='CCO',
+            normalize_match='false',
+            source='workspace',
+        )))
+
+        assert count_payload['selected_sheet'] == 'ALL (cross-sheet search)', count_payload
+        assert count_payload['row_count'] == 5, count_payload
+        assert count_payload['filter_applied'][0].endswith('[reviewer-style fallback]'), count_payload
+
+        print('✅ Reviewer-style null literal query rewrite passed')
+        return True
+    except Exception as exc:
+        print(f'❌ Test failed: {exc}')
+        import traceback
+        traceback.print_exc()
+        return False
+
+
 def test_related_value_helpers_return_explainable_outputs():
     """Verify semi-join helpers return deterministic counts and explainable metadata."""
     print('🔍 Testing related-value semi-join helpers...')
@@ -280,6 +645,15 @@ def test_route_prompt_mentions_deterministic_relational_helpers():
             'cohort guidance exists': 'For cohort, membership, ownership-share, or percentage questions where one sheet defines the group and another sheet contains the fact rows' in route_content,
             'named member share guidance exists': "When the question asks for one named member's share within that cohort" in route_content,
             'deterministic count guidance exists': 'For deterministic how-many questions, use count_rows instead of estimating counts from partial returned rows.' in route_content,
+            'generic search tool advertised': 'search_rows' in route_content,
+            'whole-doc search guidance exists': 'If the question includes an exact identifier or asks where a topic, phrase, path, code, or other value appears and the correct starting worksheet or column is unclear, begin with search_rows' in route_content,
+            'return columns guidance exists': 'use return_columns to surface the columns most relevant to the question' in route_content.casefold(),
+            'multi-condition guidance exists': 'When the cohort is defined by two literal conditions on different columns' in route_content,
+            'additional filter args advertised': 'additional_filter_column' in route_content,
+            'embedded extraction guidance exists': "extract_mode='url' or extract_mode='regex'" in route_content,
+            'url root guidance exists': 'url_path_segments' in route_content,
+            'contextual text-search guidance exists': 'If whether an embedded URL, site, link, or identifier counts depends on surrounding text in the original cell rather than the extracted value itself' in route_content,
+            'full row context guidance exists': 'Prefer filter_rows when the matching row context matters, and return the full matching rows when the cohort is modest enough to fit comfortably.' in route_content,
             'relationship hints exposed in schema preload': "'relationship_hints': schema_info.get('relationship_hints', [])[:5]" in route_content,
         }
 
@@ -300,6 +674,13 @@ def test_route_prompt_mentions_deterministic_relational_helpers():
         test_describe_tabular_file_infers_relationship_hints,
         test_get_distinct_values_returns_canonical_cohort,
         test_count_rows_returns_deterministic_row_count,
+        test_multi_filter_helpers_support_cross_sheet_contains_queries,
+        test_filter_rows_supports_additional_column_filter,
+        test_get_distinct_values_extracts_embedded_url_roots_from_filtered_cells,
+        test_get_distinct_values_supports_regex_extraction_from_text_cells,
+        test_search_rows_can_search_all_columns_and_return_target_values,
+        test_reviewer_style_text_query_expression_rewrites_for_count_and_distinct_calls,
+        test_reviewer_style_null_literal_query_expression_rewrites_for_count_calls,
         test_related_value_helpers_return_explainable_outputs,
         test_route_prompt_mentions_deterministic_relational_helpers,
     ]
diff --git a/ui_tests/test_agent_citation_modal_full_results.py b/ui_tests/test_agent_citation_modal_full_results.py
new file mode 100644
index 00000000..e278cefe
--- /dev/null
+++ b/ui_tests/test_agent_citation_modal_full_results.py
@@ -0,0 +1,181 @@
+# test_agent_citation_modal_full_results.py
+"""
+UI test for agent citation full-result modal rendering.
+
+Version: 0.240.048
+Implemented in: 0.240.048
+
+This test ensures that opening an agent tool citation lazy-loads the raw
+artifact payload, starts with a short preview, expands to 25 rows, and can
+show all returned rows for tabular results.
+"""
+
+import json
+import os
+from pathlib import Path
+
+import pytest
+from playwright.sync_api import expect
+
+
+BASE_URL = os.getenv("SIMPLECHAT_UI_BASE_URL", "").rstrip("/")
+STORAGE_STATE = os.getenv("SIMPLECHAT_UI_STORAGE_STATE", "")
+
+
+def _fulfill_json(route, payload, status=200):
+    route.fulfill(
+        status=status,
+        content_type="application/json",
+        body=json.dumps(payload),
+    )
+
+
+def _build_raw_citation_payload():
+    rows = [
+        {
+            "Location": f"Row {index:02d} - https://contoso.sharepoint.com/sites/Site{index:02d}",
+            "Site": f"Site {index:02d}",
+        }
+        for index in range(1, 31)
+    ]
+    return {
+        "tool_name": "TabularProcessingPlugin.search_rows [Legal]",
+        "function_name": "search_rows",
+        "plugin_name": "TabularProcessingPlugin",
+        "function_arguments": json.dumps(
+            {
+                "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+                "sheet_name": "Legal",
+                "search_value": "SharePoint",
+                "search_columns": "Location",
+                "max_rows": "25",
+            }
+        ),
+        "function_result": json.dumps(
+            {
+                "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+                "selected_sheet": "Legal",
+                "search_value": "SharePoint",
+                "searched_columns": ["Location"],
+                "total_matches": 30,
+                "returned_rows": 30,
+                "data": rows,
+            }
+        ),
+        "artifact_id": "assistant-msg-1_artifact_1",
+    }
+
+
+@pytest.mark.ui
+def test_agent_citation_modal_can_expand_from_preview_to_all_rows(playwright):
+    """Validate the agent citation modal can expand raw tabular results on demand."""
+    if not BASE_URL:
+        pytest.skip("Set SIMPLECHAT_UI_BASE_URL to run this UI test.")
+    if not STORAGE_STATE or not Path(STORAGE_STATE).exists():
+        pytest.skip("Set SIMPLECHAT_UI_STORAGE_STATE to a valid authenticated Playwright storage state file.")
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={"width": 1440, "height": 900},
+    )
+    page = context.new_page()
+
+    compact_citation = {
+        "tool_name": "TabularProcessingPlugin.search_rows [Legal]",
+        "function_arguments": {
+            "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+            "sheet_name": "Legal",
+            "search_value": "SharePoint",
+            "search_columns": "Location",
+            "max_rows": "25",
+        },
+        "function_result": {
+            "filename": "CCO-Legal File Plan 2025_Final Approved.xlsx",
+            "selected_sheet": "Legal",
+            "total_matches": 30,
+            "returned_rows": 30,
+            "sample_rows": [
+                {"Location": "Row 01 - https://contoso.sharepoint.com/sites/Site01 ... [truncated 120 chars]"},
+            ],
+            "sample_rows_limited": True,
+        },
+        "artifact_id": "assistant-msg-1_artifact_1",
+        "raw_payload_externalized": True,
+    }
+
+    page.route(
+        "**/api/user/settings",
+        lambda route: _fulfill_json(route, {"selected_agent": None, "settings": {"enable_agents": False}}),
+    )
+    page.route("**/api/get_conversations", lambda route: _fulfill_json(route, {"conversations": []}))
+    page.route(
+        "**/api/conversation/test-convo/agent-citation/assistant-msg-1_artifact_1",
+        lambda route: _fulfill_json(route, {"citation": _build_raw_citation_payload()}),
+    )
+
+    try:
+        page.goto(f"{BASE_URL}/chats", wait_until="domcontentloaded")
+        page.wait_for_selector("#chatbox")
+
+        page.evaluate(
+            """
+            async (payload) => {
+                currentConversationId = 'test-convo';
+                window.currentConversationId = 'test-convo';
+                const messagesModule = await import('/static/js/chat/chat-messages.js');
+                messagesModule.appendMessage(
+                    'AI',
+                    'Citation answer',
+                    null,
+                    'assistant-msg-1',
+                    false,
+                    [],
+                    [],
+                    [payload],
+                    null,
+                    null,
+                    {
+                        id: 'assistant-msg-1',
+                        role: 'assistant',
+                        content: 'Citation answer',
+                        agent_citations: [payload],
+                    },
+                    true
+                );
+            }
+            """,
+            compact_citation,
+        )
+
+        citation_button = page.locator("a.agent-citation-link").first
+        expect(citation_button).to_be_visible()
+
+        with page.expect_response("**/api/conversation/test-convo/agent-citation/assistant-msg-1_artifact_1"):
+            citation_button.click()
+
+        expect(page.locator("#agent-citation-modal")).to_be_visible()
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("total_matches: 30")
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("returned_rows: 30")
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("showing 3 rows")
+
+        result_panel = page.locator("#agent-tool-result")
+        expect(result_panel).to_contain_text("Row 01")
+        expect(result_panel).to_contain_text("Row 03")
+        expect(result_panel).not_to_contain_text("Row 04")
+
+        page.get_by_role("button", name="Show 25 rows").click()
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("showing 25 rows")
+        expect(result_panel).to_contain_text("Row 25")
+        expect(result_panel).not_to_contain_text("Row 26")
+
+        page.get_by_role("button", name="Show all rows").click()
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("showing 30 rows")
+        expect(result_panel).to_contain_text("Row 30")
+
+        page.get_by_role("button", name="Show preview").click()
+        expect(page.locator("#agent-tool-result-summary")).to_contain_text("showing 3 rows")
+        expect(result_panel).not_to_contain_text("Row 04")
+    finally:
+        context.close()
+        browser.close()
\ No newline at end of file
diff --git a/ui_tests/test_chat_new_conversation_tag_reset.py b/ui_tests/test_chat_new_conversation_tag_reset.py
new file mode 100644
index 00000000..d1da95af
--- /dev/null
+++ b/ui_tests/test_chat_new_conversation_tag_reset.py
@@ -0,0 +1,129 @@
+# test_chat_new_conversation_tag_reset.py
+"""
+UI test for chat tag reset on new conversation.
+Version: 0.240.026
+Implemented in: 0.240.026
+
+This test ensures that selecting a chat tag updates the visible selector
+state and that starting a brand new conversation clears the tag label and
+checkbox state back to the default "All Tags" view.
+"""
+
+import json
+import os
+from pathlib import Path
+
+import pytest
+from playwright.sync_api import expect
+
+
+BASE_URL = os.getenv("SIMPLECHAT_UI_BASE_URL", "").rstrip("/")
+STORAGE_STATE = os.getenv("SIMPLECHAT_UI_STORAGE_STATE", "")
+
+
+def _fulfill_json(route, payload, status=200):
+    route.fulfill(
+        status=status,
+        content_type="application/json",
+        body=json.dumps(payload),
+    )
+
+
+@pytest.mark.ui
+def test_new_conversation_clears_selected_chat_tags(playwright):
+    """Validate that explicit new chat creation clears stale tag selector state."""
+    if not BASE_URL:
+        pytest.skip("Set SIMPLECHAT_UI_BASE_URL to run this UI test.")
+    if not STORAGE_STATE or not Path(STORAGE_STATE).exists():
+        pytest.skip("Set SIMPLECHAT_UI_STORAGE_STATE to a valid authenticated Playwright storage state file.")
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={"width": 1440, "height": 900},
+    )
+    page = context.new_page()
+
+    user_settings_payload = {
+        "selected_agent": None,
+        "settings": {
+            "enable_agents": False,
+        },
+    }
+
+    def handle_user_settings(route):
+        if route.request.method == "GET":
+            _fulfill_json(route, user_settings_payload)
+            return
+
+        if route.request.method == "POST":
+            _fulfill_json(route, {"success": True})
+            return
+
+        route.continue_()
+
+    documents_payload = {
+        "documents": [
+            {
+                "id": "personal-doc-1",
+                "title": "Alpha Brief",
+                "file_name": "alpha-brief.md",
+                "tags": ["alpha"],
+                "document_classification": "",
+            }
+        ]
+    }
+
+    page.route("**/api/user/settings", handle_user_settings)
+    page.route("**/api/get_conversations", lambda route: _fulfill_json(route, {"conversations": []}))
+    page.route(
+        "**/api/create_conversation",
+        lambda route: _fulfill_json(
+            route,
+            {
+                "conversation_id": "new-conversation-1",
+                "title": "New Conversation",
+            },
+        ),
+    )
+    page.route("**/api/documents?page_size=1000", lambda route: _fulfill_json(route, documents_payload))
+    page.route("**/api/group_documents?*", lambda route: _fulfill_json(route, {"documents": []}))
+    page.route("**/api/public_workspace_documents?page_size=1000", lambda route: _fulfill_json(route, {"documents": []}))
+    page.route("**/api/documents/tags", lambda route: _fulfill_json(route, {"tags": [{"name": "alpha", "count": 1}]}))
+    page.route("**/api/group_documents/tags?*", lambda route: _fulfill_json(route, {"tags": []}))
+    page.route("**/api/public_workspace_documents/tags?*", lambda route: _fulfill_json(route, {"tags": []}))
+
+    try:
+        page.goto(f"{BASE_URL}/chats", wait_until="networkidle")
+
+        page.locator("#search-documents-btn").click()
+        page.wait_for_function(
+            """
+            () => {
+                const tagsDropdown = document.getElementById('tags-dropdown');
+                return tagsDropdown && window.getComputedStyle(tagsDropdown).display !== 'none';
+            }
+            """
+        )
+
+        page.locator("#tags-dropdown-button").click()
+        page.locator('#tags-dropdown-items [data-tag-value="alpha"]').click()
+        expect(page.locator("#tags-dropdown-button .selected-tags-text")).to_have_text("alpha")
+
+        page.locator("#new-conversation-btn").click()
+
+        page.wait_for_function(
+            """
+            () => {
+                const text = document.querySelector('#tags-dropdown-button .selected-tags-text');
+                return text && text.textContent.trim() === 'All Tags'
+                    && document.querySelectorAll('#tags-dropdown-items .tag-checkbox:checked').length === 0;
+            }
+            """
+        )
+
+        expect(page.locator("#tags-dropdown-button .selected-tags-text")).to_have_text("All Tags")
+        assert page.locator("#tags-dropdown-items .tag-checkbox:checked").count() == 0
+    finally:
+        context.close()
+        browser.close()
diff --git a/ui_tests/test_group_workspace_initial_documents_fetch.py b/ui_tests/test_group_workspace_initial_documents_fetch.py
new file mode 100644
index 00000000..b4465d51
--- /dev/null
+++ b/ui_tests/test_group_workspace_initial_documents_fetch.py
@@ -0,0 +1,120 @@
+# test_group_workspace_initial_documents_fetch.py
+"""
+UI test for group workspace initial document fetch.
+Version: 0.240.027
+Implemented in: 0.240.027
+
+This test ensures that the first visit to the group workspace loads the active
+group document table without raising the old params ReferenceError or showing a
+bulk-delete confirmation dialog.
+"""
+
+import json
+import os
+from pathlib import Path
+
+import pytest
+from playwright.sync_api import expect
+
+
+BASE_URL = os.getenv("SIMPLECHAT_UI_BASE_URL", "").rstrip("/")
+STORAGE_STATE = os.getenv("SIMPLECHAT_UI_STORAGE_STATE", "")
+
+
+def _fulfill_json(route, payload, status=200):
+    route.fulfill(
+        status=status,
+        content_type="application/json",
+        body=json.dumps(payload),
+    )
+
+
+@pytest.mark.ui
+def test_group_workspace_first_visit_loads_documents_without_load_time_errors(playwright):
+    """Validate first-load group document fetch behavior."""
+    if not BASE_URL:
+                pytest.skip("Set SIMPLECHAT_UI_BASE_URL to run this UI test.")
+    if not STORAGE_STATE or not Path(STORAGE_STATE).exists():
+                pytest.skip("Set SIMPLECHAT_UI_STORAGE_STATE to a valid authenticated Playwright storage state file.")
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={"width": 1440, "height": 900},
+    )
+    page = context.new_page()
+
+    page_errors = []
+    dialog_messages = []
+
+    page.on("pageerror", lambda error: page_errors.append(str(error)))
+
+    def handle_dialog(dialog):
+        dialog_messages.append(dialog.message)
+        dialog.dismiss()
+
+    page.on("dialog", handle_dialog)
+
+    page.route(
+        "**/api/groups?page_size=1000",
+        lambda route: _fulfill_json(
+            route,
+            {
+                "groups": [
+                    {
+                        "id": "group-alpha",
+                        "name": "Alpha Team",
+                        "isActive": True,
+                        "userRole": "Owner",
+                        "status": "active",
+                    }
+                ]
+            },
+        ),
+    )
+    page.route(
+        "**/api/group_documents?*",
+        lambda route: _fulfill_json(
+            route,
+            {
+                "documents": [],
+                "page": 1,
+                "page_size": 10,
+                "total_count": 0,
+            },
+        ),
+    )
+    page.route(
+        "**/api/group_documents/tags?*",
+        lambda route: _fulfill_json(route, {"tags": []}),
+    )
+
+    try:
+        response = page.goto(f"{BASE_URL}/group_workspaces", wait_until="networkidle")
+
+        assert response is not None, "Expected a navigation response when loading /group_workspaces."
+        assert response.ok, f"Expected /group_workspaces to load successfully, got HTTP {response.status}."
+
+        page.wait_for_function(
+            """
+            () => {
+                const tbody = document.querySelector('#group-documents-table tbody');
+                return tbody && tbody.textContent.includes('No documents found in this group.');
+            }
+            """
+        )
+
+        expect(page.locator("#group-documents-table tbody")).to_contain_text(
+            "No documents found in this group."
+        )
+
+        params_errors = [error for error in page_errors if "params is not defined" in error]
+        delete_dialogs = [
+            message for message in dialog_messages if "delete 0 selected document(s)" in message.lower()
+        ]
+
+        assert not params_errors, f"Unexpected page errors: {params_errors}"
+        assert not delete_dialogs, f"Unexpected delete confirmation dialogs: {delete_dialogs}"
+    finally:
+        context.close()
+        browser.close()
\ No newline at end of file
diff --git a/ui_tests/test_public_workspace_delete_error_toast.py b/ui_tests/test_public_workspace_delete_error_toast.py
new file mode 100644
index 00000000..4a0c8dd4
--- /dev/null
+++ b/ui_tests/test_public_workspace_delete_error_toast.py
@@ -0,0 +1,154 @@
+# test_public_workspace_delete_error_toast.py
+"""
+UI test for public workspace delete error toast.
+Version: 0.240.056
+Implemented in: 0.240.056
+
+This test ensures a failed public document delete shows a Bootstrap toast
+instead of a blocking browser alert dialog.
+"""
+
+import json
+import os
+from pathlib import Path
+from urllib.parse import urlparse
+
+import pytest
+from playwright.sync_api import expect
+
+
+BASE_URL = os.getenv('SIMPLECHAT_UI_BASE_URL', '').rstrip('/')
+STORAGE_STATE = os.getenv('SIMPLECHAT_UI_STORAGE_STATE', '')
+SKIP_RESPONSE_CODES = {401, 403, 404}
+
+
+def _fulfill_json(route, payload, status=200):
+    route.fulfill(
+        status=status,
+        content_type='application/json',
+        body=json.dumps(payload),
+    )
+
+
+def _handle_public_workspace_api(route):
+    request = route.request
+    parsed_url = urlparse(request.url)
+    path = parsed_url.path
+
+    if path == '/api/public_workspaces':
+        _fulfill_json(
+            route,
+            {
+                'workspaces': [
+                    {
+                        'id': 'public-1',
+                        'name': 'Toast Regression Workspace',
+                        'isActive': True,
+                        'userRole': 'Owner',
+                    }
+                ]
+            },
+        )
+        return
+
+    if path == '/api/public_workspaces/public-1':
+        _fulfill_json(
+            route,
+            {
+                'id': 'public-1',
+                'name': 'Toast Regression Workspace',
+                'status': 'active',
+                'userRole': 'Owner',
+            },
+        )
+        return
+
+    if path == '/api/public_documents' and request.method == 'GET':
+        _fulfill_json(
+            route,
+            {
+                'documents': [
+                    {
+                        'id': 'doc-1',
+                        'file_name': 'Toast Regression Doc.pdf',
+                        'title': 'Toast Regression Doc',
+                        'status': 'Complete',
+                        'percentage_complete': 100,
+                        'authors': 'Regression Tester',
+                        'version': '1',
+                        'number_of_pages': '1',
+                        'enhanced_citations': False,
+                        'publication_date': '2026-04-03',
+                        'keywords': 'toast, delete',
+                        'abstract': 'Regression coverage for delete errors.',
+                        'tags': [],
+                        'document_classification': 'Public',
+                    }
+                ],
+                'page': 1,
+                'page_size': 10,
+                'total_count': 1,
+            },
+        )
+        return
+
+    if path == '/api/public_documents/doc-1' and request.method == 'DELETE':
+        _fulfill_json(route, {'error': 'Delete failed for regression test.'}, status=500)
+        return
+
+    if path == '/api/public_workspace_documents/tags':
+        _fulfill_json(route, {'tags': []})
+        return
+
+    route.continue_()
+
+
+@pytest.mark.ui
+def test_public_workspace_delete_failure_uses_toast(playwright):
+    """Validate that failed public document deletes show a toast instead of a browser alert."""
+    if not BASE_URL:
+        pytest.skip('Set SIMPLECHAT_UI_BASE_URL to run this UI test.')
+    if not STORAGE_STATE or not Path(STORAGE_STATE).exists():
+        pytest.skip('Set SIMPLECHAT_UI_STORAGE_STATE to a valid authenticated Playwright storage state file.')
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={'width': 1440, 'height': 900},
+    )
+    page = context.new_page()
+    dialogs = []
+
+    def on_dialog(dialog):
+        dialogs.append(dialog.message)
+        dialog.dismiss()
+
+    page.on('dialog', on_dialog)
+    page.route('**/api/public_workspaces*', _handle_public_workspace_api)
+    page.route('**/api/public_documents*', _handle_public_workspace_api)
+    page.route('**/api/public_workspace_documents*', _handle_public_workspace_api)
+
+    try:
+        response = page.goto(f'{BASE_URL}/public_workspaces', wait_until='networkidle')
+        assert response is not None, 'Expected a navigation response when loading /public_workspaces.'
+
+        if response.status in SKIP_RESPONSE_CODES:
+            pytest.skip(f'/public_workspaces returned HTTP {response.status} in this environment.')
+
+        assert response.ok, f'Expected /public_workspaces to load successfully, got HTTP {response.status}.'
+        expect(page.locator('#publicWorkspaceTabContent')).to_be_visible()
+        expect(page.locator('#public-documents-table tbody')).to_contain_text('Toast Regression Doc')
+
+        page.evaluate("() => { window.deletePublicDocument('doc-1'); }")
+
+        delete_modal = page.locator('#publicDocumentDeleteModal')
+        expect(delete_modal).to_be_visible()
+        delete_modal.get_by_role('button', name='Delete All Versions').click()
+
+        toast = page.locator('#toast-container .toast').last
+        expect(toast).to_be_visible()
+        expect(toast).to_contain_text('Error deleting: Delete failed for regression test.')
+        assert dialogs == [], f'Expected delete failures to avoid browser alerts. Saw: {dialogs}'
+    finally:
+        context.close()
+        browser.close()
\ No newline at end of file
diff --git a/ui_tests/test_workspace_family_document_revision_delete_modal.py b/ui_tests/test_workspace_family_document_revision_delete_modal.py
new file mode 100644
index 00000000..73c6644c
--- /dev/null
+++ b/ui_tests/test_workspace_family_document_revision_delete_modal.py
@@ -0,0 +1,193 @@
+# test_workspace_family_document_revision_delete_modal.py
+"""
+UI test for workspace-family document revision delete modals.
+Version: 0.240.056
+Implemented in: 0.240.056
+
+This test ensures the personal, group, and public workspace pages use a
+Bootstrap revision delete modal instead of a native browser confirm dialog,
+and fail closed with user-visible feedback if the modal wiring is unavailable.
+"""
+
+import os
+from pathlib import Path
+
+import pytest
+from playwright.sync_api import expect
+
+
+BASE_URL = os.getenv("SIMPLECHAT_UI_BASE_URL", "").rstrip("/")
+STORAGE_STATE = os.getenv("SIMPLECHAT_UI_STORAGE_STATE", "")
+SKIP_RESPONSE_CODES = {401, 403, 404}
+DELETE_MODAL_UNAVAILABLE_MESSAGE = "Delete confirmation dialog is unavailable. Refresh the page and try again."
+
+
+def _require_ui_env():
+    if not BASE_URL:
+        pytest.skip("Set SIMPLECHAT_UI_BASE_URL to run this UI test.")
+    if not STORAGE_STATE or not Path(STORAGE_STATE).exists():
+        pytest.skip("Set SIMPLECHAT_UI_STORAGE_STATE to a valid authenticated Playwright storage state file.")
+
+
+def _assert_delete_modal(page, page_path, ready_selector, trigger_script, modal_selector):
+    dialogs = []
+
+    def on_dialog(dialog):
+        dialogs.append(dialog.message)
+        dialog.dismiss()
+
+    page.on("dialog", on_dialog)
+
+    response = page.goto(f"{BASE_URL}{page_path}", wait_until="networkidle")
+    assert response is not None, f"Expected a navigation response when loading {page_path}."
+
+    if response.status in SKIP_RESPONSE_CODES:
+        return False
+
+    assert response.ok, f"Expected {page_path} to load successfully, got HTTP {response.status}."
+    expect(page.locator(ready_selector)).to_be_visible()
+
+    page.evaluate(trigger_script)
+
+    modal = page.locator(modal_selector)
+    expect(modal).to_be_visible()
+    expect(modal.get_by_role("button", name="Delete Current Version")).to_be_visible()
+    expect(modal.get_by_role("button", name="Delete All Versions")).to_be_visible()
+    assert dialogs == [], f"Expected {page_path} to use a Bootstrap modal instead of a browser dialog. Saw: {dialogs}"
+
+    modal.get_by_role("button", name="Cancel").click()
+    expect(modal).to_be_hidden()
+    return True
+
+
+def _assert_delete_modal_fails_closed(page, page_path, ready_selector, modal_remove_script, trigger_script):
+    dialogs = []
+
+    def on_dialog(dialog):
+        dialogs.append(dialog.message)
+        dialog.dismiss()
+
+    page.on("dialog", on_dialog)
+
+    response = page.goto(f"{BASE_URL}{page_path}", wait_until="networkidle")
+    assert response is not None, f"Expected a navigation response when loading {page_path}."
+
+    if response.status in SKIP_RESPONSE_CODES:
+        return False
+
+    assert response.ok, f"Expected {page_path} to load successfully, got HTTP {response.status}."
+    expect(page.locator(ready_selector)).to_be_visible()
+
+    page.evaluate(
+        """
+        () => {
+            window.__deleteRequestCount = 0;
+            const originalFetch = window.fetch.bind(window);
+            window.fetch = (...args) => {
+                window.__deleteRequestCount += 1;
+                return originalFetch(...args);
+            };
+        }
+        """
+    )
+    page.evaluate(modal_remove_script)
+    page.evaluate(trigger_script)
+
+    expect(page.get_by_text(DELETE_MODAL_UNAVAILABLE_MESSAGE)).to_be_visible()
+    assert dialogs == [], f"Expected {page_path} to fail closed without opening a browser dialog. Saw: {dialogs}"
+    assert page.evaluate("() => window.__deleteRequestCount") == 0
+    return True
+
+
+@pytest.mark.ui
+def test_workspace_family_document_revision_delete_modal(playwright):
+    """Validate workspace-family document delete flows use revision-choice modals."""
+    _require_ui_env()
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={"width": 1440, "height": 900},
+    )
+
+    checked_pages = 0
+    try:
+        for page_path, ready_selector, trigger_script, modal_selector in [
+            (
+                "/workspace",
+                "#documents-tab",
+                "() => { window.deleteDocument('doc-1'); }",
+                "#documentDeleteModal",
+            ),
+            (
+                "/group_workspaces",
+                "#groupWorkspaceTabContent",
+                "() => { userRoleInActiveGroup = 'Owner'; window.deleteGroupDocument('doc-1'); }",
+                "#groupDocumentDeleteModal",
+            ),
+            (
+                "/public_workspaces",
+                "#publicWorkspaceTabContent",
+                "() => { window.deletePublicDocument('doc-1'); }",
+                "#publicDocumentDeleteModal",
+            ),
+        ]:
+            page = context.new_page()
+            try:
+                if _assert_delete_modal(page, page_path, ready_selector, trigger_script, modal_selector):
+                    checked_pages += 1
+            finally:
+                page.close()
+
+        if checked_pages == 0:
+            pytest.skip("No workspace-family pages were available in this environment.")
+    finally:
+        context.close()
+        browser.close()
+
+
+@pytest.mark.ui
+def test_workspace_family_document_revision_delete_modal_fails_closed_when_modal_missing(playwright):
+    """Validate workspace-family delete flows fail closed when modal wiring is unavailable."""
+    _require_ui_env()
+
+    browser = playwright.chromium.launch()
+    context = browser.new_context(
+        storage_state=STORAGE_STATE,
+        viewport={"width": 1440, "height": 900},
+    )
+
+    checked_pages = 0
+    try:
+        for page_path, ready_selector, modal_remove_script, trigger_script in [
+            (
+                "/workspace",
+                "#documents-tab",
+                "() => { document.getElementById('documentDeleteModal')?.remove(); }",
+                "() => window.deleteDocument('doc-1')",
+            ),
+            (
+                "/group_workspaces",
+                "#groupWorkspaceTabContent",
+                "() => { document.getElementById('groupDocumentDeleteModal')?.remove(); }",
+                "() => { userRoleInActiveGroup = 'Owner'; return window.deleteGroupDocument('doc-1'); }",
+            ),
+            (
+                "/public_workspaces",
+                "#publicWorkspaceTabContent",
+                "() => { document.getElementById('publicDocumentDeleteModal')?.remove(); }",
+                "() => window.deletePublicDocument('doc-1')",
+            ),
+        ]:
+            page = context.new_page()
+            try:
+                if _assert_delete_modal_fails_closed(page, page_path, ready_selector, modal_remove_script, trigger_script):
+                    checked_pages += 1
+            finally:
+                page.close()
+
+        if checked_pages == 0:
+            pytest.skip("No workspace-family pages were available in this environment.")
+    finally:
+        context.close()
+        browser.close()
\ No newline at end of file