From 0625e66ca96a83f3e088390844e65fb989c3574f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 13 Dec 2025 08:27:11 +0000
Subject: [PATCH 1/4] Initial plan


From 86c69e93d743ad8e2cab31ef3275f344d514d4c4 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 13 Dec 2025 08:34:13 +0000
Subject: [PATCH 2/4] Fix duplicate citations and malformed brackets in Azure
 AI responses

- Strip context.citations and context.all_retrieved_documents from SSE JSON
  chunks to prevent OpenWebUI from displaying duplicate unfiltered citations
- Only emit filtered citation events for documents referenced in content
- Add _strip_context_from_response method for streaming and non-streaming paths
- Add _clean_malformed_brackets method to fix bracket patterns from
  Azure AI followup generation (e.g., [[[doc1]](url)]] -> [[doc1]](url))
- Remove empty brackets [] from response content

Co-authored-by: owndev <69784886+owndev@users.noreply.github.com>
---
 pipelines/azure/azure_ai_foundry.py | 213 ++++++++++++++++++++--------
 1 file changed, 156 insertions(+), 57 deletions(-)

diff --git a/pipelines/azure/azure_ai_foundry.py b/pipelines/azure/azure_ai_foundry.py
index 0a87638..794d106 100644
--- a/pipelines/azure/azure_ai_foundry.py
+++ b/pipelines/azure/azure_ai_foundry.py
@@ -149,6 +149,13 @@ class Pipe:
     # Regex pattern for matching [docX] citation references
     DOC_REF_PATTERN = re.compile(r"\[doc(\d+)\]")
 
+    # Regex patterns for cleaning malformed bracket patterns from followup generation
+    # These can occur when Azure AI followup generation doesn't format citations properly
+    # Pattern 1: Extra brackets around valid links [+[[docX]](url)]+ -> [[docX]](url)
+    EXTRA_BRACKETS_PATTERN = re.compile(r"\[+(\[\[doc\d+\]\]\([^)]+\))\]+")
+    # Pattern 2: Empty brackets [] -> (removed)
+    EMPTY_BRACKETS_PATTERN = re.compile(r"\[\]")
+
     # Environment variables for API key, endpoint, and optional model
     class Valves(BaseModel):
         # Custom prefix for pipeline display name
@@ -802,6 +809,80 @@ def _build_citation_urls_map(
 
         return citation_urls
 
+    def _strip_context_from_response(
+        self, response_data: Dict[str, Any]
+    ) -> Dict[str, Any]:
+        """
+        Strip citations and all_retrieved_documents from the response context.
+
+        This prevents OpenWebUI from displaying duplicate citations from both
+        the raw SSE JSON and the emitted citation events. The citation events
+        are filtered to only include referenced documents, but the raw context
+        would show all documents.
+
+        Args:
+            response_data: Response data dict (modified in-place)
+
+        Returns:
+            The modified response data with context stripped
+        """
+        if not isinstance(response_data, dict) or "choices" not in response_data:
+            return response_data
+
+        for choice in response_data.get("choices", []):
+            # Handle delta (streaming) context
+            if "delta" in choice and isinstance(choice["delta"], dict):
+                context = choice["delta"].get("context")
+                if context and isinstance(context, dict):
+                    context.pop("citations", None)
+                    context.pop("all_retrieved_documents", None)
+                    # Remove empty context
+                    if not context:
+                        del choice["delta"]["context"]
+
+            # Handle message (non-streaming) context
+            if "message" in choice and isinstance(choice["message"], dict):
+                context = choice["message"].get("context")
+                if context and isinstance(context, dict):
+                    context.pop("citations", None)
+                    context.pop("all_retrieved_documents", None)
+                    # Remove empty context
+                    if not context:
+                        del choice["message"]["context"]
+
+        return response_data
+
+    def _clean_malformed_brackets(self, content: str) -> str:
+        """
+        Clean up malformed bracket patterns from followup generation.
+
+        Azure AI followup generation can produce malformed citations like:
+        - [[[doc3]](url)]] - extra brackets around link
+        - [] - empty brackets
+        - [[[doc1]](url)] - inconsistent bracket counts
+
+        This method normalizes these patterns to ensure proper markdown rendering.
+
+        Args:
+            content: The response content to clean
+
+        Returns:
+            Content with malformed brackets cleaned up
+        """
+        if not content:
+            return content
+
+        result = content
+
+        # Fix extra outer brackets: [[[doc1]](url)]] -> [[doc1]](url)
+        # Uses capture group to preserve the valid inner markdown link
+        result = self.EXTRA_BRACKETS_PATTERN.sub(r"\1", result)
+
+        # Remove empty brackets
+        result = self.EMPTY_BRACKETS_PATTERN.sub("", result)
+
+        return result
+
     def _format_citation_link(self, doc_num: int, url: Optional[str] = None) -> str:
         """
         Format a markdown link for a [docX] reference.
@@ -957,13 +1038,14 @@ async def _emit_openwebui_citation_events(
     def enhance_azure_search_response(self, response: Dict[str, Any]) -> Dict[str, Any]:
         """
         Enhance Azure AI Search responses by converting [docX] references to markdown links.
+        Also cleans up malformed brackets and strips context to prevent duplicate citations.
         Modifies the response in-place and returns it.
 
         Args:
             response: The original response from Azure AI (modified in-place)
 
         Returns:
-            The enhanced response with markdown links for citations
+            The enhanced response with markdown links for citations and cleaned content
         """
         if not isinstance(response, dict):
             return response
@@ -988,9 +1070,17 @@ def enhance_azure_search_response(self, response: Dict[str, Any]) -> Dict[str, A
             # Convert [docX] references to markdown links
             enhanced_content = self._convert_doc_refs_to_links(content, citations)
 
+            # Clean up malformed brackets from followup generation
+            if "[[" in enhanced_content or "[]" in enhanced_content:
+                enhanced_content = self._clean_malformed_brackets(enhanced_content)
+
             # Update the message content
             message["content"] = enhanced_content
 
+            # Strip context to prevent OpenWebUI from showing duplicate citations
+            # The citations are emitted separately via _emit_openwebui_citation_events
+            self._strip_context_from_response(response)
+
             return response
 
         except Exception as e:
@@ -1334,38 +1424,32 @@ def replace_ref(m, urls_map):
                     except Exception as parse_error:
                         log.debug(f"Error parsing citations from chunk: {parse_error}")
 
-                # Convert [docX] references to markdown links in the chunk content
-                # This creates clickable links to source documents in streaming responses
+                # Process SSE chunk to:
+                # 1. Strip context (citations, all_retrieved_documents) to prevent duplicate display
+                # 2. Convert [docX] references to markdown links
+                # 3. Clean up malformed bracket patterns from followup generation
                 chunk_modified = False
-                if "[doc" in chunk_str and citation_urls:
-                    try:
-                        # Parse and modify each SSE data line
-                        modified_lines = []
-                        chunk_lines = chunk_str.split("\n")
+                try:
+                    modified_lines = []
+                    chunk_lines = chunk_str.split("\n")
 
-                        for line in chunk_lines:
-                            # Early exit: skip lines without [doc references
-                            if "[doc" not in line:
-                                modified_lines.append(line)
-                                continue
+                    for line in chunk_lines:
+                        # Process only SSE data lines
+                        if line.startswith("data: ") and line.strip() != "data: [DONE]":
+                            json_str = line[6:].strip()
+                            if json_str and json_str != "[DONE]":
+                                try:
+                                    data = json.loads(json_str)
+                                    if isinstance(data, dict):
+                                        line_modified = False
 
-                            # Process only SSE data lines
-                            if (
-                                line.startswith("data: ")
-                                and line.strip() != "data: [DONE]"
-                            ):
-                                json_str = line[6:].strip()
-                                if json_str and json_str != "[DONE]":
-                                    try:
-                                        data = json.loads(json_str)
-                                        if (
-                                            isinstance(data, dict)
-                                            and "choices" in data
-                                            and data["choices"]
-                                        ):
-                                            line_modified = False
-                                            # Process choices until we find and modify content
-                                            for choice in data["choices"]:
+                                        # Strip context to prevent OpenWebUI from showing unfiltered citations
+                                        if "choices" in data:
+                                            self._strip_context_from_response(data)
+                                            line_modified = True
+
+                                            # Process content in choices
+                                            for choice in data.get("choices", []):
                                                 if (
                                                     "delta" in choice
                                                     and "content" in choice["delta"]
@@ -1373,50 +1457,65 @@ def replace_ref(m, urls_map):
                                                     content_val = choice["delta"][
                                                         "content"
                                                     ]
-                                                    if "[doc" in content_val:
-                                                        # Convert [docX] to markdown link using pre-compiled pattern
-                                                        # Use lambda to pass citation_urls to pre-defined function
-                                                        choice["delta"]["content"] = (
+                                                    modified_content = content_val
+
+                                                    # Convert [docX] to markdown links
+                                                    if (
+                                                        "[doc" in content_val
+                                                        and citation_urls
+                                                    ):
+                                                        modified_content = (
                                                             self.DOC_REF_PATTERN.sub(
                                                                 lambda m: replace_ref(
                                                                     m, citation_urls
                                                                 ),
-                                                                content_val,
+                                                                modified_content,
                                                             )
                                                         )
+
+                                                    # Clean malformed brackets from followup generation
+                                                    if (
+                                                        "[[" in modified_content
+                                                        or "[]" in modified_content
+                                                    ):
+                                                        modified_content = self._clean_malformed_brackets(
+                                                            modified_content
+                                                        )
+
+                                                    if modified_content != content_val:
+                                                        choice["delta"]["content"] = (
+                                                            modified_content
+                                                        )
                                                         line_modified = True
-                                                        # Early exit: content found and modified
-                                                        break
 
-                                            if line_modified:
-                                                modified_lines.append(
-                                                    f"data: {json.dumps(data)}"
-                                                )
-                                                chunk_modified = True
-                                            else:
-                                                modified_lines.append(line)
+                                        if line_modified:
+                                            modified_lines.append(
+                                                f"data: {json.dumps(data)}"
+                                            )
+                                            chunk_modified = True
                                         else:
                                             modified_lines.append(line)
-                                    except json.JSONDecodeError:
+                                    else:
                                         modified_lines.append(line)
-                                else:
+                                except json.JSONDecodeError:
                                     modified_lines.append(line)
                             else:
                                 modified_lines.append(line)
+                        else:
+                            modified_lines.append(line)
 
-                        # Reconstruct the chunk only if something was modified
-                        if chunk_modified:
-                            modified_chunk_str = "\n".join(modified_lines)
-                            log.debug(
-                                "Converted [docX] references to markdown links in streaming chunk"
-                            )
-                            chunk = modified_chunk_str.encode("utf-8")
-
-                    except Exception as convert_err:
+                    # Reconstruct the chunk if modified
+                    if chunk_modified:
+                        chunk_str = "\n".join(modified_lines)
+                        chunk = chunk_str.encode("utf-8")
                         log.debug(
-                            f"Error converting [docX] to markdown links: {convert_err}"
+                            "Processed streaming chunk: stripped context, converted links, cleaned brackets"
                         )
-                        # Fall through to yield original chunk
+
+                except Exception as process_err:
+                    log.debug(f"Error processing streaming chunk: {process_err}")
+                    # Fall through to yield original chunk
+                    # Fall through to yield original chunk
 
                 # Yield the (possibly modified) chunk
                 yield chunk

From 7d6778116f8092a55a6da88fcbf6dfb74cbfc998 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 13 Dec 2025 08:36:40 +0000
Subject: [PATCH 3/4] Address code review feedback: remove duplicate comment,
 simplify assignment

Co-authored-by: owndev <69784886+owndev@users.noreply.github.com>
---
 pipelines/azure/azure_ai_foundry.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/pipelines/azure/azure_ai_foundry.py b/pipelines/azure/azure_ai_foundry.py
index 794d106..2dddae3 100644
--- a/pipelines/azure/azure_ai_foundry.py
+++ b/pipelines/azure/azure_ai_foundry.py
@@ -1515,7 +1515,6 @@ def replace_ref(m, urls_map):
                 except Exception as process_err:
                     log.debug(f"Error processing streaming chunk: {process_err}")
                     # Fall through to yield original chunk
-                    # Fall through to yield original chunk
 
                 # Yield the (possibly modified) chunk
                 yield chunk

From f5d80825fa4b78d3951429653113337c06b68719 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 13 Dec 2025 08:45:07 +0000
Subject: [PATCH 4/4] Fix duplicate URL in markdown links during followup
 generation

- Add negative lookahead to DOC_REF_PATTERN to skip [docX] already followed by (url)
- Add DUPLICATE_URL_PATTERN to clean [[docX]](url)(url) -> [[docX]](url)
- Update cleanup condition to also check for '](' pattern

Co-authored-by: owndev <69784886+owndev@users.noreply.github.com>
---
 pipelines/azure/azure_ai_foundry.py | 17 +++++++++++++++--
 1 file changed, 15 insertions(+), 2 deletions(-)

diff --git a/pipelines/azure/azure_ai_foundry.py b/pipelines/azure/azure_ai_foundry.py
index 2dddae3..bdaa3dd 100644
--- a/pipelines/azure/azure_ai_foundry.py
+++ b/pipelines/azure/azure_ai_foundry.py
@@ -147,7 +147,8 @@ async def cleanup_response(
 
 class Pipe:
     # Regex pattern for matching [docX] citation references
-    DOC_REF_PATTERN = re.compile(r"\[doc(\d+)\]")
+    # Uses negative lookahead to avoid matching [docX] already followed by (url)
+    DOC_REF_PATTERN = re.compile(r"\[doc(\d+)\](?!\()")
 
     # Regex patterns for cleaning malformed bracket patterns from followup generation
     # These can occur when Azure AI followup generation doesn't format citations properly
@@ -155,6 +156,8 @@ class Pipe:
     EXTRA_BRACKETS_PATTERN = re.compile(r"\[+(\[\[doc\d+\]\]\([^)]+\))\]+")
     # Pattern 2: Empty brackets [] -> (removed)
     EMPTY_BRACKETS_PATTERN = re.compile(r"\[\]")
+    # Pattern 3: Duplicate URL after markdown link [[docX]](url)(url) -> [[docX]](url)
+    DUPLICATE_URL_PATTERN = re.compile(r"(\[\[doc\d+\]\]\([^)]+\))\([^)]+\)")
 
     # Environment variables for API key, endpoint, and optional model
     class Valves(BaseModel):
@@ -860,6 +863,7 @@ def _clean_malformed_brackets(self, content: str) -> str:
         - [[[doc3]](url)]] - extra brackets around link
         - [] - empty brackets
         - [[[doc1]](url)] - inconsistent bracket counts
+        - [[doc2]](url)(url) - duplicate URL after markdown link
 
         This method normalizes these patterns to ensure proper markdown rendering.
 
@@ -881,6 +885,10 @@ def _clean_malformed_brackets(self, content: str) -> str:
         # Remove empty brackets
         result = self.EMPTY_BRACKETS_PATTERN.sub("", result)
 
+        # Remove duplicate URLs: [[doc1]](url)(url) -> [[doc1]](url)
+        # This can occur when Azure AI adds a URL that we also added during conversion
+        result = self.DUPLICATE_URL_PATTERN.sub(r"\1", result)
+
         return result
 
     def _format_citation_link(self, doc_num: int, url: Optional[str] = None) -> str:
@@ -1071,7 +1079,11 @@ def enhance_azure_search_response(self, response: Dict[str, Any]) -> Dict[str, A
             enhanced_content = self._convert_doc_refs_to_links(content, citations)
 
             # Clean up malformed brackets from followup generation
-            if "[[" in enhanced_content or "[]" in enhanced_content:
+            if (
+                "[[" in enhanced_content
+                or "[]" in enhanced_content
+                or "](" in enhanced_content
+            ):
                 enhanced_content = self._clean_malformed_brackets(enhanced_content)
 
             # Update the message content
@@ -1477,6 +1489,7 @@ def replace_ref(m, urls_map):
                                                     if (
                                                         "[[" in modified_content
                                                         or "[]" in modified_content
+                                                        or "](" in modified_content
                                                     ):
                                                         modified_content = self._clean_malformed_brackets(
                                                             modified_content