From 5bc6cce779bbe56e59b1785e9e3c669baa73baa9 Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Sun, 14 Dec 2025 11:47:37 +0100
Subject: [PATCH 1/5] Docstrings for common.py and endpoints.py

---
 src/utils/common.py    |  15 ++++++
 src/utils/endpoints.py | 113 ++++++++++++++++++++++++++++++++++++++---
 2 files changed, 120 insertions(+), 8 deletions(-)

diff --git a/src/utils/common.py b/src/utils/common.py
index 744a6b503..7129d3ec6 100644
--- a/src/utils/common.py
+++ b/src/utils/common.py
@@ -69,6 +69,14 @@ async def _register_mcp_toolgroups_async(
     This function performs network calls against the provided async client and does not
     catch exceptions raised by those calls — any exceptions from the client (e.g., RPC
     or HTTP errors) will propagate to the caller.
+
+    Parameters:
+        client (AsyncLlamaStackClient): The LlamaStack async client used to
+                                        query and register toolgroups.
+        mcp_servers (List[ModelContextProtocolServer]): MCP server descriptors
+                                                        to ensure are registered.
+        logger (Logger): Logger used for debug messages about registration
+                         progress.
     """
     # Get registered tools
     registered_toolgroups = await client.toolgroups.list()
@@ -101,6 +109,10 @@ def run_once_async(func: Callable) -> Callable:
     Later invocations return/await the same Task, receiving the same result or
     propagated exception. Requires an active running event loop when the
     wrapped function is first called.
+
+    Returns:
+        Any: The result produced by the wrapped coroutine, or the exception it
+             raised propagated to callers.
     """
     task = None
 
@@ -114,6 +126,9 @@ async def wrapper(*args: Any, **kwargs: Any) -> Any:
         Subsequent calls return the same awaited task result. Exceptions raised
         by the task propagate to callers. Requires an active running event loop
         when first called.
+
+        Returns:
+            The awaited result of the wrapped coroutine.
         """
         nonlocal task
         if task is None:
diff --git a/src/utils/endpoints.py b/src/utils/endpoints.py
index b6d5ff735..127bcbf01 100644
--- a/src/utils/endpoints.py
+++ b/src/utils/endpoints.py
@@ -205,7 +205,17 @@ def get_system_prompt(query_request: QueryRequest, config: AppConfig) -> str:
 
 
 def get_topic_summary_system_prompt(config: AppConfig) -> str:
-    """Get the topic summary system prompt."""
+    """
+    Get the topic summary system prompt.
+
+    Parameters:
+        config (AppConfig): Application configuration from which to read
+                            customization/profile settings.
+
+    Returns:
+        str: The topic summary system prompt from the active custom profile if
+             set, otherwise the default prompt.
+    """
     # profile takes precedence for setting prompt
     if (
         config.customization is not None
@@ -223,8 +233,9 @@ def validate_model_provider_override(
 ) -> None:
     """Validate whether model/provider overrides are allowed by RBAC.
 
-    Raises HTTP 403 if the request includes model or provider and the caller
-    lacks Action.MODEL_OVERRIDE permission.
+    Raises:
+        HTTP 403 if the request includes model or provider and the caller
+        lacks Action.MODEL_OVERRIDE permission.
     """
     if (query_request.model is not None or query_request.provider is not None) and (
         Action.MODEL_OVERRIDE not in authorized_actions
@@ -242,7 +253,24 @@ def store_conversation_into_cache(
     _skip_userid_check: bool,
     topic_summary: str | None,
 ) -> None:
-    """Store one part of conversation into conversation history cache."""
+    """
+    Store one part of conversation into conversation history cache.
+
+    If a conversation cache type is configured but the cache instance is not
+    initialized, the function logs a warning and returns without persisting
+    anything.
+
+    Parameters:
+        config (AppConfig): Application configuration that may contain
+                            conversation cache settings and instance.
+        user_id (str): Owner identifier used as the cache key.
+        conversation_id (str): Conversation identifier used as the cache key.
+        cache_entry (CacheEntry): Entry to insert or append to the conversation history.
+        _skip_userid_check (bool): When true, bypasses enforcing that the cache
+                                   operation must match the user id.
+        topic_summary (str | None): Optional topic summary to store alongside
+                                    the conversation; ignored if None or empty.
+    """
     if config.conversation_cache_configuration.type is not None:
         cache = config.conversation_cache
         if cache is None:
@@ -366,10 +394,12 @@ async def get_temp_agent(
     This function creates a new agent without persistence, shields, or tools.
     Useful for temporary operations or one-off queries, such as validating a
     question or generating a summary.
-    Args:
+
+    Parameters:
         client: The AsyncLlamaStackClient to use for the request.
         model_id: The ID of the model to use.
         system_prompt: The system prompt/instructions for the agent.
+
     Returns:
         tuple[AsyncAgent, str]: A tuple containing the agent and session_id.
     """
@@ -412,7 +442,23 @@ def create_rag_chunks_dict(summary: TurnSummary) -> list[dict[str, Any]]:
 def _process_http_source(
     src: str, doc_urls: set[str]
 ) -> tuple[AnyUrl | None, str] | None:
-    """Process HTTP source and return (doc_url, doc_title) tuple."""
+    """
+    Process HTTP source and return (doc_url, doc_title) tuple.
+
+    Parameters:
+        src (str): The source URL string to process.
+        doc_urls (set[str]): Set of already-seen source strings; the function
+                             will add `src` to this set when it is new.
+
+    Returns:
+        tuple[AnyUrl | None, str] | None: A tuple (validated_url, doc_title)
+               when `src` was not previously seen:
+            - `validated_url`: an `AnyUrl` instance if `src` is a valid URL, or
+              `None` if validation failed.
+            - `doc_title`: the last path segment of the URL or `src` if no path
+               segment is present.
+        Returns `None` if `src` was already present in `doc_urls`.
+    """
     if src not in doc_urls:
         doc_urls.add(src)
         try:
@@ -433,7 +479,29 @@ def _process_document_id(
     metas_by_id: dict[str, dict[str, Any]],
     metadata_map: dict[str, Any] | None,
 ) -> tuple[AnyUrl | None, str] | None:
-    """Process document ID and return (doc_url, doc_title) tuple."""
+    """
+    Process document ID and return (doc_url, doc_title) tuple.
+
+    Parameters:
+        src (str): Document identifier to process.
+        doc_ids (set[str]): Set of already-seen document IDs; the function adds `src` to this set.
+        doc_urls (set[str]): Set of already-seen document URLs; the function
+                             adds discovered URLs to this set to avoid duplicates.
+        metas_by_id (dict[str, dict[str, Any]]): Mapping of document IDs to
+                                                 metadata dicts that may
+                                                 contain `docs_url` and
+                                                 `title`.
+        metadata_map (dict[str, Any] | None): If provided (truthy), indicates
+                                              metadata is available and enables
+                                              metadata lookup; when falsy,
+                                              metadata lookup is skipped.
+
+    Returns:
+        tuple[AnyUrl | None, str] | None: `(validated_url, doc_title)` where
+        `validated_url` is a validated `AnyUrl` or `None` and `doc_title` is
+        the chosen title string; returns `None` if the `src` or its URL was
+        already processed.
+    """
     if src in doc_ids:
         return None
     doc_ids.add(src)
@@ -500,6 +568,17 @@ def _process_rag_chunks_for_documents(
     Process RAG chunks and return a list of (doc_url, doc_title) tuples.
 
     This is the core logic shared between both return formats.
+
+    Parameters:
+        rag_chunks (list): Iterable of RAG chunk objects; each chunk must
+        provide a `source` attribute (e.g., an HTTP URL or a document ID).
+        metadata_map (dict[str, Any] | None): Optional mapping of document IDs
+        to metadata dictionaries used to resolve titles and document URLs.
+
+    Returns:
+        list[tuple[AnyUrl | None, str]]: Ordered list of tuples where the first
+        element is a validated URL object or `None` (if no URL is available)
+        and the second element is the document title.
     """
     doc_urls: set[str] = set()
     doc_ids: set[str] = set()
@@ -547,7 +626,7 @@ def create_referenced_documents(
     optional metadata enrichment, deduplication, and proper URL handling. It can return
     either ReferencedDocument objects (for query endpoint) or dictionaries (for streaming).
 
-    Args:
+    Parameters:
         rag_chunks: List of RAG chunks with source information
         metadata_map: Optional mapping containing metadata about referenced documents
         return_dict_format: If True, returns list of dicts; if False, returns list of
@@ -580,6 +659,16 @@ def create_referenced_documents_with_metadata(
     Create referenced documents from RAG chunks with metadata enrichment for streaming.
 
     This function now returns ReferencedDocument objects for consistency with the query endpoint.
+
+    Parameters:
+        summary (TurnSummary): Summary object containing `rag_chunks` to be processed.
+        metadata_map (dict[str, Any]): Metadata keyed by document id used to
+                                       derive or enrich document `doc_url` and `doc_title`.
+
+    Returns:
+        list[ReferencedDocument]: ReferencedDocument objects with `doc_url` and
+        `doc_title` populated; `doc_url` may be `None` if no valid URL could be
+        determined.
     """
     document_entries = _process_rag_chunks_for_documents(
         summary.rag_chunks, metadata_map
@@ -598,6 +687,14 @@ def create_referenced_documents_from_chunks(
 
     This is a backward compatibility wrapper around the unified
     create_referenced_documents function.
+
+    Parameters:
+        rag_chunks (list): List of RAG chunk entries containing source and metadata information.
+
+    Returns:
+        list[ReferencedDocument]: ReferencedDocument instances created from the
+        chunks; each contains `doc_url` (validated URL or `None`) and
+        `doc_title`.
     """
     document_entries = _process_rag_chunks_for_documents(rag_chunks)
     return [

From d171fcdd286198f3ad7aa23be1e1283138dbceb5 Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Sun, 14 Dec 2025 11:55:32 +0100
Subject: [PATCH 2/5] Docstrings updated in llama_stack_version.py and
 mcp_headers.py

---
 src/utils/endpoints.py           | 4 ++--
 src/utils/llama_stack_version.py | 4 ++++
 src/utils/mcp_headers.py         | 4 ++--
 3 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/utils/endpoints.py b/src/utils/endpoints.py
index 127bcbf01..372e3b4ea 100644
--- a/src/utils/endpoints.py
+++ b/src/utils/endpoints.py
@@ -234,8 +234,8 @@ def validate_model_provider_override(
     """Validate whether model/provider overrides are allowed by RBAC.
 
     Raises:
-        HTTP 403 if the request includes model or provider and the caller
-        lacks Action.MODEL_OVERRIDE permission.
+        HTTPException: HTTP 403 if the request includes model or provider and
+        the caller lacks Action.MODEL_OVERRIDE permission.
     """
     if (query_request.model is not None or query_request.provider is not None) and (
         Action.MODEL_OVERRIDE not in authorized_actions
diff --git a/src/utils/llama_stack_version.py b/src/utils/llama_stack_version.py
index 4352b1d45..7ac543bfc 100644
--- a/src/utils/llama_stack_version.py
+++ b/src/utils/llama_stack_version.py
@@ -31,6 +31,10 @@ async def check_llama_stack_version(
     and maximal supported versions. Raises
     InvalidLlamaStackVersionException if the detected version is
     outside the supported range.
+
+    Raises:
+        InvalidLlamaStackVersionException: If the detected version is outside
+        the supported range or cannot be parsed.
     """
     version_info = await client.inspect.version()
     compare_versions(
diff --git a/src/utils/mcp_headers.py b/src/utils/mcp_headers.py
index 52ac73f93..46bd0d5cd 100644
--- a/src/utils/mcp_headers.py
+++ b/src/utils/mcp_headers.py
@@ -17,7 +17,7 @@ async def mcp_headers_dependency(request: Request) -> dict[str, dict[str, str]]:
 
     mcp headers is a json dictionary or mcp url paths and their respective headers
 
-    Args:
+    Parameters:
         request (Request): The FastAPI request object.
 
     Returns:
@@ -32,7 +32,7 @@ def extract_mcp_headers(request: Request) -> dict[str, dict[str, str]]:
     If the header is missing, contains invalid JSON, or the decoded
     value is not a dictionary, an empty dictionary is returned.
 
-    Args:
+    Parameters:
         request: The FastAPI request object
 
     Returns:

From 72717ad6fe7a7394274368cba59fa5a9ee5fb811 Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Sun, 14 Dec 2025 12:00:53 +0100
Subject: [PATCH 3/5] Docstrings for quota.py and responses.py

---
 src/utils/quota.py     | 4 ++--
 src/utils/responses.py | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/utils/quota.py b/src/utils/quota.py
index d7fcc7a15..a08b37741 100644
--- a/src/utils/quota.py
+++ b/src/utils/quota.py
@@ -19,7 +19,7 @@ def consume_tokens(
 ) -> None:
     """Consume tokens from cluster and/or user quotas.
 
-    Args:
+    Parameters:
         quota_limiters: List of quota limiter instances to consume tokens from.
         user_id: Identifier of the user consuming tokens.
         input_tokens: Number of input tokens to consume.
@@ -40,7 +40,7 @@ def consume_tokens(
 def check_tokens_available(quota_limiters: list[QuotaLimiter], user_id: str) -> None:
     """Check if tokens are available for user.
 
-    Args:
+    Parameters:
         quota_limiters: List of quota limiter instances to check.
         user_id: Identifier of the user to check quota for.
 
diff --git a/src/utils/responses.py b/src/utils/responses.py
index e430b8eeb..88437af07 100644
--- a/src/utils/responses.py
+++ b/src/utils/responses.py
@@ -11,7 +11,7 @@ def extract_text_from_response_output_item(output_item: Any) -> str:
     formats including string content, content arrays with text parts, and refusal
     messages.
 
-    Args:
+    Parameters:
         output_item: A Responses API output item (typically from response.output array).
             Expected to have attributes like type, role, and content.
 

From 10010f633dd90c6e9d188720069145ba68d379dc Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Sun, 14 Dec 2025 12:09:02 +0100
Subject: [PATCH 4/5] Docstrings for shield.py token_counter.py, and
 tool_formatter.py

---
 src/utils/shields.py        |  8 ++++----
 src/utils/token_counter.py  | 16 +++++++++++-----
 src/utils/tool_formatter.py | 16 ++++++++++++----
 3 files changed, 27 insertions(+), 13 deletions(-)

diff --git a/src/utils/shields.py b/src/utils/shields.py
index f9c96831e..38730fb7a 100644
--- a/src/utils/shields.py
+++ b/src/utils/shields.py
@@ -14,11 +14,11 @@ async def get_available_shields(client: AsyncLlamaStackClient) -> list[str]:
     """
     Discover and return available shield identifiers.
 
-    Args:
+    Parameters:
         client: The Llama Stack client to query for available shields.
 
     Returns:
-        List of shield identifiers that are available.
+        list[str]: List of available shield identifiers; empty if no shields are available.
     """
     available_shields = [shield.identifier for shield in await client.shields.list()]
     if not available_shields:
@@ -36,11 +36,11 @@ def detect_shield_violations(output_items: list[Any]) -> bool:
     attributes. If a refusal is found, increments the validation error
     metric and logs a warning.
 
-    Args:
+    Parameters:
         output_items: List of output items from the LLM response to check.
 
     Returns:
-        True if a shield violation was detected, False otherwise.
+        bool: True if a shield violation was detected, False otherwise.
     """
     for output_item in output_items:
         item_type = getattr(output_item, "type", None)
diff --git a/src/utils/token_counter.py b/src/utils/token_counter.py
index b14cf2ac2..ba9b79463 100644
--- a/src/utils/token_counter.py
+++ b/src/utils/token_counter.py
@@ -31,7 +31,13 @@ class TokenCounter:
     llm_calls: int = 0
 
     def __str__(self) -> str:
-        """Textual representation of TokenCounter instance."""
+        """
+        Return a human-readable summary of the token usage stored in this TokenCounter.
+
+        Returns:
+            summary (str): A formatted string containing `input_tokens`,
+                           `output_tokens`, `input_tokens_counted`, and `llm_calls`.
+        """
         return (
             f"{self.__class__.__name__}: "
             + f"input_tokens: {self.input_tokens} "
@@ -47,9 +53,9 @@ def extract_token_usage_from_turn(turn: Turn, system_prompt: str = "") -> TokenC
     This function uses the same tokenizer and logic as the metrics system
     to ensure consistency between API responses and Prometheus metrics.
 
-    Args:
-        turn: The turn object containing token usage information
-        system_prompt: The system prompt used for the turn
+    Parameters:
+        turn (Turn): The turn object containing token usage information
+        system_prompt (str): The system prompt used for the turn
 
     Returns:
         TokenCounter: Token usage information
@@ -102,7 +108,7 @@ def extract_and_update_token_metrics(
     This function combines the token counting logic with the metrics system
     to ensure both API responses and Prometheus metrics are updated consistently.
 
-    Args:
+    Parameters:
         turn: The turn object containing token usage information
         model: The model identifier for metrics labeling
         provider: The provider identifier for metrics labeling
diff --git a/src/utils/tool_formatter.py b/src/utils/tool_formatter.py
index 67bf1a848..8fd22d336 100644
--- a/src/utils/tool_formatter.py
+++ b/src/utils/tool_formatter.py
@@ -19,7 +19,14 @@ def format_tool_response(tool_dict: dict[str, Any]) -> dict[str, Any]:
         tool_dict: Raw tool dictionary from Llama Stack
 
     Returns:
-        Formatted tool dictionary with only required fields
+        dict[str, Any]: Formatted tool dictionary containing the following keys:
+            - identifier: tool identifier string (defaults to "").
+            - description: cleaned or original description string.
+            - parameters: list of parameter definitions (defaults to empty list).
+            - provider_id: provider identifier string (defaults to "").
+            - toolgroup_id: tool group identifier string (defaults to "").
+            - server_source: server source string (defaults to "").
+            - type: tool type string (defaults to "").
     """
     # Clean up description if it contains structured metadata
     description = tool_dict.get("description", "")
@@ -116,10 +123,11 @@ def format_tools_list(tools: list[dict[str, Any]]) -> list[dict[str, Any]]:
     """
     Format a list of tools with structured description parsing.
 
-    Args:
-        tools: List of raw tool dictionaries
+    Parameters:
+        tools: (list[dict[str, Any]]): List of raw tool dictionaries
 
     Returns:
-        List of formatted tool dictionaries
+        list[dict[str, Any]]: Formatted tool dictionaries with normalized
+                              fields and cleaned descriptions.
     """
     return [format_tool_response(tool) for tool in tools]

From d0e0c32c7076ede6e5bb99a113f3874e41a667a1 Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Sun, 14 Dec 2025 12:14:35 +0100
Subject: [PATCH 5/5] Docstrings for transcripts.py and types.py

---
 src/utils/transcripts.py | 25 +++++++++++++++++++++++--
 src/utils/types.py       | 29 +++++++++++++++++++++++++----
 2 files changed, 48 insertions(+), 6 deletions(-)

diff --git a/src/utils/transcripts.py b/src/utils/transcripts.py
index 551080ee9..6b0d93c7d 100644
--- a/src/utils/transcripts.py
+++ b/src/utils/transcripts.py
@@ -25,7 +25,23 @@ def _hash_user_id(user_id: str) -> str:
 
 
 def construct_transcripts_path(user_id: str, conversation_id: str) -> Path:
-    """Construct path to transcripts."""
+    """
+    Construct the filesystem path where transcripts for a given user and conversation are stored.
+
+    The returned path is built from the configured transcripts storage base
+    directory, a filesystem-safe directory derived from a hash of `user_id`,
+    and a filesystem-safe form of `conversation_id`.
+
+    Parameters:
+        user_id (str): The identifier for the user; a hashed form of this value
+                       is used as a path component.
+        conversation_id (str): The conversation identifier; this value is
+                               normalized for use as a path component.
+
+    Returns:
+        Path: A Path pointing to the directory where transcripts for the
+        specified user and conversation should be stored.
+    """
     # these two normalizations are required by Snyk as it detects
     # this Path sanitization pattern
     hashed_user_id = _hash_user_id(user_id)
@@ -52,9 +68,11 @@ def store_transcript(  # pylint: disable=too-many-arguments,too-many-positional-
 ) -> None:
     """Store transcript in the local filesystem.
 
-    Args:
+    Parameters:
         user_id: The user ID (UUID).
         conversation_id: The conversation ID (UUID).
+        model_id: Identifier of the model used to generate the LLM response.
+        provider_id: Optional provider identifier for the model.
         query_is_valid: The result of the query validation.
         query: The query (without attachments).
         query_request: The request containing a query.
@@ -62,6 +80,9 @@ def store_transcript(  # pylint: disable=too-many-arguments,too-many-positional-
         rag_chunks: The list of serialized `RAGChunk` dictionaries.
         truncated: The flag indicating if the history was truncated.
         attachments: The list of `Attachment` objects.
+
+    Raises:
+        IOError, OSError: If writing the transcript file to disk fails.
     """
     transcripts_path = construct_transcripts_path(user_id, conversation_id)
     transcripts_path.mkdir(parents=True, exist_ok=True)
diff --git a/src/utils/types.py b/src/utils/types.py
index c528bd1b0..070869da5 100644
--- a/src/utils/types.py
+++ b/src/utils/types.py
@@ -20,11 +20,12 @@
 def content_to_str(content: Any) -> str:
     """Convert content (str, TextContentItem, ImageContentItem, or list) to string.
 
-    Args:
-        content: Content to convert to string.
+    Parameters:
+        content: Value to normalize into a string (may be None,
+                 str, content item, list, or any other object).
 
     Returns:
-        str: String representation of the content.
+        str: The normalized string representation of the content.
     """
     if content is None:
         return ""
@@ -141,7 +142,27 @@ class TurnSummary(BaseModel):
     rag_chunks: list[RAGChunk]
 
     def append_tool_calls_from_llama(self, tec: ToolExecutionStep) -> None:
-        """Append the tool calls from a llama tool execution step."""
+        """
+        Append the tool calls from a llama tool execution step.
+
+        For each tool call in `tec.tool_calls` the method appends a
+        ToolCallSummary to `self.tool_calls` and a corresponding
+        ToolResultSummary to `self.tool_results`. Arguments are preserved if
+        already a dict; otherwise they are converted to {"args":
+        str(arguments)}.
+
+        A result's `status` is "success" when a matching response (by call_id)
+        exists in `tec.tool_responses`, and "failure" when no response is
+        found.
+
+        If a call's tool name equals DEFAULT_RAG_TOOL and its response has
+        content, the method extracts and appends RAG chunks to
+        `self.rag_chunks` by calling _extract_rag_chunks_from_response.
+
+        Parameters:
+            tec (ToolExecutionStep): The execution step containing tool_calls
+                                     and tool_responses to summarize.
+        """
         calls_by_id = {tc.call_id: tc for tc in tec.tool_calls}
         responses_by_id = {tc.call_id: tc for tc in tec.tool_responses}
         for call_id, tc in calls_by_id.items():