lightspeed-core · JslYoon · Feb 3, 2026 · Feb 3, 2026 · coderabbitai · Feb 3, 2026
diff --git a/src/app/endpoints/a2a.py b/src/app/endpoints/a2a.py
@@ -312,6 +312,7 @@ async def _process_task_streaming(  # pylint: disable=too-many-locals
             generate_topic_summary=True,
             media_type=None,
             vector_store_ids=vector_store_ids,
+            shield_ids=None,
         )
 
         # Get LLM client and select model

diff --git a/src/app/endpoints/query_v2.py b/src/app/endpoints/query_v2.py
@@ -401,7 +401,9 @@ async def retrieve_response(  # pylint: disable=too-many-locals,too-many-branche
         )
 
     # Run shield moderation before calling LLM
-    moderation_result = await run_shield_moderation(client, input_text)
+    moderation_result = await run_shield_moderation(
+        client, input_text, query_request.shield_ids
+    )
     if moderation_result.blocked:
         violation_message = moderation_result.message or ""
         await append_turn_to_conversation(

diff --git a/src/app/endpoints/streaming_query_v2.py b/src/app/endpoints/streaming_query_v2.py
@@ -451,7 +451,9 @@ async def retrieve_response(  # pylint: disable=too-many-locals
         )
 
     # Run shield moderation before calling LLM
-    moderation_result = await run_shield_moderation(client, input_text)
+    moderation_result = await run_shield_moderation(
+        client, input_text, query_request.shield_ids
+    )
     if moderation_result.blocked:
         violation_message = moderation_result.message or ""
         await append_turn_to_conversation(

diff --git a/src/models/requests.py b/src/models/requests.py
@@ -83,6 +83,7 @@ class QueryRequest(BaseModel):
         generate_topic_summary: Whether to generate topic summary for new conversations.
         media_type: The optional media type for response format (application/json or text/plain).
         vector_store_ids: The optional list of specific vector store IDs to query for RAG.
+        shield_ids: The optional list of safety shield IDs to apply.
 
     Example:
         ```python
@@ -166,6 +167,14 @@ class QueryRequest(BaseModel):
         examples=["ocp_docs", "knowledge_base", "vector_db_1"],
     )
 
+    shield_ids: Optional[list[str]] = Field(
+        None,
+        description="Optional list of safety shield IDs to apply. "
+        "If None, all configured shields are used. "
+        "If empty list, all shields are skipped.",
+        examples=["llama-guard", "custom-shield"],
+    )
+
     # provides examples for /docs endpoint
     model_config = {
         "extra": "forbid",

diff --git a/src/utils/shields.py b/src/utils/shields.py
@@ -1,7 +1,7 @@
 """Utility functions for working with Llama Stack shields."""
 
 import logging
-from typing import Any, cast
+from typing import Any, Optional, cast
 
 from fastapi import HTTPException
 from llama_stack_client import AsyncLlamaStackClient, BadRequestError
@@ -63,26 +63,48 @@ def detect_shield_violations(output_items: list[Any]) -> bool:
 async def run_shield_moderation(
     client: AsyncLlamaStackClient,
     input_text: str,
+    shield_ids: Optional[list[str]] = None,
 ) -> ShieldModerationResult:
     """
     Run shield moderation on input text.
 
-    Iterates through all configured shields and runs moderation checks.
+    Iterates through configured shields and runs moderation checks.
     Raises HTTPException if shield model is not found.
 
     Parameters:
         client: The Llama Stack client.
         input_text: The text to moderate.
+        shield_ids: Optional list of shield IDs to use. If None, uses all shields.
+                   If empty list, skips all shields.
 
     Returns:
         ShieldModerationResult: Result indicating if content was blocked and the message.
 
     Raises:
         HTTPException: If shield's provider_resource_id is not configured or model not found.
     """
-    """
-    Run shield moderation on input text.
-
-    Iterates through all configured shields and runs moderation checks.
-    Iterates through configured shields and runs moderation checks.
-    Raises HTTPException if shield model is not found.
-
-    Parameters:
-        client: The Llama Stack client.
-        input_text: The text to moderate.
-        shield_ids: Optional list of shield IDs to use. If None, uses all shields.
-                   If empty list, skips all shields.
-
-    Returns:
-        ShieldModerationResult: Result indicating if content was blocked and the message.
-
-    Raises:
-        HTTPException: If shield's provider_resource_id is not configured or model not found.
-    """
+    """
+    Run shield moderation on input text.
+
+    Iterates through configured shields and runs moderation checks.
+    Raises HTTPException if shield model is not found.
+
+    Parameters:
+        client: The Llama Stack client.
+        input_text: The text to moderate.
+        shield_ids: Optional list of shield IDs to use. If None, uses all shields.
+                   If empty list, skips all shields.
+
+    Returns:
+        ShieldModerationResult: Result indicating if content was blocked and the message.
+
+    Raises:
+        HTTPException: If shield's provider_resource_id is not configured, model not found,
+            or the requested shield_ids do not match any available shields.
+    """
-    """
-    Run shield moderation on input text.
-
-    Iterates through all configured shields and runs moderation checks.
-    Iterates through configured shields and runs moderation checks.
-    Raises HTTPException if shield model is not found.
-
-    Parameters:
-        client: The Llama Stack client.
-        input_text: The text to moderate.
-        shield_ids: Optional list of shield IDs to use. If None, uses all shields.
-                   If empty list, skips all shields.
-
-    Returns:
-        ShieldModerationResult: Result indicating if content was blocked and the message.
-
-    Raises:
-        HTTPException: If shield's provider_resource_id is not configured or model not found.
-    """
+    """
+    Run shield moderation on input text.
+
+    Iterates through configured shields and runs moderation checks.
+    Raises HTTPException if shield model is not found.
+
+    Parameters:
+        client: The Llama Stack client.
+        input_text: The text to moderate.
+        shield_ids: Optional list of shield IDs to use. If None, uses all shields.
+                   If empty list, skips all shields.
+
+    Returns:
+        ShieldModerationResult: Result indicating if content was blocked and the message.
+
+    Raises:
+        HTTPException: If shield's provider_resource_id is not configured, model not found,
+            or the requested shield_ids do not match any available shields.
+    """
+    all_shields = await client.shields.list()
+
+    # Filter shields based on shield_ids parameter
+    if shield_ids is not None:
+        if len(shield_ids) == 0:
+            logger.info("shield_ids=[] provided, skipping all shields")
+            return ShieldModerationResult(blocked=False)
+
+        shields_to_run = [s for s in all_shields if s.identifier in shield_ids]
+
+        # Log warning if requested shield not found
+        requested = set(shield_ids)
+        available = {s.identifier for s in shields_to_run}
+        missing = requested - available
+        if missing:
+            logger.warning("Requested shields not found: %s", missing)
+    else:
+        shields_to_run = list(all_shields)
+
     available_models = {model.id for model in await client.models.list()}
 
-    for shield in await client.shields.list():
+    for shield in shields_to_run:
         if (
             not shield.provider_resource_id
             or shield.provider_resource_id not in available_models