From e7801fe44f4b48f12c272490d6496f4406b54a15 Mon Sep 17 00:00:00 2001
From: Sunil Sattiraju <sunilsattiraju@gmail.com>
Date: Tue, 26 Mar 2024 02:07:06 +0800
Subject: [PATCH] add support for promptflow endpoint (#709)

---
 .env.sample      |   9 +-
 README.md        |   6 +
 app.py           | 954 +++++++++++++++++++++++++++++++++--------------
 backend/utils.py | 129 +++++--
 4 files changed, 785 insertions(+), 313 deletions(-)

diff --git a/.env.sample b/.env.sample
index bdf667a194..b8623c708c 100644
--- a/.env.sample
+++ b/.env.sample
@@ -100,4 +100,11 @@ AZURE_MLINDEX_FILENAME_COLUMN=
 AZURE_MLINDEX_TITLE_COLUMN= 
 AZURE_MLINDEX_URL_COLUMN= 
 AZURE_MLINDEX_VECTOR_COLUMNS=
-AZURE_MLINDEX_QUERY_TYPE=
\ No newline at end of file
+AZURE_MLINDEX_QUERY_TYPE=
+# Chat with data: Prompt flow API
+USE_PROMPTFLOW=False
+PROMPTFLOW_ENDPOINT=
+PROMPTFLOW_API_KEY=
+PROMPTFLOW_RESPONSE_TIMEOUT=120
+PROMPTFLOW_REQUEST_FIELD_NAME=question
+PROMPTFLOW_RESPONSE_FIELD_NAME=answer
\ No newline at end of file
diff --git a/README.md b/README.md
index fae0ccc633..5b77b8f37f 100644
--- a/README.md
+++ b/README.md
@@ -230,6 +230,12 @@ Note: settings starting with `AZURE_SEARCH` are only needed when using Azure Ope
 |UI_FAVICON|| Defaults to Contoso favicon. Configure the URL to your favicon to modify.
 |UI_SHOW_SHARE_BUTTON|True|Share button (right-top)
 |SANITIZE_ANSWER|False|Whether to sanitize the answer from Azure OpenAI. Set to True to remove any HTML tags from the response.|
+|USE_PROMPTFLOW|False|Use existing Promptflow deployed endpoint. If set to `True` then both `PROMPTFLOW_ENDPOINT` and `PROMPTFLOW_API_KEY` also need to be set.|
+|PROMPTFLOW_ENDPOINT||URL of the deployed Promptflow endpoint e.g. https://pf-deployment-name.region.inference.ml.azure.com/score|
+|PROMPTFLOW_API_KEY||Auth key for deployed Promptflow endpoint. Note: only Key-based authentication is supported.|
+|PROMPTFLOW_RESPONSE_TIMEOUT|120|Timeout value in seconds for the Promptflow endpoint to respond.|
+|PROMPTFLOW_REQUEST_FIELD_NAME|question|Default field name to construct Promptflow request. Note: chat_history is auto constucted based on the interaction, if your API expects other mandatory field you will need to change the request parameters under `promptflow_request` function.|
+|PROMPTFLOW_RESPONSE_FIELD_NAME|answer|Default field name to process the response from Promptflow request.|
 
 ## Contributing
 
diff --git a/app.py b/app.py
index 2691de9b30..7d265bdd82 100644
--- a/app.py
+++ b/app.py
@@ -4,7 +4,7 @@
 import logging
 import uuid
 from dotenv import load_dotenv
-
+import httpx
 from quart import (
     Blueprint,
     Quart,
@@ -12,7 +12,7 @@
     make_response,
     request,
     send_from_directory,
-    render_template
+    render_template,
 )
 
 from openai import AsyncAzureOpenAI
@@ -20,22 +20,34 @@
 from backend.auth.auth_utils import get_authenticated_user_details
 from backend.history.cosmosdbservice import CosmosConversationClient
 
-from backend.utils import format_as_ndjson, format_stream_response, generateFilterString, parse_multi_columns, format_non_streaming_response
+from backend.utils import (
+    format_as_ndjson,
+    format_stream_response,
+    generateFilterString,
+    parse_multi_columns,
+    format_non_streaming_response,
+    convert_to_pf_format,
+    format_pf_non_streaming_response,
+)
 
 bp = Blueprint("routes", __name__, static_folder="static", template_folder="static")
 
 # Current minimum Azure OpenAI version supported
-MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION="2024-02-15-preview"
+MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION = "2024-02-15-preview"
 
 # UI configuration (optional)
 UI_TITLE = os.environ.get("UI_TITLE") or "Contoso"
 UI_LOGO = os.environ.get("UI_LOGO")
 UI_CHAT_LOGO = os.environ.get("UI_CHAT_LOGO")
 UI_CHAT_TITLE = os.environ.get("UI_CHAT_TITLE") or "Start chatting"
-UI_CHAT_DESCRIPTION = os.environ.get("UI_CHAT_DESCRIPTION") or "This chatbot is configured to answer your questions"
+UI_CHAT_DESCRIPTION = (
+    os.environ.get("UI_CHAT_DESCRIPTION")
+    or "This chatbot is configured to answer your questions"
+)
 UI_FAVICON = os.environ.get("UI_FAVICON") or "/favicon.ico"
 UI_SHOW_SHARE_BUTTON = os.environ.get("UI_SHOW_SHARE_BUTTON", "true").lower() == "true"
 
+
 def create_app():
     app = Quart(__name__)
     app.register_blueprint(bp)
@@ -47,14 +59,17 @@ def create_app():
 async def index():
     return await render_template("index.html", title=UI_TITLE, favicon=UI_FAVICON)
 
+
 @bp.route("/favicon.ico")
 async def favicon():
     return await bp.send_static_file("favicon.ico")
 
+
 @bp.route("/assets/<path:path>")
 async def assets(path):
     return await send_from_directory("static/assets", path)
 
+
 load_dotenv()
 
 # Debug settings
@@ -74,17 +89,25 @@ async def assets(path):
 AZURE_SEARCH_SERVICE = os.environ.get("AZURE_SEARCH_SERVICE")
 AZURE_SEARCH_INDEX = os.environ.get("AZURE_SEARCH_INDEX")
 AZURE_SEARCH_KEY = os.environ.get("AZURE_SEARCH_KEY", None)
-AZURE_SEARCH_USE_SEMANTIC_SEARCH = os.environ.get("AZURE_SEARCH_USE_SEMANTIC_SEARCH", "false")
-AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG = os.environ.get("AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG", "default")
+AZURE_SEARCH_USE_SEMANTIC_SEARCH = os.environ.get(
+    "AZURE_SEARCH_USE_SEMANTIC_SEARCH", "false"
+)
+AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG = os.environ.get(
+    "AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG", "default"
+)
 AZURE_SEARCH_TOP_K = os.environ.get("AZURE_SEARCH_TOP_K", SEARCH_TOP_K)
-AZURE_SEARCH_ENABLE_IN_DOMAIN = os.environ.get("AZURE_SEARCH_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN)
+AZURE_SEARCH_ENABLE_IN_DOMAIN = os.environ.get(
+    "AZURE_SEARCH_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN
+)
 AZURE_SEARCH_CONTENT_COLUMNS = os.environ.get("AZURE_SEARCH_CONTENT_COLUMNS")
 AZURE_SEARCH_FILENAME_COLUMN = os.environ.get("AZURE_SEARCH_FILENAME_COLUMN")
 AZURE_SEARCH_TITLE_COLUMN = os.environ.get("AZURE_SEARCH_TITLE_COLUMN")
 AZURE_SEARCH_URL_COLUMN = os.environ.get("AZURE_SEARCH_URL_COLUMN")
 AZURE_SEARCH_VECTOR_COLUMNS = os.environ.get("AZURE_SEARCH_VECTOR_COLUMNS")
 AZURE_SEARCH_QUERY_TYPE = os.environ.get("AZURE_SEARCH_QUERY_TYPE")
-AZURE_SEARCH_PERMITTED_GROUPS_COLUMN = os.environ.get("AZURE_SEARCH_PERMITTED_GROUPS_COLUMN")
+AZURE_SEARCH_PERMITTED_GROUPS_COLUMN = os.environ.get(
+    "AZURE_SEARCH_PERMITTED_GROUPS_COLUMN"
+)
 AZURE_SEARCH_STRICTNESS = os.environ.get("AZURE_SEARCH_STRICTNESS", SEARCH_STRICTNESS)
 
 # AOAI Integration Settings
@@ -96,36 +119,70 @@ async def assets(path):
 AZURE_OPENAI_TOP_P = os.environ.get("AZURE_OPENAI_TOP_P", 1.0)
 AZURE_OPENAI_MAX_TOKENS = os.environ.get("AZURE_OPENAI_MAX_TOKENS", 1000)
 AZURE_OPENAI_STOP_SEQUENCE = os.environ.get("AZURE_OPENAI_STOP_SEQUENCE")
-AZURE_OPENAI_SYSTEM_MESSAGE = os.environ.get("AZURE_OPENAI_SYSTEM_MESSAGE", "You are an AI assistant that helps people find information.")
-AZURE_OPENAI_PREVIEW_API_VERSION = os.environ.get("AZURE_OPENAI_PREVIEW_API_VERSION", MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION)
+AZURE_OPENAI_SYSTEM_MESSAGE = os.environ.get(
+    "AZURE_OPENAI_SYSTEM_MESSAGE",
+    "You are an AI assistant that helps people find information.",
+)
+AZURE_OPENAI_PREVIEW_API_VERSION = os.environ.get(
+    "AZURE_OPENAI_PREVIEW_API_VERSION",
+    MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION,
+)
 AZURE_OPENAI_STREAM = os.environ.get("AZURE_OPENAI_STREAM", "true")
-AZURE_OPENAI_MODEL_NAME = os.environ.get("AZURE_OPENAI_MODEL_NAME", "gpt-35-turbo-16k") # Name of the model, e.g. 'gpt-35-turbo-16k' or 'gpt-4'
+AZURE_OPENAI_MODEL_NAME = os.environ.get(
+    "AZURE_OPENAI_MODEL_NAME", "gpt-35-turbo-16k"
+)  # Name of the model, e.g. 'gpt-35-turbo-16k' or 'gpt-4'
 AZURE_OPENAI_EMBEDDING_ENDPOINT = os.environ.get("AZURE_OPENAI_EMBEDDING_ENDPOINT")
 AZURE_OPENAI_EMBEDDING_KEY = os.environ.get("AZURE_OPENAI_EMBEDDING_KEY")
 AZURE_OPENAI_EMBEDDING_NAME = os.environ.get("AZURE_OPENAI_EMBEDDING_NAME", "")
 
 # CosmosDB Mongo vcore vector db Settings
-AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING")  #This has to be secure string
-AZURE_COSMOSDB_MONGO_VCORE_DATABASE = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_DATABASE")
-AZURE_COSMOSDB_MONGO_VCORE_CONTAINER = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_CONTAINER")
+AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING"
+)  # This has to be secure string
+AZURE_COSMOSDB_MONGO_VCORE_DATABASE = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_DATABASE"
+)
+AZURE_COSMOSDB_MONGO_VCORE_CONTAINER = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_CONTAINER"
+)
 AZURE_COSMOSDB_MONGO_VCORE_INDEX = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_INDEX")
-AZURE_COSMOSDB_MONGO_VCORE_TOP_K = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_TOP_K", AZURE_SEARCH_TOP_K)
-AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS", AZURE_SEARCH_STRICTNESS)  
-AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN", AZURE_SEARCH_ENABLE_IN_DOMAIN)
-AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS", "")
-AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN")
-AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN")
-AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN")
-AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS = os.environ.get("AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS")
+AZURE_COSMOSDB_MONGO_VCORE_TOP_K = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_TOP_K", AZURE_SEARCH_TOP_K
+)
+AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS", AZURE_SEARCH_STRICTNESS
+)
+AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN", AZURE_SEARCH_ENABLE_IN_DOMAIN
+)
+AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS", ""
+)
+AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN"
+)
+AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN"
+)
+AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN"
+)
+AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS = os.environ.get(
+    "AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS"
+)
 
 SHOULD_STREAM = True if AZURE_OPENAI_STREAM.lower() == "true" else False
 
 # Chat History CosmosDB Integration Settings
 AZURE_COSMOSDB_DATABASE = os.environ.get("AZURE_COSMOSDB_DATABASE")
 AZURE_COSMOSDB_ACCOUNT = os.environ.get("AZURE_COSMOSDB_ACCOUNT")
-AZURE_COSMOSDB_CONVERSATIONS_CONTAINER = os.environ.get("AZURE_COSMOSDB_CONVERSATIONS_CONTAINER")
+AZURE_COSMOSDB_CONVERSATIONS_CONTAINER = os.environ.get(
+    "AZURE_COSMOSDB_CONVERSATIONS_CONTAINER"
+)
 AZURE_COSMOSDB_ACCOUNT_KEY = os.environ.get("AZURE_COSMOSDB_ACCOUNT_KEY")
-AZURE_COSMOSDB_ENABLE_FEEDBACK = os.environ.get("AZURE_COSMOSDB_ENABLE_FEEDBACK", "false").lower() == "true"
+AZURE_COSMOSDB_ENABLE_FEEDBACK = (
+    os.environ.get("AZURE_COSMOSDB_ENABLE_FEEDBACK", "false").lower() == "true"
+)
 
 # Elasticsearch Integration Settings
 ELASTICSEARCH_ENDPOINT = os.environ.get("ELASTICSEARCH_ENDPOINT")
@@ -133,7 +190,9 @@ async def assets(path):
 ELASTICSEARCH_INDEX = os.environ.get("ELASTICSEARCH_INDEX")
 ELASTICSEARCH_QUERY_TYPE = os.environ.get("ELASTICSEARCH_QUERY_TYPE", "simple")
 ELASTICSEARCH_TOP_K = os.environ.get("ELASTICSEARCH_TOP_K", SEARCH_TOP_K)
-ELASTICSEARCH_ENABLE_IN_DOMAIN = os.environ.get("ELASTICSEARCH_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN)
+ELASTICSEARCH_ENABLE_IN_DOMAIN = os.environ.get(
+    "ELASTICSEARCH_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN
+)
 ELASTICSEARCH_CONTENT_COLUMNS = os.environ.get("ELASTICSEARCH_CONTENT_COLUMNS")
 ELASTICSEARCH_FILENAME_COLUMN = os.environ.get("ELASTICSEARCH_FILENAME_COLUMN")
 ELASTICSEARCH_TITLE_COLUMN = os.environ.get("ELASTICSEARCH_TITLE_COLUMN")
@@ -147,8 +206,10 @@ async def assets(path):
 PINECONE_API_KEY = os.environ.get("PINECONE_API_KEY")
 PINECONE_INDEX_NAME = os.environ.get("PINECONE_INDEX_NAME")
 PINECONE_TOP_K = os.environ.get("PINECONE_TOP_K", SEARCH_TOP_K)
-PINECONE_STRICTNESS = os.environ.get("PINECONE_STRICTNESS", SEARCH_STRICTNESS)  
-PINECONE_ENABLE_IN_DOMAIN = os.environ.get("PINECONE_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN)
+PINECONE_STRICTNESS = os.environ.get("PINECONE_STRICTNESS", SEARCH_STRICTNESS)
+PINECONE_ENABLE_IN_DOMAIN = os.environ.get(
+    "PINECONE_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN
+)
 PINECONE_CONTENT_COLUMNS = os.environ.get("PINECONE_CONTENT_COLUMNS", "")
 PINECONE_FILENAME_COLUMN = os.environ.get("PINECONE_FILENAME_COLUMN")
 PINECONE_TITLE_COLUMN = os.environ.get("PINECONE_TITLE_COLUMN")
@@ -158,24 +219,40 @@ async def assets(path):
 # Azure AI MLIndex Integration Settings - for use with MLIndex data assets created in Azure AI Studio
 AZURE_MLINDEX_NAME = os.environ.get("AZURE_MLINDEX_NAME")
 AZURE_MLINDEX_VERSION = os.environ.get("AZURE_MLINDEX_VERSION")
-AZURE_ML_PROJECT_RESOURCE_ID = os.environ.get("AZURE_ML_PROJECT_RESOURCE_ID") # /subscriptions/{sub ID}/resourceGroups/{rg name}/providers/Microsoft.MachineLearningServices/workspaces/{AML project name}
+AZURE_ML_PROJECT_RESOURCE_ID = os.environ.get(
+    "AZURE_ML_PROJECT_RESOURCE_ID"
+)  # /subscriptions/{sub ID}/resourceGroups/{rg name}/providers/Microsoft.MachineLearningServices/workspaces/{AML project name}
 AZURE_MLINDEX_TOP_K = os.environ.get("AZURE_MLINDEX_TOP_K", SEARCH_TOP_K)
-AZURE_MLINDEX_STRICTNESS = os.environ.get("AZURE_MLINDEX_STRICTNESS", SEARCH_STRICTNESS)  
-AZURE_MLINDEX_ENABLE_IN_DOMAIN = os.environ.get("AZURE_MLINDEX_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN)
+AZURE_MLINDEX_STRICTNESS = os.environ.get("AZURE_MLINDEX_STRICTNESS", SEARCH_STRICTNESS)
+AZURE_MLINDEX_ENABLE_IN_DOMAIN = os.environ.get(
+    "AZURE_MLINDEX_ENABLE_IN_DOMAIN", SEARCH_ENABLE_IN_DOMAIN
+)
 AZURE_MLINDEX_CONTENT_COLUMNS = os.environ.get("AZURE_MLINDEX_CONTENT_COLUMNS", "")
 AZURE_MLINDEX_FILENAME_COLUMN = os.environ.get("AZURE_MLINDEX_FILENAME_COLUMN")
 AZURE_MLINDEX_TITLE_COLUMN = os.environ.get("AZURE_MLINDEX_TITLE_COLUMN")
 AZURE_MLINDEX_URL_COLUMN = os.environ.get("AZURE_MLINDEX_URL_COLUMN")
 AZURE_MLINDEX_VECTOR_COLUMNS = os.environ.get("AZURE_MLINDEX_VECTOR_COLUMNS")
 AZURE_MLINDEX_QUERY_TYPE = os.environ.get("AZURE_MLINDEX_QUERY_TYPE")
-
-
+# Promptflow Integration Settings
+USE_PROMPTFLOW = os.environ.get("USE_PROMPTFLOW", "false").lower() == "true"
+PROMPTFLOW_ENDPOINT = os.environ.get("PROMPTFLOW_ENDPOINT")
+PROMPTFLOW_API_KEY = os.environ.get("PROMPTFLOW_API_KEY")
+PROMPTFLOW_RESPONSE_TIMEOUT = os.environ.get("PROMPTFLOW_RESPONSE_TIMEOUT", 30.0)
+# default request and response field names are input -> 'query' and output -> 'reply'
+PROMPTFLOW_REQUEST_FIELD_NAME = os.environ.get("PROMPTFLOW_REQUEST_FIELD_NAME", "query")
+PROMPTFLOW_RESPONSE_FIELD_NAME = os.environ.get(
+    "PROMPTFLOW_RESPONSE_FIELD_NAME", "reply"
+)
 # Frontend Settings via Environment Variables
 AUTH_ENABLED = os.environ.get("AUTH_ENABLED", "true").lower() == "true"
-CHAT_HISTORY_ENABLED = AZURE_COSMOSDB_ACCOUNT and AZURE_COSMOSDB_DATABASE and AZURE_COSMOSDB_CONVERSATIONS_CONTAINER
+CHAT_HISTORY_ENABLED = (
+    AZURE_COSMOSDB_ACCOUNT
+    and AZURE_COSMOSDB_DATABASE
+    and AZURE_COSMOSDB_CONVERSATIONS_CONTAINER
+)
 SANITIZE_ANSWER = os.environ.get("SANITIZE_ANSWER", "false").lower() == "true"
-frontend_settings = { 
-    "auth_enabled": AUTH_ENABLED, 
+frontend_settings = {
+    "auth_enabled": AUTH_ENABLED,
     "feedback_enabled": AZURE_COSMOSDB_ENABLE_FEEDBACK and CHAT_HISTORY_ENABLED,
     "ui": {
         "title": UI_TITLE,
@@ -183,33 +260,39 @@ async def assets(path):
         "chat_logo": UI_CHAT_LOGO or UI_LOGO,
         "chat_title": UI_CHAT_TITLE,
         "chat_description": UI_CHAT_DESCRIPTION,
-        "show_share_button": UI_SHOW_SHARE_BUTTON
+        "show_share_button": UI_SHOW_SHARE_BUTTON,
     },
-    "sanitize_answer": SANITIZE_ANSWER
+    "sanitize_answer": SANITIZE_ANSWER,
 }
 
+
 def should_use_data():
     global DATASOURCE_TYPE
     if AZURE_SEARCH_SERVICE and AZURE_SEARCH_INDEX:
         DATASOURCE_TYPE = "AzureCognitiveSearch"
         logging.debug("Using Azure Cognitive Search")
         return True
-    
-    if AZURE_COSMOSDB_MONGO_VCORE_DATABASE and AZURE_COSMOSDB_MONGO_VCORE_CONTAINER and AZURE_COSMOSDB_MONGO_VCORE_INDEX and AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING:
+
+    if (
+        AZURE_COSMOSDB_MONGO_VCORE_DATABASE
+        and AZURE_COSMOSDB_MONGO_VCORE_CONTAINER
+        and AZURE_COSMOSDB_MONGO_VCORE_INDEX
+        and AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING
+    ):
         DATASOURCE_TYPE = "AzureCosmosDB"
         logging.debug("Using Azure CosmosDB Mongo vcore")
         return True
-    
+
     if ELASTICSEARCH_ENDPOINT and ELASTICSEARCH_ENCODED_API_KEY and ELASTICSEARCH_INDEX:
         DATASOURCE_TYPE = "Elasticsearch"
         logging.debug("Using Elasticsearch")
         return True
-    
+
     if PINECONE_ENVIRONMENT and PINECONE_API_KEY and PINECONE_INDEX_NAME:
         DATASOURCE_TYPE = "Pinecone"
         logging.debug("Using Pinecone")
         return True
-    
+
     if AZURE_MLINDEX_NAME and AZURE_MLINDEX_VERSION and AZURE_ML_PROJECT_RESOURCE_ID:
         DATASOURCE_TYPE = "AzureMLIndex"
         logging.debug("Using Azure ML Index")
@@ -217,28 +300,43 @@ def should_use_data():
 
     return False
 
+
 SHOULD_USE_DATA = should_use_data()
 
+
 # Initialize Azure OpenAI Client
 def init_openai_client(use_data=SHOULD_USE_DATA):
     azure_openai_client = None
     try:
         # API version check
-        if AZURE_OPENAI_PREVIEW_API_VERSION < MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION:
-            raise Exception(f"The minimum supported Azure OpenAI preview API version is '{MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION}'")
-        
+        if (
+            AZURE_OPENAI_PREVIEW_API_VERSION
+            < MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION
+        ):
+            raise Exception(
+                f"The minimum supported Azure OpenAI preview API version is '{MINIMUM_SUPPORTED_AZURE_OPENAI_PREVIEW_API_VERSION}'"
+            )
+
         # Endpoint
         if not AZURE_OPENAI_ENDPOINT and not AZURE_OPENAI_RESOURCE:
-            raise Exception("AZURE_OPENAI_ENDPOINT or AZURE_OPENAI_RESOURCE is required")
-        
-        endpoint = AZURE_OPENAI_ENDPOINT if AZURE_OPENAI_ENDPOINT else f"https://{AZURE_OPENAI_RESOURCE}.openai.azure.com/"
-        
+            raise Exception(
+                "AZURE_OPENAI_ENDPOINT or AZURE_OPENAI_RESOURCE is required"
+            )
+
+        endpoint = (
+            AZURE_OPENAI_ENDPOINT
+            if AZURE_OPENAI_ENDPOINT
+            else f"https://{AZURE_OPENAI_RESOURCE}.openai.azure.com/"
+        )
+
         # Authentication
         aoai_api_key = AZURE_OPENAI_KEY
         ad_token_provider = None
         if not aoai_api_key:
             logging.debug("No AZURE_OPENAI_KEY found, using Azure AD auth")
-            ad_token_provider = get_bearer_token_provider(DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default")
+            ad_token_provider = get_bearer_token_provider(
+                DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default"
+            )
 
         # Deployment
         deployment = AZURE_OPENAI_MODEL
@@ -246,18 +344,16 @@ def init_openai_client(use_data=SHOULD_USE_DATA):
             raise Exception("AZURE_OPENAI_MODEL is required")
 
         # Default Headers
-        default_headers = {
-            'x-ms-useragent': USER_AGENT
-        }
+        default_headers = {"x-ms-useragent": USER_AGENT}
 
         azure_openai_client = AsyncAzureOpenAI(
             api_version=AZURE_OPENAI_PREVIEW_API_VERSION,
             api_key=aoai_api_key,
             azure_ad_token_provider=ad_token_provider,
             default_headers=default_headers,
-            azure_endpoint=endpoint
+            azure_endpoint=endpoint,
         )
-            
+
         return azure_openai_client
     except Exception as e:
         logging.exception("Exception in Azure OpenAI initialization", e)
@@ -269,7 +365,9 @@ def init_cosmosdb_client():
     cosmos_conversation_client = None
     if CHAT_HISTORY_ENABLED:
         try:
-            cosmos_endpoint = f'https://{AZURE_COSMOSDB_ACCOUNT}.documents.azure.com:443/'
+            cosmos_endpoint = (
+                f"https://{AZURE_COSMOSDB_ACCOUNT}.documents.azure.com:443/"
+            )
 
             if not AZURE_COSMOSDB_ACCOUNT_KEY:
                 credential = DefaultAzureCredential()
@@ -277,11 +375,11 @@ def init_cosmosdb_client():
                 credential = AZURE_COSMOSDB_ACCOUNT_KEY
 
             cosmos_conversation_client = CosmosConversationClient(
-                cosmosdb_endpoint=cosmos_endpoint, 
-                credential=credential, 
+                cosmosdb_endpoint=cosmos_endpoint,
+                credential=credential,
                 database_name=AZURE_COSMOSDB_DATABASE,
                 container_name=AZURE_COSMOSDB_CONVERSATIONS_CONTAINER,
-                enable_message_feedback=AZURE_COSMOSDB_ENABLE_FEEDBACK
+                enable_message_feedback=AZURE_COSMOSDB_ENABLE_FEEDBACK,
             )
         except Exception as e:
             logging.exception("Exception in CosmosDB initialization", e)
@@ -289,7 +387,7 @@ def init_cosmosdb_client():
             raise e
     else:
         logging.debug("CosmosDB not configured")
-        
+
     return cosmos_conversation_client
 
 
@@ -300,83 +398,143 @@ def get_configured_data_source():
         # Set query type
         if AZURE_SEARCH_QUERY_TYPE:
             query_type = AZURE_SEARCH_QUERY_TYPE
-        elif AZURE_SEARCH_USE_SEMANTIC_SEARCH.lower() == "true" and AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG:
+        elif (
+            AZURE_SEARCH_USE_SEMANTIC_SEARCH.lower() == "true"
+            and AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG
+        ):
             query_type = "semantic"
 
         # Set filter
         filter = None
         userToken = None
         if AZURE_SEARCH_PERMITTED_GROUPS_COLUMN:
-            userToken = request.headers.get('X-MS-TOKEN-AAD-ACCESS-TOKEN', "")
+            userToken = request.headers.get("X-MS-TOKEN-AAD-ACCESS-TOKEN", "")
             logging.debug(f"USER TOKEN is {'present' if userToken else 'not present'}")
             if not userToken:
-                raise Exception("Document-level access control is enabled, but user access token could not be fetched.")
+                raise Exception(
+                    "Document-level access control is enabled, but user access token could not be fetched."
+                )
 
             filter = generateFilterString(userToken)
             logging.debug(f"FILTER: {filter}")
-        
+
         # Set authentication
         authentication = {}
         if AZURE_SEARCH_KEY:
-            authentication = {
-                "type": "api_key",
-                "api_key": AZURE_SEARCH_KEY
-            }
+            authentication = {"type": "api_key", "api_key": AZURE_SEARCH_KEY}
         else:
             # If key is not provided, assume AOAI resource identity has been granted access to the search service
-            authentication = {
-                "type": "system_assigned_managed_identity"
-            }
+            authentication = {"type": "system_assigned_managed_identity"}
 
         data_source = {
-                "type": "azure_search",
-                "parameters": {
-                    "endpoint": f"https://{AZURE_SEARCH_SERVICE}.search.windows.net",
-                    "authentication": authentication,
-                    "index_name": AZURE_SEARCH_INDEX,
-                    "fields_mapping": {
-                        "content_fields": parse_multi_columns(AZURE_SEARCH_CONTENT_COLUMNS) if AZURE_SEARCH_CONTENT_COLUMNS else [],
-                        "title_field": AZURE_SEARCH_TITLE_COLUMN if AZURE_SEARCH_TITLE_COLUMN else None,
-                        "url_field": AZURE_SEARCH_URL_COLUMN if AZURE_SEARCH_URL_COLUMN else None,
-                        "filepath_field": AZURE_SEARCH_FILENAME_COLUMN if AZURE_SEARCH_FILENAME_COLUMN else None,
-                        "vector_fields": parse_multi_columns(AZURE_SEARCH_VECTOR_COLUMNS) if AZURE_SEARCH_VECTOR_COLUMNS else []
-                    },
-                    "in_scope": True if AZURE_SEARCH_ENABLE_IN_DOMAIN.lower() == "true" else False,
-                    "top_n_documents": int(AZURE_SEARCH_TOP_K) if AZURE_SEARCH_TOP_K else int(SEARCH_TOP_K),
-                    "query_type": query_type,
-                    "semantic_configuration": AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG if AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG else "",
-                    "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
-                    "filter": filter,
-                    "strictness": int(AZURE_SEARCH_STRICTNESS) if AZURE_SEARCH_STRICTNESS else int(SEARCH_STRICTNESS)
-                }
-            }
+            "type": "azure_search",
+            "parameters": {
+                "endpoint": f"https://{AZURE_SEARCH_SERVICE}.search.windows.net",
+                "authentication": authentication,
+                "index_name": AZURE_SEARCH_INDEX,
+                "fields_mapping": {
+                    "content_fields": (
+                        parse_multi_columns(AZURE_SEARCH_CONTENT_COLUMNS)
+                        if AZURE_SEARCH_CONTENT_COLUMNS
+                        else []
+                    ),
+                    "title_field": (
+                        AZURE_SEARCH_TITLE_COLUMN if AZURE_SEARCH_TITLE_COLUMN else None
+                    ),
+                    "url_field": (
+                        AZURE_SEARCH_URL_COLUMN if AZURE_SEARCH_URL_COLUMN else None
+                    ),
+                    "filepath_field": (
+                        AZURE_SEARCH_FILENAME_COLUMN
+                        if AZURE_SEARCH_FILENAME_COLUMN
+                        else None
+                    ),
+                    "vector_fields": (
+                        parse_multi_columns(AZURE_SEARCH_VECTOR_COLUMNS)
+                        if AZURE_SEARCH_VECTOR_COLUMNS
+                        else []
+                    ),
+                },
+                "in_scope": (
+                    True if AZURE_SEARCH_ENABLE_IN_DOMAIN.lower() == "true" else False
+                ),
+                "top_n_documents": (
+                    int(AZURE_SEARCH_TOP_K) if AZURE_SEARCH_TOP_K else int(SEARCH_TOP_K)
+                ),
+                "query_type": query_type,
+                "semantic_configuration": (
+                    AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG
+                    if AZURE_SEARCH_SEMANTIC_SEARCH_CONFIG
+                    else ""
+                ),
+                "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
+                "filter": filter,
+                "strictness": (
+                    int(AZURE_SEARCH_STRICTNESS)
+                    if AZURE_SEARCH_STRICTNESS
+                    else int(SEARCH_STRICTNESS)
+                ),
+            },
+        }
     elif DATASOURCE_TYPE == "AzureCosmosDB":
         query_type = "vector"
 
         data_source = {
-                "type": "azure_cosmos_db",
-                "parameters": {
-                    "authentication": {
-                        "type": "connection_string",
-                        "connection_string": AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING
-                    },
-                    "index_name": AZURE_COSMOSDB_MONGO_VCORE_INDEX,
-                    "database_name": AZURE_COSMOSDB_MONGO_VCORE_DATABASE,
-                    "container_name": AZURE_COSMOSDB_MONGO_VCORE_CONTAINER,                    
-                    "fields_mapping": {
-                        "content_fields": parse_multi_columns(AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS) if AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS else [],
-                        "title_field": AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN if AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN else None,
-                        "url_field": AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN if AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN else None,
-                        "filepath_field": AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN if AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN else None,
-                        "vector_fields": parse_multi_columns(AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS) if AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS else []
-                    },
-                    "in_scope": True if AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN.lower() == "true" else False,
-                    "top_n_documents": int(AZURE_COSMOSDB_MONGO_VCORE_TOP_K) if AZURE_COSMOSDB_MONGO_VCORE_TOP_K else int(SEARCH_TOP_K),
-                    "strictness": int(AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS) if AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS else int(SEARCH_STRICTNESS),
-                    "query_type": query_type,
-                    "role_information": AZURE_OPENAI_SYSTEM_MESSAGE
-                }
-            }
+            "type": "azure_cosmos_db",
+            "parameters": {
+                "authentication": {
+                    "type": "connection_string",
+                    "connection_string": AZURE_COSMOSDB_MONGO_VCORE_CONNECTION_STRING,
+                },
+                "index_name": AZURE_COSMOSDB_MONGO_VCORE_INDEX,
+                "database_name": AZURE_COSMOSDB_MONGO_VCORE_DATABASE,
+                "container_name": AZURE_COSMOSDB_MONGO_VCORE_CONTAINER,
+                "fields_mapping": {
+                    "content_fields": (
+                        parse_multi_columns(AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS)
+                        if AZURE_COSMOSDB_MONGO_VCORE_CONTENT_COLUMNS
+                        else []
+                    ),
+                    "title_field": (
+                        AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN
+                        if AZURE_COSMOSDB_MONGO_VCORE_TITLE_COLUMN
+                        else None
+                    ),
+                    "url_field": (
+                        AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN
+                        if AZURE_COSMOSDB_MONGO_VCORE_URL_COLUMN
+                        else None
+                    ),
+                    "filepath_field": (
+                        AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN
+                        if AZURE_COSMOSDB_MONGO_VCORE_FILENAME_COLUMN
+                        else None
+                    ),
+                    "vector_fields": (
+                        parse_multi_columns(AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS)
+                        if AZURE_COSMOSDB_MONGO_VCORE_VECTOR_COLUMNS
+                        else []
+                    ),
+                },
+                "in_scope": (
+                    True
+                    if AZURE_COSMOSDB_MONGO_VCORE_ENABLE_IN_DOMAIN.lower() == "true"
+                    else False
+                ),
+                "top_n_documents": (
+                    int(AZURE_COSMOSDB_MONGO_VCORE_TOP_K)
+                    if AZURE_COSMOSDB_MONGO_VCORE_TOP_K
+                    else int(SEARCH_TOP_K)
+                ),
+                "strictness": (
+                    int(AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS)
+                    if AZURE_COSMOSDB_MONGO_VCORE_STRICTNESS
+                    else int(SEARCH_STRICTNESS)
+                ),
+                "query_type": query_type,
+                "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
+            },
+        }
     elif DATASOURCE_TYPE == "Elasticsearch":
         if ELASTICSEARCH_QUERY_TYPE:
             query_type = ELASTICSEARCH_QUERY_TYPE
@@ -387,22 +545,50 @@ def get_configured_data_source():
                 "endpoint": ELASTICSEARCH_ENDPOINT,
                 "authentication": {
                     "type": "encoded_api_key",
-                    "encoded_api_key": ELASTICSEARCH_ENCODED_API_KEY
+                    "encoded_api_key": ELASTICSEARCH_ENCODED_API_KEY,
                 },
                 "index_name": ELASTICSEARCH_INDEX,
                 "fields_mapping": {
-                    "content_fields": parse_multi_columns(ELASTICSEARCH_CONTENT_COLUMNS) if ELASTICSEARCH_CONTENT_COLUMNS else [],
-                    "title_field": ELASTICSEARCH_TITLE_COLUMN if ELASTICSEARCH_TITLE_COLUMN else None,
-                    "url_field": ELASTICSEARCH_URL_COLUMN if ELASTICSEARCH_URL_COLUMN else None,
-                    "filepath_field": ELASTICSEARCH_FILENAME_COLUMN if ELASTICSEARCH_FILENAME_COLUMN else None,
-                    "vector_fields": parse_multi_columns(ELASTICSEARCH_VECTOR_COLUMNS) if ELASTICSEARCH_VECTOR_COLUMNS else []
+                    "content_fields": (
+                        parse_multi_columns(ELASTICSEARCH_CONTENT_COLUMNS)
+                        if ELASTICSEARCH_CONTENT_COLUMNS
+                        else []
+                    ),
+                    "title_field": (
+                        ELASTICSEARCH_TITLE_COLUMN
+                        if ELASTICSEARCH_TITLE_COLUMN
+                        else None
+                    ),
+                    "url_field": (
+                        ELASTICSEARCH_URL_COLUMN if ELASTICSEARCH_URL_COLUMN else None
+                    ),
+                    "filepath_field": (
+                        ELASTICSEARCH_FILENAME_COLUMN
+                        if ELASTICSEARCH_FILENAME_COLUMN
+                        else None
+                    ),
+                    "vector_fields": (
+                        parse_multi_columns(ELASTICSEARCH_VECTOR_COLUMNS)
+                        if ELASTICSEARCH_VECTOR_COLUMNS
+                        else []
+                    ),
                 },
-                "in_scope": True if ELASTICSEARCH_ENABLE_IN_DOMAIN.lower() == "true" else False,
-                "top_n_documents": int(ELASTICSEARCH_TOP_K) if ELASTICSEARCH_TOP_K else int(SEARCH_TOP_K),
+                "in_scope": (
+                    True if ELASTICSEARCH_ENABLE_IN_DOMAIN.lower() == "true" else False
+                ),
+                "top_n_documents": (
+                    int(ELASTICSEARCH_TOP_K)
+                    if ELASTICSEARCH_TOP_K
+                    else int(SEARCH_TOP_K)
+                ),
                 "query_type": query_type,
                 "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
-                "strictness": int(ELASTICSEARCH_STRICTNESS) if ELASTICSEARCH_STRICTNESS else int(SEARCH_STRICTNESS)
-            }
+                "strictness": (
+                    int(ELASTICSEARCH_STRICTNESS)
+                    if ELASTICSEARCH_STRICTNESS
+                    else int(SEARCH_STRICTNESS)
+                ),
+            },
         }
     elif DATASOURCE_TYPE == "AzureMLIndex":
         if AZURE_MLINDEX_QUERY_TYPE:
@@ -415,18 +601,46 @@ def get_configured_data_source():
                 "version": AZURE_MLINDEX_VERSION,
                 "project_resource_id": AZURE_ML_PROJECT_RESOURCE_ID,
                 "fieldsMapping": {
-                    "content_fields": parse_multi_columns(AZURE_MLINDEX_CONTENT_COLUMNS) if AZURE_MLINDEX_CONTENT_COLUMNS else [],
-                    "title_field": AZURE_MLINDEX_TITLE_COLUMN if AZURE_MLINDEX_TITLE_COLUMN else None,
-                    "url_field": AZURE_MLINDEX_URL_COLUMN if AZURE_MLINDEX_URL_COLUMN else None,
-                    "filepath_field": AZURE_MLINDEX_FILENAME_COLUMN if AZURE_MLINDEX_FILENAME_COLUMN else None,
-                    "vector_fields": parse_multi_columns(AZURE_MLINDEX_VECTOR_COLUMNS) if AZURE_MLINDEX_VECTOR_COLUMNS else []
+                    "content_fields": (
+                        parse_multi_columns(AZURE_MLINDEX_CONTENT_COLUMNS)
+                        if AZURE_MLINDEX_CONTENT_COLUMNS
+                        else []
+                    ),
+                    "title_field": (
+                        AZURE_MLINDEX_TITLE_COLUMN
+                        if AZURE_MLINDEX_TITLE_COLUMN
+                        else None
+                    ),
+                    "url_field": (
+                        AZURE_MLINDEX_URL_COLUMN if AZURE_MLINDEX_URL_COLUMN else None
+                    ),
+                    "filepath_field": (
+                        AZURE_MLINDEX_FILENAME_COLUMN
+                        if AZURE_MLINDEX_FILENAME_COLUMN
+                        else None
+                    ),
+                    "vector_fields": (
+                        parse_multi_columns(AZURE_MLINDEX_VECTOR_COLUMNS)
+                        if AZURE_MLINDEX_VECTOR_COLUMNS
+                        else []
+                    ),
                 },
-                "in_scope": True if AZURE_MLINDEX_ENABLE_IN_DOMAIN.lower() == "true" else False,
-                "top_n_documents": int(AZURE_MLINDEX_TOP_K) if AZURE_MLINDEX_TOP_K else int(SEARCH_TOP_K),
+                "in_scope": (
+                    True if AZURE_MLINDEX_ENABLE_IN_DOMAIN.lower() == "true" else False
+                ),
+                "top_n_documents": (
+                    int(AZURE_MLINDEX_TOP_K)
+                    if AZURE_MLINDEX_TOP_K
+                    else int(SEARCH_TOP_K)
+                ),
                 "query_type": query_type,
                 "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
-                "strictness": int(AZURE_MLINDEX_STRICTNESS) if AZURE_MLINDEX_STRICTNESS else int(SEARCH_STRICTNESS)
-            }
+                "strictness": (
+                    int(AZURE_MLINDEX_STRICTNESS)
+                    if AZURE_MLINDEX_STRICTNESS
+                    else int(SEARCH_STRICTNESS)
+                ),
+            },
         }
     elif DATASOURCE_TYPE == "Pinecone":
         query_type = "vector"
@@ -435,34 +649,53 @@ def get_configured_data_source():
             "type": "pinecone",
             "parameters": {
                 "environment": PINECONE_ENVIRONMENT,
-                "authentication": {
-                    "type": "api_key",
-                    "key": PINECONE_API_KEY
-                },
+                "authentication": {"type": "api_key", "key": PINECONE_API_KEY},
                 "index_name": PINECONE_INDEX_NAME,
                 "fields_mapping": {
-                    "content_fields": parse_multi_columns(PINECONE_CONTENT_COLUMNS) if PINECONE_CONTENT_COLUMNS else [],
-                    "title_field": PINECONE_TITLE_COLUMN if PINECONE_TITLE_COLUMN else None,
+                    "content_fields": (
+                        parse_multi_columns(PINECONE_CONTENT_COLUMNS)
+                        if PINECONE_CONTENT_COLUMNS
+                        else []
+                    ),
+                    "title_field": (
+                        PINECONE_TITLE_COLUMN if PINECONE_TITLE_COLUMN else None
+                    ),
                     "url_field": PINECONE_URL_COLUMN if PINECONE_URL_COLUMN else None,
-                    "filepath_field": PINECONE_FILENAME_COLUMN if PINECONE_FILENAME_COLUMN else None,
-                    "vector_fields": parse_multi_columns(PINECONE_VECTOR_COLUMNS) if PINECONE_VECTOR_COLUMNS else []
+                    "filepath_field": (
+                        PINECONE_FILENAME_COLUMN if PINECONE_FILENAME_COLUMN else None
+                    ),
+                    "vector_fields": (
+                        parse_multi_columns(PINECONE_VECTOR_COLUMNS)
+                        if PINECONE_VECTOR_COLUMNS
+                        else []
+                    ),
                 },
-                "in_scope": True if PINECONE_ENABLE_IN_DOMAIN.lower() == "true" else False,
-                "top_n_documents": int(PINECONE_TOP_K) if PINECONE_TOP_K else int(SEARCH_TOP_K),
-                "strictness": int(PINECONE_STRICTNESS) if PINECONE_STRICTNESS else int(SEARCH_STRICTNESS),
+                "in_scope": (
+                    True if PINECONE_ENABLE_IN_DOMAIN.lower() == "true" else False
+                ),
+                "top_n_documents": (
+                    int(PINECONE_TOP_K) if PINECONE_TOP_K else int(SEARCH_TOP_K)
+                ),
+                "strictness": (
+                    int(PINECONE_STRICTNESS)
+                    if PINECONE_STRICTNESS
+                    else int(SEARCH_STRICTNESS)
+                ),
                 "query_type": query_type,
                 "role_information": AZURE_OPENAI_SYSTEM_MESSAGE,
-            }
+            },
         }
     else:
-        raise Exception(f"DATASOURCE_TYPE is not configured or unknown: {DATASOURCE_TYPE}")
+        raise Exception(
+            f"DATASOURCE_TYPE is not configured or unknown: {DATASOURCE_TYPE}"
+        )
 
     if "vector" in query_type.lower() and DATASOURCE_TYPE != "AzureMLIndex":
         embeddingDependency = {}
         if AZURE_OPENAI_EMBEDDING_NAME:
             embeddingDependency = {
                 "type": "deployment_name",
-                "deployment_name": AZURE_OPENAI_EMBEDDING_NAME
+                "deployment_name": AZURE_OPENAI_EMBEDDING_NAME,
             }
         elif AZURE_OPENAI_EMBEDDING_ENDPOINT and AZURE_OPENAI_EMBEDDING_KEY:
             embeddingDependency = {
@@ -470,73 +703,122 @@ def get_configured_data_source():
                 "endpoint": AZURE_OPENAI_EMBEDDING_ENDPOINT,
                 "authentication": {
                     "type": "api_key",
-                    "key": AZURE_OPENAI_EMBEDDING_KEY
-                }
+                    "key": AZURE_OPENAI_EMBEDDING_KEY,
+                },
             }
         elif DATASOURCE_TYPE == "Elasticsearch" and ELASTICSEARCH_EMBEDDING_MODEL_ID:
             embeddingDependency = {
                 "type": "model_id",
-                "model_id": ELASTICSEARCH_EMBEDDING_MODEL_ID
+                "model_id": ELASTICSEARCH_EMBEDDING_MODEL_ID,
             }
         else:
-            raise Exception(f"Vector query type ({query_type}) is selected for data source type {DATASOURCE_TYPE} but no embedding dependency is configured")
+            raise Exception(
+                f"Vector query type ({query_type}) is selected for data source type {DATASOURCE_TYPE} but no embedding dependency is configured"
+            )
         data_source["parameters"]["embedding_dependency"] = embeddingDependency
 
     return data_source
 
+
 def prepare_model_args(request_body):
     request_messages = request_body.get("messages", [])
     messages = []
     if not SHOULD_USE_DATA:
-        messages = [
-            {
-                "role": "system",
-                "content": AZURE_OPENAI_SYSTEM_MESSAGE
-            }
-        ]
+        messages = [{"role": "system", "content": AZURE_OPENAI_SYSTEM_MESSAGE}]
 
     for message in request_messages:
         if message:
-            messages.append({
-                "role": message["role"] ,
-                "content": message["content"]
-            })
+            messages.append({"role": message["role"], "content": message["content"]})
 
     model_args = {
         "messages": messages,
         "temperature": float(AZURE_OPENAI_TEMPERATURE),
         "max_tokens": int(AZURE_OPENAI_MAX_TOKENS),
         "top_p": float(AZURE_OPENAI_TOP_P),
-        "stop": parse_multi_columns(AZURE_OPENAI_STOP_SEQUENCE) if AZURE_OPENAI_STOP_SEQUENCE else None,
+        "stop": (
+            parse_multi_columns(AZURE_OPENAI_STOP_SEQUENCE)
+            if AZURE_OPENAI_STOP_SEQUENCE
+            else None
+        ),
         "stream": SHOULD_STREAM,
         "model": AZURE_OPENAI_MODEL,
     }
 
     if SHOULD_USE_DATA:
-        model_args["extra_body"] = {
-            "data_sources": [get_configured_data_source()]
-        }
+        model_args["extra_body"] = {"data_sources": [get_configured_data_source()]}
 
     model_args_clean = copy.deepcopy(model_args)
     if model_args_clean.get("extra_body"):
-        secret_params = ["key", "connection_string", "embedding_key", "encoded_api_key", "api_key"]
+        secret_params = [
+            "key",
+            "connection_string",
+            "embedding_key",
+            "encoded_api_key",
+            "api_key",
+        ]
         for secret_param in secret_params:
-            if model_args_clean["extra_body"]["data_sources"][0]["parameters"].get(secret_param):
-                model_args_clean["extra_body"]["data_sources"][0]["parameters"][secret_param] = "*****"
-        authentication = model_args_clean["extra_body"]["data_sources"][0]["parameters"].get("authentication", {})
+            if model_args_clean["extra_body"]["data_sources"][0]["parameters"].get(
+                secret_param
+            ):
+                model_args_clean["extra_body"]["data_sources"][0]["parameters"][
+                    secret_param
+                ] = "*****"
+        authentication = model_args_clean["extra_body"]["data_sources"][0][
+            "parameters"
+        ].get("authentication", {})
         for field in authentication:
             if field in secret_params:
-                model_args_clean["extra_body"]["data_sources"][0]["parameters"]["authentication"][field] = "*****"
-        embeddingDependency = model_args_clean["extra_body"]["data_sources"][0]["parameters"].get("embedding_dependency", {})
+                model_args_clean["extra_body"]["data_sources"][0]["parameters"][
+                    "authentication"
+                ][field] = "*****"
+        embeddingDependency = model_args_clean["extra_body"]["data_sources"][0][
+            "parameters"
+        ].get("embedding_dependency", {})
         if "authentication" in embeddingDependency:
             for field in embeddingDependency["authentication"]:
                 if field in secret_params:
-                    model_args_clean["extra_body"]["data_sources"][0]["parameters"]["embedding_dependency"]["authentication"][field] = "*****"
-        
+                    model_args_clean["extra_body"]["data_sources"][0]["parameters"][
+                        "embedding_dependency"
+                    ]["authentication"][field] = "*****"
+
     logging.debug(f"REQUEST BODY: {json.dumps(model_args_clean, indent=4)}")
-    
+
     return model_args
 
+
+async def promptflow_request(request):
+    try:
+        headers = {
+            "Content-Type": "application/json",
+            "Authorization": f"Bearer {PROMPTFLOW_API_KEY}",
+        }
+        # Adding timeout for scenarios where response takes longer to come back
+        logging.debug(f"Setting timeout to {PROMPTFLOW_RESPONSE_TIMEOUT}")
+        async with httpx.AsyncClient(
+            timeout=float(PROMPTFLOW_RESPONSE_TIMEOUT)
+        ) as client:
+            pf_formatted_obj = convert_to_pf_format(
+                request, PROMPTFLOW_REQUEST_FIELD_NAME, PROMPTFLOW_RESPONSE_FIELD_NAME
+            )
+            # NOTE: This only support question and chat_history parameters
+            # If you need to add more parameters, you need to modify the request body
+            response = await client.post(
+                PROMPTFLOW_ENDPOINT,
+                json={
+                    f"{PROMPTFLOW_REQUEST_FIELD_NAME}": pf_formatted_obj[-1]["inputs"][
+                        PROMPTFLOW_REQUEST_FIELD_NAME
+                    ],
+                    "chat_history": pf_formatted_obj[:-1],
+                },
+                headers=headers,
+            )
+        resp = response.json()
+        resp["id"] = request["messages"][-1]["id"]
+        return resp
+    except Exception as e:
+        logging.error(f"An error occurred while making promptflow_request: {e}")
+
+
 async def send_chat_request(request):
     model_args = prepare_model_args(request)
 
@@ -550,11 +832,19 @@ async def send_chat_request(request):
 
     return response
 
+
 async def complete_chat_request(request_body):
-    response = await send_chat_request(request_body)
-    history_metadata = request_body.get("history_metadata", {})
+    if USE_PROMPTFLOW and PROMPTFLOW_ENDPOINT and PROMPTFLOW_API_KEY:
+        response = await promptflow_request(request_body)
+        history_metadata = request_body.get("history_metadata", {})
+        return format_pf_non_streaming_response(
+            response, history_metadata, PROMPTFLOW_RESPONSE_FIELD_NAME
+        )
+    else:
+        response = await send_chat_request(request_body)
+        history_metadata = request_body.get("history_metadata", {})
+        return format_non_streaming_response(response, history_metadata)
 
-    return format_non_streaming_response(response, history_metadata)
 
 async def stream_chat_request(request_body):
     response = await send_chat_request(request_body)
@@ -566,6 +856,7 @@ async def generate():
 
     return generate()
 
+
 async def conversation_internal(request_body):
     try:
         if SHOULD_STREAM:
@@ -577,7 +868,7 @@ async def conversation_internal(request_body):
         else:
             result = await complete_chat_request(request_body)
             return jsonify(result)
-    
+
     except Exception as ex:
         logging.exception(ex)
         if hasattr(ex, "status_code"):
@@ -591,26 +882,28 @@ async def conversation():
     if not request.is_json:
         return jsonify({"error": "request must be json"}), 415
     request_json = await request.get_json()
-    
+
     return await conversation_internal(request_json)
 
-@bp.route("/frontend_settings", methods=["GET"])  
+
+@bp.route("/frontend_settings", methods=["GET"])
 def get_frontend_settings():
     try:
         return jsonify(frontend_settings), 200
     except Exception as e:
         logging.exception("Exception in /frontend_settings")
-        return jsonify({"error": str(e)}), 500  
+        return jsonify({"error": str(e)}), 500
 
-## Conversation History API ## 
+
+## Conversation History API ##
 @bp.route("/history/generate", methods=["POST"])
 async def add_conversation():
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
+    conversation_id = request_json.get("conversation_id", None)
 
     try:
         # make sure cosmos is configured
@@ -622,34 +915,40 @@ async def add_conversation():
         history_metadata = {}
         if not conversation_id:
             title = await generate_title(request_json["messages"])
-            conversation_dict = await cosmos_conversation_client.create_conversation(user_id=user_id, title=title)
-            conversation_id = conversation_dict['id']
-            history_metadata['title'] = title
-            history_metadata['date'] = conversation_dict['createdAt']
-            
+            conversation_dict = await cosmos_conversation_client.create_conversation(
+                user_id=user_id, title=title
+            )
+            conversation_id = conversation_dict["id"]
+            history_metadata["title"] = title
+            history_metadata["date"] = conversation_dict["createdAt"]
+
         ## Format the incoming message object in the "chat/completions" messages format
         ## then write it to the conversation history in cosmos
         messages = request_json["messages"]
-        if len(messages) > 0 and messages[-1]['role'] == "user":
+        if len(messages) > 0 and messages[-1]["role"] == "user":
             createdMessageValue = await cosmos_conversation_client.create_message(
                 uuid=str(uuid.uuid4()),
                 conversation_id=conversation_id,
                 user_id=user_id,
-                input_message=messages[-1]
+                input_message=messages[-1],
             )
             if createdMessageValue == "Conversation not found":
-                raise Exception("Conversation not found for the given conversation ID: " + conversation_id + ".")
+                raise Exception(
+                    "Conversation not found for the given conversation ID: "
+                    + conversation_id
+                    + "."
+                )
         else:
             raise Exception("No user message found")
-        
+
         await cosmos_conversation_client.cosmosdb_client.close()
-        
+
         # Submit request to Chat Completions for response
         request_body = await request.get_json()
-        history_metadata['conversation_id'] = conversation_id
-        request_body['history_metadata'] = history_metadata
+        history_metadata["conversation_id"] = conversation_id
+        request_body["history_metadata"] = history_metadata
         return await conversation_internal(request_body)
-       
+
     except Exception as e:
         logging.exception("Exception in /history/generate")
         return jsonify({"error": str(e)}), 500
@@ -658,11 +957,11 @@ async def add_conversation():
 @bp.route("/history/update", methods=["POST"])
 async def update_conversation():
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
+    conversation_id = request_json.get("conversation_id", None)
 
     try:
         # make sure cosmos is configured
@@ -673,62 +972,80 @@ async def update_conversation():
         # check for the conversation_id, if the conversation is not set, we will create a new one
         if not conversation_id:
             raise Exception("No conversation_id found")
-            
+
         ## Format the incoming message object in the "chat/completions" messages format
         ## then write it to the conversation history in cosmos
         messages = request_json["messages"]
-        if len(messages) > 0 and messages[-1]['role'] == "assistant":
-            if len(messages) > 1 and messages[-2].get('role', None) == "tool":
+        if len(messages) > 0 and messages[-1]["role"] == "assistant":
+            if len(messages) > 1 and messages[-2].get("role", None) == "tool":
                 # write the tool message first
                 await cosmos_conversation_client.create_message(
                     uuid=str(uuid.uuid4()),
                     conversation_id=conversation_id,
                     user_id=user_id,
-                    input_message=messages[-2]
+                    input_message=messages[-2],
                 )
             # write the assistant message
             await cosmos_conversation_client.create_message(
-                uuid=messages[-1]['id'],
+                uuid=messages[-1]["id"],
                 conversation_id=conversation_id,
                 user_id=user_id,
-                input_message=messages[-1]
+                input_message=messages[-1],
             )
         else:
             raise Exception("No bot messages found")
-        
+
         # Submit request to Chat Completions for response
         await cosmos_conversation_client.cosmosdb_client.close()
-        response = {'success': True}
+        response = {"success": True}
         return jsonify(response), 200
-       
+
     except Exception as e:
         logging.exception("Exception in /history/update")
         return jsonify({"error": str(e)}), 500
 
+
 @bp.route("/history/message_feedback", methods=["POST"])
 async def update_message():
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
     cosmos_conversation_client = init_cosmosdb_client()
 
     ## check request for message_id
     request_json = await request.get_json()
-    message_id = request_json.get('message_id', None)
+    message_id = request_json.get("message_id", None)
     message_feedback = request_json.get("message_feedback", None)
     try:
         if not message_id:
             return jsonify({"error": "message_id is required"}), 400
-        
+
         if not message_feedback:
             return jsonify({"error": "message_feedback is required"}), 400
-        
+
         ## update the message in cosmos
-        updated_message = await cosmos_conversation_client.update_message_feedback(user_id, message_id, message_feedback)
+        updated_message = await cosmos_conversation_client.update_message_feedback(
+            user_id, message_id, message_feedback
+        )
         if updated_message:
-            return jsonify({"message": f"Successfully updated message with feedback {message_feedback}", "message_id": message_id}), 200
+            return (
+                jsonify(
+                    {
+                        "message": f"Successfully updated message with feedback {message_feedback}",
+                        "message_id": message_id,
+                    }
+                ),
+                200,
+            )
         else:
-            return jsonify({"error": f"Unable to update message {message_id}. It either does not exist or the user does not have access to it."}), 404
-        
+            return (
+                jsonify(
+                    {
+                        "error": f"Unable to update message {message_id}. It either does not exist or the user does not have access to it."
+                    }
+                ),
+                404,
+            )
+
     except Exception as e:
         logging.exception("Exception in /history/message_feedback")
         return jsonify({"error": str(e)}), 500
@@ -738,30 +1055,42 @@ async def update_message():
 async def delete_conversation():
     ## get the user id from the request headers
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
-    
+    user_id = authenticated_user["user_principal_id"]
+
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
+    conversation_id = request_json.get("conversation_id", None)
 
-    try: 
+    try:
         if not conversation_id:
             return jsonify({"error": "conversation_id is required"}), 400
-        
+
         ## make sure cosmos is configured
         cosmos_conversation_client = init_cosmosdb_client()
         if not cosmos_conversation_client:
             raise Exception("CosmosDB is not configured or not working")
 
         ## delete the conversation messages from cosmos first
-        deleted_messages = await cosmos_conversation_client.delete_messages(conversation_id, user_id)
+        deleted_messages = await cosmos_conversation_client.delete_messages(
+            conversation_id, user_id
+        )
 
-        ## Now delete the conversation 
-        deleted_conversation = await cosmos_conversation_client.delete_conversation(user_id, conversation_id)
+        ## Now delete the conversation
+        deleted_conversation = await cosmos_conversation_client.delete_conversation(
+            user_id, conversation_id
+        )
 
         await cosmos_conversation_client.cosmosdb_client.close()
 
-        return jsonify({"message": "Successfully deleted conversation and messages", "conversation_id": conversation_id}), 200
+        return (
+            jsonify(
+                {
+                    "message": "Successfully deleted conversation and messages",
+                    "conversation_id": conversation_id,
+                }
+            ),
+            200,
+        )
     except Exception as e:
         logging.exception("Exception in /history/delete")
         return jsonify({"error": str(e)}), 500
@@ -771,7 +1100,7 @@ async def delete_conversation():
 async def list_conversations():
     offset = request.args.get("offset", 0)
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     ## make sure cosmos is configured
     cosmos_conversation_client = init_cosmosdb_client()
@@ -779,7 +1108,9 @@ async def list_conversations():
         raise Exception("CosmosDB is not configured or not working")
 
     ## get the conversations from cosmos
-    conversations = await cosmos_conversation_client.get_conversations(user_id, offset=offset, limit=25)
+    conversations = await cosmos_conversation_client.get_conversations(
+        user_id, offset=offset, limit=25
+    )
     await cosmos_conversation_client.cosmosdb_client.close()
     if not isinstance(conversations, list):
         return jsonify({"error": f"No conversations for {user_id} were found"}), 404
@@ -792,72 +1123,105 @@ async def list_conversations():
 @bp.route("/history/read", methods=["POST"])
 async def get_conversation():
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
-    
+    conversation_id = request_json.get("conversation_id", None)
+
     if not conversation_id:
         return jsonify({"error": "conversation_id is required"}), 400
-    
+
     ## make sure cosmos is configured
     cosmos_conversation_client = init_cosmosdb_client()
     if not cosmos_conversation_client:
         raise Exception("CosmosDB is not configured or not working")
 
     ## get the conversation object and the related messages from cosmos
-    conversation = await cosmos_conversation_client.get_conversation(user_id, conversation_id)
+    conversation = await cosmos_conversation_client.get_conversation(
+        user_id, conversation_id
+    )
     ## return the conversation id and the messages in the bot frontend format
     if not conversation:
-        return jsonify({"error": f"Conversation {conversation_id} was not found. It either does not exist or the logged in user does not have access to it."}), 404
-    
+        return (
+            jsonify(
+                {
+                    "error": f"Conversation {conversation_id} was not found. It either does not exist or the logged in user does not have access to it."
+                }
+            ),
+            404,
+        )
+
     # get the messages for the conversation from cosmos
-    conversation_messages = await cosmos_conversation_client.get_messages(user_id, conversation_id)
+    conversation_messages = await cosmos_conversation_client.get_messages(
+        user_id, conversation_id
+    )
 
     ## format the messages in the bot frontend format
-    messages = [{'id': msg['id'], 'role': msg['role'], 'content': msg['content'], 'createdAt': msg['createdAt'], 'feedback': msg.get('feedback')} for msg in conversation_messages]
+    messages = [
+        {
+            "id": msg["id"],
+            "role": msg["role"],
+            "content": msg["content"],
+            "createdAt": msg["createdAt"],
+            "feedback": msg.get("feedback"),
+        }
+        for msg in conversation_messages
+    ]
 
     await cosmos_conversation_client.cosmosdb_client.close()
     return jsonify({"conversation_id": conversation_id, "messages": messages}), 200
 
+
 @bp.route("/history/rename", methods=["POST"])
 async def rename_conversation():
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
-    
+    conversation_id = request_json.get("conversation_id", None)
+
     if not conversation_id:
         return jsonify({"error": "conversation_id is required"}), 400
-    
+
     ## make sure cosmos is configured
     cosmos_conversation_client = init_cosmosdb_client()
     if not cosmos_conversation_client:
         raise Exception("CosmosDB is not configured or not working")
-    
+
     ## get the conversation from cosmos
-    conversation = await cosmos_conversation_client.get_conversation(user_id, conversation_id)
+    conversation = await cosmos_conversation_client.get_conversation(
+        user_id, conversation_id
+    )
     if not conversation:
-        return jsonify({"error": f"Conversation {conversation_id} was not found. It either does not exist or the logged in user does not have access to it."}), 404
+        return (
+            jsonify(
+                {
+                    "error": f"Conversation {conversation_id} was not found. It either does not exist or the logged in user does not have access to it."
+                }
+            ),
+            404,
+        )
 
     ## update the title
     title = request_json.get("title", None)
     if not title:
         return jsonify({"error": "title is required"}), 400
-    conversation['title'] = title
-    updated_conversation = await cosmos_conversation_client.upsert_conversation(conversation)
+    conversation["title"] = title
+    updated_conversation = await cosmos_conversation_client.upsert_conversation(
+        conversation
+    )
 
     await cosmos_conversation_client.cosmosdb_client.close()
     return jsonify(updated_conversation), 200
 
+
 @bp.route("/history/delete_all", methods=["DELETE"])
 async def delete_all_conversations():
     ## get the user id from the request headers
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
+    user_id = authenticated_user["user_principal_id"]
 
     # get conversations for user
     try:
@@ -866,47 +1230,71 @@ async def delete_all_conversations():
         if not cosmos_conversation_client:
             raise Exception("CosmosDB is not configured or not working")
 
-        conversations = await cosmos_conversation_client.get_conversations(user_id, offset=0, limit=None)
+        conversations = await cosmos_conversation_client.get_conversations(
+            user_id, offset=0, limit=None
+        )
         if not conversations:
             return jsonify({"error": f"No conversations for {user_id} were found"}), 404
-        
+
         # delete each conversation
         for conversation in conversations:
             ## delete the conversation messages from cosmos first
-            deleted_messages = await cosmos_conversation_client.delete_messages(conversation['id'], user_id)
+            deleted_messages = await cosmos_conversation_client.delete_messages(
+                conversation["id"], user_id
+            )
 
-            ## Now delete the conversation 
-            deleted_conversation = await cosmos_conversation_client.delete_conversation(user_id, conversation['id'])
+            ## Now delete the conversation
+            deleted_conversation = await cosmos_conversation_client.delete_conversation(
+                user_id, conversation["id"]
+            )
         await cosmos_conversation_client.cosmosdb_client.close()
-        return jsonify({"message": f"Successfully deleted conversation and messages for user {user_id}"}), 200
-    
+        return (
+            jsonify(
+                {
+                    "message": f"Successfully deleted conversation and messages for user {user_id}"
+                }
+            ),
+            200,
+        )
+
     except Exception as e:
         logging.exception("Exception in /history/delete_all")
         return jsonify({"error": str(e)}), 500
 
+
 @bp.route("/history/clear", methods=["POST"])
 async def clear_messages():
     ## get the user id from the request headers
     authenticated_user = get_authenticated_user_details(request_headers=request.headers)
-    user_id = authenticated_user['user_principal_id']
-    
+    user_id = authenticated_user["user_principal_id"]
+
     ## check request for conversation_id
     request_json = await request.get_json()
-    conversation_id = request_json.get('conversation_id', None)
+    conversation_id = request_json.get("conversation_id", None)
 
-    try: 
+    try:
         if not conversation_id:
             return jsonify({"error": "conversation_id is required"}), 400
-        
+
         ## make sure cosmos is configured
         cosmos_conversation_client = init_cosmosdb_client()
         if not cosmos_conversation_client:
             raise Exception("CosmosDB is not configured or not working")
 
         ## delete the conversation messages from cosmos
-        deleted_messages = await cosmos_conversation_client.delete_messages(conversation_id, user_id)
+        deleted_messages = await cosmos_conversation_client.delete_messages(
+            conversation_id, user_id
+        )
 
-        return jsonify({"message": "Successfully deleted messages in conversation", "conversation_id": conversation_id}), 200
+        return (
+            jsonify(
+                {
+                    "message": "Successfully deleted messages in conversation",
+                    "conversation_id": conversation_id,
+                }
+            ),
+            200,
+        )
     except Exception as e:
         logging.exception("Exception in /history/clear_messages")
         return jsonify({"error": str(e)}), 500
@@ -916,7 +1304,7 @@ async def clear_messages():
 async def ensure_cosmos():
     if not AZURE_COSMOSDB_ACCOUNT:
         return jsonify({"error": "CosmosDB is not configured"}), 404
-    
+
     try:
         cosmos_conversation_client = init_cosmosdb_client()
         success, err = await cosmos_conversation_client.ensure()
@@ -924,7 +1312,7 @@ async def ensure_cosmos():
             if err:
                 return jsonify({"error": err}), 422
             return jsonify({"error": "CosmosDB is not configured or not working"}), 500
-        
+
         await cosmos_conversation_client.cosmosdb_client.close()
         return jsonify({"message": "CosmosDB is configured and working"}), 200
     except Exception as e:
@@ -933,9 +1321,23 @@ async def ensure_cosmos():
         if "Invalid credentials" in cosmos_exception:
             return jsonify({"error": cosmos_exception}), 401
         elif "Invalid CosmosDB database name" in cosmos_exception:
-            return jsonify({"error": f"{cosmos_exception} {AZURE_COSMOSDB_DATABASE} for account {AZURE_COSMOSDB_ACCOUNT}"}), 422
+            return (
+                jsonify(
+                    {
+                        "error": f"{cosmos_exception} {AZURE_COSMOSDB_DATABASE} for account {AZURE_COSMOSDB_ACCOUNT}"
+                    }
+                ),
+                422,
+            )
         elif "Invalid CosmosDB container name" in cosmos_exception:
-            return jsonify({"error": f"{cosmos_exception}: {AZURE_COSMOSDB_CONVERSATIONS_CONTAINER}"}), 422
+            return (
+                jsonify(
+                    {
+                        "error": f"{cosmos_exception}: {AZURE_COSMOSDB_CONVERSATIONS_CONTAINER}"
+                    }
+                ),
+                422,
+            )
         else:
             return jsonify({"error": "CosmosDB is not working"}), 500
 
@@ -944,22 +1346,22 @@ async def generate_title(conversation_messages):
     ## make sure the messages are sorted by _ts descending
     title_prompt = 'Summarize the conversation so far into a 4-word or less title. Do not use any quotation marks or punctuation. Respond with a json object in the format {{"title": string}}. Do not include any other commentary or description.'
 
-    messages = [{'role': msg['role'], 'content': msg['content']} for msg in conversation_messages]
-    messages.append({'role': 'user', 'content': title_prompt})
+    messages = [
+        {"role": msg["role"], "content": msg["content"]}
+        for msg in conversation_messages
+    ]
+    messages.append({"role": "user", "content": title_prompt})
 
     try:
         azure_openai_client = init_openai_client(use_data=False)
         response = await azure_openai_client.chat.completions.create(
-            model=AZURE_OPENAI_MODEL,
-            messages=messages,
-            temperature=1,
-            max_tokens=64
+            model=AZURE_OPENAI_MODEL, messages=messages, temperature=1, max_tokens=64
         )
-        
-        title = json.loads(response.choices[0].message.content)['title']
+
+        title = json.loads(response.choices[0].message.content)["title"]
         return title
     except Exception as e:
-        return messages[-2]['content']
+        return messages[-2]["content"]
 
 
-app = create_app()
\ No newline at end of file
+app = create_app()
diff --git a/backend/utils.py b/backend/utils.py
index 45ccd8dc3e..3b2a856c9d 100644
--- a/backend/utils.py
+++ b/backend/utils.py
@@ -8,7 +8,10 @@
 if DEBUG.lower() == "true":
     logging.basicConfig(level=logging.DEBUG)
 
-AZURE_SEARCH_PERMITTED_GROUPS_COLUMN = os.environ.get("AZURE_SEARCH_PERMITTED_GROUPS_COLUMN")
+AZURE_SEARCH_PERMITTED_GROUPS_COLUMN = os.environ.get(
+    "AZURE_SEARCH_PERMITTED_GROUPS_COLUMN"
+)
+
 
 class JSONEncoder(json.JSONEncoder):
     def default(self, o):
@@ -16,6 +19,7 @@ def default(self, o):
             return dataclasses.asdict(o)
         return super().default(o)
 
+
 async def format_as_ndjson(r):
     try:
         async for event in r:
@@ -24,6 +28,7 @@ async def format_as_ndjson(r):
         logging.exception("Exception while generating response stream: %s", error)
         yield json.dumps({"error": str(error)})
 
+
 def parse_multi_columns(columns: str) -> list:
     if "|" in columns:
         return columns.split("|")
@@ -37,22 +42,20 @@ def fetchUserGroups(userToken, nextLink=None):
         endpoint = nextLink
     else:
         endpoint = "https://graph.microsoft.com/v1.0/me/transitiveMemberOf?$select=id"
-    
-    headers = {
-        'Authorization': "bearer " + userToken
-    }
-    try :
+
+    headers = {"Authorization": "bearer " + userToken}
+    try:
         r = requests.get(endpoint, headers=headers)
         if r.status_code != 200:
             logging.error(f"Error fetching user groups: {r.status_code} {r.text}")
             return []
-        
+
         r = r.json()
         if "@odata.nextLink" in r:
             nextLinkData = fetchUserGroups(userToken, r["@odata.nextLink"])
-            r['value'].extend(nextLinkData)
-        
-        return r['value']
+            r["value"].extend(nextLinkData)
+
+        return r["value"]
     except Exception as e:
         logging.error(f"Exception in fetchUserGroups: {e}")
         return []
@@ -66,59 +69,56 @@ def generateFilterString(userToken):
     if not userGroups:
         logging.debug("No user groups found")
 
-    group_ids = ", ".join([obj['id'] for obj in userGroups])
+    group_ids = ", ".join([obj["id"] for obj in userGroups])
     return f"{AZURE_SEARCH_PERMITTED_GROUPS_COLUMN}/any(g:search.in(g, '{group_ids}'))"
 
+
 def format_non_streaming_response(chatCompletion, history_metadata, message_uuid=None):
     response_obj = {
         "id": chatCompletion.id,
         "model": chatCompletion.model,
         "created": chatCompletion.created,
         "object": chatCompletion.object,
-        "choices": [
-            {
-                "messages": []
-            }
-        ],
-        "history_metadata": history_metadata
+        "choices": [{"messages": []}],
+        "history_metadata": history_metadata,
     }
 
     if len(chatCompletion.choices) > 0:
         message = chatCompletion.choices[0].message
         if message:
             if hasattr(message, "context"):
-                response_obj["choices"][0]["messages"].append({
-                    "role": "tool",
-                    "content": json.dumps(message.context),
-                })
-            response_obj["choices"][0]["messages"].append({
-                "role": "assistant",
-                "content": message.content,
-            })
+                response_obj["choices"][0]["messages"].append(
+                    {
+                        "role": "tool",
+                        "content": json.dumps(message.context),
+                    }
+                )
+            response_obj["choices"][0]["messages"].append(
+                {
+                    "role": "assistant",
+                    "content": message.content,
+                }
+            )
             return response_obj
-    
+
     return {}
 
+
 def format_stream_response(chatCompletionChunk, history_metadata, message_uuid=None):
     response_obj = {
         "id": chatCompletionChunk.id,
         "model": chatCompletionChunk.model,
         "created": chatCompletionChunk.created,
         "object": chatCompletionChunk.object,
-        "choices": [{
-            "messages": []
-        }],
-        "history_metadata": history_metadata
+        "choices": [{"messages": []}],
+        "history_metadata": history_metadata,
     }
 
     if len(chatCompletionChunk.choices) > 0:
         delta = chatCompletionChunk.choices[0].delta
         if delta:
             if hasattr(delta, "context"):
-                messageObj = {
-                    "role": "tool",
-                    "content": json.dumps(delta.context)
-                }
+                messageObj = {"role": "tool", "content": json.dumps(delta.context)}
                 response_obj["choices"][0]["messages"].append(messageObj)
                 return response_obj
             if delta.role == "assistant" and hasattr(delta, "context"):
@@ -136,5 +136,62 @@ def format_stream_response(chatCompletionChunk, history_metadata, message_uuid=N
                     }
                     response_obj["choices"][0]["messages"].append(messageObj)
                     return response_obj
-    
-    return {}
\ No newline at end of file
+
+    return {}
+
+
+def format_pf_non_streaming_response(
+    chatCompletion, history_metadata, response_field_name, message_uuid=None
+):
+    if chatCompletion is None:
+        logging.error(
+            "chatCompletion object is None - Increase PROMPTFLOW_RESPONSE_TIMEOUT parameter"
+        )
+        return {
+            "error": "No response received from promptflow endpoint increase PROMPTFLOW_RESPONSE_TIMEOUT parameter or check the promptflow endpoint."
+        }
+    if "error" in chatCompletion:
+        logging.error(f"Error in promptflow response api: {chatCompletion['error']}")
+        return {"error": chatCompletion["error"]}
+
+    logging.debug(f"chatCompletion: {chatCompletion}")
+    try:
+        response_obj = {
+            "id": chatCompletion["id"],
+            "model": "",
+            "created": "",
+            "object": "",
+            "choices": [
+                {
+                    "messages": [
+                        {
+                            "role": "assistant",
+                            "content": chatCompletion[response_field_name],
+                        }
+                    ]
+                }
+            ],
+            "history_metadata": history_metadata,
+        }
+        return response_obj
+    except Exception as e:
+        logging.error(f"Exception in format_pf_non_streaming_response: {e}")
+        return {}
+
+
+def convert_to_pf_format(input_json, request_field_name, response_field_name):
+    output_json = []
+    logging.debug(f"Input json: {input_json}")
+    # align the input json to the format expected by promptflow chat flow
+    for message in input_json["messages"]:
+        if message:
+            if message["role"] == "user":
+                new_obj = {
+                    "inputs": {request_field_name: message["content"]},
+                    "outputs": {response_field_name: ""},
+                }
+                output_json.append(new_obj)
+            elif message["role"] == "assistant" and len(output_json) > 0:
+                output_json[-1]["outputs"][response_field_name] = message["content"]
+    logging.debug(f"PF formatted response: {output_json}")
+    return output_json