From 6998ab09f1f7d922f7c30b118d1c2d0e74f161e0 Mon Sep 17 00:00:00 2001 From: Roopan-Microsoft <168007406+Roopan-Microsoft@users.noreply.github.com> Date: Tue, 17 Sep 2024 02:13:10 +0530 Subject: [PATCH] fix: Psl 6635 - BYOD workflow implementation (#1265) Co-authored-by: Ajit Padhi (Persistent Systems Inc) Co-authored-by: Francia Riesco --- code/backend/Admin.py | 1 + .../utilities/helpers/config/config_helper.py | 20 +- .../utilities/helpers/config/default.json | 3 +- .../batch/utilities/helpers/env_helper.py | 13 +- code/backend/pages/04_Configuration.py | 21 ++ code/create_app.py | 62 +++++- .../src/components/Answer/AnswerParser.tsx | 2 +- .../backend_api/default/test_conversation.py | 13 +- .../with_byod/test_conversation_flow.py | 32 ++- .../test_azure_byod_without_data.py | 33 ++- code/tests/test_app.py | 205 +++++++++++++++--- .../utilities/helpers/test_config_helper.py | 3 +- 12 files changed, 341 insertions(+), 67 deletions(-) diff --git a/code/backend/Admin.py b/code/backend/Admin.py index 627996263..373560ffc 100644 --- a/code/backend/Admin.py +++ b/code/backend/Admin.py @@ -51,6 +51,7 @@ def load_css(file_path): """ * If you want to ingest data (pdf, websites, etc.), then use the `Ingest Data` tab * If you want to explore how your data was chunked, check the `Explore Data` tab + * If you want to delete your data, check the `Delete Data` tab * If you want to adapt the underlying prompts, logging settings and others, use the `Configuration` tab """ ) diff --git a/code/backend/batch/utilities/helpers/config/config_helper.py b/code/backend/batch/utilities/helpers/config/config_helper.py index 71772131e..60b4b7432 100644 --- a/code/backend/batch/utilities/helpers/config/config_helper.py +++ b/code/backend/batch/utilities/helpers/config/config_helper.py @@ -12,6 +12,7 @@ from ...orchestrator import OrchestrationSettings from ..env_helper import EnvHelper from .assistant_strategy import AssistantStrategy +from .conversation_flow import ConversationFlow CONFIG_CONTAINER_NAME = "config" CONFIG_FILE_NAME = "active.json" @@ -90,6 +91,9 @@ def get_available_orchestration_strategies(self): def get_available_ai_assistant_types(self): return [c.value for c in AssistantStrategy] + def get_available_conversational_flows(self): + return [c.value for c in ConversationFlow] + # TODO: Change to AnsweringChain or something, Prompts is not a good name class Prompts: @@ -102,6 +106,7 @@ def __init__(self, prompts: dict): self.enable_post_answering_prompt = prompts["enable_post_answering_prompt"] self.enable_content_safety = prompts["enable_content_safety"] self.ai_assistant_type = prompts["ai_assistant_type"] + self.conversational_flow = prompts["conversational_flow"] class Example: @@ -166,13 +171,20 @@ def _set_new_config_properties(config: dict, default_config: dict): config["example"] = default_config["example"] if config["prompts"].get("ai_assistant_type") is None: - config["prompts"]["ai_assistant_type"] = default_config["prompts"]["ai_assistant_type"] + config["prompts"]["ai_assistant_type"] = default_config["prompts"][ + "ai_assistant_type" + ] if config.get("integrated_vectorization_config") is None: config["integrated_vectorization_config"] = default_config[ "integrated_vectorization_config" ] + if config["prompts"].get("conversational_flow") is None: + config["prompts"]["conversational_flow"] = default_config["prompts"][ + "conversational_flow" + ] + @staticmethod @functools.cache def get_active_config_or_default(): @@ -247,12 +259,14 @@ def get_default_config(): @staticmethod @functools.cache def get_default_contract_assistant(): - contract_file_path = os.path.join(os.path.dirname(__file__), "default_contract_assistant_prompt.txt") + contract_file_path = os.path.join( + os.path.dirname(__file__), "default_contract_assistant_prompt.txt" + ) contract_assistant = "" with open(contract_file_path, encoding="utf-8") as f: contract_assistant = f.readlines() - return ''.join([str(elem) for elem in contract_assistant]) + return "".join([str(elem) for elem in contract_assistant]) @staticmethod def clear_config(): diff --git a/code/backend/batch/utilities/helpers/config/default.json b/code/backend/batch/utilities/helpers/config/default.json index cf3999ab7..9bfa9c813 100644 --- a/code/backend/batch/utilities/helpers/config/default.json +++ b/code/backend/batch/utilities/helpers/config/default.json @@ -8,7 +8,8 @@ "use_on_your_data_format": true, "enable_post_answering_prompt": false, "ai_assistant_type": "default", - "enable_content_safety": true + "enable_content_safety": true, + "conversational_flow": "custom" }, "example": { "documents": "{\n \"retrieved_documents\": [\n {\n \"[doc1]\": {\n \"content\": \"Dual Transformer Encoder (DTE) DTE (https://dev.azure.com/TScience/TSciencePublic/_wiki/wikis/TSciencePublic.wiki/82/Dual-Transformer-Encoder) DTE is a general pair-oriented sentence representation learning framework based on transformers. It provides training, inference and evaluation for sentence similarity models. Model Details DTE can be used to train a model for sentence similarity with the following features: - Build upon existing transformer-based text representations (e.g.TNLR, BERT, RoBERTa, BAG-NLR) - Apply smoothness inducing technology to improve the representation robustness - SMART (https://arxiv.org/abs/1911.03437) SMART - Apply NCE (Noise Contrastive Estimation) based similarity learning to speed up training of 100M pairs We use pretrained DTE model\"\n }\n },\n {\n \"[doc2]\": {\n \"content\": \"trained on internal data. You can find more details here - Models.md (https://dev.azure.com/TScience/_git/TSciencePublic?path=%2FDualTransformerEncoder%2FMODELS.md&version=GBmaster&_a=preview) Models.md DTE-pretrained for In-context Learning Research suggests that finetuned transformers can be used to retrieve semantically similar exemplars for e.g. KATE (https://arxiv.org/pdf/2101.06804.pdf) KATE . They show that finetuned models esp. tuned on related tasks give the maximum boost to GPT-3 in-context performance. DTE have lot of pretrained models that are trained on intent classification tasks. We can use these model embedding to find natural language utterances which are similar to our test utterances at test time. The steps are: 1. Embed\"\n }\n },\n {\n \"[doc3]\": {\n \"content\": \"train and test utterances using DTE model 2. For each test embedding, find K-nearest neighbors. 3. Prefix the prompt with nearest embeddings. The following diagram from the above paper (https://arxiv.org/pdf/2101.06804.pdf) the above paper visualizes this process: DTE-Finetuned This is an extension of DTE-pretrained method where we further finetune the embedding models for prompt crafting task. In summary, we sample random prompts from our training data and use them for GPT-3 inference for the another part of training data. Some prompts work better and lead to right results whereas other prompts lead\"\n }\n },\n {\n \"[doc4]\": {\n \"content\": \"to wrong completions. We finetune the model on the downstream task of whether a prompt is good or not based on whether it leads to right or wrong completion. This approach is similar to this paper: Learning To Retrieve Prompts for In-Context Learning (https://arxiv.org/pdf/2112.08633.pdf) this paper: Learning To Retrieve Prompts for In-Context Learning . This method is very general but it may require a lot of data to actually finetune a model to learn how to retrieve examples suitable for the downstream inference model like GPT-3.\"\n }\n }\n ]\n}", diff --git a/code/backend/batch/utilities/helpers/env_helper.py b/code/backend/batch/utilities/helpers/env_helper.py index 0cff6b52d..873bce6ec 100644 --- a/code/backend/batch/utilities/helpers/env_helper.py +++ b/code/backend/batch/utilities/helpers/env_helper.py @@ -4,7 +4,6 @@ from dotenv import load_dotenv from azure.identity import DefaultAzureCredential, get_bearer_token_provider from azure.keyvault.secrets import SecretClient -from .config.conversation_flow import ConversationFlow logger = logging.getLogger(__name__) @@ -69,9 +68,13 @@ def __load_config(self, **kwargs) -> None: self.AZURE_SEARCH_FIELDS_METADATA = os.getenv( "AZURE_SEARCH_FIELDS_METADATA", "metadata" ) - self.AZURE_SEARCH_SOURCE_COLUMN = os.getenv("AZURE_SEARCH_SOURCE_COLUMN", "source") + self.AZURE_SEARCH_SOURCE_COLUMN = os.getenv( + "AZURE_SEARCH_SOURCE_COLUMN", "source" + ) self.AZURE_SEARCH_CHUNK_COLUMN = os.getenv("AZURE_SEARCH_CHUNK_COLUMN", "chunk") - self.AZURE_SEARCH_OFFSET_COLUMN = os.getenv("AZURE_SEARCH_OFFSET_COLUMN", "offset") + self.AZURE_SEARCH_OFFSET_COLUMN = os.getenv( + "AZURE_SEARCH_OFFSET_COLUMN", "offset" + ) self.AZURE_SEARCH_CONVERSATIONS_LOG_INDEX = os.getenv( "AZURE_SEARCH_CONVERSATIONS_LOG_INDEX", "conversations" ) @@ -211,10 +214,6 @@ def __load_config(self, **kwargs) -> None: self.ORCHESTRATION_STRATEGY = os.getenv( "ORCHESTRATION_STRATEGY", "openai_function" ) - # Conversation Type - which chooses between custom or byod - self.CONVERSATION_FLOW = os.getenv( - "CONVERSATION_FLOW", ConversationFlow.CUSTOM.value - ) # Speech Service self.AZURE_SPEECH_SERVICE_NAME = os.getenv("AZURE_SPEECH_SERVICE_NAME", "") self.AZURE_SPEECH_SERVICE_REGION = os.getenv("AZURE_SPEECH_SERVICE_REGION") diff --git a/code/backend/pages/04_Configuration.py b/code/backend/pages/04_Configuration.py index 1a6bd53a7..cfb5f64e0 100644 --- a/code/backend/pages/04_Configuration.py +++ b/code/backend/pages/04_Configuration.py @@ -7,6 +7,7 @@ from batch.utilities.helpers.config.config_helper import ConfigHelper from azure.core.exceptions import ResourceNotFoundError from batch.utilities.helpers.config.assistant_strategy import AssistantStrategy +from batch.utilities.helpers.config.conversation_flow import ConversationFlow sys.path.append(os.path.join(os.path.dirname(__file__), "..")) env_helper: EnvHelper = EnvHelper() @@ -65,6 +66,8 @@ def load_css(file_path): st.session_state["orchestrator_strategy"] = config.orchestrator.strategy.value if "ai_assistant_type" not in st.session_state: st.session_state["ai_assistant_type"] = config.prompts.ai_assistant_type +if "conversational_flow" not in st.session_state: + st.session_state["conversational_flow"] = config.prompts.conversational_flow if env_helper.AZURE_SEARCH_USE_INTEGRATED_VECTORIZATION: if "max_page_length" not in st.session_state: @@ -163,6 +166,17 @@ def validate_documents(): try: + conversational_flow_help = "Whether to use the custom conversational flow or byod conversational flow. Refer to the Conversational flow options README for more details." + with st.expander("Conversational flow configuration", expanded=True): + cols = st.columns([2, 4]) + with cols[0]: + conv_flow = st.selectbox( + "Conversational flow", + key="conversational_flow", + options=config.get_available_conversational_flows(), + help=conversational_flow_help, + ) + with st.expander("Orchestrator configuration", expanded=True): cols = st.columns([2, 4]) with cols[0]: @@ -170,6 +184,12 @@ def validate_documents(): "Orchestrator strategy", key="orchestrator_strategy", options=config.get_available_orchestration_strategies(), + disabled=( + True + if st.session_state["conversational_flow"] + == ConversationFlow.BYOD.value + else False + ), ) # # # condense_question_prompt_help = "This prompt is used to convert the user's input to a standalone question, using the context of the chat history." @@ -377,6 +397,7 @@ def validate_documents(): ], "enable_content_safety": st.session_state["enable_content_safety"], "ai_assistant_type": st.session_state["ai_assistant_type"], + "conversational_flow": st.session_state["conversational_flow"], }, "messages": { "post_answering_filter": st.session_state[ diff --git a/code/create_app.py b/code/create_app.py index a01d37832..896db501c 100644 --- a/code/create_app.py +++ b/code/create_app.py @@ -8,23 +8,67 @@ import mimetypes from os import path import sys +import re import requests from openai import AzureOpenAI, Stream, APIStatusError from openai.types.chat import ChatCompletionChunk from flask import Flask, Response, request, Request, jsonify from dotenv import load_dotenv +from urllib.parse import quote from backend.batch.utilities.helpers.env_helper import EnvHelper from backend.batch.utilities.helpers.orchestrator_helper import Orchestrator from backend.batch.utilities.helpers.config.config_helper import ConfigHelper from backend.batch.utilities.helpers.config.conversation_flow import ConversationFlow from azure.mgmt.cognitiveservices import CognitiveServicesManagementClient from azure.identity import DefaultAzureCredential +from backend.batch.utilities.helpers.azure_blob_storage_client import ( + AzureBlobStorageClient, +) ERROR_429_MESSAGE = "We're currently experiencing a high number of requests for the service you're trying to access. Please wait a moment and try again." ERROR_GENERIC_MESSAGE = "An error occurred. Please try again. If the problem persists, please contact the site administrator." logger = logging.getLogger(__name__) +def get_markdown_url(source, title, container_sas): + """Get Markdown URL for a citation""" + + url = quote(source, safe=":/") + if "_SAS_TOKEN_PLACEHOLDER_" in url: + url = url.replace("_SAS_TOKEN_PLACEHOLDER_", container_sas) + return f"[{title}]({url})" + + +def get_citations(citation_list): + """Returns Formated Citations""" + blob_client = AzureBlobStorageClient() + container_sas = blob_client.get_container_sas() + citations_dict = {"citations": []} + for citation in citation_list.get("citations"): + metadata = ( + json.loads(citation["url"]) + if isinstance(citation["url"], str) + else citation["url"] + ) + title = citation["title"] + url = get_markdown_url(metadata["source"], title, container_sas) + citations_dict["citations"].append( + { + "content": url + "\n\n\n" + citation["content"], + "id": metadata["id"], + "chunk_id": ( + re.findall(r"\d+", metadata["chunk_id"])[-1] + if metadata["chunk_id"] is not None + else metadata["chunk"] + ), + "title": title, + "filepath": title.split("/")[-1], + "url": url, + } + ) + return citations_dict + + def stream_with_data(response: Stream[ChatCompletionChunk]): """This function streams the response from Azure OpenAI with data.""" response_obj = { @@ -67,8 +111,9 @@ def stream_with_data(response: Stream[ChatCompletionChunk]): role = delta.role if role == "assistant": + citations = get_citations(delta.model_extra["context"]) response_obj["choices"][0]["messages"][0]["content"] = json.dumps( - delta.model_extra["context"], + citations, ensure_ascii=False, ) else: @@ -135,7 +180,8 @@ def conversation_with_data(conversation: Request, env_helper: EnvHelper): env_helper.AZURE_SEARCH_CONTENT_VECTOR_COLUMN ], "title_field": env_helper.AZURE_SEARCH_TITLE_COLUMN or None, - "url_field": env_helper.AZURE_SEARCH_URL_COLUMN or None, + "url_field": env_helper.AZURE_SEARCH_FIELDS_METADATA + or None, "filepath_field": ( env_helper.AZURE_SEARCH_FILENAME_COLUMN or None ), @@ -166,6 +212,7 @@ def conversation_with_data(conversation: Request, env_helper: EnvHelper): ) if not env_helper.SHOULD_STREAM: + citations = get_citations(response.choices[0].message.model_extra["context"]) response_obj = { "id": response.id, "model": response.model, @@ -176,7 +223,7 @@ def conversation_with_data(conversation: Request, env_helper: EnvHelper): "messages": [ { "content": json.dumps( - response.choices[0].message.model_extra["context"], + citations, ensure_ascii=False, ), "end_turn": False, @@ -194,10 +241,7 @@ def conversation_with_data(conversation: Request, env_helper: EnvHelper): return response_obj - return Response( - stream_with_data(response), - mimetype="application/json-lines", - ) + return Response(stream_with_data(response), mimetype="application/json-lines") def stream_without_data(response: Stream[ChatCompletionChunk]): @@ -405,7 +449,9 @@ async def conversation_custom(): @app.route("/api/conversation", methods=["POST"]) async def conversation(): - conversation_flow = env_helper.CONVERSATION_FLOW + ConfigHelper.get_active_config_or_default.cache_clear() + result = ConfigHelper.get_active_config_or_default() + conversation_flow = result.prompts.conversational_flow if conversation_flow == ConversationFlow.CUSTOM.value: return await conversation_custom() elif conversation_flow == ConversationFlow.BYOD.value: diff --git a/code/frontend/src/components/Answer/AnswerParser.tsx b/code/frontend/src/components/Answer/AnswerParser.tsx index 4238ab8eb..57dd791a0 100644 --- a/code/frontend/src/components/Answer/AnswerParser.tsx +++ b/code/frontend/src/components/Answer/AnswerParser.tsx @@ -11,7 +11,7 @@ let filteredCitations = [] as Citation[]; // Define a function to check if a citation with the same Chunk_Id already exists in filteredCitations const isDuplicate = (citation: Citation,citationIndex:string) => { - return filteredCitations.some((c) => c.chunk_id === citation.chunk_id) && !filteredCitations.find((c) => c.id === citationIndex) ; + return filteredCitations.some((c) => c.chunk_id === citation.chunk_id) ; }; export function parseAnswer(answer: AskResponse): ParsedAnswer { diff --git a/code/tests/functional/tests/backend_api/default/test_conversation.py b/code/tests/functional/tests/backend_api/default/test_conversation.py index 70d567e14..645529fe7 100644 --- a/code/tests/functional/tests/backend_api/default/test_conversation.py +++ b/code/tests/functional/tests/backend_api/default/test_conversation.py @@ -2,6 +2,7 @@ import re import pytest from pytest_httpserver import HTTPServer +from unittest.mock import patch import requests from tests.request_matching import ( @@ -176,7 +177,9 @@ def test_post_makes_correct_calls_to_openai_embeddings_to_embed_question_to_sear def test_post_makes_correct_calls_to_openai_embeddings_to_embed_question_to_store_in_conversation_log( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + app_url: str, + app_config: AppConfig, + httpserver: HTTPServer, ): # when requests.post(f"{app_url}{path}", json=body) @@ -649,9 +652,15 @@ def test_post_makes_correct_call_to_store_conversation_in_search( ) +@patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" +) def test_post_returns_error_when_downstream_fails( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + get_active_config_or_default_mock, app_url: str, httpserver: HTTPServer ): + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) httpserver.expect_oneshot_request( re.compile(".*"), ).respond_with_json({}, status=403) diff --git a/code/tests/functional/tests/backend_api/with_byod/test_conversation_flow.py b/code/tests/functional/tests/backend_api/with_byod/test_conversation_flow.py index b9ea5e7f0..c0e5537fe 100644 --- a/code/tests/functional/tests/backend_api/with_byod/test_conversation_flow.py +++ b/code/tests/functional/tests/backend_api/with_byod/test_conversation_flow.py @@ -1,6 +1,7 @@ import json import pytest from pytest_httpserver import HTTPServer +from unittest.mock import patch import requests from string import Template @@ -30,7 +31,7 @@ def setup_default_mocking(httpserver: HTTPServer, app_config: AppConfig): method="POST", ).respond_with_data( Template( - r"""data: {"id":"92f715be-cfc4-4ae6-80f8-c86b7955f6af","model":"$model","created":1712077271,"object":"extensions.chat.completion.chunk","choices":[{"index":0,"delta":{"role":"assistant","context":{"citations":[{"content":"document","title":"/documents/doc.pdf","url":null,"filepath":null,"chunk_id":"0"}],"intent":"[\"intent\"]"}},"end_turn":false,"finish_reason":null}]} + r"""data: {"id":"92f715be-cfc4-4ae6-80f8-c86b7955f6af","model":"$model","created":1712077271,"object":"extensions.chat.completion.chunk","choices":[{"index":0,"delta":{"role":"assistant","context":{"citations":[{"content":"document","title":"/documents/doc.pdf","url":{"id": "id", "source": "source", "title": "title", "chunk": 46, "chunk_id": null},"filepath":null,"chunk_id":"0"}],"intent":"[\"intent\"]"}},"end_turn":false,"finish_reason":null}]} data: {"id":"92f715be-cfc4-4ae6-80f8-c86b7955f6af","model":"$model","created":1712077271,"object":"extensions.chat.completion.chunk","choices":[{"index":0,"delta":{"content":"42 is the meaning of life"},"end_turn":false,"finish_reason":null}],"system_fingerprint":"fp_68a7d165bf"} @@ -46,9 +47,16 @@ def setup_default_mocking(httpserver: HTTPServer, app_config: AppConfig): httpserver.check() +@patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" +) def test_azure_byod_responds_successfully_when_streaming( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + get_active_config_or_default_mock, + app_url: str, + app_config: AppConfig, ): + get_active_config_or_default_mock.return_value.prompts.conversational_flow = "byod" + # when response = requests.post(f"{app_url}{path}", json=body) @@ -69,7 +77,7 @@ def test_azure_byod_responds_successfully_when_streaming( { "messages": [ { - "content": r'{"citations": [{"content": "document", "title": "/documents/doc.pdf", "url": null, "filepath": null, "chunk_id": "0"}], "intent": "[\"intent\"]"}', + "content": '{"citations": [{"content": "[/documents/doc.pdf](source)\\n\\n\\ndocument", "id": "id", "chunk_id": 46, "title": "/documents/doc.pdf", "filepath": "doc.pdf", "url": "[/documents/doc.pdf](source)"}]}', "end_turn": False, "role": "tool", }, @@ -84,9 +92,17 @@ def test_azure_byod_responds_successfully_when_streaming( } +@patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" +) def test_post_makes_correct_call_to_azure_openai( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + get_active_config_or_default_mock, + app_url: str, + app_config: AppConfig, + httpserver: HTTPServer, ): + get_active_config_or_default_mock.return_value.prompts.conversational_flow = "byod" + # when requests.post(f"{app_url}{path}", json=body) @@ -113,12 +129,12 @@ def test_post_makes_correct_call_to_azure_openai( "fields_mapping": { "content_fields": ["content"], "vector_fields": [ - app_config.get( - "AZURE_SEARCH_CONTENT_VECTOR_COLUMN" - ) + app_config.get("AZURE_SEARCH_CONTENT_VECTOR_COLUMN") ], "title_field": "title", - "url_field": "url", + "url_field": app_config.get( + "AZURE_SEARCH_FIELDS_METADATA" + ), "filepath_field": "filepath", }, "filter": app_config.get("AZURE_SEARCH_FILTER"), diff --git a/code/tests/functional/tests/backend_api/without_data/test_azure_byod_without_data.py b/code/tests/functional/tests/backend_api/without_data/test_azure_byod_without_data.py index f453e8ec0..c903b8eb3 100644 --- a/code/tests/functional/tests/backend_api/without_data/test_azure_byod_without_data.py +++ b/code/tests/functional/tests/backend_api/without_data/test_azure_byod_without_data.py @@ -3,6 +3,7 @@ from pytest_httpserver import HTTPServer import requests from string import Template +from unittest.mock import patch, MagicMock from tests.request_matching import ( RequestMatcher, @@ -48,9 +49,28 @@ def setup_default_mocking(httpserver: HTTPServer, app_config: AppConfig): httpserver.check() +@pytest.fixture(autouse=True) +def env_helper_mock(): + with patch("backend.batch.utilities.helpers.env_helper.EnvHelper") as mock: + env_helper = mock.return_value + + yield env_helper + + +@patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" +) def test_azure_byod_responds_successfully_when_streaming( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + get_active_config_or_default_mock, + app_url: str, + app_config: AppConfig, + env_helper_mock: MagicMock, ): + # given + env_helper_mock.AZURE_SEARCH_KEY = None + env_helper_mock.should_use_data.return_value = False + get_active_config_or_default_mock.return_value.prompts.conversational_flow = "byod" + # when response = requests.post(f"{app_url}{path}", json=body) @@ -80,9 +100,18 @@ def test_azure_byod_responds_successfully_when_streaming( } +@patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" +) def test_post_makes_correct_call_to_azure_openai( - app_url: str, app_config: AppConfig, httpserver: HTTPServer + get_active_config_or_default_mock, + app_url: str, + app_config: AppConfig, + httpserver: HTTPServer, ): + # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = "byod" + # when requests.post(f"{app_url}{path}", json=body) diff --git a/code/tests/test_app.py b/code/tests/test_app.py index 75deba2ce..776e48bef 100644 --- a/code/tests/test_app.py +++ b/code/tests/test_app.py @@ -26,7 +26,7 @@ AZURE_SEARCH_CONTENT_VECTOR_COLUMN = "vector-column" AZURE_SEARCH_TITLE_COLUMN = "title" AZURE_SEARCH_FILENAME_COLUMN = "filename" -AZURE_SEARCH_URL_COLUMN = "url" +AZURE_SEARCH_URL_COLUMN = "metadata" AZURE_SEARCH_FILTER = "filter" AZURE_SEARCH_ENABLE_IN_DOMAIN = "true" AZURE_SEARCH_TOP_K = 5 @@ -110,7 +110,7 @@ def test_returns_speech_token_using_keys( "token": "speech-token", "region": AZURE_SPEECH_SERVICE_REGION, "languages": AZURE_SPEECH_RECOGNIZER_LANGUAGES, - "key": "mock-speech-key" + "key": "mock-speech-key", } requests.post.assert_called_once_with( @@ -154,7 +154,7 @@ def test_returns_speech_token_using_rbac( "token": "speech-token", "region": AZURE_SPEECH_SERVICE_REGION, "languages": AZURE_SPEECH_RECOGNIZER_LANGUAGES, - "key": "mock-key1" + "key": "mock-key1", } requests.post.assert_called_once_with( @@ -245,6 +245,9 @@ def test_conversation_custom_returns_correct_response( ): """Test that the custom conversation endpoint returns the correct response.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) get_active_config_or_default_mock.return_value.orchestrator.return_value = ( self.orchestrator_config ) @@ -274,8 +277,12 @@ def test_conversation_custom_returns_correct_response( @patch("create_app.get_message_orchestrator") @patch("create_app.get_orchestrator_config") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_custom_calls_message_orchestrator_correctly( self, + get_active_config_or_default_mock, get_orchestrator_config_mock, get_message_orchestrator_mock, env_helper_mock, @@ -283,6 +290,9 @@ def test_conversation_custom_calls_message_orchestrator_correctly( ): """Test that the custom conversation endpoint calls the message orchestrator correctly.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) get_orchestrator_config_mock.return_value = self.orchestrator_config message_orchestrator_mock = AsyncMock() @@ -307,11 +317,17 @@ def test_conversation_custom_calls_message_orchestrator_correctly( ) @patch("create_app.get_orchestrator_config") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversaation_custom_returns_error_response_on_exception( - self, get_orchestrator_config_mock, env_helper_mock, client + self, get_active_config_or_default_mock, get_orchestrator_config_mock, client ): """Test that an error response is returned when an exception occurs.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) get_orchestrator_config_mock.side_effect = Exception("An error occurred") # when @@ -328,11 +344,17 @@ def test_conversaation_custom_returns_error_response_on_exception( } @patch("create_app.get_orchestrator_config") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_custom_returns_error_response_on_rate_limit_error( - self, get_orchestrator_config_mock, env_helper_mock, client + self, get_active_config_or_default_mock, get_orchestrator_config_mock, client ): """Test that a 429 response is returned on RateLimitError.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) response_mock = Mock() response_mock.status_code = 429 response_mock.json.return_value = { @@ -366,11 +388,17 @@ def test_conversation_custom_returns_error_response_on_rate_limit_error( } @patch("create_app.get_orchestrator_config") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_custom_returns_500_when_internalservererror_occurs( - self, get_orchestrator_config_mock, env_helper_mock, client + self, get_active_config_or_default_mock, get_orchestrator_config_mock, client ): """Test that an error response is returned when an exception occurs.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) response_mock = MagicMock() response_mock.status_code = 500 get_orchestrator_config_mock.side_effect = InternalServerError( @@ -393,16 +421,22 @@ def test_conversation_custom_returns_500_when_internalservererror_occurs( @patch("create_app.get_message_orchestrator") @patch("create_app.get_orchestrator_config") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_custom_allows_multiple_messages_from_user( self, + get_active_config_or_default_mock, get_orchestrator_config_mock, get_message_orchestrator_mock, - env_helper_mock, client, ): """This can happen if there was an error getting a response from the assistant for the previous user message.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "custom" + ) get_orchestrator_config_mock.return_value = self.orchestrator_config message_orchestrator_mock = AsyncMock() @@ -438,11 +472,18 @@ def test_conversation_custom_allows_multiple_messages_from_user( orchestrator=self.orchestrator_config, ) + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_returns_error_response_on_incorrect_conversation_flow_input( - self, env_helper_mock, client + self, + get_active_config_or_default_mock, + client, ): # given - env_helper_mock.CONVERSATION_FLOW = "bob" + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "bob" + ) # when response = client.post( @@ -487,6 +528,7 @@ def setup_method(self): { "content": "content", "title": "title", + "url": '{"id": "doc_id", "source": "source", "title": "title", "chunk": 46, "chunk_id": null}', } ], "intent": "intent", @@ -513,6 +555,7 @@ def setup_method(self): { "content": "content", "title": "title", + "url": '{"id": "doc_id", "source": "source", "title": "title", "chunk": 46, "chunk_id": null}', } ], "intent": "intent", @@ -557,8 +600,16 @@ def setup_method(self): ] @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) + @patch( + "backend.batch.utilities.helpers.azure_blob_storage_client.generate_container_sas" + ) def test_conversation_azure_byod_returns_correct_response_when_streaming_with_data_keys( self, + generate_container_sas_mock: MagicMock, + get_active_config_or_default_mock, azure_openai_mock: MagicMock, env_helper_mock: MagicMock, client: FlaskClient, @@ -570,7 +621,10 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da self.mock_streamed_response ) - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) + generate_container_sas_mock.return_value = "mock-sas" # when response = client.post( @@ -586,9 +640,9 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da data = str(response.data, "utf-8") assert ( data - == r"""{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "", "end_turn": false, "role": "assistant"}]}]} -{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": false, "role": "assistant"}]}]} -{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": true, "role": "assistant"}]}]} + == r"""{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "", "end_turn": false, "role": "assistant"}]}]} +{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": false, "role": "assistant"}]}]} +{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": true, "role": "assistant"}]}]} """ ) @@ -621,7 +675,7 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da "content_fields": ["field1", "field2"], "vector_fields": [AZURE_SEARCH_CONTENT_VECTOR_COLUMN], "title_field": AZURE_SEARCH_TITLE_COLUMN, - "url_field": AZURE_SEARCH_URL_COLUMN, + "url_field": env_helper_mock.AZURE_SEARCH_FIELDS_METADATA, "filepath_field": AZURE_SEARCH_FILENAME_COLUMN, }, "filter": AZURE_SEARCH_FILTER, @@ -641,8 +695,16 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da ) @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) + @patch( + "backend.batch.utilities.helpers.azure_blob_storage_client.generate_container_sas" + ) def test_conversation_azure_byod_returns_correct_response_when_streaming_with_data_rbac( self, + generate_container_sas_mock: MagicMock, + get_active_config_or_default_mock, azure_openai_mock: MagicMock, env_helper_mock: MagicMock, client: FlaskClient, @@ -650,7 +712,10 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da """Test that the Azure BYOD conversation endpoint returns the correct response.""" # given env_helper_mock.is_auth_type_keys.return_value = False - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) + generate_container_sas_mock.return_value = "mock-sas" openai_client_mock = azure_openai_mock.return_value openai_client_mock.chat.completions.create.return_value = ( self.mock_streamed_response @@ -670,9 +735,9 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da data = str(response.data, "utf-8") assert ( data - == r"""{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "", "end_turn": false, "role": "assistant"}]}]} -{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": false, "role": "assistant"}]}]} -{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"content\", \"title\": \"title\"}], \"intent\": \"intent\"}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": true, "role": "assistant"}]}]} + == r"""{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "", "end_turn": false, "role": "assistant"}]}]} +{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": false, "role": "assistant"}]}]} +{"id": "response.id", "model": "mock-openai-model", "created": 0, "object": "response.object", "choices": [{"messages": [{"content": "{\"citations\": [{\"content\": \"[title](source)\\n\\n\\ncontent\", \"id\": \"doc_id\", \"chunk_id\": 46, \"title\": \"title\", \"filepath\": \"title\", \"url\": \"[title](source)\"}]}", "end_turn": false, "role": "tool"}, {"content": "A question\n?", "end_turn": true, "role": "assistant"}]}]} """ ) @@ -691,8 +756,16 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_with_da } @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) + @patch( + "backend.batch.utilities.helpers.azure_blob_storage_client.generate_container_sas" + ) def test_conversation_azure_byod_returns_correct_response_when_not_streaming_with_data( self, + generate_container_sas_mock: MagicMock, + get_active_config_or_default_mock, azure_openai_mock: MagicMock, env_helper_mock: MagicMock, client: FlaskClient, @@ -700,7 +773,10 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit """Test that the Azure BYOD conversation endpoint returns the correct response.""" # given env_helper_mock.SHOULD_STREAM = False - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) + generate_container_sas_mock.return_value = "mock-sas" openai_client_mock = azure_openai_mock.return_value openai_client_mock.chat.completions.create.return_value = self.mock_response @@ -723,7 +799,7 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit { "messages": [ { - "content": '{"citations": [{"content": "content", "title": "title"}], "intent": "intent"}', + "content": '{"citations": [{"content": "[title](source)\\n\\n\\ncontent", "id": "doc_id", "chunk_id": 46, "title": "title", "filepath": "title", "url": "[title](source)"}]}', "end_turn": False, "role": "tool", }, @@ -738,13 +814,21 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit } @patch("create_app.conversation_with_data") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_500_when_exception_occurs( - self, conversation_with_data_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + conversation_with_data_mock, + client, ): """Test that an error response is returned when an exception occurs.""" # given conversation_with_data_mock.side_effect = Exception("Test exception") - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) # when response = client.post( @@ -760,8 +844,14 @@ def test_conversation_azure_byod_returns_500_when_exception_occurs( } @patch("create_app.conversation_with_data") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_500_when_internalservererror_occurs( - self, conversation_with_data_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + conversation_with_data_mock, + client, ): """Test that an error response is returned when an exception occurs.""" # given @@ -770,7 +860,9 @@ def test_conversation_azure_byod_returns_500_when_internalservererror_occurs( conversation_with_data_mock.side_effect = InternalServerError( "Test exception", response=response_mock, body="" ) - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) # when response = client.post( @@ -787,8 +879,14 @@ def test_conversation_azure_byod_returns_500_when_internalservererror_occurs( } @patch("create_app.conversation_with_data") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_429_on_rate_limit_error( - self, conversation_with_data_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + conversation_with_data_mock, + client, ): """Test that a 429 response is returned on RateLimitError for BYOD conversation.""" # given @@ -807,7 +905,9 @@ def test_conversation_azure_byod_returns_429_on_rate_limit_error( conversation_with_data_mock.side_effect = BadRequestError( message="Error code: 400", response=response_mock, body="" ) - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) # when response = client.post( @@ -824,14 +924,23 @@ def test_conversation_azure_byod_returns_429_on_rate_limit_error( } @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_correct_response_when_not_streaming_without_data_keys( - self, azure_openai_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + azure_openai_mock, + env_helper_mock, + client, ): """Test that the Azure BYOD conversation endpoint returns the correct response.""" # given env_helper_mock.should_use_data.return_value = False env_helper_mock.SHOULD_STREAM = False - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) openai_client_mock = MagicMock() azure_openai_mock.return_value = openai_client_mock @@ -889,8 +998,15 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit ) @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_correct_response_when_not_streaming_without_data_rbac( - self, azure_openai_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + azure_openai_mock, + env_helper_mock, + client, ): """Test that the Azure BYOD conversation endpoint returns the correct response.""" # given @@ -898,7 +1014,9 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit env_helper_mock.SHOULD_STREAM = False env_helper_mock.AZURE_AUTH_TYPE = "rbac" env_helper_mock.AZURE_OPENAI_STOP_SEQUENCE = "" - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) openai_client_mock = MagicMock() azure_openai_mock.return_value = openai_client_mock @@ -956,13 +1074,22 @@ def test_conversation_azure_byod_returns_correct_response_when_not_streaming_wit ) @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) def test_conversation_azure_byod_returns_correct_response_when_streaming_without_data( - self, azure_openai_mock, env_helper_mock, client + self, + get_active_config_or_default_mock, + azure_openai_mock, + env_helper_mock, + client, ): """Test that the Azure BYOD conversation endpoint returns the correct response.""" # given env_helper_mock.should_use_data.return_value = False - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) openai_client_mock = MagicMock() azure_openai_mock.return_value = openai_client_mock @@ -994,19 +1121,29 @@ def test_conversation_azure_byod_returns_correct_response_when_streaming_without ) @patch("create_app.AzureOpenAI") + @patch( + "backend.batch.utilities.helpers.config.config_helper.ConfigHelper.get_active_config_or_default" + ) + @patch( + "backend.batch.utilities.helpers.azure_blob_storage_client.generate_container_sas" + ) def test_conversation_azure_byod_uses_semantic_config( self, + generate_container_sas_mock: MagicMock, + get_active_config_or_default_mock, azure_openai_mock: MagicMock, - env_helper_mock: MagicMock, client: FlaskClient, ): """Test that the Azure BYOD conversation endpoint uses the semantic configuration.""" # given + get_active_config_or_default_mock.return_value.prompts.conversational_flow = ( + "byod" + ) + generate_container_sas_mock.return_value = "mock-sas" openai_client_mock = azure_openai_mock.return_value openai_client_mock.chat.completions.create.return_value = ( self.mock_streamed_response ) - env_helper_mock.CONVERSATION_FLOW = ConversationFlow.BYOD.value # when response = client.post( diff --git a/code/tests/utilities/helpers/test_config_helper.py b/code/tests/utilities/helpers/test_config_helper.py index 0c2f0cb3d..8c35dedce 100644 --- a/code/tests/utilities/helpers/test_config_helper.py +++ b/code/tests/utilities/helpers/test_config_helper.py @@ -19,7 +19,8 @@ def config_dict(): "post_answering_prompt": "mock_post_answering_prompt", "enable_post_answering_prompt": False, "enable_content_safety": True, - "ai_assistant_type": "default" + "ai_assistant_type": "default", + "conversational_flow": "custom", }, "messages": { "post_answering_filter": "mock_post_answering_filter",