Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add test for backend functions #644

Merged
merged 22 commits into from
Apr 15, 2024
Merged
Show file tree
Hide file tree
Changes from 13 commits
Commits
Show all changes
22 commits
Select commit Hold shift + click to select a range
af6cf8f
Add test for batch processing function
tanya-borisova Apr 9, 2024
2ddc45e
Remove comment
tanya-borisova Apr 9, 2024
4295e5d
Merge branch 'main' of github.com:Azure-Samples/chat-with-your-data-s…
tanya-borisova Apr 9, 2024
f37d719
Try to remove sys path modifications
tanya-borisova Apr 9, 2024
1461250
Fix imports
tanya-borisova Apr 9, 2024
1ecc1f5
Fix sys path append statements by making paths absolute
tanya-borisova Apr 10, 2024
36faa21
Merge branch 'main' into 584-add-unit-tests-for-the-batch-function-app
tanya-borisova Apr 10, 2024
cc55b1a
Remove extra sys.path.append that isnt necessary
tanya-borisova Apr 10, 2024
6e9abf2
Merge branch '584-add-unit-tests-for-the-batch-function-app' of githu…
tanya-borisova Apr 10, 2024
4b0cf90
Apply suggestions from code review
tanya-borisova Apr 11, 2024
3ecdb85
Rename test file, add a test for no url in request
tanya-borisova Apr 11, 2024
642e619
Make sure ConfigHelper etc are mocked out
tanya-borisova Apr 11, 2024
4278eae
Mock out config helper
tanya-borisova Apr 11, 2024
4bed86c
Improve sys.path.append
tanya-borisova Apr 12, 2024
c313534
Merge branch 'main' of github.com:Azure-Samples/chat-with-your-data-s…
tanya-borisova Apr 12, 2024
59bf150
Mock EnvHelper as well to speed up test execution time
tanya-borisova Apr 12, 2024
691912d
Utilise get_user_function() method to enable tests
tanya-borisova Apr 12, 2024
9a805f1
re-add env sample
tanya-borisova Apr 12, 2024
c139155
Merge branch 'main' into 584-add-unit-tests-for-the-batch-function-app
tanya-borisova Apr 12, 2024
de3bf93
Init log level from os environ
tanya-borisova Apr 12, 2024
833f107
Merge branch '584-add-unit-tests-for-the-batch-function-app' of githu…
tanya-borisova Apr 12, 2024
b3a8081
Merge branch 'main' into 584-add-unit-tests-for-the-batch-function-app
tanya-borisova Apr 12, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
57 changes: 0 additions & 57 deletions .env.sample

This file was deleted.

7 changes: 4 additions & 3 deletions code/backend/batch/AddURLEmbeddings.py
Original file line number Diff line number Diff line change
@@ -1,20 +1,21 @@
import logging
import traceback
import azure.functions as func
import sys

from utilities.helpers.DocumentProcessorHelper import DocumentProcessor
from utilities.helpers.ConfigHelper import ConfigHelper
adamdougal marked this conversation as resolved.
Show resolved Hide resolved

sys.path.append("..")
adamdougal marked this conversation as resolved.
Show resolved Hide resolved

bp_add_url_embeddings = func.Blueprint()

logger = logging.getLogger(__name__)


@bp_add_url_embeddings.route(route="AddURLEmbeddings")
def add_url_embeddings(req: func.HttpRequest) -> func.HttpResponse:
return do_add_url_embeddings(req)
adamdougal marked this conversation as resolved.
Show resolved Hide resolved


def do_add_url_embeddings(req: func.HttpRequest) -> func.HttpResponse:
logger.info("Python HTTP trigger function processed a request.")
# Get Url from request
url = req.params.get("url")
Expand Down
12 changes: 8 additions & 4 deletions code/backend/batch/BatchPushResults.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,16 +2,15 @@
import json
import azure.functions as func
from urllib.parse import urlparse
import sys

from utilities.helpers.AzureBlobStorageHelper import AzureBlobStorageClient
from utilities.helpers.AzureBlobStorageHelper import (
AzureBlobStorageClient,
)
from utilities.helpers.DocumentProcessorHelper import DocumentProcessor
from utilities.helpers.ConfigHelper import ConfigHelper

sys.path.append("..")

bp_batch_push_results = func.Blueprint()

logger = logging.getLogger(__name__)


Expand All @@ -29,6 +28,10 @@ def _get_file_name_from_message(msg: func.QueueMessage) -> str:
arg_name="msg", queue_name="doc-processing", connection="AzureWebJobsStorage"
)
def batch_push_results(msg: func.QueueMessage) -> None:
do_batch_push_results(msg)


def do_batch_push_results(msg: func.QueueMessage) -> None:
logger.info(
"Python queue trigger function processed a queue item: %s",
msg.get_body().decode("utf-8"),
Expand All @@ -41,6 +44,7 @@ def batch_push_results(msg: func.QueueMessage) -> None:
file_sas = blob_client.get_blob_sas(file_name)
# Get file extension's processors
file_extension = file_name.split(".")[-1]

processors = list(
filter(
lambda x: x.document_type.lower() == file_extension.lower(),
Expand Down
8 changes: 5 additions & 3 deletions code/backend/batch/BatchStartProcessing.py
Original file line number Diff line number Diff line change
@@ -1,22 +1,24 @@
import logging
import json
import azure.functions as func
import sys

from utilities.helpers.EnvHelper import EnvHelper
from utilities.helpers.AzureBlobStorageHelper import (
AzureBlobStorageClient,
create_queue_client,
)

sys.path.append("..")
bp_batch_start_processing = func.Blueprint()
env_helper: EnvHelper = EnvHelper()

logger = logging.getLogger(__name__)


@bp_batch_start_processing.route(route="BatchStartProcessing")
def batch_start_processing(req: func.HttpRequest) -> func.HttpResponse:
return do_batch_start_processing(req)


def do_batch_start_processing(req: func.HttpRequest) -> func.HttpResponse:
logger.info("Requested to start processing all documents received")
# Set up Blob Storage Client
azure_blob_storage_client = AzureBlobStorageClient()
Expand Down
10 changes: 6 additions & 4 deletions code/backend/batch/GetConversationResponse.py
Original file line number Diff line number Diff line change
@@ -1,20 +1,23 @@
import azure.functions as func
import logging
import json
import sys

from utilities.helpers.EnvHelper import EnvHelper
from utilities.helpers.OrchestratorHelper import Orchestrator
from utilities.helpers.ConfigHelper import ConfigHelper

sys.path.append("..")

bp_get_conversation_response = func.Blueprint()
env_helper: EnvHelper = EnvHelper()

logger = logging.getLogger(__name__)


@bp_get_conversation_response.route(route="GetConversationResponse")
def get_conversation_response(req: func.HttpRequest) -> func.HttpResponse:
return do_get_conversation_response(req)


def do_get_conversation_response(req: func.HttpRequest) -> func.HttpResponse:
logger.info("Python HTTP trigger function processed a request.")

message_orchestrator = Orchestrator()
Expand All @@ -37,7 +40,6 @@ def get_conversation_response(req: func.HttpRequest) -> func.HttpResponse:
user_assistant_messages[i + 1]["content"],
)
)
from utilities.helpers.ConfigHelper import ConfigHelper

messages = message_orchestrator.handle_message(
user_message=user_message,
Expand Down
Empty file.
58 changes: 58 additions & 0 deletions code/tests/test_AddURLEmbeddings.py
tanya-borisova marked this conversation as resolved.
Show resolved Hide resolved
Original file line number Diff line number Diff line change
@@ -0,0 +1,58 @@
import sys
import os
from unittest.mock import patch
import azure.functions as func


function_app_path = os.path.abspath(
os.path.join(os.path.dirname(__file__), "../backend/batch")
)
sys.path.append(function_app_path)

from backend.batch.AddURLEmbeddings import do_add_url_embeddings # noqa: E402


@patch("backend.batch.AddURLEmbeddings.ConfigHelper")
@patch("backend.batch.AddURLEmbeddings.DocumentProcessor")
def test_add_url_embeddings_when_url_set_in_body(_, __):
fake_request = func.HttpRequest(
method="POST",
url="",
body=b'{"url": "https://example.com"}',
headers={"Content-Type": "application/json"},
)

response = do_add_url_embeddings(fake_request)

assert response.status_code == 200


@patch("backend.batch.AddURLEmbeddings.ConfigHelper")
@patch("backend.batch.AddURLEmbeddings.DocumentProcessor")
def test_add_url_embeddings_when_url_set_in_param(_, __):
fake_request = func.HttpRequest(
method="POST",
url="",
body=b"",
headers={"Content-Type": "application/json"},
params={"url": "https://example.com"},
)

response = do_add_url_embeddings(fake_request)

assert response.status_code == 200


@patch("backend.batch.AddURLEmbeddings.ConfigHelper")
@patch("backend.batch.AddURLEmbeddings.DocumentProcessor")
def test_add_url_embeddings_returns_400_when_url_not_set(_, __):
fake_request = func.HttpRequest(
method="POST",
url="",
body=b"",
params={},
)

response = do_add_url_embeddings(fake_request)

assert response.status_code == 400
67 changes: 67 additions & 0 deletions code/tests/test_BatchPushResults.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,67 @@
import sys
import os
from unittest.mock import patch, Mock
from azure.functions import QueueMessage


function_app_path = os.path.abspath(
os.path.join(os.path.dirname(__file__), "../backend/batch")
)
sys.path.append(function_app_path)

from backend.batch.BatchPushResults import do_batch_push_results # noqa: E402
from backend.batch.BatchPushResults import _get_file_name_from_message # noqa: E402
tanya-borisova marked this conversation as resolved.
Show resolved Hide resolved


def test_get_file_name_from_message():
mock_queue_message = QueueMessage(
body='{"message": "test message", "filename": "test_filename.md"}'
)

file_name = _get_file_name_from_message(mock_queue_message)

assert file_name == "test_filename.md"


def test_get_file_name_from_message_no_filename():
mock_queue_message = QueueMessage(
body='{"data": { "url": "test/test/test_filename.md"} }'
)

file_name = _get_file_name_from_message(mock_queue_message)

assert file_name == "test_filename.md"


@patch("backend.batch.BatchPushResults.ConfigHelper")
@patch("backend.batch.BatchPushResults.AzureBlobStorageClient")
@patch("backend.batch.BatchPushResults.DocumentProcessor")
def test_do_batch_push_results(
mock_document_processor, mock_azure_blob_storage_client, mock_config_helper
):
mock_queue_message = QueueMessage(
body='{"message": "test message", "filename": "test/test/test_filename.md"}'
)

mock_blob_client_instance = mock_azure_blob_storage_client.return_value
mock_blob_client_instance.get_blob_sas.return_value = "test_blob_sas"

mock_document_processor_instance = mock_document_processor.return_value

md_processor = Mock()
md_processor.document_type.lower.return_value = "md"
txt_processor = Mock()
txt_processor.document_type.lower.return_value = "txt"
mock_processors = [md_processor, txt_processor]
mock_config_helper.get_active_config_or_default.return_value.document_processors = (
mock_processors
)

do_batch_push_results(mock_queue_message)

mock_document_processor_instance.process.assert_called_once_with(
source_url="test_blob_sas", processors=[md_processor]
)
mock_blob_client_instance.upsert_blob_metadata.assert_called_once_with(
"test/test/test_filename.md", {"embeddings_added": "true"}
)
63 changes: 63 additions & 0 deletions code/tests/test_BatchStartProcessing.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,63 @@
import sys
import os
from unittest.mock import patch, Mock

function_app_path = os.path.abspath(
os.path.join(os.path.dirname(__file__), "../backend/batch")
)
sys.path.append(function_app_path)

from backend.batch.BatchStartProcessing import do_batch_start_processing # noqa: E402


@patch("backend.batch.BatchStartProcessing.create_queue_client")
@patch("backend.batch.BatchStartProcessing.AzureBlobStorageClient")
def test_batch_start_processing_processes_all(
mock_blob_storage_client, mock_create_queue_client
):
mock_http_request = Mock()
mock_http_request.params = dict()
mock_http_request.params["process_all"] = "true"

mock_queue_client = Mock()
mock_create_queue_client.return_value = mock_queue_client

mock_blob_storage_client.return_value.get_all_files.return_value = [
{"filename": "file_name_one", "embeddings_added": False}
]

response = do_batch_start_processing(mock_http_request)

assert response.status_code == 200

mock_queue_client.send_message.assert_called_once_with(
b'{"filename": "file_name_one"}',
)


@patch("backend.batch.BatchStartProcessing.create_queue_client")
@patch("backend.batch.BatchStartProcessing.AzureBlobStorageClient")
def test_batch_start_processing_filters_filter_no_embeddings(
mock_blob_storage_client, mock_create_queue_client
):
mock_http_request = Mock()
mock_http_request.params = dict()
mock_http_request.params["process_all"] = "false"

mock_queue_client = Mock()
mock_create_queue_client.return_value = mock_queue_client

mock_blob_storage_client.return_value.get_all_files.return_value = [
{
"filename": "file_name_one",
"embeddings_added": True, # will get filtered out
},
{"filename": "file_name_two", "embeddings_added": False},
]
response = do_batch_start_processing(mock_http_request)

assert response.status_code == 200

mock_queue_client.send_message.assert_called_once_with(
b'{"filename": "file_name_two"}',
)
Loading
Loading