tests: added tests (#250)

2023-07-16 02:28:51 +02:00
parent d12aeec1ff
commit 3f71050c47
9 changed files with 388 additions and 29 deletions
--- a/tests/chunkers/test_text.py
+++ b/tests/chunkers/test_text.py
@@ -0,0 +1,42 @@
 # ruff: noqa: E501
 import unittest
 from embedchain.chunkers.text import TextChunker
 class TestTextChunker(unittest.TestCase):
    def test_chunks(self):
        """
        Test the chunks generated by TextChunker.
        # TODO: Not a very precise test.
        """
        chunker_config = {
            "chunk_size": 10,
            "chunk_overlap": 0,
            "length_function": len,
        }
        chunker = TextChunker(config=chunker_config)
        text = "Lorem ipsum dolor sit amet, consectetur adipiscing elit."
        result = chunker.create_chunks(MockLoader(), text)
        documents = result["documents"]
        self.assertGreaterEqual(len(documents), 5)
    # Additional test cases can be added to cover different scenarios
 class MockLoader:
    def load_data(self, src):
        """
        Mock loader that returns a list of data dictionaries.
        Adjust this method to return different data for testing.
        """
        return [
            {
                "content": src,
                "meta_data": {"url": "none"},
            }
        ]
--- a/tests/embedchain/test_add.py
+++ b/tests/embedchain/test_add.py
@@ -0,0 +1,26 @@
 import os
 import unittest
 from unittest.mock import MagicMock, patch
 from embedchain import App
 class TestApp(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    def setUp(self):
        self.app = App()
    @patch("chromadb.api.models.Collection.Collection.add", MagicMock)
    def test_add(self):
        """
        This test checks the functionality of the 'add' method in the App class.
        It begins by simulating the addition of a web page with a specific URL to the application instance.
        The 'add' method is expected to append the input type and URL to the 'user_asks' attribute of the App instance.
        By asserting that 'user_asks' is updated correctly after the 'add' method is called, we can confirm that the
        method is working as intended.
        The Collection.add method from the chromadb library is mocked during this test to isolate the behavior of the
        'add' method.
        """
        self.app.add("web_page", "https://example.com", {"meta": "meta-data"})
        self.assertEqual(self.app.user_asks, [["web_page", "https://example.com", {"meta": "meta-data"}]])
--- a/tests/embedchain/test_chat.py
+++ b/tests/embedchain/test_chat.py
@@ -0,0 +1,48 @@
 import os
 import unittest
 from unittest.mock import patch
 from embedchain import App
 class TestApp(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    def setUp(self):
        self.app = App()
    @patch("embedchain.embedchain.memory", autospec=True)
    @patch.object(App, "retrieve_from_database", return_value=["Test context"])
    @patch.object(App, "get_answer_from_llm", return_value="Test answer")
    def test_chat_with_memory(self, mock_answer, mock_retrieve, mock_memory):
        """
        This test checks the functionality of the 'chat' method in the App class with respect to the chat history
        memory.
        The 'chat' method is called twice. The first call initializes the chat history memory.
        The second call is expected to use the chat history from the first call.
        Key assumptions tested:
        - After the first call, 'memory.chat_memory.add_user_message' and 'memory.chat_memory.add_ai_message' are
            called with correct arguments, adding the correct chat history.
        - During the second call, the 'chat' method uses the chat history from the first call.
        The test isolates the 'chat' method behavior by mocking out 'retrieve_from_database', 'get_answer_from_llm' and
        'memory' methods.
        """
        mock_memory.load_memory_variables.return_value = {"history": []}
        app = App()
        # First call to chat
        first_answer = app.chat("Test query 1")
        self.assertEqual(first_answer, "Test answer")
        mock_memory.chat_memory.add_user_message.assert_called_once_with("Test query 1")
        mock_memory.chat_memory.add_ai_message.assert_called_once_with("Test answer")
        mock_memory.chat_memory.add_user_message.reset_mock()
        mock_memory.chat_memory.add_ai_message.reset_mock()
        # Second call to chat
        second_answer = app.chat("Test query 2")
        self.assertEqual(second_answer, "Test answer")
        mock_memory.chat_memory.add_user_message.assert_called_once_with("Test query 2")
        mock_memory.chat_memory.add_ai_message.assert_called_once_with("Test answer")
--- a/tests/embedchain/test_dryrun.py
+++ b/tests/embedchain/test_dryrun.py
@@ -0,0 +1,52 @@
 import os
 import unittest
 from string import Template
 from unittest.mock import patch
 from embedchain import App
 from embedchain.embedchain import QueryConfig
 class TestApp(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    def setUp(self):
        self.app = App()
    @patch("logging.info")
    def test_query_logs_same_prompt_as_dry_run(self, mock_logging_info):
        """
        Test that the 'query' method logs the same prompt as the 'dry_run' method.
        This is the only way I found to test the prompt in query, that's not returned.
        """
        with patch.object(self.app, "retrieve_from_database") as mock_retrieve:
            mock_retrieve.return_value = ["Test context"]
            input_query = "Test query"
            config = QueryConfig(
                number_documents=3,
                template=Template("Question: $query, context: $context, history: $history"),
                history=["Past context 1", "Past context 2"],
            )
            with patch.object(self.app, "get_answer_from_llm"):
                self.app.dry_run(input_query, config)
                self.app.query(input_query, config)
            # Access the log messages captured during the execution
            logged_messages = [call[0][0] for call in mock_logging_info.call_args_list]
            # Extract the prompts from the log messages
            dry_run_prompt = self.extract_prompt(logged_messages[0])
            query_prompt = self.extract_prompt(logged_messages[1])
            # Perform assertions on the prompts
            self.assertEqual(dry_run_prompt, query_prompt)
    def extract_prompt(self, log_message):
        """
        Extracts the prompt value from the log message.
        Adjust this method based on the log message format in your implementation.
        """
        # Modify this logic based on your log message format
        prefix = "Prompt: "
        return log_message.split(prefix, 1)[1]
--- a/tests/embedchain/test_embedchain.py
+++ b/tests/embedchain/test_embedchain.py
@@ -0,0 +1,39 @@
 import os
 import unittest
 from unittest.mock import patch
 from embedchain import App
 from embedchain.config import InitConfig
 class TestChromaDbHostsLoglevel(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    @patch("chromadb.api.models.Collection.Collection.add")
    @patch("chromadb.api.models.Collection.Collection.get")
    @patch("embedchain.embedchain.EmbedChain.retrieve_from_database")
    @patch("embedchain.embedchain.EmbedChain.get_answer_from_llm")
    @patch("embedchain.embedchain.EmbedChain.get_llm_model_answer")
    def test_whole_app(
        self,
        _mock_get,
        _mock_add,
        _mock_ec_retrieve_from_database,
        _mock_get_answer_from_llm,
        mock_ec_get_llm_model_answer,
    ):
        """
        Test if the `App` instance is initialized without a config that does not contain default hosts and ports.
        """
        config = InitConfig(log_level="DEBUG")
        app = App(config)
        knowledge = "lorem ipsum dolor sit amet, consectetur adipiscing"
        app.add_local("text", knowledge)
        app.query("What text did I give you?")
        app.chat("What text did I give you?")
        self.assertEqual(mock_ec_get_llm_model_answer.call_args[1]["documents"], [knowledge])
--- a/tests/embedchain/test_generate_prompt.py
+++ b/tests/embedchain/test_generate_prompt.py
@@ -0,0 +1,66 @@
 import unittest
 from string import Template
 from embedchain import App
 from embedchain.embedchain import QueryConfig
 class TestGeneratePrompt(unittest.TestCase):
    def setUp(self):
        self.app = App()
    def test_generate_prompt_with_template(self):
        """
        Tests that the generate_prompt method correctly formats the prompt using
        a custom template provided in the QueryConfig instance.
        This test sets up a scenario with an input query and a list of contexts,
        and a custom template, and then calls generate_prompt. It checks that the
        returned prompt correctly incorporates all the contexts and the query into
        the format specified by the template.
        """
        # Setup
        input_query = "Test query"
        contexts = ["Context 1", "Context 2", "Context 3"]
        template = "You are a bot. Context: ${context} - Query: ${query} - Helpful answer:"
        config = QueryConfig(template=Template(template))
        # Execute
        result = self.app.generate_prompt(input_query, contexts, config)
        # Assert
        expected_result = (
            "You are a bot. Context: Context 1 | Context 2 | Context 3 - Query: Test query - Helpful answer:"
        )
        self.assertEqual(result, expected_result)
    def test_generate_prompt_with_contexts_list(self):
        """
        Tests that the generate_prompt method correctly handles a list of contexts.
        This test sets up a scenario with an input query and a list of contexts,
        and then calls generate_prompt. It checks that the returned prompt
        correctly includes all the contexts and the query.
        """
        # Setup
        input_query = "Test query"
        contexts = ["Context 1", "Context 2", "Context 3"]
        config = QueryConfig()
        # Execute
        result = self.app.generate_prompt(input_query, contexts, config)
        # Assert
        expected_result = config.template.substitute(context="Context 1 | Context 2 | Context 3", query=input_query)
        self.assertEqual(result, expected_result)
    def test_generate_prompt_with_history(self):
        """
        Test the 'generate_prompt' method with QueryConfig containing a history attribute.
        """
        config = QueryConfig(history=["Past context 1", "Past context 2"])
        config.template = Template("Context: $context | Query: $query | History: $history")
        prompt = self.app.generate_prompt("Test query", ["Test context"], config)
        expected_prompt = "Context: Test context | Query: Test query | History: ['Past context 1', 'Past context 2']"
        self.assertEqual(prompt, expected_prompt)
--- a/tests/embedchain/test_query.py
+++ b/tests/embedchain/test_query.py
@@ -0,0 +1,43 @@
 import os
 import unittest
 from unittest.mock import MagicMock, patch
 from embedchain import App
 from embedchain.embedchain import QueryConfig
 class TestApp(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    def setUp(self):
        self.app = App()
    @patch("chromadb.api.models.Collection.Collection.add", MagicMock)
    def test_query(self):
        """
        This test checks the functionality of the 'query' method in the App class.
        It simulates a scenario where the 'retrieve_from_database' method returns a context list and
        'get_llm_model_answer' returns an expected answer string.
        The 'query' method is expected to call 'retrieve_from_database' and 'get_llm_model_answer' methods
        appropriately and return the right answer.
        Key assumptions tested:
        - 'retrieve_from_database' method is called exactly once with arguments: "Test query" and an instance of
            QueryConfig.
        - 'get_llm_model_answer' is called exactly once. The specific arguments are not checked in this test.
        - 'query' method returns the value it received from 'get_llm_model_answer'.
        The test isolates the 'query' method behavior by mocking out 'retrieve_from_database' and
        'get_llm_model_answer' methods.
        """
        with patch.object(self.app, "retrieve_from_database") as mock_retrieve:
            mock_retrieve.return_value = ["Test context"]
            with patch.object(self.app, "get_llm_model_answer") as mock_answer:
                mock_answer.return_value = "Test answer"
                answer = self.app.query("Test query")
        self.assertEqual(answer, "Test answer")
        self.assertEqual(mock_retrieve.call_args[0][0], "Test query")
        self.assertIsInstance(mock_retrieve.call_args[0][1], QueryConfig)
        mock_answer.assert_called_once()
--- a/tests/test_embedchain.py
+++ b/tests/test_embedchain.py
@@ -1,29 +0,0 @@
 import os
 import unittest
 from unittest.mock import MagicMock, patch
 from embedchain import App
 class TestApp(unittest.TestCase):
    os.environ["OPENAI_API_KEY"] = "test_key"
    def setUp(self):
        self.app = App()
    @patch("chromadb.api.models.Collection.Collection.add", MagicMock)
    def test_add(self):
        self.app.add("web_page", "https://example.com")
        self.assertEqual(self.app.user_asks, [["web_page", "https://example.com"]])
    @patch("chromadb.api.models.Collection.Collection.add", MagicMock)
    def test_query(self):
        with patch.object(self.app, "retrieve_from_database") as mock_retrieve:
            mock_retrieve.return_value = "Test context"
            with patch.object(self.app, "get_llm_model_answer") as mock_answer:
                mock_answer.return_value = "Test answer"
                answer = self.app.query("Test query")
        self.assertEqual(answer, "Test answer")
        mock_retrieve.assert_called_once_with("Test query")
        mock_answer.assert_called_once()
--- a/tests/vectordb/test_chroma_db.py
+++ b/tests/vectordb/test_chroma_db.py
@@ -0,0 +1,72 @@
 # ruff: noqa: E501
 import unittest
 from unittest.mock import patch
 from embedchain import App
 from embedchain.config import InitConfig
 from embedchain.vectordb.chroma_db import ChromaDB, chromadb
 class TestChromaDbHosts(unittest.TestCase):
    def test_init_with_host_and_port(self):
        """
        Test if the `ChromaDB` instance is initialized with the correct host and port values.
        """
        host = "test-host"
        port = "1234"
        with patch.object(chromadb, "Client") as mock_client:
            _db = ChromaDB(host=host, port=port)
        expected_settings = chromadb.config.Settings(
            chroma_api_impl="rest",
            chroma_server_host=host,
            chroma_server_http_port=port,
        )
        mock_client.assert_called_once_with(expected_settings)
 class TestChromaDbHostsInit(unittest.TestCase):
    @patch("embedchain.vectordb.chroma_db.chromadb.Client")
    def test_init_with_host_and_port(self, mock_client):
        """
        Test if the `App` instance is initialized with the correct host and port values.
        """
        host = "test-host"
        port = "1234"
        config = InitConfig(host=host, port=port)
        _app = App(config)
        self.assertEqual(mock_client.call_args[0][0].chroma_server_host, host)
        self.assertEqual(mock_client.call_args[0][0].chroma_server_http_port, port)
 class TestChromaDbHostsNone(unittest.TestCase):
    @patch("embedchain.vectordb.chroma_db.chromadb.Client")
    def test_init_with_host_and_port(self, mock_client):
        """
        Test if the `App` instance is initialized without default hosts and ports.
        """
        _app = App()
        self.assertEqual(mock_client.call_args[0][0].chroma_server_host, None)
        self.assertEqual(mock_client.call_args[0][0].chroma_server_http_port, None)
 class TestChromaDbHostsLoglevel(unittest.TestCase):
    @patch("embedchain.vectordb.chroma_db.chromadb.Client")
    def test_init_with_host_and_port(self, mock_client):
        """
        Test if the `App` instance is initialized without a config that does not contain default hosts and ports.
        """
        config = InitConfig(log_level="DEBUG")
        _app = App(config)
        self.assertEqual(mock_client.call_args[0][0].chroma_server_host, None)
        self.assertEqual(mock_client.call_args[0][0].chroma_server_http_port, None)