From 2b4e9a3efaa231588f586398f6f8e892310fe95a Mon Sep 17 00:00:00 2001 From: Roma Date: Tue, 25 Apr 2023 14:02:59 -0300 Subject: [PATCH] Add unit test for _merge_splits function (#3513) This commit adds a new unit test for the _merge_splits function in the text splitter. The new test verifies that the function merges text into chunks of the correct size and overlap, using a specified separator. The test passes on the current implementation of the function. --- tests/unit_tests/test_text_splitter.py | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/tests/unit_tests/test_text_splitter.py b/tests/unit_tests/test_text_splitter.py index dbfb9b5f..40f3c2bc 100644 --- a/tests/unit_tests/test_text_splitter.py +++ b/tests/unit_tests/test_text_splitter.py @@ -68,6 +68,15 @@ def test_character_text_splitting_args() -> None: CharacterTextSplitter(chunk_size=2, chunk_overlap=4) +def test_merge_splits() -> None: + """Test merging splits with a given separator.""" + splitter = CharacterTextSplitter(separator=" ", chunk_size=9, chunk_overlap=2) + splits = ["foo", "bar", "baz"] + expected_output = ["foo bar", "baz"] + output = splitter._merge_splits(splits, separator=" ") + assert output == expected_output + + def test_create_documents() -> None: """Test create documents method.""" texts = ["foo bar", "baz"]