feat: Add embedding manager (#570)

This commit is contained in:
Taranjeet Singh
2023-09-11 23:43:53 -07:00
committed by GitHub
parent ba208f5b48
commit 2bd6881361
16 changed files with 311 additions and 73 deletions

View File

@@ -69,9 +69,12 @@ class MockLoader:
Mock loader that returns a list of data dictionaries.
Adjust this method to return different data for testing.
"""
return [
{
"content": src,
"meta_data": {"url": "none"},
}
]
return {
"doc_id": "123",
"data": [
{
"content": src,
"meta_data": {"url": "none"},
}
]
}

View File

@@ -29,18 +29,19 @@ def test_load_data(delimiter):
# Loading CSV using CsvLoader
loader = CsvLoader()
result = loader.load_data(filename)
data = result["data"]
# Assertions
assert len(result) == 3
assert result[0]["content"] == "Name: Alice, Age: 28, Occupation: Engineer"
assert result[0]["meta_data"]["url"] == filename
assert result[0]["meta_data"]["row"] == 1
assert result[1]["content"] == "Name: Bob, Age: 35, Occupation: Doctor"
assert result[1]["meta_data"]["url"] == filename
assert result[1]["meta_data"]["row"] == 2
assert result[2]["content"] == "Name: Charlie, Age: 22, Occupation: Student"
assert result[2]["meta_data"]["url"] == filename
assert result[2]["meta_data"]["row"] == 3
assert len(data) == 3
assert data[0]["content"] == "Name: Alice, Age: 28, Occupation: Engineer"
assert data[0]["meta_data"]["url"] == filename
assert data[0]["meta_data"]["row"] == 1
assert data[1]["content"] == "Name: Bob, Age: 35, Occupation: Doctor"
assert data[1]["meta_data"]["url"] == filename
assert data[1]["meta_data"]["row"] == 2
assert data[2]["content"] == "Name: Charlie, Age: 22, Occupation: Student"
assert data[2]["meta_data"]["url"] == filename
assert data[2]["meta_data"]["row"] == 3
# Cleaning up the temporary file
os.unlink(filename)
@@ -67,18 +68,19 @@ def test_load_data_with_file_uri(delimiter):
# Loading CSV using CsvLoader
loader = CsvLoader()
result = loader.load_data(filename)
data = result["data"]
# Assertions
assert len(result) == 3
assert result[0]["content"] == "Name: Alice, Age: 28, Occupation: Engineer"
assert result[0]["meta_data"]["url"] == filename
assert result[0]["meta_data"]["row"] == 1
assert result[1]["content"] == "Name: Bob, Age: 35, Occupation: Doctor"
assert result[1]["meta_data"]["url"] == filename
assert result[1]["meta_data"]["row"] == 2
assert result[2]["content"] == "Name: Charlie, Age: 22, Occupation: Student"
assert result[2]["meta_data"]["url"] == filename
assert result[2]["meta_data"]["row"] == 3
assert len(data) == 3
assert data[0]["content"] == "Name: Alice, Age: 28, Occupation: Engineer"
assert data[0]["meta_data"]["url"] == filename
assert data[0]["meta_data"]["row"] == 1
assert data[1]["content"] == "Name: Bob, Age: 35, Occupation: Doctor"
assert data[1]["meta_data"]["url"] == filename
assert data[1]["meta_data"]["row"] == 2
assert data[2]["content"] == "Name: Charlie, Age: 22, Occupation: Student"
assert data[2]["meta_data"]["url"] == filename
assert data[2]["meta_data"]["row"] == 3
# Cleaning up the temporary file
os.unlink(tmpfile.name)