[Bug fix] Avoid saving the duplicated docs (#1326)
This commit is contained in:
@@ -146,7 +146,7 @@ class QdrantDB(BaseVectorDB):
|
|||||||
qdrant_ids = []
|
qdrant_ids = []
|
||||||
for id, document, metadata in zip(ids, documents, metadatas):
|
for id, document, metadata in zip(ids, documents, metadatas):
|
||||||
metadata["text"] = document
|
metadata["text"] = document
|
||||||
qdrant_ids.append(str(uuid.uuid4()))
|
qdrant_ids.append(id)
|
||||||
payloads.append({"identifier": id, "text": document, "metadata": copy.deepcopy(metadata)})
|
payloads.append({"identifier": id, "text": document, "metadata": copy.deepcopy(metadata)})
|
||||||
|
|
||||||
for i in tqdm(range(0, len(qdrant_ids), self.BATCH_SIZE), desc="Adding data in batches"):
|
for i in tqdm(range(0, len(qdrant_ids), self.BATCH_SIZE), desc="Adding data in batches"):
|
||||||
|
|||||||
Reference in New Issue
Block a user