diff --git a/phi/knowledge/base.py b/phi/knowledge/base.py index 556b1a8aa8..8c71f1fc3b 100644 --- a/phi/knowledge/base.py +++ b/phi/knowledge/base.py @@ -84,6 +84,7 @@ def load( else: # Filter out documents which already exist in the vector db if skip_existing: + document_list = {document.content: document for document in document_list}.values() documents_to_load = [ document for document in document_list if not self.vector_db.doc_exists(document) ]