diff --git a/langchain/document_loaders/confluence.py b/langchain/document_loaders/confluence.py index f02eb77493..f20ed5f366 100644 --- a/langchain/document_loaders/confluence.py +++ b/langchain/document_loaders/confluence.py @@ -219,9 +219,11 @@ class ConfluenceLoader(BaseLoader): max_pages=max_pages, expand="body.storage.value", ) - docs += self.process_pages( - pages, include_restricted_content, include_attachments, include_comments - ) + ids_by_label = [page["id"] for page in pages] + if page_ids: + page_ids = list(set(page_ids + ids_by_label)) + else: + page_ids = list(set(ids_by_label)) if cql: pages = self.paginate_request(