From 49b3d6c78c60815a4d0bc83fcccfafa125873355 Mon Sep 17 00:00:00 2001 From: Harrison Chase Date: Sun, 15 Jan 2023 16:45:16 -0800 Subject: [PATCH] Harrison/wiki update (#622) Co-authored-by: Rubens Mau --- langchain/docstore/wikipedia.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/langchain/docstore/wikipedia.py b/langchain/docstore/wikipedia.py index 2325ffd9..5575b8c7 100644 --- a/langchain/docstore/wikipedia.py +++ b/langchain/docstore/wikipedia.py @@ -30,7 +30,10 @@ class Wikipedia(Docstore): try: page_content = wikipedia.page(search).content - result: Union[str, Document] = Document(page_content=page_content) + url = wikipedia.page(search).url + result: Union[str, Document] = Document( + page_content=page_content, metadata={"page": url} + ) except wikipedia.PageError: result = f"Could not find [{search}]. Similar: {wikipedia.search(search)}" except wikipedia.DisambiguationError: