mirror of
https://github.com/hwchase17/langchain
synced 2024-11-08 07:10:35 +00:00
CR feedback
This commit is contained in:
parent
5919c0f4a2
commit
5cd244e9b7
@ -19,18 +19,10 @@
|
||||
"metadata": {
|
||||
"tags": []
|
||||
},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"Requirement already satisfied: lxml in /root/Source/github/docugami.langchain/libs/langchain/.venv/lib/python3.9/site-packages (4.9.3)\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"outputs": [],
|
||||
"source": [
|
||||
"# You need the lxml package to use the DocugamiLoader\n",
|
||||
"!poetry run pip install lxml"
|
||||
"!poetry run pip install lxml --quiet"
|
||||
]
|
||||
},
|
||||
{
|
||||
|
@ -147,6 +147,7 @@ class DocugamiLoader(BaseLoader, BaseModel):
|
||||
metadata = {
|
||||
XPATH_KEY: _xpath_for_chunk(node),
|
||||
DOCUMENT_ID_KEY: document[DOCUMENT_ID_KEY],
|
||||
DOCUMENT_NAME_KEY: document[DOCUMENT_NAME_KEY],
|
||||
DOCUMENT_SOURCE_KEY: document[DOCUMENT_NAME_KEY],
|
||||
STRUCTURE_KEY: node.attrib.get("structure", ""),
|
||||
TAG_KEY: re.sub(r"\{.*\}", "", node.tag),
|
||||
|
Loading…
Reference in New Issue
Block a user