mirror of
https://github.com/hwchase17/langchain
synced 2024-11-02 09:40:22 +00:00
37 lines
1.1 KiB
Python
37 lines
1.1 KiB
Python
from typing import Iterator
|
|
|
|
from langchain_core.documents import Document
|
|
|
|
from langchain_community.document_loaders.base import BaseLoader
|
|
|
|
|
|
class AirtableLoader(BaseLoader):
|
|
"""Load the `Airtable` tables."""
|
|
|
|
def __init__(self, api_token: str, table_id: str, base_id: str):
|
|
"""Initialize with API token and the IDs for table and base"""
|
|
self.api_token = api_token
|
|
"""Airtable API token."""
|
|
self.table_id = table_id
|
|
"""Airtable table ID."""
|
|
self.base_id = base_id
|
|
"""Airtable base ID."""
|
|
|
|
def lazy_load(self) -> Iterator[Document]:
|
|
"""Lazy load Documents from table."""
|
|
|
|
from pyairtable import Table
|
|
|
|
table = Table(self.api_token, self.base_id, self.table_id)
|
|
records = table.all()
|
|
for record in records:
|
|
# Need to convert record from dict to str
|
|
yield Document(
|
|
page_content=str(record),
|
|
metadata={
|
|
"source": self.base_id + "_" + self.table_id,
|
|
"base_id": self.base_id,
|
|
"table_id": self.table_id,
|
|
},
|
|
)
|