forked from Archives/langchain
You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
15 lines
405 B
Python
15 lines
405 B
Python
import tokenize
|
|
|
|
from langchain.document_loaders.text import TextLoader
|
|
|
|
|
|
class PythonLoader(TextLoader):
|
|
"""
|
|
Load Python files, respecting any non-default encoding if specified.
|
|
"""
|
|
|
|
def __init__(self, file_path: str):
|
|
with open(file_path, "rb") as f:
|
|
encoding, _ = tokenize.detect_encoding(f.readline)
|
|
super().__init__(file_path=file_path, encoding=encoding)
|