{ "cells": [ { "cell_type": "markdown", "id": "e229e34c", "metadata": {}, "source": [ "# AsyncHtmlLoader\n", "\n", "AsyncHtmlLoader loads raw HTML from a list of urls concurrently." ] }, { "cell_type": "code", "execution_count": 4, "id": "4c8e4dab", "metadata": {}, "outputs": [], "source": [ "from langchain.document_loaders import AsyncHtmlLoader" ] }, { "cell_type": "code", "execution_count": 5, "id": "e76b5ddc", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "Fetching pages: 100%|############| 2/2 [00:00<00:00, 9.96it/s]\n" ] } ], "source": [ "urls = [\"https://www.espn.com\", \"https://lilianweng.github.io/posts/2023-06-23-agent/\"]\n", "loader = AsyncHtmlLoader(urls)\n", "docs = loader.load()" ] }, { "cell_type": "code", "execution_count": 6, "id": "5dca1c0c", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "' news. Stream exclusive games on ESPN+ and play fantasy sports.\" />\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n