diff --git a/libs/community/langchain_community/document_loaders/url_playwright.py b/libs/community/langchain_community/document_loaders/url_playwright.py index 3f350615401b9..8e06ce4be0e7e 100644 --- a/libs/community/langchain_community/document_loaders/url_playwright.py +++ b/libs/community/langchain_community/document_loaders/url_playwright.py @@ -177,6 +177,8 @@ def lazy_load(self) -> Iterator[Document]: if response is None: raise ValueError(f"page.goto() returned None for url {url}") + page.wait_for_load_state("load") + text = self.evaluator.evaluate(page, browser, response) metadata = {"source": url} yield Document(page_content=text, metadata=metadata) @@ -216,6 +218,8 @@ async def alazy_load(self) -> AsyncIterator[Document]: if response is None: raise ValueError(f"page.goto() returned None for url {url}") + await page.wait_for_load_state("load") + text = await self.evaluator.evaluate_async(page, browser, response) metadata = {"source": url} yield Document(page_content=text, metadata=metadata)