[docs]classBrowserbaseLoader(BaseLoader):"""Load pre-rendered web pages using a headless browser hosted on Browserbase. Depends on `browserbase` package. Get your API key from https://browserbase.com """
[docs]def__init__(self,urls:Sequence[str],text_content:bool=False,api_key:Optional[str]=None,project_id:Optional[str]=None,session_id:Optional[str]=None,proxy:Optional[bool]=None,):self.urls=urlsself.text_content=text_contentself.session_id=session_idself.proxy=proxytry:frombrowserbaseimportBrowserbaseexceptImportError:raiseImportError("You must run ""`pip install --upgrade ""browserbase` ""to use the Browserbase loader.")self.browserbase=Browserbase(api_key,project_id)
[docs]deflazy_load(self)->Iterator[Document]:"""Load pages from URLs"""pages=self.browserbase.load_urls(self.urls,self.text_content,self.session_id,self.proxy)fori,pageinenumerate(pages):yieldDocument(page_content=page,metadata={"url":self.urls[i],},)