Skip to content

Commit e21d461

Browse files
committed
push
1 parent d03eedc commit e21d461

File tree

2 files changed

+9
-8
lines changed

2 files changed

+9
-8
lines changed

scrapegraphai/docloaders/broswer_base.py renamed to scrapegraphai/docloaders/browser_base.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,9 @@
22
browserbase integration module
33
"""
44
from browserbase import Browserbase
5+
from typing import List
56

6-
def browser_base_fetch(api_key: str, project_id: str, link: str) -> object:
7+
def browser_base_fetch(api_key: str, project_id: str, link: List[str]) -> List[str]:
78
"""
89
BrowserBase Fetch
910
@@ -15,7 +16,8 @@ def browser_base_fetch(api_key: str, project_id: str, link: str) -> object:
1516
- `link`: The URL or link that you want to fetch data from.
1617
1718
It initializes a Browserbase object with the given API key and project ID,
18-
then uses this object to load the specified link. It returns the result of the loading operation.
19+
then uses this object to load the specified link.
20+
It returns the result of the loading operation.
1921
2022
Example usage:
2123
@@ -41,6 +43,6 @@ def browser_base_fetch(api_key: str, project_id: str, link: str) -> object:
4143

4244
browserbase = Browserbase(api_key=api_key, project_id=project_id)
4345

44-
result = browserbase.load(link)
46+
result = browserbase.load([link])
4547

4648
return result

scrapegraphai/nodes/fetch_node.py

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -202,11 +202,10 @@ def execute(self, state):
202202
loader_kwargs = self.node_config.get("loader_kwargs", {})
203203

204204
if self.browser_base is not None:
205-
document = [
206-
Document(page_content= browser_base_fetch(self.browser_base.get("api_key"),
207-
self.browser_base.get("project_id"), source),
208-
metadata={})
209-
]
205+
data = browser_base_fetch(self.browser_base.get("api_key"),
206+
self.browser_base.get("project_id"), source)
207+
208+
document = [Document(page_content= data, metadata={"source": "html file"})]
210209
else:
211210
loader = ChromiumLoader([source], headless=self.headless, **loader_kwargs)
212211
document = loader.load()

0 commit comments

Comments
 (0)