mirror of
https://github.com/langgenius/dify.git
synced 2026-05-03 17:08:03 +08:00
add old auth transform
This commit is contained in:
@ -24,7 +24,6 @@ class FirecrawlWebExtractor(BaseExtractor):
|
||||
tenant_id: str,
|
||||
mode: str = "crawl",
|
||||
only_main_content: bool = True,
|
||||
credential_id: Optional[str] = None,
|
||||
):
|
||||
"""Initialize with url, api_key, base_url and mode."""
|
||||
self._url = url
|
||||
@ -32,14 +31,13 @@ class FirecrawlWebExtractor(BaseExtractor):
|
||||
self.tenant_id = tenant_id
|
||||
self.mode = mode
|
||||
self.only_main_content = only_main_content
|
||||
self.credential_id = credential_id
|
||||
|
||||
def extract(self) -> list[Document]:
|
||||
"""Extract content from the URL."""
|
||||
documents = []
|
||||
if self.mode == "crawl":
|
||||
crawl_data = WebsiteService.get_crawl_url_data(
|
||||
self.job_id, "firecrawl", self._url, self.tenant_id, self.credential_id
|
||||
self.job_id, "firecrawl", self._url, self.tenant_id
|
||||
)
|
||||
if crawl_data is None:
|
||||
return []
|
||||
@ -54,7 +52,7 @@ class FirecrawlWebExtractor(BaseExtractor):
|
||||
documents.append(document)
|
||||
elif self.mode == "scrape":
|
||||
scrape_data = WebsiteService.get_scrape_url_data(
|
||||
"firecrawl", self._url, self.tenant_id, self.only_main_content, self.credential_id
|
||||
"firecrawl", self._url, self.tenant_id, self.only_main_content
|
||||
)
|
||||
|
||||
document = Document(
|
||||
|
||||
Reference in New Issue
Block a user