Fix crawler (#2591)

This commit is contained in:
bogdankostic 2022-05-24 12:34:31 +02:00 committed by GitHub
parent 867695ad0c
commit 1ab2b977c0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -280,7 +280,7 @@ class Crawler(BaseComponent):
self, base_url: str, filter_urls: Optional[List] = None, existed_links: List = None
) -> set:
self.driver.get(base_url)
a_elements = self.driver.find_elements_by_tag_name("a")
a_elements = self.driver.find_elements_by_xpath("//a[@href]")
sub_links = set()
if not (existed_links and base_url in existed_links):
if filter_urls: