Skip to content

Commit

Permalink
fix and update test
Browse files Browse the repository at this point in the history
  • Loading branch information
saraswatpuneet committed Sep 2, 2023
1 parent 2450b79 commit 1810c97
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 1 deletion.
1 change: 1 addition & 0 deletions querent/tools/web_page_extractor.py
Original file line number Diff line number Diff line change
Expand Up @@ -271,6 +271,7 @@ def extract_links(self, url):
if (
link_href.startswith(url)
and link_href not in self.crawled_urls
and link_href != url
):
links.append(link_href)
return links
Expand Down
2 changes: 1 addition & 1 deletion tests/test_webscrapper.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@ def test_fs_collector_factory():


def test_scrapping_data():
uri = Uri("https://asecuritysite.com/")
uri = Uri("https://protocolstreams.xyz/")
resolver = CollectorResolver()
webscrapperConfig = WebScraperConfig(website_url=uri.uri)
collector = resolver.resolve(uri, webscrapperConfig)
Expand Down

0 comments on commit 1810c97

Please sign in to comment.