diff --git a/internal/scraper/avaz.go b/internal/scraper/avaz.go index 51f19f7..906fb80 100644 --- a/internal/scraper/avaz.go +++ b/internal/scraper/avaz.go @@ -37,7 +37,7 @@ func visitAvazApprovedPages(crArticlePage *colly.Collector) { func setupAvazHomepageCrawler(crHomePage *colly.Collector, crArticlePage *colly.Collector) { articleUrlR, _ := regexp.Compile("/\\d\\d+/([a-z0-9-]+)") - articleBlacklist, _ := regexp.Compile("(info-vodic|foto-data)") + articleBlacklist, _ := regexp.Compile("(english)") crHomePage.OnHTML("a", func(e *colly.HTMLElement) { url := e.Attr("href") completeUrl := url diff --git a/spider b/spider index 8b778c0..714b07c 100755 Binary files a/spider and b/spider differ