Fix scrapers
This commit is contained in:
@@ -80,7 +80,7 @@ func setupBljesakArticlePageCrawler(crArticlePage *colly.Collector) {
|
||||
|
||||
text := ""
|
||||
|
||||
e.ForEach("div.col-xs-12, article.b-article-detail, div.col-article-content, div.intro, div.s-main-content", func(_ int, el *colly.HTMLElement) {
|
||||
e.ForEach("div.intro, div#infiniteLoadBreakpoint", func(_ int, el *colly.HTMLElement) {
|
||||
text += extractJustText(el.DOM)
|
||||
})
|
||||
|
||||
|
||||
@@ -79,7 +79,7 @@ func setupSiArticlePageCrawler(crArticlePage *colly.Collector) {
|
||||
|
||||
text := ""
|
||||
|
||||
e.ForEach("div.article__top-content, div.article__content, h4, h3, h2, div.article__content", func(_ int, el *colly.HTMLElement) {
|
||||
e.ForEach("div.article__top-content, div.article__content", func(_ int, el *colly.HTMLElement) {
|
||||
text += extractJustText(el.DOM)
|
||||
})
|
||||
|
||||
|
||||
Reference in New Issue
Block a user