Promise pool
This commit is contained in:
@@ -4,6 +4,7 @@ const fetch = require("../../helpers/fetchWrapper");
|
||||
const cheerio = require("cheerio");
|
||||
const Promise = require("bluebird");
|
||||
const moment = require("moment-timezone");
|
||||
const PromisePool = require('@supercharge/promise-pool');
|
||||
|
||||
const {
|
||||
AD_TYPE,
|
||||
@@ -224,6 +225,14 @@ class OlxCrawler {
|
||||
asyncScraping.push(this.scrapeAd(hrefs[i]));
|
||||
}
|
||||
|
||||
|
||||
const { scrapedData, errors } = await PromisePool
|
||||
.withConcurrency(2)
|
||||
.for(asyncScraping)
|
||||
.process(async data => {
|
||||
return await data
|
||||
})
|
||||
|
||||
const scrapedData = await Promise.all(asyncScraping);
|
||||
const filteredScrapedData = scrapedData.filter(adData => !!adData);
|
||||
return filteredScrapedData;
|
||||
|
||||
@@ -25,8 +25,6 @@ const fetch = async (url, options = {}) => {
|
||||
const urlAdaptedForScraping = USE_SCRAPER_API
|
||||
? `${SCRAPER_API_BASE_URL}?api_key=${SCRAPER_API_KEY}&url=${urlToFetchThroughAPI}`
|
||||
: url;
|
||||
const randomPauseMS = Math.floor(Math.random() * Math.floor(1500)) + 500;
|
||||
await timeout(randomPauseMS);
|
||||
return nodeFetch(urlAdaptedForScraping, newOptions);
|
||||
};
|
||||
|
||||
|
||||
15
package-lock.json
generated
15
package-lock.json
generated
@@ -40,6 +40,21 @@
|
||||
"@sendgrid/helpers": "^6.3.0"
|
||||
}
|
||||
},
|
||||
"@supercharge/goodies": {
|
||||
"version": "1.4.0",
|
||||
"resolved": "https://registry.npmjs.org/@supercharge/goodies/-/goodies-1.4.0.tgz",
|
||||
"integrity": "sha512-Np6u2qjRwiA3wTgzz4n2yduydIjSXqtJWP5cOnNqjdlCR/EUAK86LAOhEcU+YW211D1ksugns3GqpARJDoXQ7g==",
|
||||
"dev": true
|
||||
},
|
||||
"@supercharge/promise-pool": {
|
||||
"version": "1.3.0",
|
||||
"resolved": "https://registry.npmjs.org/@supercharge/promise-pool/-/promise-pool-1.3.0.tgz",
|
||||
"integrity": "sha512-9/EVrJevSPEqI4i/gRH8Dt7C+FQT65wRRYuu0MDaGmSLZ2aTel0jOGu8Ae84fPiQ+Ah0B80RPFUxk+K+Cz48DA==",
|
||||
"dev": true,
|
||||
"requires": {
|
||||
"@supercharge/goodies": "~1.4.0"
|
||||
}
|
||||
},
|
||||
"@types/caseless": {
|
||||
"version": "0.12.2",
|
||||
"resolved": "https://registry.npmjs.org/@types/caseless/-/caseless-0.12.2.tgz",
|
||||
|
||||
@@ -55,6 +55,7 @@
|
||||
"sequelize-cli": "^5.5.0"
|
||||
},
|
||||
"devDependencies": {
|
||||
"@supercharge/promise-pool": "^1.3.0",
|
||||
"nodemon": "^1.19.0"
|
||||
}
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user