Compare commits
1 Commits
saljic-cra
...
include-in
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
81fa3f046d |
@@ -218,7 +218,7 @@ class SaljicCrawler {
|
||||
}
|
||||
|
||||
async scrapeAd(url, adType) {
|
||||
console.log("[SALJIC] Scraping : ", url);
|
||||
// console.log("[SALJIC] Scraping : ", url);
|
||||
try {
|
||||
const adPageSource = await fetch(url);
|
||||
const body = await adPageSource.text();
|
||||
@@ -227,9 +227,7 @@ class SaljicCrawler {
|
||||
// No information for status ex. PRODAN
|
||||
const status = AD_STATUS.STATUS_NORMAL;
|
||||
//Extracting agency ID from url
|
||||
const agencyObjectId = url
|
||||
? parseInt(url.substring(46, url.length))
|
||||
: null;
|
||||
const agencyObjectId = parseInt(url.substring(46, url.length));
|
||||
|
||||
//Extracting main properties
|
||||
const propertySelectors = {
|
||||
@@ -274,10 +272,14 @@ class SaljicCrawler {
|
||||
.trim();
|
||||
|
||||
const latAndLongSrc = $(propertySelectors.latAndLong).attr("src");
|
||||
const tmpLatLong = latAndLongSrc.split("marker=")[1];
|
||||
const latText = tmpLatLong.split("%2C")[0];
|
||||
const longText = tmpLatLong.split("%2C")[1];
|
||||
|
||||
const latText = latAndLongSrc.substring(
|
||||
latAndLongSrc.indexOf("marker=") + 7,
|
||||
latAndLongSrc.indexOf("%2C", latAndLongSrc.indexOf("marker="))
|
||||
);
|
||||
const longText = latAndLongSrc.substring(
|
||||
latAndLongSrc.indexOf("%2C", latAndLongSrc.indexOf("marker=")) + 3,
|
||||
latAndLongSrc.length
|
||||
);
|
||||
const locationLat = parseFloat(latText) || null;
|
||||
const locationLong = parseFloat(longText) || null;
|
||||
|
||||
@@ -326,10 +328,11 @@ class SaljicCrawler {
|
||||
let numberOfViewsKivi = null;
|
||||
let streetNumber = 0;
|
||||
let adStatus = status;
|
||||
let shortDescription = descriptions
|
||||
? descriptions.substring(0, descriptions.indexOf("."))
|
||||
: "";
|
||||
let longDescription = descriptions || "";
|
||||
let shortDescription = descriptions.substring(
|
||||
0,
|
||||
descriptions.indexOf(".")
|
||||
);
|
||||
let longDescription = descriptions;
|
||||
//Extracting data - Glavne karakteristike
|
||||
let mainFieldIndex = 1;
|
||||
do {
|
||||
@@ -340,14 +343,10 @@ class SaljicCrawler {
|
||||
.replace(/[\n\r\t]/gm, "")
|
||||
.trim();
|
||||
|
||||
const mainFieldTitle = mainField
|
||||
? mainField.substring(0, mainField.indexOf(" "))
|
||||
: "";
|
||||
const mainFieldTitle = mainField.substring(0, mainField.indexOf(" "));
|
||||
const mainFieldValue = mainField
|
||||
? mainField
|
||||
.substring(mainField.indexOf(" "), mainField.length)
|
||||
.trim()
|
||||
: "";
|
||||
.substring(mainField.indexOf(" "), mainField.length)
|
||||
.trim();
|
||||
|
||||
switch (mainFieldTitle) {
|
||||
case "Površina":
|
||||
|
||||
@@ -332,10 +332,14 @@ const findRealEstatesForSearchRequest = async (searchRequest, maxResults) => {
|
||||
};
|
||||
}
|
||||
|
||||
//When includeIncompleteAds are not defined - null it will consider it true
|
||||
const order = [["updatedAt", "desc"]];
|
||||
|
||||
return db.RealEstate.findAll({
|
||||
where: includeIncompleteAds ? queryIncludeIncomplete : query,
|
||||
where:
|
||||
includeIncompleteAds || includeIncompleteAds == null
|
||||
? queryIncludeIncomplete
|
||||
: query,
|
||||
limit: maxResults,
|
||||
order
|
||||
});
|
||||
|
||||
@@ -157,7 +157,7 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
} else {
|
||||
// If real estate dont have defined number of rooms ex. null
|
||||
//It returns requests that didn't choose number of rooms - also null
|
||||
//Or ones that picked some values but also picked to includeIncomplete ads
|
||||
//Or ones that picked some values but also picked to includeIncomplete ads (or default)
|
||||
numberOfRoomsQuery = {
|
||||
[Op.or]: [
|
||||
{
|
||||
@@ -176,7 +176,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -226,7 +229,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -275,7 +281,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -313,7 +322,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -347,7 +359,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -381,7 +396,10 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
},
|
||||
{
|
||||
includeIncompleteAds: {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
}
|
||||
}
|
||||
]
|
||||
@@ -423,10 +441,13 @@ const findSearchRequestsForRealEstate = async realEstate => {
|
||||
[Op.eq]: "ANY"
|
||||
};
|
||||
}
|
||||
//Tag to check if incomplete ads are accepted in query
|
||||
//Tag to check if incomplete ads are accepted in query which is default
|
||||
if (checkForIncompleteWanted) {
|
||||
query.includeIncompleteAds = {
|
||||
[Op.eq]: true
|
||||
[Op.or]: {
|
||||
[Op.eq]: true,
|
||||
[Op.is]: null
|
||||
}
|
||||
};
|
||||
}
|
||||
|
||||
|
||||
@@ -61,9 +61,8 @@
|
||||
<p class="distinguished">
|
||||
<label class="checkbox-label">
|
||||
<input type="checkbox" class="filled-in" name="includeIncompleteAds"
|
||||
<% if (includeIncompleteAds) { %>
|
||||
checked
|
||||
<% } %>>
|
||||
>
|
||||
<span>Uključi i oglase bez potpunih informacija</span>
|
||||
</label>
|
||||
</p>
|
||||
|
||||
Reference in New Issue
Block a user