Complete filter #2
@@ -1,20 +1,20 @@
|
|||||||
var config = {};
|
var config = {};
|
||||||
|
|
||||||
/*
|
|
||||||
config.domainList = [
|
config.domainList = [
|
||||||
'https://www.iis.se/data/bardate_domains_nu.txt',
|
'https://www.iis.se/data/bardate_domains_nu.txt',
|
||||||
'https://www.iis.se/data/bardate_domains.txt'];
|
'https://www.iis.se/data/bardate_domains.txt'];
|
||||||
|
|
||||||
*/
|
|
||||||
|
|
||||||
config.domainList = ['/home/bilal/Saburly/domene-svedska/crawler/bardate_domains.txt'];
|
|
||||||
|
//config.domainList = ['/home/bilal/Saburly/domene-svedska/crawler/bardate_domains.txt'];
|
||||||
|
|
||||||
config.wordList = __dirname + '/words.txt';
|
config.wordList = __dirname + '/words.txt';
|
||||||
|
|
||||||
config.lettersOnlyRegex = /^[A-Za-z]+$/;
|
config.lettersOnlyRegex = /^[A-Za-z]+$/;
|
||||||
config.swedishLettersOnly = /^[A-Za-zÅåÄäÖöüÜáÁèÈàÀéÉëËíÍÆæøØçÇ]+$/;
|
config.swedishLettersOnly = /^[A-Za-zÅåÄäÖöüÜáÁèÈàÀéÉëËíÍÆæøØçÇ]+$/;
|
||||||
|
|
||||||
config.databaseURL = 'mongodb://localhost:27017/kivi';
|
config.databaseURL = 'mongodb://localhost:27017/domains';
|
||||||
|
|
||||||
|
|
||||||
//====
|
//====
|
||||||
|
|||||||
@@ -21,7 +21,6 @@ module.exports = {
|
|||||||
}
|
}
|
||||||
});
|
});
|
||||||
applyFilter(result, callback);
|
applyFilter(result, callback);
|
||||||
console.log("Result Len : " + result.length);
|
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|||||||
2893
crawler/izlaz.txt
Normal file
2893
crawler/izlaz.txt
Normal file
File diff suppressed because it is too large
Load Diff
@@ -1,3 +1,4 @@
|
|||||||
|
skålar
|
||||||
A-aktie
|
A-aktie
|
||||||
A-aktien
|
A-aktien
|
||||||
A-aktiens
|
A-aktiens
|
||||||
|
|||||||
Reference in New Issue
Block a user