Complete filter #2

Merged
senaduka merged 11 commits from complete-filter into master 2017-12-14 14:22:32 +01:00
4 changed files with 2898 additions and 5 deletions
Showing only changes of commit b634bfd300 - Show all commits

View File

@@ -1,20 +1,20 @@
var config = {}; var config = {};
/*
config.domainList = [ config.domainList = [
'https://www.iis.se/data/bardate_domains_nu.txt', 'https://www.iis.se/data/bardate_domains_nu.txt',
'https://www.iis.se/data/bardate_domains.txt']; 'https://www.iis.se/data/bardate_domains.txt'];
*/
config.domainList = ['/home/bilal/Saburly/domene-svedska/crawler/bardate_domains.txt'];
//config.domainList = ['/home/bilal/Saburly/domene-svedska/crawler/bardate_domains.txt'];
config.wordList = __dirname + '/words.txt'; config.wordList = __dirname + '/words.txt';
config.lettersOnlyRegex = /^[A-Za-z]+$/; config.lettersOnlyRegex = /^[A-Za-z]+$/;
config.swedishLettersOnly = /^[A-Za-zÅåÄäÖöüÜáÁèÈàÀéÉëËíÍÆæøØçÇ]+$/; config.swedishLettersOnly = /^[A-Za-zÅåÄäÖöüÜáÁèÈàÀéÉëËíÍÆæøØçÇ]+$/;
config.databaseURL = 'mongodb://localhost:27017/kivi'; config.databaseURL = 'mongodb://localhost:27017/domains';
//==== //====

View File

@@ -21,7 +21,6 @@ module.exports = {
} }
}); });
applyFilter(result, callback); applyFilter(result, callback);
console.log("Result Len : " + result.length);
}); });
} }
}; };

2893
crawler/izlaz.txt Normal file

File diff suppressed because it is too large Load Diff

View File

@@ -1,3 +1,4 @@
skålar
A-aktie A-aktie
A-aktien A-aktien
A-aktiens A-aktiens