Merge pull request #2940 from ntimo/task/split-bad-words

[RSPAMD] Split bad words into multiple files per language
This commit is contained in:
André Peters 2019-09-18 18:35:11 +02:00 committed by GitHub
commit 1bbe1a2367
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
4 changed files with 31 additions and 21 deletions

View File

@ -1,9 +1,6 @@
/\ssex\s/i
/\svagina\s/i
/\serotic\s/i /\serotic\s/i
/\serection\s/i /\serection\s/i
/\ssexy\s/i /\ssexy\s/i
/\spenis\s/i
/\sass\s/i /\sass\s/i
/\sviagra\s/i /\sviagra\s/i
/\stits\s/i /\stits\s/i
@ -17,28 +14,16 @@
/\spharma\s/i /\spharma\s/i
/\spharmacy\s/i /\spharmacy\s/i
/\sseo\s/i /\sseo\s/i
/\smarketing\s/i
/\sjackpot\s/i /\sjackpot\s/i
/\slotto\s/i
/\slottery\s/i /\slottery\s/i
/pillenversand/i
/\skredithilfe\s/i
/\skapital\s/i
/\skrankenversicherung\s/i
/bitcoin/i /bitcoin/i
/pädophil/i
/paedophil/i
/freiberufler/i
/unternehmer/i
/masturbieren/i
/trojaner/i /trojaner/i
/malware/i /malware/i
/\sscooter\s/i /\sscooter\s/i
/\sescooter\s/i
/\se-scooter\s/i
/testost/i /testost/i
/\spotenz\s/i
/potenzmittel/i
/rezeptfrei/i
/apotheke/i
/web\sdevelopment/i /web\sdevelopment/i
/\slottery\s/i
/\ssex\s/i
/\svagina\s/i
/\spenis\s/i
/\smarketing\s/i

View File

@ -0,0 +1,17 @@
/\slotto\s/i
/pillenversand/i
/\skredithilfe\s/i
/\skapital\s/i
/\skrankenversicherung\s/i
/pädophil/i
/paedophil/i
/freiberufler/i
/unternehmer/i
/masturbieren/i
/\sescooter\s/i
/\se-scooter\s/i
/testost/i
/\spotenz\s/i
/potenzmittel/i
/rezeptfrei/i
/apotheke/i

View File

@ -27,6 +27,6 @@ OLEFY_MACRO {
policy = "remove_weight"; policy = "remove_weight";
} }
BAD_WORD_BAD_TLD { BAD_WORD_BAD_TLD {
expression = "FISHY_TLD & BAD_WORDS" expression = "FISHY_TLD & ( BAD_WORDS | BAD_WORDS_DE )"
score = 10.0; score = 10.0;
} }

View File

@ -119,3 +119,11 @@ BAD_WORDS {
regexp = true; regexp = true;
score = 0.1; score = 0.1;
} }
BAD_WORDS_DE {
type = "content";
filter = "text";
map = "${LOCAL_CONFDIR}/custom/bad_words_de.map";
regexp = true;
score = 0.1;
}