/
enwiki.py
64 lines (57 loc) · 2.48 KB
/
enwiki.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
from revscoring.features import wikitext as wikitext_features
from revscoring.features import revision_oriented
from revscoring.features.modifiers import sub
from revscoring.languages import english
from . import mediawiki, wikipedia, wikitext
local_wiki = [
revision_oriented.revision.comment_matches(
r"copy|edit|npov|wp:?el",
name="enwiki.revision.comment.has_known_word"
),
revision_oriented.revision.comment_matches(
r"\[\[WP:AES\|←\]\]",
name="enwiki.revision.comment.is_aes"
),
sub(
wikitext_features.revision.template_names_matching(r"^cite"),
wikitext_features.revision.parent.template_names_matching(r"^cite"),
name="enwiki.revision.diff.cite_templates_added"
)
]
badwords = [
english.badwords.revision.diff.match_delta_sum,
english.badwords.revision.diff.match_delta_increase,
english.badwords.revision.diff.match_delta_decrease,
english.badwords.revision.diff.match_prop_delta_sum,
english.badwords.revision.diff.match_prop_delta_increase,
english.badwords.revision.diff.match_prop_delta_decrease
]
informals = [
english.informals.revision.diff.match_delta_sum,
english.informals.revision.diff.match_delta_increase,
english.informals.revision.diff.match_delta_decrease,
english.informals.revision.diff.match_prop_delta_sum,
english.informals.revision.diff.match_prop_delta_increase,
english.informals.revision.diff.match_prop_delta_decrease
]
dict_words = [
english.dictionary.revision.diff.dict_word_delta_sum,
english.dictionary.revision.diff.dict_word_delta_increase,
english.dictionary.revision.diff.dict_word_delta_decrease,
english.dictionary.revision.diff.dict_word_prop_delta_sum,
english.dictionary.revision.diff.dict_word_prop_delta_increase,
english.dictionary.revision.diff.dict_word_prop_delta_decrease,
english.dictionary.revision.diff.non_dict_word_delta_sum,
english.dictionary.revision.diff.non_dict_word_delta_increase,
english.dictionary.revision.diff.non_dict_word_delta_decrease,
english.dictionary.revision.diff.non_dict_word_prop_delta_sum,
english.dictionary.revision.diff.non_dict_word_prop_delta_increase,
english.dictionary.revision.diff.non_dict_word_prop_delta_decrease
]
damaging = wikipedia.page + \
wikitext.parent + wikitext.diff + mediawiki.user_rights + \
mediawiki.protected_user + mediawiki.comment + \
badwords + informals + dict_words
"Damaging Features"
reverted = damaging
goodfaith = damaging