This repository has been archived by the owner on Dec 21, 2017. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Makefile
66 lines (60 loc) · 2.47 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
datasets/wikidata.rev_reverted.20k_balanced_2015.tsv: \
datasets/wikidata.sampled_revisions.20k_balanced_2015.tsv
cat datasets/wikidata.sampled_revisions.20k_balanced_2015.tsv | \
editquality label_reverted \
--host https://wikidata.org \
--revert-radius 3 \
--verbose > \
datasets/wikidata.rev_reverted.20k_balanced_2015.tsv
datasets/wikidata.features_reverted.20k_balanced_2015.tsv: \
datasets/wikidata.rev_reverted.20k_balanced_2015.tsv
cat datasets/wikidata.rev_reverted.20k_balanced_2015.tsv | \
revscoring extract_features \
wb_vandalism.feature_lists.wikidata.reverted \
--host https://wikidata.org \
--verbose \
--include-revid > \
datasets/wikidata.features_reverted.20k_balanced_2015.tsv
models/wikidata.reverted.rf.model: \
datasets/wikidata.features_reverted.20k_balanced_2015.tsv
cut datasets/wikidata.features_reverted.20k_balanced_2015.tsv -f2- | \
revscoring train_test \
revscoring.scorer_models.RF \
wb_vandalism.feature_lists.wikidata.reverted \
--version 0.0.4 \
-p 'max_features="log2"' \
-p 'criterion="entropy"' \
-p 'min_samples_leaf=1' \
-p 'n_estimators=80' \
--label-type=bool > \
models/wikidata.reverted.rf.model
datasets/wikidata.prelabeled_revisions.20k_balanced_2015.tsv: \
datasets/wikidata.sampled_revisions.20k_balanced_2015.tsv
cat datasets/wikidata.sampled_revisions.20k_balanced_2015.tsv | \
editquality prelabel https://wikidata.org \
--trusted-groups=abusefilter,arbcom,bureaucrat,checkuser,rollbacker,sysop,bot \
--trusted-edits=1000 \
--verbose > \
datasets/wikidata.prelabeled_revisions.20k_balanced_2015.tsv
tuning_reports/wikidata.reverted.roc_auc.md: \
datasets/wikidata.features_reverted.20k_balanced_2015.tsv
cat datasets/wikidata.features_reverted.20k_balanced_2015.tsv | cut -f2- | \
revscoring tune \
config/damaging_classifiers.params.yaml \
wb_vandalism.feature_lists.wikidata.reverted \
--cv-timeout=60 \
--debug \
--scoring=roc_auc \
--label-type=bool > \
tuning_reports/wikidata.reverted.roc_auc.md
tuning_reports/wikidata.reverted.pr_auc.md: \
datasets/wikidata.features_reverted.20k_balanced_2015.tsv
cat datasets/wikidata.features_reverted.20k_balanced_2015.tsv | cut -f2- | \
revscoring tune \
config/damaging_classifiers.params.yaml \
wb_vandalism.feature_lists.wikidata.reverted \
--cv-timeout=60 \
--debug \
--scoring=pr_auc \
--label-type=bool > \
tuning_reports/wikidata.reverted.pr_auc.md