-
Notifications
You must be signed in to change notification settings - Fork 140
/
Copy pathmediawiki
26 lines (24 loc) · 1.46 KB
/
mediawiki
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
# This ignore set avoids grabbing the full history of each page, because there
# are generally far too many ?oldid= pages to crawl completely.
^https?://{any_start_netloc}/.+[\?&]oldid=\d+
^https?://{any_start_netloc}/.+[\?&]curid=\d+
^https?://{any_start_netloc}/.+[\?&]limit=(20|100|250|500)
^https?://{any_start_netloc}/.+[\?&]hide(minor|bots|anons|liu|myself|redirs|links|trans|patrolled)=
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:(UserLogin|UserLogout|Translate|MobileFeedback|MobileOptions|RecentChangesLinked|Diff|MobileDiff)
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:RecentChanges&from=\d+
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:ListFiles&dir=prev&offset=\d+
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:(ListFiles|PrefixIndex).*&
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:ListFiles.*&user=
^https?://{any_start_netloc}/.+([\?&]title=|/)Special:Log/
^https?://{any_start_netloc}/.+[\?&]action=edit§ion=(\d+|new)
^https?://{any_start_netloc}/.+[\?&]feed(format)?=atom
^https?://{any_start_netloc}/.+[\?&]printable=yes
^https?://{any_start_netloc}/.+[\?&]mobileaction=
^https?://{any_start_netloc}/.+[\?&]undo(after)?=\d+
^https?://{any_start_netloc}/.+[\?&]lqt_method=
# Links to pages that don't exist
^https?://{any_start_netloc}/.+[\?&]redlink=1
# Loops
^https?://{any_start_netloc}/.*User_talk:.+/User_talk:
^https?://{any_start_netloc}/.*User_blog:.+/User_blog:
^https?://{any_start_netloc}/.*User:.+/User: