Revision: 4792
Author: wikipedian
Date: 2008-01-02 20:18:54 +0000 (Wed, 02 Jan 2008)
Log Message:
-----------
fixed bug: [ 1862171 ] How to hide Links from weblinkchcker.py ?
Modified Paths:
--------------
trunk/pywikipedia/weblinkchecker.py
Modified: trunk/pywikipedia/weblinkchecker.py
===================================================================
--- trunk/pywikipedia/weblinkchecker.py 2008-01-02 16:19:31 UTC (rev 4791)
+++ trunk/pywikipedia/weblinkchecker.py 2008-01-02 20:18:54 UTC (rev 4792)
@@ -145,12 +145,22 @@
}
ignorelist = [
- re.compile('.*[\./(a)]example.com(/.*)?'))?'), # reserved for documentation
- re.compile('.*[\./(a)]example.net(/.*)?'))?'), # reserved for documentation
- re.compile('.*[\./(a)]example.org(/.*)?'))?'), # reserved for documentation
- re.compile('.*[\./(a)]gso.gbv.de(/.*)?'))?'), # bot somehow can't handle their
redirects
- re.compile('.*[\./(a)]berlinonline.de(/.*)?'))?'), # a de: user wants to fix them
by hand and doesn't want them to be deleted, see [[de:Benutzer:BLueFiSH.as/BZ]].
- re.compile('.*[\./(a)]bodo.kommune.no(/.*)?'))?'), # bot can't handle their
redirects
+ # Officialy reserved for testing, documentation, etc. in
+ #
http://tools.ietf.org/html/rfc2606#page-2
+ # top-level domains:
+ re.compile('.*[\./(a)]test(/.*)?'))?'),
+ re.compile('.*[\./(a)]example(/.*)?'))?'),
+ re.compile('.*[\./(a)]invalid(/.*)?'))?'),
+ re.compile('.*[\./(a)]localhost(/.*)?'))?'),
+ # second-level domains:
+ re.compile('.*[\./(a)]example\.com(/.*)?'))?'),
+ re.compile('.*[\./(a)]example\.net(/.*)?'))?'),
+ re.compile('.*[\./(a)]example\.org(/.*)?'))?'),
+
+ # Other special cases
+ re.compile('.*[\./(a)]gso\.gbv\.de(/.*)?'))?'), # bot somehow can't handle
their redirects
+ re.compile('.*[\./(a)]berlinonline\.de(/.*)?'))?'), # a de: user wants to fix them
by hand and doesn't want them to be deleted, see [[de:Benutzer:BLueFiSH.as/BZ]].
+ re.compile('.*[\./(a)]bodo\.kommune\.no(/.*)?'))?'), # bot can't handle their
redirects
]
def compileLinkR(withoutBracketed = False, onlyBracketed = False):