Revision: 5349 Author: nicdumz Date: 2008-05-10 18:38:59 +0000 (Sat, 10 May 2008)
Log Message: ----------- Fixing badtitles regex
Modified Paths: -------------- trunk/pywikipedia/reflinks.py
Modified: trunk/pywikipedia/reflinks.py =================================================================== --- trunk/pywikipedia/reflinks.py 2008-05-10 17:39:28 UTC (rev 5348) +++ trunk/pywikipedia/reflinks.py 2008-05-10 18:38:59 UTC (rev 5349) @@ -67,7 +67,7 @@ domain = re.compile(ur'^(\w+)://(?:www.|)([^/]+)') badtitles = {'en': # is - ur'(?is) (test|' + ur'(?is)(test|' # starts with +'^\W*(register|registration|(sign|log)[ -]?in|subscribe|sign[ -]?up|log[ -]?on|untitled *(document|page|$))' # anywhere @@ -77,9 +77,9 @@ +')', 'fr': #is - ur'(?is) (test|' + ur'(?is)(test|' # starts with - ur'^\W*(register|registration|(sign|log)[ -]?in|subscribe|sign[ -]?up|log[ -]?on|untitled *(document|page|$))' + + ur'^\W*(register|registration|(sign|log)[ -]?in|subscribe|sign[ -]?up|log[ -]?on|untitled *(document|page|$))' # anywhere +'|(404|page|file|site).*(not *found|en +travaux)' # ends with