Revision: 4791 Author: filnik Date: 2008-01-02 16:19:31 +0000 (Wed, 02 Jan 2008)
Log Message: ----------- Important BugFix, the whiteTemplates for a strange reason, weren't recognised! Update as soon as possible!
Modified Paths: -------------- trunk/pywikipedia/checkimages.py
Modified: trunk/pywikipedia/checkimages.py =================================================================== --- trunk/pywikipedia/checkimages.py 2008-01-02 15:14:56 UTC (rev 4790) +++ trunk/pywikipedia/checkimages.py 2008-01-02 16:19:31 UTC (rev 4791) @@ -22,6 +22,8 @@
-time[:#] - Time in seconds between repeat runs (default: 30)
+ -wait[:#] - Wait x second before check the images (default: 0) + -skip[:#] - The bot skip the first [:#] images (default: 0)
-start[:#] - Use allpages() as generator (it starts already form Image:[:#]) @@ -585,6 +587,7 @@ limit = 80 time_sleep = 30 skip_number = 0 + wait_number = 0 commonsActive = False normal = False urlUsed = False @@ -614,6 +617,13 @@ elif len(arg) > 5: skip = True skip_number = int(arg[6:]) + elif arg.startswith('-wait'): + if len(arg) == 5: + wait = True + wait_number = int(wikipedia.input(u'How many time do you want to wait before checking the images?')) + elif len(arg) > 5: + wait = True + wait_number = int(arg[6:]) elif arg.startswith('-start'): if len(arg) == 6: firstPageTitle = str(wikipedia.input(u'From witch page do you want to start?')) @@ -698,7 +708,9 @@ hiddentemplate.append('%s' % langK)
if skip_number == 0: - skip = False + skip = False + if wait_number == 0: + wait = False # nothing = Defining an empty image description nothing = ['', ' ', ' ', ' ', '\n', '\n ', '\n ', '\n\n', '\n \n', ' \n', ' \n ', ' \n \n'] # something = Minimal requirements for an image description. @@ -761,7 +773,12 @@ wikipedia.output(u'Skipping the first %s images:\n' % skip_number) else: wikipedia.output(u'\t\t>> No images to skip...<<') - skipok = False + skipok = False + if wait: + + + wikipedia.output(u'\tWaiting %s seconds before checking the images, %s' % (wait_number, time.strftime("%d %b %Y %H:%M:%S (UTC)", time.localtime()))) + time.sleep(wait_number) for image in generator: if normal == False and regexGen == False: if image_namespace.lower() not in image.title().lower() and \ @@ -798,24 +815,26 @@ continue except wikipedia.IsRedirectPage: wikipedia.output(u"The file description for %s is a redirect?!" % imageName ) - continue + continue + for i in TextFind: + if i.lower() in g: + tagged = True for l in hiddentemplate: - res = re.findall(r'{{(?:[Tt]emplate:|)%s(?: |||\n|\W)' % l.lower(), g.lower()) - if res != []: - #print res - wikipedia.output(u'A white template found, skipping the template...') - # I don't delete the template, because if there is something to change the image page - # will be reloaded. I delete it only for the next check part. - g = g.lower().replace(l, '') + if tagged == False: + res = re.findall(r'{{(?:[Tt]emplate:|)%s(?: \n|||\n)' % l.lower(), g.lower()) + if res != []: + #print res + wikipedia.output(u'A white template found, skipping the template...') + # I don't delete the template, because if there is something to change the image page + # will be reloaded. I delete it only for the next check part. + if l != '' and l != ' ': + g = g.lower().replace('{{%s' % l, '') for a_word in something: if a_word in g: parentesi = True for parl in notallowed: if parl.lower() in extension.lower(): delete = True - for i in TextFind: - if i.lower() in g: - tagged = True some_problem = False if tupla_written != None: for tupla in tuplaList:
pywikipedia-l@lists.wikimedia.org