Pywikibot-commits

pywikibot-commits@lists.wikimedia.org

1 participants
13410 discussions

[Gerrit] Port movepages.py from compat - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: Port movepages.py from compat ...................................................................... Port movepages.py from compat Change-Id: I15f82347cc7f9111aafe328b6cd60fb32d5f25d3 --- A scripts/movepages.py 1 file changed, 290 insertions(+), 0 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/movepages.py b/scripts/movepages.py new file mode 100644 index 0000000..098a394 --- /dev/null +++ b/scripts/movepages.py @@ -0,0 +1,290 @@ +#!/usr/bin/python +# -*- coding: utf-8 -*- +""" +This script can move pages. + +These command line parameters can be used to specify which pages to work on: + +&params; + +Furthermore, the following command line parameters are supported: + +-from and -to The page to move from and the page to move to. + +-noredirect Leave no redirect behind. + +-prefix Move pages by adding a namespace prefix to the names of the + pages. (Will remove the old namespace prefix if any) + Argument can also be given as "-prefix:namespace:". + +-always Don't prompt to make changes, just do them. + +-skipredirects Skip redirect pages (Warning: increases server load) + +-summary Prompt for a custom summary, bypassing the predefined message + texts. Argument can also be given as "-summary:XYZ". + +-pairs Read pairs of file names from a file. The file must be in a + format [[frompage]] [[topage]] [[frompage]] [[topage]] ... + Argument can also be given as "-pairs:filename" + +""" +# +# (C) Leonardo Gregianin, 2006 +# (C) Andreas J. Schwab, 2007 +# (C) Pywikipedia bot team, 2006-2013 +# +# Distributed under the terms of the MIT license. +# + +__version__='$Id$' + +import sys, re +import pywikibot +from pywikibot import i18n +from pywikibot import pagegenerators + +# This is required for the text that is shown when you run this script +# with the parameter -help. +docuReplacements = { + '&params;': pagegenerators.parameterHelp, +} + + +class MovePagesBot: + def __init__(self, generator, addprefix, noredirect, always, skipredirects, + summary): + self.generator = generator + self.addprefix = addprefix + self.leaveRedirect = not noredirect + self.always = always + self.skipredirects = skipredirects + self.summary = summary + + def moveOne(self, page, newPageTitle): + try: + msg = self.summary + if not msg: + msg = i18n.twtranslate(pywikibot.Site(), 'movepages-moving') + pywikibot.output(u'Moving page %s to [[%s]]' + % (page.title(asLink=True), + newPageTitle)) + page.move(newPageTitle, msg, leaveRedirect=self.leaveRedirect) + except pywikibot.NoPage: + pywikibot.output(u'Page %s does not exist!' % page.title()) + except pywikibot.IsRedirectPage: + pywikibot.output(u'Page %s is a redirect; skipping.' % page.title()) + except pywikibot.LockedPage: + pywikibot.output(u'Page %s is locked!' % page.title()) + except pywikibot.PageNotSaved, e: + #target newPageTitle already exists + pywikibot.output(e.message) + + def treat(self, page): + # Show the title of the page we're working on. + # Highlight the title in purple. + pywikibot.output(u"\n\n>>> \03{lightpurple}%s\03{default} <<<" + % page.title()) + if self.skipredirects and page.isRedirectPage(): + pywikibot.output(u'Page %s is a redirect; skipping.' % page.title()) + return + pagetitle = page.title(withNamespace=False) + namesp = page.site().namespace(page.namespace()) + if self.appendAll: + newPageTitle = (u'%s%s%s' + % (self.pagestart, pagetitle, self.pageend)) + if not self.noNamespace and namesp: + newPageTitle = (u'%s:%s' % (namesp, newPageTitle)) + elif self.regexAll: + newPageTitle = self.regex.sub(self.replacePattern, pagetitle) + if not self.noNamespace and namesp: + newPageTitle = (u'%s:%s' % (namesp, newPageTitle)) + if self.addprefix: + newPageTitle = (u'%s%s' % (self.addprefix, pagetitle)) + if self.addprefix or self.appendAll or self.regexAll: + if not self.always: + choice2 = pywikibot.inputChoice( + u'Change the page title to "%s"?' % newPageTitle, + ['yes', 'no', 'all', 'quit'], ['y', 'n', 'a', 'q']) + if choice2 == 'y': + self.moveOne(page, newPageTitle) + elif choice2 == 'a': + self.always = True + self.moveOne(page, newPageTitle) + elif choice2 == 'q': + sys.exit() + elif choice2 == 'n': + pass + else: + self.treat(page) + else: + self.moveOne(page, newPageTitle) + else: + choice = pywikibot.inputChoice(u'What do you want to do?', + ['change page name', + 'append to page name', + 'use a regular expression', + 'next page', 'quit'], + ['c', 'a', 'r', 'n', 'q']) + if choice == 'c': + newPageTitle = pywikibot.input(u'New page name:') + self.moveOne(page, newPageTitle) + elif choice == 'a': + self.pagestart = pywikibot.input(u'Append this to the start:') + self.pageend = pywikibot.input(u'Append this to the end:') + newPageTitle = (u'%s%s%s' + % (self.pagestart, pagetitle, self.pageend)) + if namesp: + choice2 = pywikibot.inputChoice( + u'Do you want to remove the namespace prefix "%s:"?' + % namesp, ['yes', 'no'], ['y', 'n']) + if choice2 == 'y': + noNamespace = True + else: + newPageTitle = (u'%s:%s' % (namesp, newPageTitle)) + choice2 = pywikibot.inputChoice( + u'Change the page title to "%s"?' + % newPageTitle, ['yes', 'no', 'all', 'quit'], + ['y', 'n', 'a', 'q']) + if choice2 == 'y': + self.moveOne(page, newPageTitle) + elif choice2 == 'a': + self.appendAll = True + self.moveOne(page, newPageTitle) + elif choice2 == 'q': + sys.exit() + elif choice2 == 'n': + pass + else: + self.treat(page) + elif choice == 'r': + searchPattern = pywikibot.input(u'Enter the search pattern:') + self.replacePattern = pywikibot.input( + u'Enter the replace pattern:') + self.regex=re.compile(searchPattern) + if page.title() == page.title(withNamespace=False): + newPageTitle = self.regex.sub(self.replacePattern, + page.title()) + else: + choice2 = pywikibot.inputChoice( + u'Do you want to remove the namespace prefix "%s:"?' + % namesp, ['yes', 'no'], ['y', 'n']) + if choice2 == 'y': + newPageTitle = self.regex.sub( + self.replacePattern, page.title(withNamespace=False)) + noNamespace = True + else: + newPageTitle = self.regex.sub(self.replacePattern, + page.title()) + choice2 = pywikibot.inputChoice( + u'Change the page title to "%s"?' + % newPageTitle, ['yes', 'no', 'all', 'quit'], + ['y', 'n', 'a', 'q']) + if choice2 == 'y': + self.moveOne(page, newPageTitle) + elif choice2 == 'a': + self.regexAll = True + self.moveOne(page, newPageTitle) + elif choice2 == 'q': + sys.exit() + elif choice2 == 'n': + pass + else: + self.treat(page) + elif choice == 'n': + pass + elif choice == 'q': + sys.exit() + else: + self.treat(page) + + def run(self): + self.appendAll = False + self.regexAll = False + self.noNamespace = False + for page in self.generator: + self.treat(page) + + +def main(): + gen = None + prefix = None + oldName = None + newName = None + noredirect = False + always = False + skipredirects = False + summary = None + fromToPairs = [] + + # This factory is responsible for processing command line arguments + # that are also used by other scripts and that determine on which pages + # to work on. + genFactory = pagegenerators.GeneratorFactory() + + for arg in pywikibot.handleArgs(): + if arg.startswith('-pairs'): + if len(arg) == len('-pairs'): + filename = pywikibot.input( + u'Enter the name of the file containing pairs:') + else: + filename = arg[len('-pairs:'):] + oldName1 = None + for page in pagegenerators.TextfilePageGenerator(filename): + if oldName1: + fromToPairs.append([oldName1, page.title()]) + oldName1 = None + else: + oldName1 = page.title() + if oldName1: + pywikibot.warning( + u'file %s contains odd number of links' % filename) + elif arg == '-noredirect': + noredirect = True + elif arg == '-always': + always = True + elif arg == '-skipredirects': + skipredirects = True + elif arg.startswith('-from:'): + if oldName: + pywikibot.warning(u'-from:%s without -to:' % oldName) + oldName = arg[len('-from:'):] + elif arg.startswith('-to:'): + if oldName: + fromToPairs.append([oldName, arg[len('-to:'):]]) + oldName = None + else: + pywikibot.warning(u'%s without -from' % arg) + elif arg.startswith('-prefix'): + if len(arg) == len('-prefix'): + prefix = pywikibot.input(u'Enter the prefix:') + else: + prefix = arg[8:] + elif arg.startswith('-summary'): + if len(arg) == len('-summary'): + summary = pywikibot.input(u'Enter the summary:') + else: + summary = arg[9:] + else: + genFactory.handleArg(arg) + + if oldName: + pywikibot.warning(u'-from:%s without -to:' % oldName) + for pair in fromToPairs: + page = pywikibot.Page(pywikibot.Site(), pair[0]) + bot = MovePagesBot(None, prefix, noredirect, always, skipredirects, + summary) + bot.moveOne(page, pair[1]) + + if not gen: + gen = genFactory.getCombinedGenerator() + if gen: + preloadingGen = pagegenerators.PreloadingGenerator(gen) + bot = MovePagesBot(preloadingGen, prefix, noredirect, always, + skipredirects, summary) + bot.run() + elif not fromToPairs: + pywikibot.showHelp() + +if __name__ == '__main__': + main() -- To view, visit https://gerrit.wikimedia.org/r/86618 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I15f82347cc7f9111aafe328b6cd60fb32d5f25d3 Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] PEP8-ify movepages.py - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: PEP8-ify movepages.py ...................................................................... PEP8-ify movepages.py Change-Id: I6d776ba34ac05999302f14adb606261d7de8275d --- M scripts/movepages.py 1 file changed, 5 insertions(+), 4 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/movepages.py b/scripts/movepages.py index 098a394..bbed63d 100644 --- a/scripts/movepages.py +++ b/scripts/movepages.py @@ -37,9 +37,10 @@ # Distributed under the terms of the MIT license. # -__version__='$Id$' +__version__ = '$Id$' -import sys, re +import sys +import re import pywikibot from pywikibot import i18n from pywikibot import pagegenerators @@ -146,7 +147,7 @@ u'Change the page title to "%s"?' % newPageTitle, ['yes', 'no', 'all', 'quit'], ['y', 'n', 'a', 'q']) - if choice2 == 'y': + if choice2 == 'y': self.moveOne(page, newPageTitle) elif choice2 == 'a': self.appendAll = True @@ -161,7 +162,7 @@ searchPattern = pywikibot.input(u'Enter the search pattern:') self.replacePattern = pywikibot.input( u'Enter the replace pattern:') - self.regex=re.compile(searchPattern) + self.regex = re.compile(searchPattern) if page.title() == page.title(withNamespace=False): newPageTitle = self.regex.sub(self.replacePattern, page.title()) -- To view, visit https://gerrit.wikimedia.org/r/86619 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I6d776ba34ac05999302f14adb606261d7de8275d Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] Remove unused imports, re-order - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: Remove unused imports, re-order ...................................................................... Remove unused imports, re-order Change-Id: I84e9aac6e8ee4f7d265301e4e87093183fc3f76c --- M scripts/imagerecat.py 1 file changed, 6 insertions(+), 6 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/imagerecat.py b/scripts/imagerecat.py index 2d4af9e..9a6ee16 100644 --- a/scripts/imagerecat.py +++ b/scripts/imagerecat.py @@ -32,16 +32,16 @@ # Distributed under the terms of the MIT license. # # -import os, sys, re, codecs -import urllib, httplib, urllib2 +import sys +import re +import urllib import time import socket -import StringIO -import pywikibot -from pywikibot import config -from pywikibot import pagegenerators import xml.etree.ElementTree +import pywikibot +from pywikibot import pagegenerators + category_blacklist = [] countries = [] -- To view, visit https://gerrit.wikimedia.org/r/86623 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I84e9aac6e8ee4f7d265301e4e87093183fc3f76c Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] tabs --> spaces - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: tabs --> spaces ...................................................................... tabs --> spaces Change-Id: I062b379189acfad6cbfeb8c86e9a1f17f4488811 --- M scripts/imagerecat.py 1 file changed, 28 insertions(+), 28 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/imagerecat.py b/scripts/imagerecat.py index 7c91106..2d4af9e 100644 --- a/scripts/imagerecat.py +++ b/scripts/imagerecat.py @@ -186,15 +186,15 @@ result = [] locationList = getOpenStreetMap(latitude, longitude) for i in range(0, len(locationList)): - #print 'Working on ' + locationList[i] - if i <= len(locationList)-3: - category = getCategoryByName(name=locationList[i], parent=locationList[i+1], grandparent=locationList[i+2]) - elif i == len(locationList)-2: + #print 'Working on ' + locationList[i] + if i <= len(locationList)-3: + category = getCategoryByName(name=locationList[i], parent=locationList[i+1], grandparent=locationList[i+2]) + elif i == len(locationList)-2: category = getCategoryByName(name=locationList[i], parent=locationList[i+1]) - else: + else: category = getCategoryByName(name=locationList[i]) - if category and not category==u'': - result.append(category) + if category and not category==u'': + result.append(category) #print result return result @@ -208,39 +208,39 @@ gotInfo = False parameters = urllib.urlencode({'lat' : latitude, 'lon' : longitude, 'accept-language' : 'en'}) while(not gotInfo): - try: - page = urllib.urlopen("http://nominatim.openstreetmap.org/reverse?format=xml&%s" % parameters) - et = xml.etree.ElementTree.parse(page) - gotInfo=True - except IOError: - pywikibot.output(u'Got an IOError, let\'s try again') - time.sleep(30) - except socket.timeout: - pywikibot.output(u'Got a timeout, let\'s try again') - time.sleep(30) + try: + page = urllib.urlopen("http://nominatim.openstreetmap.org/reverse?format=xml&%s" % parameters) + et = xml.etree.ElementTree.parse(page) + gotInfo=True + except IOError: + pywikibot.output(u'Got an IOError, let\'s try again') + time.sleep(30) + except socket.timeout: + pywikibot.output(u'Got a timeout, let\'s try again') + time.sleep(30) validParts = [u'hamlet', u'village', u'city', u'county', u'country'] invalidParts = [u'path', u'road', u'suburb', u'state', u'country_code'] addressparts = et.find('addressparts') #xml.etree.ElementTree.dump(et) for addresspart in addressparts.getchildren(): - if addresspart.tag in validParts: - result.append(addresspart.text) - elif addresspart.tag in invalidParts: - pywikibot.output(u'Dropping %s, %s' % (addresspart.tag, addresspart.text)) - else: - pywikibot.warning(u'%s, %s is not in addressparts lists' % (addresspart.tag, addresspart.text)) + if addresspart.tag in validParts: + result.append(addresspart.text) + elif addresspart.tag in invalidParts: + pywikibot.output(u'Dropping %s, %s' % (addresspart.tag, addresspart.text)) + else: + pywikibot.warning(u'%s, %s is not in addressparts lists' % (addresspart.tag, addresspart.text)) #print result return result def getCategoryByName(name, parent=u'', grandparent=u''): if not parent==u'': - workname = name.strip() + u',_' + parent.strip() - workcat = pywikibot.Category( - pywikibot.Site(u'commons', u'commons'), workname) - if workcat.exists(): - return workname + workname = name.strip() + u',_' + parent.strip() + workcat = pywikibot.Category( + pywikibot.Site(u'commons', u'commons'), workname) + if workcat.exists(): + return workname if not grandparent==u'': workname = name.strip() + u',_' + grandparent.strip() workcat = pywikibot.Category( -- To view, visit https://gerrit.wikimedia.org/r/86622 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I062b379189acfad6cbfeb8c86e9a1f17f4488811 Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] PEP8-ify most of imagerecat.py - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: PEP8-ify most of imagerecat.py ...................................................................... PEP8-ify most of imagerecat.py Change-Id: I5a4a7dd85eadf7233fe7e388644dadd5ba1e5ffc --- M scripts/imagerecat.py 1 file changed, 105 insertions(+), 92 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/imagerecat.py b/scripts/imagerecat.py index 9a6ee16..df04190 100644 --- a/scripts/imagerecat.py +++ b/scripts/imagerecat.py @@ -45,13 +45,14 @@ category_blacklist = [] countries = [] -search_wikis=u'_20' -hint_wiki=u'' +search_wikis = u'_20' +hint_wiki = u'' + def initLists(): - ''' + """ Get the list of countries & the blacklist from Commons. - ''' + """ global category_blacklist global countries @@ -66,18 +67,19 @@ countries.append(country.title(withNamespace=False)) return + def categorizeImages(generator, onlyFilter, onlyUncat): - ''' Loop over all images in generator and try to categorize them. Get + """ Loop over all images in generator and try to categorize them. Get category suggestions from CommonSense. - ''' + """ for page in generator: if page.exists() and (page.namespace() == 6) and \ (not page.isRedirectPage()): imagepage = pywikibot.ImagePage(page.site(), page.title()) pywikibot.output(u'Working on ' + imagepage.title()) - if (onlyUncat and not(u'Uncategorized' in imagepage.templates())): + if onlyUncat and not(u'Uncategorized' in imagepage.templates()): pywikibot.output(u'No Uncategorized template found') else: currentCats = getCurrentCats(imagepage) @@ -87,26 +89,28 @@ galleries = [] else: (commonshelperCats, usage, galleries) = getCommonshelperCats(imagepage) - newcats = applyAllFilters(commonshelperCats+currentCats) + newcats = applyAllFilters(commonshelperCats + currentCats) - if (len(newcats) > 0 and not(set(currentCats)==set(newcats))): + if len(newcats) > 0 and not(set(currentCats) == set(newcats)): for cat in newcats: - pywikibot.output(u' Found new cat: ' + cat); + pywikibot.output(u' Found new cat: ' + cat) saveImagePage(imagepage, newcats, usage, galleries, onlyFilter) + def getCurrentCats(imagepage): - ''' Get the categories currently on the image ''' + """ Get the categories currently on the image """ result = [] for cat in imagepage.categories(): result.append(cat.title(withNamespace=False)) return list(set(result)) + def getCommonshelperCats(imagepage): - ''' Get category suggestions from CommonSense. Parse them and return a list + """ Get category suggestions from CommonSense. Parse them and return a list of suggestions. - ''' + """ commonshelperCats = [] usage = [] galleries = [] @@ -116,35 +120,35 @@ site = imagepage.site lang = site.language() family = site.family.name - if lang==u'commons' and family==u'commons': + if lang == u'commons' and family == u'commons': parameters = urllib.urlencode( - {'i' : imagepage.title(withNamespace=False).encode('utf-8'), - 'r' : 'on', - 'go-clean' : 'Find+Categories', - 'p' : search_wikis, - 'cl' : hint_wiki}) - elif family==u'wikipedia': + {'i': imagepage.title(withNamespace=False).encode('utf-8'), + 'r': 'on', + 'go-clean': 'Find+Categories', + 'p': search_wikis, + 'cl': hint_wiki}) + elif family == u'wikipedia': parameters = urllib.urlencode( - {'i' : imagepage.title(withNamespace=False).encode('utf-8'), - 'r' : 'on', - 'go-move' : 'Find+Categories', - 'p' : search_wikis, - 'cl' : hint_wiki, - 'w' : lang}) + {'i': imagepage.title(withNamespace=False).encode('utf-8'), + 'r': 'on', + 'go-move': 'Find+Categories', + 'p': search_wikis, + 'cl': hint_wiki, + 'w': lang}) else: #Cant handle other sites atm - return ([], [], []) + return [], [], [] - commonsenseRe = re.compile('^#COMMONSENSE(.*)#USAGE(\s)+$(?P<usagenum>(\d)+)$\s(?P<usage>(.*))\s#KEYWORDS(\s)+$(?P<keywords>(\d)+)$(.*)#CATEGORIES(\s)+$(?P<catnum>(\d)+)$\s(?P<cats>(.*))\s#GALLERIES(\s)+$(?P<galnum>(\d)+)$\s(?P<gals>(.*))\s(.*)#EOF$', re.MULTILINE + re.DOTALL) + commonsenseRe = re.compile('^#COMMONSENSE(.*)#USAGE(\s)+$(?P<usagenum>(\d)+)$\s(?P<usage>(.*))\s#KEYWORDS(\s)+$(?P<keywords>(\d)+)$(.*)#CATEGORIES(\s)+$(?P<catnum>(\d)+)$\s(?P<cats>(.*))\s#GALLERIES(\s)+$(?P<galnum>(\d)+)$\s(?P<gals>(.*))\s(.*)#EOF$', re.MULTILINE + re.DOTALL) # noqa gotInfo = False matches = None maxtries = 10 tries = 0 - while(not gotInfo): + while not gotInfo: try: - if ( tries < maxtries ): - tries = tries + 1 + if tries < maxtries: + tries += 1 commonsHelperPage = urllib.urlopen( "http://toolserver.org/~daniel/WikiSense/CommonSense.php?%s" % parameters) matches = commonsenseRe.search( @@ -157,18 +161,18 @@ except socket.timeout: pywikibot.output(u'Got a timeout, let\'s try again') - if (matches and gotInfo): - if (matches.group('usagenum') > 0): + if matches and gotInfo: + if matches.group('usagenum') > 0: used = matches.group('usage').splitlines() for use in used: - usage= usage + getUsage(use) + usage = usage + getUsage(use) #pywikibot.output(use) - if (matches.group('catnum') > 0): + if matches.group('catnum') > 0: cats = matches.group('cats').splitlines() for cat in cats: commonshelperCats.append(cat.replace('_', ' ')) pywikibot.output(u'category : ' + cat) - if (matches.group('galnum') > 0): + if matches.group('galnum') > 0: gals = matches.group('gals').splitlines() for gal in gals: galleries.append(gal.replace('_', ' ')) @@ -177,41 +181,45 @@ galleries = list(set(galleries)) for (lang, project, article) in usage: pywikibot.output(lang + project + article) - return (commonshelperCats, usage, galleries) + return commonshelperCats, usage, galleries + def getOpenStreetMapCats(latitude, longitude): - ''' + """ Get a list of location categories based on the OSM nomatim tool - ''' + """ result = [] locationList = getOpenStreetMap(latitude, longitude) for i in range(0, len(locationList)): #print 'Working on ' + locationList[i] - if i <= len(locationList)-3: - category = getCategoryByName(name=locationList[i], parent=locationList[i+1], grandparent=locationList[i+2]) - elif i == len(locationList)-2: - category = getCategoryByName(name=locationList[i], parent=locationList[i+1]) + if i <= len(locationList) - 3: + category = getCategoryByName(name=locationList[i], + parent=locationList[i + 1], + grandparent=locationList[i + 2]) + elif i == len(locationList) - 2: + category = getCategoryByName(name=locationList[i], + parent=locationList[i + 1]) else: category = getCategoryByName(name=locationList[i]) - if category and not category==u'': + if category and not category == u'': result.append(category) #print result return result def getOpenStreetMap(latitude, longitude): - ''' + """ Get the result from http://nominatim.openstreetmap.org/reverse and put it in a list of tuples to play around with - ''' + """ result = [] gotInfo = False - parameters = urllib.urlencode({'lat' : latitude, 'lon' : longitude, 'accept-language' : 'en'}) - while(not gotInfo): + parameters = urllib.urlencode({'lat': latitude, 'lon': longitude, 'accept-language': 'en'}) + while not gotInfo: try: page = urllib.urlopen("http://nominatim.openstreetmap.org/reverse?format=xml&%s" % parameters) et = xml.etree.ElementTree.parse(page) - gotInfo=True + gotInfo = True except IOError: pywikibot.output(u'Got an IOError, let\'s try again') time.sleep(30) @@ -233,30 +241,28 @@ #print result return result + def getCategoryByName(name, parent=u'', grandparent=u''): - if not parent==u'': + if not parent == u'': workname = name.strip() + u',_' + parent.strip() - workcat = pywikibot.Category( - pywikibot.Site(u'commons', u'commons'), workname) + workcat = pywikibot.Category(pywikibot.Site(u'commons', u'commons'), workname) if workcat.exists(): return workname - if not grandparent==u'': + if not grandparent == u'': workname = name.strip() + u',_' + grandparent.strip() - workcat = pywikibot.Category( - pywikibot.Site(u'commons', u'commons'), workname) + workcat = pywikibot.Category(pywikibot.Site(u'commons', u'commons'), workname) if workcat.exists(): return workname workname = name.strip() - workcat = pywikibot.Category( - pywikibot.Site(u'commons', u'commons'), workname) + workcat = pywikibot.Category(pywikibot.Site(u'commons', u'commons'), workname) if workcat.exists(): return workname return u'' def getUsage(use): - ''' Parse the Commonsense output to get the usage ''' + """ Parse the Commonsense output to get the usage """ result = [] lang = '' project = '' @@ -265,21 +271,22 @@ '^(?P<lang>([\w-]+))\.(?P<project>([\w]+))\.org:(?P<articles>\s(.*))') matches = usageRe.search(use) if matches: - if (matches.group('lang')): + if matches.group('lang'): lang = matches.group('lang') #pywikibot.output(lang) - if (matches.group('project')): + if matches.group('project'): project = matches.group('project') #pywikibot.output(project) - if (matches.group('articles')): + if matches.group('articles'): articles = matches.group('articles') #pywikibot.output(articles) for article in articles.split(): result.append((lang, project, article)) return result + def applyAllFilters(categories): - ''' Apply all filters on categories. ''' + """ Apply all filters on categories. """ result = [] result = filterDisambiguation(categories) result = followRedirects(result) @@ -288,17 +295,19 @@ result = filterParents(result) return result + def filterBlacklist(categories): - ''' Filter out categories which are on the blacklist. ''' + """ Filter out categories which are on the blacklist. """ result = [] for cat in categories: cat = cat.replace('_', ' ') - if (cat not in category_blacklist): + if not (cat in category_blacklist): result.append(cat) return list(set(result)) + def filterDisambiguation(categories): - ''' Filter out disambiguation categories. ''' + """ Filter out disambiguation categories. """ result = [] for cat in categories: if (not pywikibot.Page(pywikibot.Site(u'commons', u'commons'), @@ -306,8 +315,9 @@ result.append(cat) return result + def followRedirects(categories): - ''' If a category is a redirect, replace the category with the target. ''' + """ If a category is a redirect, replace the category with the target. """ result = [] for cat in categories: categoryPage = pywikibot.Page(pywikibot.getSite(u'commons', u'commons'), @@ -320,19 +330,20 @@ result.append(cat) return result + def filterCountries(categories): - ''' Try to filter out ...by country categories. + """ Try to filter out ...by country categories. First make a list of any ...by country categories and try to find some countries. If a by country category has a subcategoy containing one of the countries found, add it. The ...by country categories remain in the set and should be filtered out by filterParents. - ''' + """ result = categories listByCountry = [] listCountries = [] for cat in categories: - if (cat.endswith(u'by country')): + if cat.endswith(u'by country'): listByCountry.append(cat) #If cat contains 'by country' add it to the list @@ -341,27 +352,26 @@ for country in countries: if country in cat: listCountries.append(country) - if(len(listByCountry) > 0): + if len(listByCountry) > 0: for bc in listByCountry: category = pywikibot.Category( pywikibot.Site(u'commons', u'commons'), u'Category:' + bc) for subcategory in category.subcategories(): for country in listCountries: - if (subcategory.title(withNamespace=False).endswith(country)): + if subcategory.title(withNamespace=False).endswith(country): result.append(subcategory.title(withNamespace=False)) return list(set(result)) -def filterParents(categories): - ''' Remove all parent categories from the set to prevent overcategorization. - ''' +def filterParents(categories): + """ Remove all parent categories from the set to prevent overcategorization. """ result = [] toFilter = u'' for cat in categories: cat = cat.replace('_', ' ') toFilter = toFilter + "[[Category:" + cat + "]]\n" - parameters = urllib.urlencode({'source' : toFilter.encode('utf-8'), - 'bot' : '1'}) + parameters = urllib.urlencode({'source': toFilter.encode('utf-8'), + 'bot': '1'}) filterCategoriesRe = re.compile('\[\[Category:([^\]]*)\]\]') try: filterCategoriesPage = urllib.urlopen( @@ -377,17 +387,18 @@ return categories return result + def saveImagePage(imagepage, newcats, usage, galleries, onlyFilter): - ''' Remove the old categories and add the new categories to the image. ''' + """ Remove the old categories and add the new categories to the image. """ newtext = pywikibot.removeCategoryLinks(imagepage.get(), imagepage.site()) - if not(onlyFilter): + if not onlyFilter: newtext = removeTemplates(newtext) newtext = newtext + getCheckCategoriesTemplate(usage, galleries, len(newcats)) - newtext = newtext + u'\n' + newtext += u'\n' for category in newcats: newtext = newtext + u'[[Category:' + category + u']]\n' - if(onlyFilter): + if onlyFilter: comment = u'Filtering categories' else: comment = u'Image is categorized by a bot using data from [[Commons:Tools#CommonSense|CommonSense]]' @@ -395,11 +406,11 @@ imagepage.put(newtext, comment) return -def removeTemplates(oldtext = u''): - ''' + +def removeTemplates(oldtext=u''): + """ Remove {{Uncategorized}} and {{Check categories}} templates - ''' - result = u'' + """ result = re.sub( u'\{\{\s*([Uu]ncat(egori[sz]ed( image)?)?|[Nn]ocat|[Nn]eedscategory)[^}]*\}\}', u'', oldtext) result = re.sub(u'', @@ -407,10 +418,11 @@ result = re.sub(u'\{\{\s*[Cc]heck categories[^}]*\}\}', u'', result) return result + def getCheckCategoriesTemplate(usage, galleries, ncats): - ''' + """ Build the check categories template with all parameters - ''' + """ result = u'{{Check categories|year={{subst:CURRENTYEAR}}|month={{subst:CURRENTMONTHNAME}}|day={{subst:CURRENTDAY}}\n' usageCounter = 1 for (lang, project, article) in usage: @@ -418,19 +430,20 @@ result += u'|wiki%d=%s' % (usageCounter, project) result += u'|article%d=%s' % (usageCounter, article) result += u'\n' - usageCounter = usageCounter + 1 + usageCounter += 1 galleryCounter = 1 for gallery in galleries: result += u'|gallery%d=%s' % (galleryCounter, gallery.replace('_', ' ')) + u'\n' - galleryCounter = galleryCounter + 1 + galleryCounter += 1 result += u'|ncats=%d\n' % ncats result += u'}}\n' return result + def main(args): - ''' + """ Main loop. Get a generator and options. Work on all images in the generator. - ''' + """ generator = None onlyFilter = False onlyUncat = False @@ -446,9 +459,9 @@ elif arg == '-onlyuncat': onlyUncat = True elif arg.startswith('-hint:'): - hint_wiki = arg [len('-hint:'):] + hint_wiki = arg[len('-hint:'):] elif arg.startswith('-onlyhint'): - search_wikis = arg [len('-onlyhint:'):] + search_wikis = arg[len('-onlyhint:'):] else: genFactory.handleArg(arg) -- To view, visit https://gerrit.wikimedia.org/r/86624 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I5a4a7dd85eadf7233fe7e388644dadd5ba1e5ffc Gerrit-PatchSet: 2 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] Port imagerecat.py from compat - change (pywikibot/core)
by jenkins-bot (Code Review) 30 Sep '13

30 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: Port imagerecat.py from compat ...................................................................... Port imagerecat.py from compat Change-Id: I9e5f5a1fb1823ec85378d3bf9d7c67592139face --- A scripts/imagerecat.py 1 file changed, 465 insertions(+), 0 deletions(-) Approvals: Merlijn van Deen: Looks good to me, approved jenkins-bot: Verified diff --git a/scripts/imagerecat.py b/scripts/imagerecat.py new file mode 100644 index 0000000..7c91106 --- /dev/null +++ b/scripts/imagerecat.py @@ -0,0 +1,465 @@ +# -*- coding: utf-8 -*- +""" +Program to (re)categorize images at commons. + +The program uses commonshelper for category suggestions. +It takes the suggestions and the current categories. Put the categories through +some filters and adds the result. + +The following command line parameters are supported: + +-onlyfilter Don't use Commonsense to get categories, just filter the current + categories + +-onlyuncat Only work on uncategorized images. Will prevent the bot from + working on an image multiple times. + +-hint Give Commonsense a hint. + For example -hint:li.wikipedia.org + +-onlyhint Give Commonsense a hint. And only work on this hint. + Syntax is the same as -hint. Some special hints are possible: + _20 : Work on the top 20 wikipedia's + _80 : Work on the top 80 wikipedia's + wps : Work on all wikipedia's + +""" +__version__ = '$Id$' +# +# (C) Multichill 2008-2011 +# (C) Pywikipedia bot team, 2008-2013 +# +# Distributed under the terms of the MIT license. +# +# +import os, sys, re, codecs +import urllib, httplib, urllib2 +import time +import socket +import StringIO +import pywikibot +from pywikibot import config +from pywikibot import pagegenerators +import xml.etree.ElementTree + +category_blacklist = [] +countries = [] + +search_wikis=u'_20' +hint_wiki=u'' + +def initLists(): + ''' + Get the list of countries & the blacklist from Commons. + ''' + global category_blacklist + global countries + + blacklistPage = pywikibot.Page(pywikibot.Site(u'commons', u'commons'), + u'User:Multichill/Category_blacklist') + for cat in blacklistPage.linkedPages(): + category_blacklist.append(cat.title(withNamespace=False)) + + countryPage = pywikibot.Page(pywikibot.Site(u'commons', u'commons'), + u'User:Multichill/Countries') + for country in countryPage.linkedPages(): + countries.append(country.title(withNamespace=False)) + return + +def categorizeImages(generator, onlyFilter, onlyUncat): + ''' Loop over all images in generator and try to categorize them. Get + category suggestions from CommonSense. + + ''' + for page in generator: + if page.exists() and (page.namespace() == 6) and \ + (not page.isRedirectPage()): + imagepage = pywikibot.ImagePage(page.site(), page.title()) + pywikibot.output(u'Working on ' + imagepage.title()) + + if (onlyUncat and not(u'Uncategorized' in imagepage.templates())): + pywikibot.output(u'No Uncategorized template found') + else: + currentCats = getCurrentCats(imagepage) + if onlyFilter: + commonshelperCats = [] + usage = [] + galleries = [] + else: + (commonshelperCats, usage, galleries) = getCommonshelperCats(imagepage) + newcats = applyAllFilters(commonshelperCats+currentCats) + + if (len(newcats) > 0 and not(set(currentCats)==set(newcats))): + for cat in newcats: + pywikibot.output(u' Found new cat: ' + cat); + saveImagePage(imagepage, newcats, usage, galleries, + onlyFilter) + +def getCurrentCats(imagepage): + ''' Get the categories currently on the image ''' + result = [] + for cat in imagepage.categories(): + result.append(cat.title(withNamespace=False)) + return list(set(result)) + +def getCommonshelperCats(imagepage): + ''' Get category suggestions from CommonSense. Parse them and return a list + of suggestions. + + ''' + commonshelperCats = [] + usage = [] + galleries = [] + + global search_wikis + global hint_wiki + site = imagepage.site + lang = site.language() + family = site.family.name + if lang==u'commons' and family==u'commons': + parameters = urllib.urlencode( + {'i' : imagepage.title(withNamespace=False).encode('utf-8'), + 'r' : 'on', + 'go-clean' : 'Find+Categories', + 'p' : search_wikis, + 'cl' : hint_wiki}) + elif family==u'wikipedia': + parameters = urllib.urlencode( + {'i' : imagepage.title(withNamespace=False).encode('utf-8'), + 'r' : 'on', + 'go-move' : 'Find+Categories', + 'p' : search_wikis, + 'cl' : hint_wiki, + 'w' : lang}) + else: + #Cant handle other sites atm + return ([], [], []) + + commonsenseRe = re.compile('^#COMMONSENSE(.*)#USAGE(\s)+$(?P<usagenum>(\d)+)$\s(?P<usage>(.*))\s#KEYWORDS(\s)+$(?P<keywords>(\d)+)$(.*)#CATEGORIES(\s)+$(?P<catnum>(\d)+)$\s(?P<cats>(.*))\s#GALLERIES(\s)+$(?P<galnum>(\d)+)$\s(?P<gals>(.*))\s(.*)#EOF$', re.MULTILINE + re.DOTALL) + + gotInfo = False + matches = None + maxtries = 10 + tries = 0 + while(not gotInfo): + try: + if ( tries < maxtries ): + tries = tries + 1 + commonsHelperPage = urllib.urlopen( + "http://toolserver.org/~daniel/WikiSense/CommonSense.php?%s" % parameters) + matches = commonsenseRe.search( + commonsHelperPage.read().decode('utf-8')) + gotInfo = True + else: + break + except IOError: + pywikibot.output(u'Got an IOError, let\'s try again') + except socket.timeout: + pywikibot.output(u'Got a timeout, let\'s try again') + + if (matches and gotInfo): + if (matches.group('usagenum') > 0): + used = matches.group('usage').splitlines() + for use in used: + usage= usage + getUsage(use) + #pywikibot.output(use) + if (matches.group('catnum') > 0): + cats = matches.group('cats').splitlines() + for cat in cats: + commonshelperCats.append(cat.replace('_', ' ')) + pywikibot.output(u'category : ' + cat) + if (matches.group('galnum') > 0): + gals = matches.group('gals').splitlines() + for gal in gals: + galleries.append(gal.replace('_', ' ')) + pywikibot.output(u'gallery : ' + gal) + commonshelperCats = list(set(commonshelperCats)) + galleries = list(set(galleries)) + for (lang, project, article) in usage: + pywikibot.output(lang + project + article) + return (commonshelperCats, usage, galleries) + +def getOpenStreetMapCats(latitude, longitude): + ''' + Get a list of location categories based on the OSM nomatim tool + ''' + result = [] + locationList = getOpenStreetMap(latitude, longitude) + for i in range(0, len(locationList)): + #print 'Working on ' + locationList[i] + if i <= len(locationList)-3: + category = getCategoryByName(name=locationList[i], parent=locationList[i+1], grandparent=locationList[i+2]) + elif i == len(locationList)-2: + category = getCategoryByName(name=locationList[i], parent=locationList[i+1]) + else: + category = getCategoryByName(name=locationList[i]) + if category and not category==u'': + result.append(category) + #print result + return result + + +def getOpenStreetMap(latitude, longitude): + ''' + Get the result from http://nominatim.openstreetmap.org/reverse + and put it in a list of tuples to play around with + ''' + result = [] + gotInfo = False + parameters = urllib.urlencode({'lat' : latitude, 'lon' : longitude, 'accept-language' : 'en'}) + while(not gotInfo): + try: + page = urllib.urlopen("http://nominatim.openstreetmap.org/reverse?format=xml&%s" % parameters) + et = xml.etree.ElementTree.parse(page) + gotInfo=True + except IOError: + pywikibot.output(u'Got an IOError, let\'s try again') + time.sleep(30) + except socket.timeout: + pywikibot.output(u'Got a timeout, let\'s try again') + time.sleep(30) + validParts = [u'hamlet', u'village', u'city', u'county', u'country'] + invalidParts = [u'path', u'road', u'suburb', u'state', u'country_code'] + addressparts = et.find('addressparts') + #xml.etree.ElementTree.dump(et) + + for addresspart in addressparts.getchildren(): + if addresspart.tag in validParts: + result.append(addresspart.text) + elif addresspart.tag in invalidParts: + pywikibot.output(u'Dropping %s, %s' % (addresspart.tag, addresspart.text)) + else: + pywikibot.warning(u'%s, %s is not in addressparts lists' % (addresspart.tag, addresspart.text)) + #print result + return result + +def getCategoryByName(name, parent=u'', grandparent=u''): + + if not parent==u'': + workname = name.strip() + u',_' + parent.strip() + workcat = pywikibot.Category( + pywikibot.Site(u'commons', u'commons'), workname) + if workcat.exists(): + return workname + if not grandparent==u'': + workname = name.strip() + u',_' + grandparent.strip() + workcat = pywikibot.Category( + pywikibot.Site(u'commons', u'commons'), workname) + if workcat.exists(): + return workname + workname = name.strip() + workcat = pywikibot.Category( + pywikibot.Site(u'commons', u'commons'), workname) + if workcat.exists(): + return workname + return u'' + + +def getUsage(use): + ''' Parse the Commonsense output to get the usage ''' + result = [] + lang = '' + project = '' + article = '' + usageRe = re.compile( + '^(?P<lang>([\w-]+))\.(?P<project>([\w]+))\.org:(?P<articles>\s(.*))') + matches = usageRe.search(use) + if matches: + if (matches.group('lang')): + lang = matches.group('lang') + #pywikibot.output(lang) + if (matches.group('project')): + project = matches.group('project') + #pywikibot.output(project) + if (matches.group('articles')): + articles = matches.group('articles') + #pywikibot.output(articles) + for article in articles.split(): + result.append((lang, project, article)) + return result + +def applyAllFilters(categories): + ''' Apply all filters on categories. ''' + result = [] + result = filterDisambiguation(categories) + result = followRedirects(result) + result = filterBlacklist(result) + result = filterCountries(result) + result = filterParents(result) + return result + +def filterBlacklist(categories): + ''' Filter out categories which are on the blacklist. ''' + result = [] + for cat in categories: + cat = cat.replace('_', ' ') + if (cat not in category_blacklist): + result.append(cat) + return list(set(result)) + +def filterDisambiguation(categories): + ''' Filter out disambiguation categories. ''' + result = [] + for cat in categories: + if (not pywikibot.Page(pywikibot.Site(u'commons', u'commons'), + cat, ns=14).isDisambig()): + result.append(cat) + return result + +def followRedirects(categories): + ''' If a category is a redirect, replace the category with the target. ''' + result = [] + for cat in categories: + categoryPage = pywikibot.Page(pywikibot.getSite(u'commons', u'commons'), + cat, ns=14) + if categoryPage.isCategoryRedirect(): + result.append( + categoryPage.getCategoryRedirectTarget().title( + withNamespace=False)) + else: + result.append(cat) + return result + +def filterCountries(categories): + ''' Try to filter out ...by country categories. + First make a list of any ...by country categories and try to find some + countries. If a by country category has a subcategoy containing one of the + countries found, add it. The ...by country categories remain in the set and + should be filtered out by filterParents. + + ''' + result = categories + listByCountry = [] + listCountries = [] + for cat in categories: + if (cat.endswith(u'by country')): + listByCountry.append(cat) + + #If cat contains 'by country' add it to the list + #If cat contains the name of a country add it to the list + else: + for country in countries: + if country in cat: + listCountries.append(country) + if(len(listByCountry) > 0): + for bc in listByCountry: + category = pywikibot.Category( + pywikibot.Site(u'commons', u'commons'), u'Category:' + bc) + for subcategory in category.subcategories(): + for country in listCountries: + if (subcategory.title(withNamespace=False).endswith(country)): + result.append(subcategory.title(withNamespace=False)) + return list(set(result)) + +def filterParents(categories): + ''' Remove all parent categories from the set to prevent overcategorization. + + ''' + result = [] + toFilter = u'' + for cat in categories: + cat = cat.replace('_', ' ') + toFilter = toFilter + "[[Category:" + cat + "]]\n" + parameters = urllib.urlencode({'source' : toFilter.encode('utf-8'), + 'bot' : '1'}) + filterCategoriesRe = re.compile('\[\[Category:([^\]]*)\]\]') + try: + filterCategoriesPage = urllib.urlopen( + "http://toolserver.org/~multichill/filtercats.php?%s" % parameters) + result = filterCategoriesRe.findall( + filterCategoriesPage.read().decode('utf-8')) + except IOError: + #Something is wrong, forget about this filter and just return the input + return categories + + if not result: + #Is empty, dont want to remove all categories + return categories + return result + +def saveImagePage(imagepage, newcats, usage, galleries, onlyFilter): + ''' Remove the old categories and add the new categories to the image. ''' + newtext = pywikibot.removeCategoryLinks(imagepage.get(), imagepage.site()) + if not(onlyFilter): + newtext = removeTemplates(newtext) + newtext = newtext + getCheckCategoriesTemplate(usage, galleries, + len(newcats)) + newtext = newtext + u'\n' + for category in newcats: + newtext = newtext + u'[[Category:' + category + u']]\n' + if(onlyFilter): + comment = u'Filtering categories' + else: + comment = u'Image is categorized by a bot using data from [[Commons:Tools#CommonSense|CommonSense]]' + pywikibot.showDiff(imagepage.get(), newtext) + imagepage.put(newtext, comment) + return + +def removeTemplates(oldtext = u''): + ''' + Remove {{Uncategorized}} and {{Check categories}} templates + ''' + result = u'' + result = re.sub( + u'\{\{\s*([Uu]ncat(egori[sz]ed( image)?)?|[Nn]ocat|[Nn]eedscategory)[^}]*\}\}', u'', oldtext) + result = re.sub(u'', + u'', result) + result = re.sub(u'\{\{\s*[Cc]heck categories[^}]*\}\}', u'', result) + return result + +def getCheckCategoriesTemplate(usage, galleries, ncats): + ''' + Build the check categories template with all parameters + ''' + result = u'{{Check categories|year={{subst:CURRENTYEAR}}|month={{subst:CURRENTMONTHNAME}}|day={{subst:CURRENTDAY}}\n' + usageCounter = 1 + for (lang, project, article) in usage: + result += u'|lang%d=%s' % (usageCounter, lang) + result += u'|wiki%d=%s' % (usageCounter, project) + result += u'|article%d=%s' % (usageCounter, article) + result += u'\n' + usageCounter = usageCounter + 1 + galleryCounter = 1 + for gallery in galleries: + result += u'|gallery%d=%s' % (galleryCounter, gallery.replace('_', ' ')) + u'\n' + galleryCounter = galleryCounter + 1 + result += u'|ncats=%d\n' % ncats + result += u'}}\n' + return result + +def main(args): + ''' + Main loop. Get a generator and options. Work on all images in the generator. + ''' + generator = None + onlyFilter = False + onlyUncat = False + genFactory = pagegenerators.GeneratorFactory() + + global search_wikis + global hint_wiki + + site = pywikibot.getSite(u'commons', u'commons') + for arg in pywikibot.handleArgs(): + if arg == '-onlyfilter': + onlyFilter = True + elif arg == '-onlyuncat': + onlyUncat = True + elif arg.startswith('-hint:'): + hint_wiki = arg [len('-hint:'):] + elif arg.startswith('-onlyhint'): + search_wikis = arg [len('-onlyhint:'):] + else: + genFactory.handleArg(arg) + + generator = genFactory.getCombinedGenerator() + if not generator: + generator = pagegenerators.CategorizedPageGenerator( + pywikibot.Category(site, u'Category:Media needing categories'), + recurse=True) + initLists() + categorizeImages(generator, onlyFilter, onlyUncat) + pywikibot.output(u'All done') + +if __name__ == "__main__": + main(sys.argv[1:]) -- To view, visit https://gerrit.wikimedia.org/r/86621 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I9e5f5a1fb1823ec85378d3bf9d7c67592139face Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] .pep8: ignore ez_setup, .git - change (pywikibot/core)
by jenkins-bot (Code Review) 29 Sep '13

29 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: .pep8: ignore ez_setup, .git ...................................................................... .pep8: ignore ez_setup, .git Change-Id: I53a5b4a6b06218d57bde4ee7a18e0ed7602ce5da --- M .pep8 1 file changed, 1 insertion(+), 1 deletion(-) Approvals: Legoktm: Looks good to me, approved jenkins-bot: Verified diff --git a/.pep8 b/.pep8 index 6e64087..2454dfd 100644 --- a/.pep8 +++ b/.pep8 @@ -1,4 +1,4 @@ [pep8] ignore = E122,E241,E502 -exclude = distribute_setup.py,externals,user-config.py,./scripts/i18n/*,./pywikibot/date.py +exclude = .git,ez_setup.py,externals,user-config.py,./scripts/i18n/*,./pywikibot/date.py max_line_length = 256 -- To view, visit https://gerrit.wikimedia.org/r/86434 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I53a5b4a6b06218d57bde4ee7a18e0ed7602ce5da Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] update linktrail from mw (update from compat) - change (pywikibot/core)
by jenkins-bot (Code Review) 29 Sep '13

29 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: update linktrail from mw (update from compat) ...................................................................... update linktrail from mw (update from compat) Change-Id: I7e46868aab1a3d76caef3b9d95bd77e721274221 --- M pywikibot/family.py 1 file changed, 111 insertions(+), 5 deletions(-) Approvals: Legoktm: Looks good to me, approved jenkins-bot: Verified diff --git a/pywikibot/family.py b/pywikibot/family.py index bc5d206..59484c9 100644 --- a/pywikibot/family.py +++ b/pywikibot/family.py @@ -117,28 +117,134 @@ # Note: this is a regular expression. self.linktrails = { '_default': u'[a-z]*', + 'ab': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'als': u'[äöüßa-z]*', + 'an': u'[a-záéíóúñ]*', + 'ar': u'[a-zء-ي]*', + 'arz': u'[a-zء-ي]*', + 'av': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'ay': u'[a-záéíóúñ]*', + 'bar': u'[äöüßa-z]*', + 'be': u'[абвгґджзеёжзійклмнопрстуўфхцчшыьэюяćčłńśšŭźža-z]*', + 'be-x-old': u'[абвгґджзеёжзійклмнопрстуўфхцчшыьэюяćčłńśšŭźža-z]*', + 'bg': u'[a-zабвгдежзийклмнопрстуфхцчшщъыьэюя]*', + 'bm': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'bs': u'[a-zćčžšđž]*', + 'bxr': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'ca': u'[a-zàèéíòóúç·ïü]*', + 'cbk-zam': u'[a-záéíóúñ]*', + 'ce': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'crh': u'[a-zâçğıñöşüа-яё“»]*', 'cs': u'[a-záčďéěíňóřšťúůýž]*', - 'de': u'[a-zäöüß]*', + 'csb': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', + 'cu': u'[a-zабвгдеєжѕзїіıићклмнопсстѹфхѡѿцчшщъыьѣюѥѧѩѫѭѯѱѳѷѵґѓђёјйљњќуўџэ҄я“»]*', + 'cv': u'[a-zа-яĕçăӳ"»]*', + 'cy': u'[àáâèéêìíîïòóôûŵŷa-z]*', 'da': u'[a-zæøå]*', + 'de': u'[a-zäöüß]*', + 'dsb': u'[äöüßa-z]*', + 'el': u'[a-zαβγδεζηθικλμνξοπρστυφχψωςΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΤΥΦΧΨΩάέήίόύώϊϋΐΰΆΈΉΊΌΎΏΪΫ]*', + 'eml': u'[a-zàéèíîìóòúù]*', 'es': u'[a-záéíóúñ]*', - 'fa': u'[a-zابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'et': u'[äöõšüža-z]*', + 'fa': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'ff': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', 'fi': u'[a-zäö]*', + 'fiu-vro': u'[äöõšüža-z]*', + 'fo': u'[áðíóúýæøa-z]*', 'fr': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'frp': u'[a-zàâçéèêîœôû·’æäåāăëēïīòöōùü‘]*', 'frr': u'[a-zäöüßåāđē]*', + 'fur': u'[a-zàéèíîìóòúù]*', + 'fy': u'[a-zàáèéìíòóùúâêîôûäëïöü]*', + 'gag': u'[a-zÇĞçğİıÖöŞşÜüÂâÎîÛû]*', + 'gl': u'[áâãàéêẽçíòóôõq̃úüűũa-z]*', + 'glk': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'gn': u'[a-záéíóúñ]*', 'he': u'[a-zא-ת]*', + 'hr': u'[čšžćđßa-z]*', + 'hsb': u'[äöüßa-z]*', + 'ht': u'[a-zàèòÀÈÒ]*', 'hu': u'[a-záéíóúöüőűÁÉÍÓÚÖÜŐŰ]*', + 'hy': u'[a-zաբգդեզէըթժիլխծկհձղճմյնշոչպջռսվտրցւփքօֆև«»]*', + 'is': u'[áðéíóúýþæöa-z-–]*', 'it': u'[a-zàéèíîìóòúù]*', 'ka': u'[a-zაბგდევზთიკლმნოპჟრსტუფქღყშჩცძწჭხჯჰ“»]*', 'kk': u'[a-zäçéğıïñöşüýʺʹа-яёәғіқңөұүһٴابپتجحدرزسشعفقكلمنڭەوۇۋۆىيچھ“»]*', + 'kl': u'[a-zæøå]*', + 'koi': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'krc': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'ksh': u'[a-zäöüėëĳßəğåůæœç]*', + 'kv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'lad': u'[a-záéíóúñ]*', + 'lb': u'[äöüßa-z]*', + 'lbe': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюяӀ1“»]*', + 'lez': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'li': u'[a-zäöüïëéèà]*', + 'lij': u'[a-zàéèíîìóòúù]*', + 'lmo': u'[a-zàéèíîìóòúù]*', + 'ln': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'mg': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'mhr': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'mk': u'[a-zабвгдѓежзѕијклљмнњопрстќуфхцчџш]*', - 'nl': u'[a-zäöüïëéèàë]*', + 'mn': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя“»]*', + 'mr': u'[ऀ-ॣॱ-ॿ‍]*', + 'mrj': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'mwl': u'[áâãàéêẽçíòóôõq̃úüűũa-z]*', + 'myv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'mzn': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'nah': u'[a-záéíóúñ]*', + 'nap': u'[a-zàéèíîìóòúù]*', + 'nds': u'[äöüßa-z]*', + 'nds-nl': u'[a-zäöüïëéèà]*', + 'nl': u'[a-zäöüïëéèà]*', + 'nn': u'[æøåa-z]*', + 'no': u'[æøåa-z]*', + 'oc': u'[a-zàâçéèêîôû]*', + 'pa': u'[ਁਂਃਅਆਇਈਉਊਏਐਓਔਕਖਗਘਙਚਛਜਝਞਟਠਡਢਣਤਥਦਧਨਪਫਬਭਮਯਰਲਲ਼ਵਸ਼ਸਹ਼ਾਿੀੁੂੇੈੋੌ੍ਖ਼ਗ਼ਜ਼ੜਫ਼ੰੱੲੳa-z]*', + 'pcd': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'pdc': u'[äöüßa-z]*', + 'pfl': u'[äöüßa-z]*', 'pl': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', - 'pt': u'[a-záâàãéêíóôõúüç]*', + 'pms': u'[a-zàéèíîìóòúù]*', + 'pt': u'[a-záâãàéêẽçíòóôõq̃úüűũ]*', + 'qu': u'[a-záéíóúñ]*', + 'rmy': u'[a-zăâîşţșțĂÂÎŞŢȘȚ]*', 'ro': u'[a-zăâîşţșțĂÂÎŞŢȘȚ]*', - 'ru': u'[a-zа-я]*', + 'ru': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'rue': u'[a-zабвгґдеєжзиіїйклмнопрстуфхцчшщьєюяёъы“»]*', + 'sah': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'scn': u'[a-zàéèíîìóòúù]*', + 'sg': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'sh': u'[a-zčćđžš]*', 'sk': u'[a-záäčďéíľĺňóôŕšťúýž]*', + 'sl': u'[a-zčćđžš]*', + 'sr': u'[abvgdđežzijklljmnnjoprstćufhcčdžšабвгдђежзијклљмнњопрстћуфхцчџш]*', + 'srn': u'[a-zäöüïëéèà]*', + 'stq': u'[äöüßa-z]*', + 'sv': u'[a-zåäöéÅÄÖÉ]*', + 'szl': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', + 'ta': u'[஀-௿]*', + 'te': u'[ఁ-౯]*', + 'tg': u'[a-zабвгдеёжзийклмнопрстуфхчшъэюяғӣқўҳҷцщыь]*', + 'tk': u'[a-zÄäÇçĞğŇňÖöŞşÜüÝýŽž]*', + 'tr': u'[a-zÇĞçğİıÖöŞşÜüÂâÎîÛû]*', + 'tt': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюяӘәӨөҮүҖҗҢңҺһ]*', + 'ty': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'tyv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'udm': u'[a-zа-яёӝӟӥӧӵ“»]*', + 'uk': u'[a-zабвгґдеєжзиіїйклмнопрстуфхцчшщьєюяёъы“»]*', + 'uz': u'[a-zʻʼ“»]*', + 'vec': u'[a-zàéèíîìóòúù]*', + 'vep': u'[äöõšüža-z]*', + 'vi': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'vls': u'[a-zäöüïëéèà]*', + 'wa': u'[a-zåâêîôûçéè]*', + 'wo': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'xal': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'xmf': u'[a-zაბგდევზთიკლმნოპჟრსტუფქღყშჩცძწჭხჯჰ“»]*', + 'yi': u'[a-zא-ת]*', + 'zea': u'[a-zäöüïëéèà]*', } # Wikimedia wikis all use "bodyContent" as the id of the <div> -- To view, visit https://gerrit.wikimedia.org/r/86392 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I7e46868aab1a3d76caef3b9d95bd77e721274221 Gerrit-PatchSet: 2 Gerrit-Project: pywikibot/core Gerrit-Branch: master Gerrit-Owner: Xqt <info(a)gno.de> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: Merlijn van Deen <valhallasw(a)arctus.nl> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] update version handling from core: - change (pywikibot/compat)
by jenkins-bot (Code Review) 29 Sep '13

29 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: update version handling from core: ...................................................................... update version handling from core: - print release from pywikibot __init__ file (1.0b1) update __init__ file from core - utf-8 coding - copyright mark - release string - version hash string Change-Id: I61758b8c8f14417be012311f496dbaa9a278f140 --- M pywikibot/__init__.py M version.py 2 files changed, 18 insertions(+), 4 deletions(-) Approvals: Legoktm: Looks good to me, approved DrTrigon: Checked; Looks good to me, but someone else must approve jenkins-bot: Verified diff --git a/pywikibot/__init__.py b/pywikibot/__init__.py index 5daf5a2..bf163d9 100644 --- a/pywikibot/__init__.py +++ b/pywikibot/__init__.py @@ -1,5 +1,17 @@ -# wikipedia.py will monkey-patch this module to look completely -# alike wikipedia itself... +# -*- coding: utf-8 -*- +""" +The initialization file for the Pywikibot framework. + +wikipedia.py will monkey-patch this module to look completely +alike wikipedia itself... +""" +# +# (C) Pywikipedia bot team, 2010-2013 +# +# Distributed under the terms of the MIT license. +# +__release__ = '1.0b1' +__version__ = '$Id$' try: import wikipedia diff --git a/version.py b/version.py index 338fac5..9832bd4 100644 --- a/version.py +++ b/version.py @@ -10,12 +10,14 @@ __version__ = '$Id$' import sys +import pywikibot from pywikibot.version import * import config if __name__ == '__main__': - print 'Pywikipedia %s' % getversion() - print 'Python %s' % sys.version + print 'Pywikibot %s' % getversion() + print 'Release version: %s' % pywikibot.__release__ + print 'Python: %s' % sys.version print 'config-settings:' print 'use_api =', config.use_api print 'use_api_login =', config.use_api_login -- To view, visit https://gerrit.wikimedia.org/r/86380 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I61758b8c8f14417be012311f496dbaa9a278f140 Gerrit-PatchSet: 2 Gerrit-Project: pywikibot/compat Gerrit-Branch: master Gerrit-Owner: Xqt <info(a)gno.de> Gerrit-Reviewer: DrTrigon <dr.trigon(a)surfeu.ch> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: jenkins-bot

1 0

[Gerrit] update linktrail from mw - change (pywikibot/compat)
by jenkins-bot (Code Review) 29 Sep '13

29 Sep '13

jenkins-bot has submitted this change and it was merged. Change subject: update linktrail from mw ...................................................................... update linktrail from mw Change-Id: I81d29851d0f05674d0cce03d9ad045d339fa903d --- M family.py 1 file changed, 111 insertions(+), 5 deletions(-) Approvals: Legoktm: Looks good to me, approved Adamw: Looks good to me, but someone else must approve jenkins-bot: Verified diff --git a/family.py b/family.py index ebafced..b672cdf 100644 --- a/family.py +++ b/family.py @@ -3288,28 +3288,134 @@ # Note: this is a regular expression. self.linktrails = { '_default': u'[a-z]*', + 'ab': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'als': u'[äöüßa-z]*', + 'an': u'[a-záéíóúñ]*', + 'ar': u'[a-zء-ي]*', + 'arz': u'[a-zء-ي]*', + 'av': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'ay': u'[a-záéíóúñ]*', + 'bar': u'[äöüßa-z]*', + 'be': u'[абвгґджзеёжзійклмнопрстуўфхцчшыьэюяćčłńśšŭźža-z]*', + 'be-x-old': u'[абвгґджзеёжзійклмнопрстуўфхцчшыьэюяćčłńśšŭźža-z]*', + 'bg': u'[a-zабвгдежзийклмнопрстуфхцчшщъыьэюя]*', + 'bm': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'bs': u'[a-zćčžšđž]*', + 'bxr': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'ca': u'[a-zàèéíòóúç·ïü]*', + 'cbk-zam': u'[a-záéíóúñ]*', + 'ce': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'crh': u'[a-zâçğıñöşüа-яё“»]*', 'cs': u'[a-záčďéěíňóřšťúůýž]*', - 'de': u'[a-zäöüß]*', + 'csb': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', + 'cu': u'[a-zабвгдеєжѕзїіıићклмнопсстѹфхѡѿцчшщъыьѣюѥѧѩѫѭѯѱѳѷѵґѓђёјйљњќуўџэ҄я“»]*', + 'cv': u'[a-zа-яĕçăӳ"»]*', + 'cy': u'[àáâèéêìíîïòóôûŵŷa-z]*', 'da': u'[a-zæøå]*', + 'de': u'[a-zäöüß]*', + 'dsb': u'[äöüßa-z]*', + 'el': u'[a-zαβγδεζηθικλμνξοπρστυφχψωςΑΒΓΔΕΖΗΘΙΚΛΜΝΞΟΠΡΣΤΥΦΧΨΩάέήίόύώϊϋΐΰΆΈΉΊΌΎΏΪΫ]*', + 'eml': u'[a-zàéèíîìóòúù]*', 'es': u'[a-záéíóúñ]*', - 'fa': u'[a-zابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'et': u'[äöõšüža-z]*', + 'fa': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'ff': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', 'fi': u'[a-zäö]*', + 'fiu-vro': u'[äöõšüža-z]*', + 'fo': u'[áðíóúýæøa-z]*', 'fr': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'frp': u'[a-zàâçéèêîœôû·’æäåāăëēïīòöōùü‘]*', 'frr': u'[a-zäöüßåāđē]*', + 'fur': u'[a-zàéèíîìóòúù]*', + 'fy': u'[a-zàáèéìíòóùúâêîôûäëïöü]*', + 'gag': u'[a-zÇĞçğİıÖöŞşÜüÂâÎîÛû]*', + 'gl': u'[áâãàéêẽçíòóôõq̃úüűũa-z]*', + 'glk': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'gn': u'[a-záéíóúñ]*', 'he': u'[a-zא-ת]*', + 'hr': u'[čšžćđßa-z]*', + 'hsb': u'[äöüßa-z]*', + 'ht': u'[a-zàèòÀÈÒ]*', 'hu': u'[a-záéíóúöüőűÁÉÍÓÚÖÜŐŰ]*', + 'hy': u'[a-zաբգդեզէըթժիլխծկհձղճմյնշոչպջռսվտրցւփքօֆև«»]*', + 'is': u'[áðéíóúýþæöa-z-–]*', 'it': u'[a-zàéèíîìóòúù]*', 'ka': u'[a-zაბგდევზთიკლმნოპჟრსტუფქღყშჩცძწჭხჯჰ“»]*', 'kk': u'[a-zäçéğıïñöşüýʺʹа-яёәғіқңөұүһٴابپتجحدرزسشعفقكلمنڭەوۇۋۆىيچھ“»]*', + 'kl': u'[a-zæøå]*', + 'koi': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'krc': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'ksh': u'[a-zäöüėëĳßəğåůæœç]*', + 'kv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'lad': u'[a-záéíóúñ]*', + 'lb': u'[äöüßa-z]*', + 'lbe': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюяӀ1“»]*', + 'lez': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'li': u'[a-zäöüïëéèà]*', + 'lij': u'[a-zàéèíîìóòúù]*', + 'lmo': u'[a-zàéèíîìóòúù]*', + 'ln': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'mg': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'mhr': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', 'mk': u'[a-zабвгдѓежзѕијклљмнњопрстќуфхцчџш]*', - 'nl': u'[a-zäöüïëéèàë]*', + 'mn': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя“»]*', + 'mr': u'[ऀ-ॣॱ-ॿ‍]*', + 'mrj': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'mwl': u'[áâãàéêẽçíòóôõq̃úüűũa-z]*', + 'myv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'mzn': u'[ابپتثجچحخدذرزژسشصضطظعغفقکگلمنوهیآأئؤة‌]*', + 'nah': u'[a-záéíóúñ]*', + 'nap': u'[a-zàéèíîìóòúù]*', + 'nds': u'[äöüßa-z]*', + 'nds-nl': u'[a-zäöüïëéèà]*', + 'nl': u'[a-zäöüïëéèà]*', + 'nn': u'[æøåa-z]*', + 'no': u'[æøåa-z]*', + 'oc': u'[a-zàâçéèêîôû]*', + 'pa': u'[ਁਂਃਅਆਇਈਉਊਏਐਓਔਕਖਗਘਙਚਛਜਝਞਟਠਡਢਣਤਥਦਧਨਪਫਬਭਮਯਰਲਲ਼ਵਸ਼ਸਹ਼ਾਿੀੁੂੇੈੋੌ੍ਖ਼ਗ਼ਜ਼ੜਫ਼ੰੱੲੳa-z]*', + 'pcd': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'pdc': u'[äöüßa-z]*', + 'pfl': u'[äöüßa-z]*', 'pl': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', - 'pt': u'[a-záâàãéêíóôõúüç]*', + 'pms': u'[a-zàéèíîìóòúù]*', + 'pt': u'[a-záâãàéêẽçíòóôõq̃úüűũ]*', + 'qu': u'[a-záéíóúñ]*', + 'rmy': u'[a-zăâîşţșțĂÂÎŞŢȘȚ]*', 'ro': u'[a-zăâîşţșțĂÂÎŞŢȘȚ]*', - 'ru': u'[a-zа-я]*', + 'ru': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'rue': u'[a-zабвгґдеєжзиіїйклмнопрстуфхцчшщьєюяёъы“»]*', + 'sah': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'scn': u'[a-zàéèíîìóòúù]*', + 'sg': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'sh': u'[a-zčćđžš]*', 'sk': u'[a-záäčďéíľĺňóôŕšťúýž]*', + 'sl': u'[a-zčćđžš]*', + 'sr': u'[abvgdđežzijklljmnnjoprstćufhcčdžšабвгдђежзијклљмнњопрстћуфхцчџш]*', + 'srn': u'[a-zäöüïëéèà]*', + 'stq': u'[äöüßa-z]*', + 'sv': u'[a-zåäöéÅÄÖÉ]*', + 'szl': u'[a-zęóąśłżźćńĘÓĄŚŁŻŹĆŃ]*', + 'ta': u'[஀-௿]*', + 'te': u'[ఁ-౯]*', + 'tg': u'[a-zабвгдеёжзийклмнопрстуфхчшъэюяғӣқўҳҷцщыь]*', + 'tk': u'[a-zÄäÇçĞğŇňÖöŞşÜüÝýŽž]*', + 'tr': u'[a-zÇĞçğİıÖöŞşÜüÂâÎîÛû]*', + 'tt': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюяӘәӨөҮүҖҗҢңҺһ]*', + 'ty': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'tyv': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'udm': u'[a-zа-яёӝӟӥӧӵ“»]*', + 'uk': u'[a-zабвгґдеєжзиіїйклмнопрстуфхцчшщьєюяёъы“»]*', + 'uz': u'[a-zʻʼ“»]*', + 'vec': u'[a-zàéèíîìóòúù]*', + 'vep': u'[äöõšüža-z]*', + 'vi': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'vls': u'[a-zäöüïëéèà]*', + 'wa': u'[a-zåâêîôûçéè]*', + 'wo': u'[a-zàâçéèêîôûäëïöüùÇÉÂÊÎÔÛÄËÏÖÜÀÈÙ]*', + 'xal': u'[a-zабвгдеёжзийклмнопрстуфхцчшщъыьэюя]*', + 'xmf': u'[a-zაბგდევზთიკლმნოპჟრსტუფქღყშჩცძწჭხჯჰ“»]*', + 'yi': u'[a-zא-ת]*', + 'zea': u'[a-zäöüïëéèà]*', } # Wikimedia wikis all use "bodyContent" as the id of the <div> -- To view, visit https://gerrit.wikimedia.org/r/86391 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I81d29851d0f05674d0cce03d9ad045d339fa903d Gerrit-PatchSet: 1 Gerrit-Project: pywikibot/compat Gerrit-Branch: master Gerrit-Owner: Xqt <info(a)gno.de> Gerrit-Reviewer: Adamw <awight(a)wikimedia.org> Gerrit-Reviewer: Ladsgroup <ladsgroup(a)gmail.com> Gerrit-Reviewer: Legoktm <legoktm.wikipedia(a)gmail.com> Gerrit-Reviewer: jenkins-bot

1 0

Jump to page:

2024

2023

2022

2021

2020

2019

2018

2017

2016

2015

2014

2013

Pywikibot-commits