Pywikipedia-l August 2007

pywikipedia-l@lists.wikimedia.org

26 participants
318 discussions

SVN: [4140] trunk/pywikipedia/wikipedia.py
by cydeweys＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4140 Author: cydeweys Date: 2007-08-30 01:34:57 +0000 (Thu, 30 Aug 2007) Log Message: ----------- Committing a quick fix to catch the NoPage exceptions caught when working on a red category page. Red categories can still contain pages in them, so we should not abort. Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2007-08-29 22:11:40 UTC (rev 4139) +++ trunk/pywikipedia/wikipedia.py 2007-08-30 01:34:57 UTC (rev 4140) @@ -1331,7 +1331,11 @@ The return value is a list of Category objects, one for each of the category links in the page text. """ - return getCategoryLinks(self.get(nofollow_redirects=nofollow_redirects), self.site()) + try: + category_links_to_return = getCategoryLinks(self.get(nofollow_redirects=nofollow_redirects), self.site()) + except NoPage: + category_links_to_return = [] + return category_links_to_return def __cmp__(self, other): """Pseudo method to be able to use equality and inequality tests on

1 0

SVN: [4139] trunk/pywikipedia
by siebrand＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4139 Author: siebrand Date: 2007-08-29 22:11:40 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Also revert changes to the delinker. Works again. Modified Paths: -------------- trunk/pywikipedia/delinker.py trunk/pywikipedia/delinker.txt Modified: trunk/pywikipedia/delinker.py =================================================================== --- trunk/pywikipedia/delinker.py 2007-08-29 22:06:09 UTC (rev 4138) +++ trunk/pywikipedia/delinker.py 2007-08-29 22:11:40 UTC (rev 4139) @@ -396,7 +396,7 @@ http_callback = wait_callback, no_db = True) - def check_usage(self, image, timestamp, admin, reason, replacement, namespace = None): + def check_usage(self, image, timestamp, admin, reason, replacement): """ Check whether this image needs to be delinked. """ # Check whether the image still is deleted on Commons. @@ -420,7 +420,7 @@ if self.CommonsDelinker.config['global']: - usage = self.CheckUsage.get_usage(image, namespace = namespace) + usage = self.CheckUsage.get_usage(image) usage_domains = {} count = 0 @@ -434,15 +434,12 @@ #FIX! usage_domains = {(self.site.lang, self.site.family.name): list(self.CheckUsage.get_usage_live(self.site, - image, namespace = namespace))} + image))} count = len(usage_domains[(self.site.lang, self.site.family.name)]) output(u'%s %s used on %s pages' % (self, image, count)) if count: - if count > self.CommonsDelinker.config.get('template_threshold', sys.maxint): - output('%s Only delinking %s from template namespace' % (self, image)) - return check_usage(image, timestamp, admin, reason, replacement, 10) # Pass the usage to the Delinker pool along with other arguments self.CommonsDelinker.Delinkers.append((image, usage_domains, timestamp, admin, reason, replacement)) Modified: trunk/pywikipedia/delinker.txt =================================================================== --- trunk/pywikipedia/delinker.txt 2007-08-29 22:06:09 UTC (rev 4138) +++ trunk/pywikipedia/delinker.txt 2007-08-29 22:11:40 UTC (rev 4139) @@ -95,8 +95,6 @@ * ''exclude_string = "no-delink"'': If this string is included in the deletion summary, the file is not delinked. * ''summary_cache = 3600'': Time before on-wiki settings are updated. -* ''template_threshold = 1000'': If more an image is used more often than this - value, only delink from the template namespace. === Replacer settings === Those variables only need to be set if the replacer is enabled.

1 0

SVN: [4138] trunk/pywikipedia/checkusage.py
by siebrand＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4138 Author: siebrand Date: 2007-08-29 22:06:09 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Revert. Gave errors on CommonsDelinker Modified Paths: -------------- trunk/pywikipedia/checkusage.py Modified: trunk/pywikipedia/checkusage.py =================================================================== --- trunk/pywikipedia/checkusage.py 2007-08-29 20:01:51 UTC (rev 4137) +++ trunk/pywikipedia/checkusage.py 2007-08-29 22:06:09 UTC (rev 4138) @@ -298,12 +298,12 @@ max_retries = self.http_max_retries, callback = self.http_callback) - def get_usage(self, image, namespace = None): + def get_usage(self, image): for dbname in self.databases: - for link in self.get_usage_db(dbname, image, True, namespace): + for link in self.get_usage_db(dbname, image, True): yield self.sites[dbname], link - def get_usage_db(self, dbname, image, shared = False, namespace = None): + def get_usage_db(self, dbname, image, shared = False): #image = strip_image(image) lang, family_name = self.sites[dbname] family = self.known_families[family_name] @@ -314,13 +314,8 @@ left_join = 'WHERE'; query = """SELECT page_namespace, page_title FROM %s.page, %s.imagelinks %s page_id = il_from AND il_to = %%s""" - query = query % (dbname, dbname, left_join) - if not namespace is None: - self.databases[dbname][1].execute(query + ' AND page_namespace = %s', - (image.encode('utf-8', 'ignore'), namespace)) - else: - self.databases[dbname][1].execute(query % (dbname, dbname, left_join), - (image.encode('utf-8', 'ignore'), )) + self.databases[dbname][1].execute(query % (dbname, dbname, left_join), + (image.encode('utf-8', 'ignore'), )) for page_namespace, page_title in self.databases[dbname][1]: stripped_title = page_title.decode('utf-8', 'ignore') if page_namespace != 0: @@ -329,7 +324,7 @@ title = stripped_title yield page_namespace, stripped_title, title - def get_usage_live(self, site, image, shared = False, namespace = None): + def get_usage_live(self, site, image, shared = False): self.connect_http() # FIXME: Use continue @@ -338,13 +333,9 @@ if site.live_version()[:2] > (1, 10): kwargs['list'] = 'imageusage' kwargs['iulimit'] = '500' - if not namespace is None: - kwargs['iunamespace'] = str(namespace) else: kwargs['list'] = 'imagelinks' kwargs['illimit'] = '500' - if not namespace is None: - kwargs['ilnamespace'] = str(namespace) res = self.http.query_api(site.hostname(), site.apipath(), **kwargs)

1 0

SVN: [4137] trunk/pywikipedia
by btongminh＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4137 Author: btongminh Date: 2007-08-29 20:01:51 +0000 (Wed, 29 Aug 2007) Log Message: ----------- New config setting: template_threshold. Modified Paths: -------------- trunk/pywikipedia/delinker.py trunk/pywikipedia/delinker.txt Modified: trunk/pywikipedia/delinker.py =================================================================== --- trunk/pywikipedia/delinker.py 2007-08-29 19:56:26 UTC (rev 4136) +++ trunk/pywikipedia/delinker.py 2007-08-29 20:01:51 UTC (rev 4137) @@ -396,7 +396,7 @@ http_callback = wait_callback, no_db = True) - def check_usage(self, image, timestamp, admin, reason, replacement): + def check_usage(self, image, timestamp, admin, reason, replacement, namespace = None): """ Check whether this image needs to be delinked. """ # Check whether the image still is deleted on Commons. @@ -420,7 +420,7 @@ if self.CommonsDelinker.config['global']: - usage = self.CheckUsage.get_usage(image) + usage = self.CheckUsage.get_usage(image, namespace = namespace) usage_domains = {} count = 0 @@ -434,12 +434,15 @@ #FIX! usage_domains = {(self.site.lang, self.site.family.name): list(self.CheckUsage.get_usage_live(self.site, - image))} + image, namespace = namespace))} count = len(usage_domains[(self.site.lang, self.site.family.name)]) output(u'%s %s used on %s pages' % (self, image, count)) if count: + if count > self.CommonsDelinker.config.get('template_threshold', sys.maxint): + output('%s Only delinking %s from template namespace' % (self, image)) + return check_usage(image, timestamp, admin, reason, replacement, 10) # Pass the usage to the Delinker pool along with other arguments self.CommonsDelinker.Delinkers.append((image, usage_domains, timestamp, admin, reason, replacement)) Modified: trunk/pywikipedia/delinker.txt =================================================================== --- trunk/pywikipedia/delinker.txt 2007-08-29 19:56:26 UTC (rev 4136) +++ trunk/pywikipedia/delinker.txt 2007-08-29 20:01:51 UTC (rev 4137) @@ -95,6 +95,8 @@ * ''exclude_string = "no-delink"'': If this string is included in the deletion summary, the file is not delinked. * ''summary_cache = 3600'': Time before on-wiki settings are updated. +* ''template_threshold = 1000'': If more an image is used more often than this + value, only delink from the template namespace. === Replacer settings === Those variables only need to be set if the replacer is enabled.

1 0

SVN: [4136] trunk/pywikipedia/checkusage.py
by btongminh＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4136 Author: btongminh Date: 2007-08-29 19:56:26 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Remove documentation. Add namespace support. Modified Paths: -------------- trunk/pywikipedia/checkusage.py Modified: trunk/pywikipedia/checkusage.py =================================================================== --- trunk/pywikipedia/checkusage.py 2007-08-29 19:46:50 UTC (rev 4135) +++ trunk/pywikipedia/checkusage.py 2007-08-29 19:56:26 UTC (rev 4136) @@ -298,12 +298,12 @@ max_retries = self.http_max_retries, callback = self.http_callback) - def get_usage(self, image): + def get_usage(self, image, namespace = None): for dbname in self.databases: - for link in self.get_usage_db(dbname, image, True): + for link in self.get_usage_db(dbname, image, True, namespace): yield self.sites[dbname], link - def get_usage_db(self, dbname, image, shared = False): + def get_usage_db(self, dbname, image, shared = False, namespace = None): #image = strip_image(image) lang, family_name = self.sites[dbname] family = self.known_families[family_name] @@ -314,8 +314,13 @@ left_join = 'WHERE'; query = """SELECT page_namespace, page_title FROM %s.page, %s.imagelinks %s page_id = il_from AND il_to = %%s""" - self.databases[dbname][1].execute(query % (dbname, dbname, left_join), - (image.encode('utf-8', 'ignore'), )) + query = query % (dbname, dbname, left_join) + if not namespace is None: + self.databases[dbname][1].execute(query + ' AND page_namespace = %s', + (image.encode('utf-8', 'ignore'), namespace)) + else: + self.databases[dbname][1].execute(query % (dbname, dbname, left_join), + (image.encode('utf-8', 'ignore'), )) for page_namespace, page_title in self.databases[dbname][1]: stripped_title = page_title.decode('utf-8', 'ignore') if page_namespace != 0: @@ -324,7 +329,7 @@ title = stripped_title yield page_namespace, stripped_title, title - def get_usage_live(self, site, image, shared = False): + def get_usage_live(self, site, image, shared = False, namespace = None): self.connect_http() # FIXME: Use continue @@ -333,9 +338,13 @@ if site.live_version()[:2] > (1, 10): kwargs['list'] = 'imageusage' kwargs['iulimit'] = '500' + if not namespace is None: + kwargs['iunamespace'] = str(namespace) else: kwargs['list'] = 'imagelinks' kwargs['illimit'] = '500' + if not namespace is None: + kwargs['ilnamespace'] = str(namespace) res = self.http.query_api(site.hostname(), site.apipath(), **kwargs)

1 0

SVN: [4135] trunk/pywikipedia
by btongminh＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4135 Author: btongminh Date: 2007-08-29 19:46:50 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Add persitent_http as a config setting. Modified Paths: -------------- trunk/pywikipedia/config.py trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/config.py =================================================================== --- trunk/pywikipedia/config.py 2007-08-29 19:43:26 UTC (rev 4134) +++ trunk/pywikipedia/config.py 2007-08-29 19:46:50 UTC (rev 4135) @@ -359,6 +359,12 @@ copyright_economize_query = True +############## HTTP SETTINGS ############## +# Use a persistent http connection. An http connection has to be established +# only once per site object, making stuff a whole lot faster. Do NOT EVER +# use this if you share Site objects across threads without proper locking. +persistent_http = False + ############## FURTHER SETTINGS ############## # The bot can make some additional changes to each page it edits, e.g. fix Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2007-08-29 19:43:26 UTC (rev 4134) +++ trunk/pywikipedia/wikipedia.py 2007-08-29 19:46:50 UTC (rev 4135) @@ -3131,6 +3131,7 @@ if not language[0].upper() + language[1:] in self.namespaces(): self._validlanguages.append(language) + if persistent_http is None: persistent_http = config.persistent_http self.persistent_http = persistent_http and self.protocol() in ('http', 'https') if persistent_http: if self.protocol() == 'http':

1 0

SVN: [4134] trunk/pywikipedia/wikipedia.py
by btongminh＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4134 Author: btongminh Date: 2007-08-29 19:43:26 +0000 (Wed, 29 Aug 2007) Log Message: ----------- The cache keys wikipedia.getSite uses now use all arguments to getSite; Add support for persistent connections. An http connection has to be established only once, making stuff a whole lot faster. Do NOT EVER use this if you share Site objects across threads without proper locking. In fact you should never ever share objects between threads without locking. Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2007-08-29 18:00:33 UTC (rev 4133) +++ trunk/pywikipedia/wikipedia.py 2007-08-29 19:43:26 UTC (rev 4134) @@ -3090,13 +3090,18 @@ return myfamily.Family() class Site(object): - def __init__(self, code, fam=None, user=None): - """Constructor takes three arguments: + def __init__(self, code, fam=None, user=None, persistent_http = None): + """Constructor takes four arguments: code language code for Site fam Wikimedia family (optional: defaults to configured). Can either be a string or a Family object. - user User to use (optional: defaults to configured)""" + user User to use (optional: defaults to configured) + persistent_http Use a persistent http connection. An http connection + has to be established only once, making stuff a whole lot + faster. Do NOT EVER use this if you share Site objects + across threads without proper locking. + """ self.lang = code.lower() if isinstance(fam, basestring) or fam is None: @@ -3125,6 +3130,15 @@ for language in self.languages(): if not language[0].upper() + language[1:] in self.namespaces(): self._validlanguages.append(language) + + self.persistent_http = persistent_http and self.protocol() in ('http', 'https') + if persistent_http: + if self.protocol() == 'http': + self.conn = httplib.HTTPConnection(self.hostname()) + elif self.protocol() == 'https': + self.conn = httplib.HTTPSConnection(self.hostname()) + + self.sandboxpage = Page(self,self.family.sandboxpage(code)) def urlEncode(self, query): @@ -3170,28 +3184,41 @@ # TODO: add the authenticate stuff here - # Encode all of this into a HTTP request - if self.protocol() == 'http': - conn = httplib.HTTPConnection(self.hostname()) - elif self.protocol() == 'https': - conn = httplib.HTTPSConnection(self.hostname()) - # otherwise, it will crash, as other protocols are not supported - + if self.persistent_http: + conn = self.conn + else: + # Encode all of this into a HTTP request + if self.protocol() == 'http': + conn = httplib.HTTPConnection(self.hostname()) + elif self.protocol() == 'https': + conn = httplib.HTTPSConnection(self.hostname()) + # otherwise, it will crash, as other protocols are not supported + conn.putrequest('POST', address) conn.putheader('Content-Length', str(len(data))) conn.putheader('Content-type', contentType) conn.putheader('User-agent', useragent) if useCookie and self.cookies(sysop = sysop): conn.putheader('Cookie', self.cookies(sysop = sysop)) + if self.persistent_http: + conn.putheader('Connection', 'Keep-Alive') conn.endheaders() conn.send(data) # Prepare the return values # Note that this can raise network exceptions which are not # caught here. - response = conn.getresponse() + try: + response = conn.getresponse() + except httplib.BadStatusLine: + # Blub. + conn.close() + conn.connect() + return self.postData(address, data, contentType, sysop, useCookie) data = response.read().decode(self.encoding()) - conn.close() + response.close() + if not self.persistent_http: + conn.close() return response, data def forceLogin(self, sysop = False): @@ -3278,59 +3305,92 @@ Returns the HTML text of the page converted to unicode. """ - if self.hostname() in config.authenticate.keys(): - uo = authenticateURLopener - else: - uo = MyURLopener() - if self.cookies(sysop = sysop): - uo.addheader('Cookie', self.cookies(sysop = sysop)) + if self.persistent_http and not data: + self.conn.putrequest('GET', path) + self.conn.putheader('User-agent', useragent) + self.conn.putheader('Cookie', self.cookies(sysop = sysop)) + self.conn.putheader('Connection', 'Keep-Alive') if compress: - uo.addheader('Accept-encoding', 'gzip') - - url = '%s://%s%s' % (self.protocol(), self.hostname(), path) - data = self.urlEncode(data) - - # Try to retrieve the page until it was successfully loaded (just in - # case the server is down or overloaded). - # Wait for retry_idle_time minutes (growing!) between retries. - retry_idle_time = 1 - retrieved = False - while not retrieved: + self.conn.putheader('Accept-encoding', 'gzip') + self.conn.endheaders() + + # Prepare the return values + # Note that this can raise network exceptions which are not + # caught here. try: - if self.hostname() in config.authenticate.keys(): - if compress: - request = urllib2.Request(url, data) - request.add_header('Accept-encoding', 'gzip') - opener = urllib2.build_opener() - f = opener.open(request) + response = self.conn.getresponse() + except httplib.BadStatusLine: + # Blub. + self.conn.close() + self.conn.connect() + return self.getUrl(path, retry, sysop, data, compress) + + text = response.read() + contentType = response.getheader('Content-Type') + contentEncoding = response.getheader('Content-Encoding') + else: + if self.hostname() in config.authenticate.keys(): + uo = authenticateURLopener + else: + uo = MyURLopener() + if self.cookies(sysop = sysop): + uo.addheader('Cookie', self.cookies(sysop = sysop)) + if compress: + uo.addheader('Accept-encoding', 'gzip') + + url = '%s://%s%s' % (self.protocol(), self.hostname(), path) + data = self.urlEncode(data) + + # Try to retrieve the page until it was successfully loaded (just in + # case the server is down or overloaded). + # Wait for retry_idle_time minutes (growing!) between retries. + retry_idle_time = 1 + retrieved = False + while not retrieved: + try: + if self.hostname() in config.authenticate.keys(): + if compress: + request = urllib2.Request(url, data) + request.add_header('Accept-encoding', 'gzip') + opener = urllib2.build_opener() + f = opener.open(request) + else: + f = urllib2.urlopen(url, data) else: - f = urllib2.urlopen(url, data) - else: - f = uo.open(url, data) - retrieved = True - except KeyboardInterrupt: - raise - except Exception, e: - if retry: - # We assume that the server is down. Wait some time, then try again. - output(u"%s" % e) - output(u"WARNING: Could not open '%s://%s%s'. Maybe the server or your connection is down. Retrying in %i minutes..." % (self.protocol(), self.hostname(), path, retry_idle_time)) - time.sleep(retry_idle_time * 60) - # Next time wait longer, but not longer than half an hour - retry_idle_time *= 2 - if retry_idle_time > 30: - retry_idle_time = 30 - else: + f = uo.open(url, data) + retrieved = True + except KeyboardInterrupt: raise - text = f.read() - if compress and f.headers.get('Content-Encoding') == 'gzip': - import StringIO, gzip - compressedstream = StringIO.StringIO(text) + except Exception, e: + if retry: + # We assume that the server is down. Wait some time, then try again. + output(u"%s" % e) + output(u"WARNING: Could not open '%s://%s%s'. Maybe the server or your connection is down. Retrying in %i minutes..." % (self.protocol(), self.hostname(), path, retry_idle_time)) + time.sleep(retry_idle_time * 60) + # Next time wait longer, but not longer than half an hour + retry_idle_time *= 2 + if retry_idle_time > 30: + retry_idle_time = 30 + else: + raise + text = f.read() + + # Find charset in the content-type meta tag + contentType = f.info()['Content-Type'] + contentEncoding = f.headers.get('Content-Encoding') + + if compress and contentEncoding == 'gzip': + # Use cStringIO if available + # TODO: rewrite gzip.py such that it supports unseekable fileobjects. + try: + from cStringIO import StringIO + except ImportError: + from StringIO import StringIO + import gzip + compressedstream = StringIO(text) gzipper = gzip.GzipFile(fileobj=compressedstream) text = gzipper.read() - - # Find charset in the content-type meta tag - contentType = f.info()['Content-Type'] + R = re.compile('charset=([^\'\";]+)') m = R.search(contentType) if m: @@ -4158,14 +4218,14 @@ _sites = {} _namespaceCache = {} -def getSite(code = None, fam = None, user=None): +def getSite(code = None, fam = None, user=None, persistent_http=None): if code == None: code = default_code if fam == None: fam = default_family - key = '%s:%s'%(fam,code) + key = '%s:%s:%s:%s'%(fam,code,user,persistent_http) if not _sites.has_key(key): - _sites[key] = Site(code=code, fam=fam, user=user) + _sites[key] = Site(code=code, fam=fam, user=user, persistent_http=persistent_http) return _sites[key] def setSite(site):

1 0

SVN: [4133] trunk/pywikipedia/families/wikipedia_family.py
by siebrand＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4133 Author: siebrand Date: 2007-08-29 18:00:33 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Update namespaces for wikipedia_family.py based on interwiki for en:India Modified Paths: -------------- trunk/pywikipedia/families/wikipedia_family.py Modified: trunk/pywikipedia/families/wikipedia_family.py =================================================================== --- trunk/pywikipedia/families/wikipedia_family.py 2007-08-29 17:49:38 UTC (rev 4132) +++ trunk/pywikipedia/families/wikipedia_family.py 2007-08-29 18:00:33 UTC (rev 4133) @@ -90,6 +90,7 @@ 'tr': u'Vikipedi', 'uk': u'Вікіпедія', 'ur': u'منصوبہ', + 'uz': u'Vikipediya', 'vo': u'Vükiped', 'yi': u'װיקיפּעדיע', } @@ -202,14 +203,14 @@ 'ta': [u'Wikipedia பேச்சு', u'விக்கிபீடியா பேச்சு'], 'te': u'వికీపీడియా చర్చ', 'tg': u'Баҳси Википедиа', - 'th': u'คุยเรื่อง วิกิพีเดีย', + 'th': u'คุยเรื่องวิกิพีเดีย', 'tr': u'Vikipedi tartışma', 'tt': u'Wikipedia bäxäse', 'ty': u'Discussion Wikipedia', 'udm': u'Wikipedia сярысь вераськон', 'uk': u'Обговорення Вікіпедії', 'ur': u'تبادلۂ خیال منصوبہ', - 'uz': u'Wikipedia munozarasi', + 'uz': u'Vikipediya munozarasi', 'vec':u'Discussion Wikipedia', 'vi': u'Thảo luận Wikipedia', 'vls': u'Discuusje Wikipedia', @@ -312,6 +313,7 @@ 'it': u'Progetto', 'lmo': u'Purtaal', 'pl': u'Wikiprojekt', + 'pt': u'Anexo', } self.namespaces[103] = { @@ -324,6 +326,7 @@ 'it': u'Discussioni progetto', 'lmo': u'Descüssiun Purtaal', 'pl': u'Dyskusja Wikiprojektu', + 'pt': u'Anexo Discussão', } self.namespaces[104] = {

1 0

SVN: [4132] trunk/pywikipedia/families/wikinews_family.py
by siebrand＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4132 Author: siebrand Date: 2007-08-29 17:49:38 +0000 (Wed, 29 Aug 2007) Log Message: ----------- More updates for namespaces of family wikinews Modified Paths: -------------- trunk/pywikipedia/families/wikinews_family.py Modified: trunk/pywikipedia/families/wikinews_family.py =================================================================== --- trunk/pywikipedia/families/wikinews_family.py 2007-08-29 17:20:31 UTC (rev 4131) +++ trunk/pywikipedia/families/wikinews_family.py 2007-08-29 17:49:38 UTC (rev 4132) @@ -24,7 +24,7 @@ # Override defaults self.namespaces[2]['pl'] = u'Wikireporter' - self.namespaces[2]['pl'] = u'Dyskusja Wikireportera' + self.namespaces[3]['pl'] = u'Dyskusja Wikireportera' # Most namespaces are inherited from family.Family. self.namespaces[4] = { @@ -48,7 +48,7 @@ self.namespaces[5] = { '_default': [u'Wikinews talk', self.namespaces[5]['_default']], 'ar': u'نقاش ويكي الأخبار', - 'bg': u'Уикиновини', + 'bg': u'Уикиновини беседа', 'bs': u'Razgovor s Wikivijestima', 'ca': u'Viquinotícies Discussió', 'de': u'Wikinews Diskussion', @@ -65,22 +65,28 @@ 'ru': u'Обсуждение ВикиНовостей', 'sr': u'Разговор о Викивестима', 'sv': u'Wikinewsdiskussion', + 'ta': u'Wikinews பேச்ச', 'th': u'คุยเรื่องวิกิข่าว', 'uk': u'Обговорення ВікіНовини', } self.namespaces[100] = { '_default': u'Portal', + 'he': u'פורטל', 'it': u'Portale', - 'fr': u'Wikinytt', + 'ja': u'ポータル', + 'zh': u'频道', } self.namespaces[101] = { '_default': u'Portal talk', + 'he': u'שיחת פורטל', 'it': u'Discussioni portale', - 'fr': u'Wikinytt', + 'ja': u'ポータル‐ノート', + 'de': u'Portal Diskussion', 'pl': u'Dyskusja portalu', 'pt': u'Portal Discussão', + 'zh': u'频道 talk', } self.namespaces[102] = { @@ -107,7 +113,15 @@ 'fr': u'Discussion Dossier', } + self.namespaces[108] = { + 'ja': u'短信', + } + self.namespaces[109] = { + 'ja': u'短信‐ノート', + } + + # On most Wikipedias page names must start with a capital letter, but some # languages don't use this.

1 0

SVN: [4131] trunk/pywikipedia/wikipedia.py
by btongminh＠svn.wikimedia.org 30 Aug '07

30 Aug '07

Revision: 4131 Author: btongminh Date: 2007-08-29 17:20:31 +0000 (Wed, 29 Aug 2007) Log Message: ----------- Only start the put queue if there is actually work to do. Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2007-08-29 15:14:32 UTC (rev 4130) +++ trunk/pywikipedia/wikipedia.py 2007-08-29 17:20:31 UTC (rev 4131) @@ -1030,6 +1030,14 @@ """Asynchronous version of put (takes the same arguments), which places pages on a queue to be saved by a daemon thread. """ + try: + page_put_queue.mutex.acquire() + try: + _putthread.start() + except AssertionError: + pass + finally: + page_put_queue.mutex.release() page_put_queue.put((self, newtext, comment, watchArticle, minorEdit, force)) def put(self, newtext, comment=None, watchArticle = None, minorEdit = True, force=False): @@ -4678,7 +4686,8 @@ # identification for debugging purposes _putthread.setName('Put-Thread') _putthread.setDaemon(True) -_putthread.start() +## Don't start the queue if it is not necessary. +#_putthread.start() def stopme(): """This should be run when a bot does not interact with the Wiki, or

1 0

← Newer
1
2
3
4
5
6
7
...
32
Older →

Jump to page:

2024

2023

2022

2021

2020

2019

2018

2017

2016

2015

2014

2013

2012

2011

2010

2009

2008

2007

Pywikipedia-l August 2007