Revision: 5026 Author: rotem Date: 2008-02-15 18:25:03 +0000 (Fri, 15 Feb 2008)
Log Message: ----------- Changing Wikipedia and Wiktionary to use a closed list of langauges rather than knownlanguages, updating languages_by_size in the other families, updating obsolete in Wikipedia and Wiktionary.
Modified Paths: -------------- trunk/pywikipedia/families/wikinews_family.py trunk/pywikipedia/families/wikipedia_family.py trunk/pywikipedia/families/wikiquote_family.py trunk/pywikipedia/families/wikisource_family.py trunk/pywikipedia/families/wiktionary_family.py
Modified: trunk/pywikipedia/families/wikinews_family.py =================================================================== --- trunk/pywikipedia/families/wikinews_family.py 2008-02-15 17:00:06 UTC (rev 5025) +++ trunk/pywikipedia/families/wikinews_family.py 2008-02-15 18:25:03 UTC (rev 5026) @@ -13,8 +13,8 @@ self.name = 'wikinews'
self.languages_by_size = [ - 'en', 'de', 'pl', 'it', 'fr', 'es', 'pt', 'sv', 'ja', 'zh', - 'ru', 'nl', 'sr', 'he', 'ca', 'uk', 'ro', 'fi', 'th', 'no', + 'en', 'pl', 'de', 'it', 'fr', 'es', 'pt', 'sv', 'ja', 'zh', + 'sr', 'ru', 'nl', 'he', 'uk', 'ca', 'fi', 'ro', 'no', 'th', 'ar', 'bs', 'bg', 'ta', 'sd', ]
Modified: trunk/pywikipedia/families/wikipedia_family.py =================================================================== --- trunk/pywikipedia/families/wikipedia_family.py 2008-02-15 17:00:06 UTC (rev 5025) +++ trunk/pywikipedia/families/wikipedia_family.py 2008-02-15 18:25:03 UTC (rev 5026) @@ -12,7 +12,35 @@ family.Family.__init__(self) self.name = 'wikipedia'
- for lang in self.knownlanguages: + self.languages_by_size = [ + 'en', 'de', 'fr', 'pl', 'ja', 'it', 'nl', 'pt', 'es', 'sv', + 'ru', 'zh', 'no', 'fi', 'vo', 'ca', 'ro', 'tr', 'eo', 'uk', + 'cs', 'sk', 'hu', 'da', 'id', 'he', 'lt', 'sr', 'sl', 'ar', + 'ko', 'bg', 'et', 'new', 'hr', 'te', 'ceb', 'gl', 'th', 'el', + 'fa', 'vi', 'nn', 'ms', 'simple', 'eu', 'bpy', 'bs', 'lb', 'ka', + 'is', 'sq', 'br', 'la', 'az', 'bn', 'hi', 'mr', 'tl', 'io', + 'sh', 'mk', 'cy', 'pms', 'su', 'lv', 'ta', 'nap', 'jv', 'nds', + 'scn', 'oc', 'ast', 'ku', 'wa', 'ht', 'be', 'af', 'tg', 'be-x-old', + 'an', 'roa-tara', 'ksh', 'vec', 'zh-yue', 'cv', 'fy', 'ur', 'sw', 'uz', + 'yo', 'mi', 'qu', 'ga', 'bat-smg', 'ml', 'co', 'kn', 'gd', 'hsb', + 'yi', 'pam', 'nah', 'lmo', 'tt', 'ia', 'sa', 'li', 'hy', 'als', + 'roa-rup', 'map-bms', 'am', 'pag', 'nrm', 'zh-min-nan', 'fo', 'vls', 'se', 'nds-nl', + 'war', 'ne', 'fur', 'bh', 'lij', 'nov', 'pi', 'dv', 'ilo', 'sco', + 'rm', 'diq', 'frp', 'zh-classical', 'kk', 'mt', 'os', 'pdc', 'lad', 'csb', + 'kw', 'wuu', 'fiu-vro', 'to', 'bar', 'ps', 'mn', 'haw', 'ang', 'ln', + 'tk', 'ie', 'km', 'jbo', 'crh', 'tpi', 'wo', 'eml', 'ig', 'or', + 'zea', 'mg', 'ty', 'kg', 'glk', 'cbk-zam', 'si', 'ky', 'ay', 'arc', + 'sc', 'gu', 'kab', 'ks', 'so', 'gn', 'cu', 'udm', 'tet', 'mzn', + 'gv', 'sd', 'pa', 'ba', 'rmy', 'na', 'iu', 'lo', 'bo', 'got', + 'chr', 'ce', 'stq', 'om', 'ug', 'sm', 'bcl', 'ee', 'ti', 'as', + 'hak', 'cdo', 'av', 'bm', 'zu', 'nv', 'dsb', 'pih', 'my', 'pap', + 'cr', 've', 'rw', 'ss', 'xh', 'kl', 'tlh', 'ik', 'dz', 'ts', + 'bi', 'kv', 'bug', 'xal', 'st', 'tn', 'ch', 'ak', 'bxr', 'tw', + 'ab', 'fj', 'ny', 'lbe', 'za', 'ff', 'tum', 'sn', 'ha', 'sg', + 'lg', 'ki', 'rn', 'chy', 'aa', 'mh', 'ng', + ] + + for lang in self.languages_by_size: self.langs[lang] = '%s.wikipedia.org' % lang
# Override defaults @@ -708,6 +736,7 @@ 'hz': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Her... 'ii': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Yi_... 'kj': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Kwa... + 'kr': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Kan... 'minnan': 'zh-min-nan', 'mo': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Mol... 'mus': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Mus... @@ -719,34 +748,6 @@ 'zh-cn': 'zh' }
- # Language codes of the largest wikis. They should be roughly sorted - # by size. - # Note: currently they have been sorted by number of pages, but with languages - # not in the Latin alphabet counted 1/3 lower - - self.languages_by_size = [ - 'en','de','fr','pl','nl','it','pt','es','ja','sv', - 'ru','fi','no','zh','tr','eo','sk','cs','ca','ro', - 'hu','da','id','vo','lt','sl','lmo','uk','he','et', - 'hr','sr','ceb','bg','ko','gl','nn','ar','te','vi', - 'ms','bs','eu','simple','new','el','th','is','lb','sq', - 'fa','az','br','io','la','bpy','su','nap','sh','cy', - 'ka','bn','scn','nds','lv','jv','oc','ku','pms','wa', - 'ast','hi','af','roa-tara','mr','mk','ta','ht','ksh','an', - 'tl','sw','uz','vec','tg','co','ga','fy','be-x-old','be', - 'gd','ur','cv','tt','yo','pam','ia','qu','nah','li', - 'bat-smg','kn','als','map-bms','zh-yue','yi','hsb','mi','zh-min-nan','nrm', - 'sa','fo','ml','se','nds-nl','pag','fur','hy','ilo','war', - 'nov','vls','sco','am','frp','lij','bh','pi','diq','csb', - 'mt','pdc','kw','fiu-vro','to','os','lad','dv','zh-classical','bar', - 'ne','ang','ln','ps','tk','kk','jbo','ty','mn','rm', - 'wo','or','roa-rup','kab','ig','tpi','zea','eml','ie','gv', - 'arc','tet','mg','sc','kg','ky','so','na','cbk-zam','ks', - 'gu','km','wuu','glk','cu','om','pa','udm','ee','rmy', - 'sm','iu','hak','bo','lo','cdo','bm','chr','si','got', - 'sd','cr','ba','ti','pap','as','nv','zu','av','ce' - ] - # Languages that used to be coded in iso-8859-1 self.latin1old = ['de', 'en', 'et', 'es', 'ia', 'la', 'af', 'cs', 'fr', 'pt', 'sl', 'bs', 'fy', 'vi', 'lt', 'fi', 'it',
Modified: trunk/pywikipedia/families/wikiquote_family.py =================================================================== --- trunk/pywikipedia/families/wikiquote_family.py 2008-02-15 17:00:06 UTC (rev 5025) +++ trunk/pywikipedia/families/wikiquote_family.py 2008-02-15 18:25:03 UTC (rev 5026) @@ -12,15 +12,15 @@ self.name = 'wikiquote'
self.languages_by_size = [ - 'en', 'de', 'it', 'pl', 'sk', 'pt', 'ru', 'bs', 'bg', 'sl', - 'es', 'tr', 'he', 'zh', 'lt', 'id', 'fr', 'cs', 'el', 'sv', - 'hu', 'ja', 'uk', 'no', 'nl', 'fa', 'fi', 'ku', 'ca', 'ar', - 'eo', 'ro', 'hr', 'gl', 'ko', 'af', 'et', 'li', 'ka', 'is', - 'sr', 'da', 'nn', 'th', 'ml', 'vi', 'simple', 'sq', 'te', - 'la', 'br', 'eu', 'hi', 'ast', 'az', 'ang', 'be', 'zh-min-nan', - 'lb', 'su', 'ur', 'mr', 'kn', 'ta', 'ky', 'wo', 'gu', 'uz', - 'cy', 'am', 'tt', 'co', 'qu', 'bm', 'ug', 'na', 'kw', 'hy', - 'tk', 'vo', 'nds', 'kr', 'cr', 'kk', 'ga', 'ks', 'za', 'als', + 'en', 'de', 'it', 'pl', 'sk', 'pt', 'ru', 'bg', 'bs', 'sl', + 'es', 'tr', 'he', 'zh', 'lt', 'fr', 'cs', 'id', 'el', 'uk', + 'sv', 'hu', 'ja', 'no', 'nl', 'fa', 'fi', 'ca', 'ku', 'ar', + 'eo', 'ro', 'hr', 'gl', 'ko', 'af', 'is', 'et', 'nn', 'li', + 'ka', 'sr', 'ml', 'da', 'th', 'simple', 'vi', 'sq', 'te', + 'la', 'br', 'eu', 'hi', 'az', 'ast', 'uz', 'be', 'ang', + 'zh-min-nan', 'lb', 'mr', 'su', 'ur', 'kn', 'ta', 'wo', 'ky', 'gu', + 'cy', 'hy', 'am', 'tt', 'co', 'qu', 'bm', 'ug', 'kw', 'na', + 'tk', 'vo', 'ga', 'kr', 'nds', 'cr', 'kk', 'ks', 'za', 'als', ]
for lang in self.languages_by_size:
Modified: trunk/pywikipedia/families/wikisource_family.py =================================================================== --- trunk/pywikipedia/families/wikisource_family.py 2008-02-15 17:00:06 UTC (rev 5025) +++ trunk/pywikipedia/families/wikisource_family.py 2008-02-15 18:25:03 UTC (rev 5026) @@ -13,8 +13,8 @@ self.languages_by_size = [ 'en', 'fr', 'es', 'zh', 'de', 'it', 'pt', 'ru', 'th', 'pl', 'ro', 'te', 'hr', 'tr', 'he', 'cs', 'fi', 'nl', 'sr', 'sv', - 'ar', 'la', 'is', 'ja', 'bs', 'uk', 'el', 'ca', 'ko', 'hu', - 'bn', 'hy', 'no', 'da', 'sl', 'ml', 'id', 'mk', 'az', 'ta', + 'hu', 'ar', 'la', 'ml', 'is', 'ja', 'bs', 'uk', 'el', 'ca', + 'ko', 'sl', 'bn', 'hy', 'no', 'da', 'id', 'ta', 'az', 'mk', 'kn', 'bg', 'fa', 'vi', 'sk', 'cy', 'et', 'lt', 'gl', 'zh-min-nan','yi', 'ht', 'fo', 'ang', ]
Modified: trunk/pywikipedia/families/wiktionary_family.py =================================================================== --- trunk/pywikipedia/families/wiktionary_family.py 2008-02-15 17:00:06 UTC (rev 5025) +++ trunk/pywikipedia/families/wiktionary_family.py 2008-02-15 18:25:03 UTC (rev 5026) @@ -12,10 +12,29 @@ family.Family.__init__(self) self.name = 'wiktionary'
- for lang in self.knownlanguages: - if lang not in ['ee','ht','ny', 'se', 'tum']: - self.langs[lang] = '%s.wiktionary.org' % lang + self.languages_by_size = [ + 'fr', 'en', 'vi', 'tr', 'ru', 'io', 'zh', 'el', 'ar', 'pl', + 'fi', 'it', 'de', 'sv', 'hu', 'pt', 'ku', 'ko', 'id', 'te', + 'es', 'nl', 'ja', 'bg', 'lt', 'vo', 'gl', 'li', 'et', 'sr', + 'fa', 'is', 'ro', 'af', 'scn', 'br', 'sl', 'ta', 'hy', 'zh-min-nan', + 'no', 'he', 'la', 'sq', 'ur', 'da', 'simple', 'ca', 'ast', 'tlh', + 'fy', 'cs', 'uk', 'hr', 'sw', 'oc', 'ang', 'kk', 'ml', 'hi', + 'ia', 'csb', 'co', 'st', 'sk', 'eo', 'kl', 'nds', 'ky', 'ms', + 'sd', 'ug', 'az', 'th', 'ga', 'tt', 'ti', 'gu', 'mk', 'tl', + 'ts', 'fo', 'qu', 'rw', 'cy', 'bs', 'mr', 'su', 'ie', 'chr', + 'an', 'am', 'yi', 'wo', 'kn', 'mn', 'nah', 'gd', 'be', 'pa', + 'lv', 'zu', 'nn', 'km', 'ps', 'mi', 'so', 'dv', 'bn', 'tg', + 'mg', 'ha', 'ka', 'na', 'sa', 'gv', 'tpi', 'ay', 'ss', 'eu', + 'ne', 'jbo', 'uz', 'tn', 'gn', 'as', 'mt', 'ch', 'jv', 'pi', + 'sh', 'lb', 'ks', 'tk', 'iu', 'sg', 'fj', 'als', 'xh', 'ik', + 'kw', 'ln', 'sm', 'si', 'za', 'roa-rup', 'mh', 'ba', 'or', 'sn', + 'ak', 'bh', 'lo', 'bm', 'yo', 'bi', 'to', 'aa', 'av', 'rn', + 'dz', 'tw', 'om', 'ab', 'my', 'wa', 'sc', 'cr', 'bo', 'rm', + ]
+ for lang in self.languages_by_size: + self.langs[lang] = '%s.wiktionary.org' % lang + # Override defaults self.namespaces[2]['pl'] = u'Wikipedysta' self.namespaces[3]['pl'] = u'Dyskusja Wikipedysty' @@ -319,6 +338,7 @@ self.obsolete = { 'dk': 'da', 'jp': 'ja', + 'mo': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Mol... 'minnan':'zh-min-nan', 'nb': 'no', 'tokipona': None, @@ -344,18 +364,6 @@ 'simple': self.alphabetic }
- self.languages_by_size = [ - 'en', 'fr', 'vi', 'zh', 'io', 'el', 'pl', 'it', 'de', 'hu', - 'fi', 'nl', 'bg', 'pt', 'ku', 'es', 'gl', 'sr', 'id', 'sv', - 'et', 'ru', 'ko', 'tr', 'ja', 'sl', 'scn', 'fa', 'ar', 'no', - 'la', 'ta', 'zh-min-nan', 'he', 'hy', 'af', 'ro', 'da', 'ang', 'hi', - 'cs', 'sk', 'is', 'uk', 'co', 'ca', 'simple', 'st', 'fy', 'hr', - 'nds', 'csb', 'ky', 'kk', 'ia', 'gu', 'sq', 'sd', 'eo', 'lt', - 'cy', 'vo', 'ml', 'ie', 'th', 'yi', 'mk', 'bs', 'qu', 'am', - 'mr', 'be', 'rw', 'tl', 'eu', 'ms', 'ast', 'an', 'ga', 'pa', - 'nah', 'ha', 'oc' - ] - self.interwiki_on_one_line = ['pl']
self.interwiki_attop = ['pl'] @@ -365,4 +373,3 @@
def shared_image_repository(self, code): return ('commons', 'commons') -