Xqt has submitted this change. ( https://gerrit.wikimedia.org/r/c/pywikibot/core/+/1277442?usp=email )
Change subject: Fix: Add Devanagari numerals to NON_ASCII_DIGITS
......................................................................
Fix: Add Devanagari numerals to NON_ASCII_DIGITS
Also fix timeznR in textlib.TimeStripper to match any
timezone outside ASCII characters like CEST|UTC that
special timezones can be found like नेपाली समय.
The regex change also solves the expected failure for
ar-wiki in TestArchiveBot.test_archivebot.
Bug: T424467
Change-Id: I84b5bc468406a90aa99e501a30f005b24b22f4e5
Signed-off-by: Xqt <info(a)gno.de>
---
M pywikibot/textlib.py
M pywikibot/userinterfaces/transliteration.py
M tests/archivebot_tests.py
3 files changed, 5 insertions(+), 16 deletions(-)
Approvals:
Xqt: Verified; Looks good to me, approved
jenkins-bot: Verified
diff --git a/pywikibot/textlib.py b/pywikibot/textlib.py
index 269f43e..0186bbe 100644
--- a/pywikibot/textlib.py
+++ b/pywikibot/textlib.py
@@ -2261,7 +2261,7 @@
timeR = (r'(?P<time>(?P<hour>([0-1]\d|2[0-3]))[:\.h]'
r'(?P<minute>[0-5]\d))')
- timeznR = r'\((?P<tzinfo>[A-Z]+)\)'
+ timeznR = r'\((?P<tzinfo>[^(){}\[\]:;#\t\n\r\f\v+-]+)\)'
yearR = r'(?P<year>(19|20)\d\d)(?:{})?'.format('\ub144')
# if months have 'digits' as names, they need to be
# removed; will be handled as digits in regex, adding d+{1,2}\.?
diff --git a/pywikibot/userinterfaces/transliteration.py b/pywikibot/userinterfaces/transliteration.py
index 7d1c38d..779370e 100644
--- a/pywikibot/userinterfaces/transliteration.py
+++ b/pywikibot/userinterfaces/transliteration.py
@@ -24,6 +24,7 @@
'kn': '೦೧೨೩೪೫೬೭೮೯',
'lo': '໐໑໒໓໔໕໖໗໘໙',
'ml': '൦൧൨൩൪൫൬൭൮൯',
+ 'ne': '०१२३४५६७८९',
'or': '୦୧୨୩୪୫୬୭୮୯',
'pa': '੦੧੨੩੪੫੬੭੮੯',
'te': '౦౧౨౩౪౫౬౭౮౯',
diff --git a/tests/archivebot_tests.py b/tests/archivebot_tests.py
index 7680ec6..088c3cd 100755
--- a/tests/archivebot_tests.py
+++ b/tests/archivebot_tests.py
@@ -121,7 +121,9 @@
sites = {code: {'family': 'wikipedia', 'code': code} for code in THREADS}
cached = True
- expected_failures = ['ar', 'scn', 'th']
+ expected_failures = ['scn', 'th']
+ # FIXME: see TestArchiveBotAfterDateUpdate()
+ # 'th': year is 2552 while regex assumes 19..|20.., might be fixed
def test_archivebot(self, code=None) -> None:
"""Test archivebot for one site."""
@@ -153,20 +155,6 @@
self.assertIsInstance(thread.content, str)
self.assertIsInstance(thread.timestamp, datetime)
- # FIXME: see TestArchiveBotAfterDateUpdate()
- # 'ar': Uses Arabic acronym for TZ
- # 'eo': changed month name setting in wiki from Sep to sep
- # Localisation updates from https://translatewiki.net.
- # Change-Id: I3d9b14ae3a5d77fea9694ef113b0180e5677c39e
- # ref: mediawiki languages/i18n/eo.json
- # for new entries it should work
- # 'pdc': changed month name setting in wiki over time (?)
- # in old posts in talk page, February is "Feb.", site message gives
- # <message name="feb" xml:space="preserve">Han.</message>.
- # for new entries it should work
- # 'th': year is 2552 while regex assumes 19..|20.., might be fixed
- # 'uz': changed month name for October (T370501)
-
class TestArchiveBotAfterDateUpdate(TestCase):
--
To view, visit https://gerrit.wikimedia.org/r/c/pywikibot/core/+/1277442?usp=email
To unsubscribe, or for help writing mail filters, visit https://gerrit.wikimedia.org/r/settings?usp=email
Gerrit-MessageType: merged
Gerrit-Project: pywikibot/core
Gerrit-Branch: master
Gerrit-Change-Id: I84b5bc468406a90aa99e501a30f005b24b22f4e5
Gerrit-Change-Number: 1277442
Gerrit-PatchSet: 11
Gerrit-Owner: Xqt <info(a)gno.de>
Gerrit-Reviewer: Saroj <Sarojoffl(a)gmail.com>
Gerrit-Reviewer: Thiemo Kreuz (WMDE) <thiemo.kreuz(a)wikimedia.de>
Gerrit-Reviewer: Xqt <info(a)gno.de>
Gerrit-Reviewer: jenkins-bot
jenkins-bot has submitted this change. ( https://gerrit.wikimedia.org/r/c/pywikibot/i18n/+/1277524?usp=email )
Change subject: Localisation updates from https://translatewiki.net.
......................................................................
Localisation updates from https://translatewiki.net.
Change-Id: I1713dc56bc23d9c9d37b32621b19f5b866701873
---
M delete/be-tarask.json
M delete/frp.json
M tracking_param_remover/ko.json
M weblinkchecker/be-tarask.json
M weblinkchecker/sv.json
5 files changed, 8 insertions(+), 3 deletions(-)
Approvals:
L10n-bot: Looks good to me, approved
jenkins-bot: Verified
diff --git a/delete/be-tarask.json b/delete/be-tarask.json
index fa96983..68a3f19 100644
--- a/delete/be-tarask.json
+++ b/delete/be-tarask.json
@@ -2,9 +2,11 @@
"@metadata": {
"authors": [
"EugeneZelenko",
- "Red Winged Duck"
+ "Red Winged Duck",
+ "Ucukor"
]
},
+ "delete-broken-redirect": "Робат: Выдаленьне перанакіроўваньня на выдаленую старонку %(page)s",
"delete-from-category": "Робат: выдаліў усе старонкі з катэгорыі %(page)s",
"delete-from-file": "Робат: выдаленьне сьпісу старонак.",
"delete-images": "Робат: выдаліў усе выявы на старонцы %(page)s",
diff --git a/delete/frp.json b/delete/frp.json
index 7d11dbb..bcaa0b4 100644
--- a/delete/frp.json
+++ b/delete/frp.json
@@ -5,6 +5,7 @@
"L'Arpetani"
]
},
+ "delete-broken-redirect": "Robot: Suprimar la redirèccion vèrs la pâge suprimâye %(page)s",
"delete-from-category": "Robot : suprime totes les pâges de la catègorie %(page)s",
"delete-from-file": "Robot : suprèssion d’una lista de pâges.",
"delete-images": "Robot : suprime totes les émâges sur la pâge %(page)s",
diff --git a/tracking_param_remover/ko.json b/tracking_param_remover/ko.json
index 12805ca..68dbce8 100644
--- a/tracking_param_remover/ko.json
+++ b/tracking_param_remover/ko.json
@@ -1,6 +1,7 @@
{
"@metadata": {
"authors": [
+ "Tensama0415",
"YeBoy371"
]
},
diff --git a/weblinkchecker/be-tarask.json b/weblinkchecker/be-tarask.json
index 000ae1f..445ec58 100644
--- a/weblinkchecker/be-tarask.json
+++ b/weblinkchecker/be-tarask.json
@@ -7,7 +7,7 @@
]
},
"weblinkchecker-archive_msg": "Ўэб-старонка была захаваная ў інтэрнэт архіве. Калі ласка, карыстайцеся спасылкай на адпаведную архіўную вэрсію: [%(URL)s].",
- "weblinkchecker-badurl": "Падобна, што пададзеная спасылка не зьяўляецца слушным URL-адрасам",
+ "weblinkchecker-badurl": "Падобна, што пададзеная спасылка не зьяўляецца слушным URL-адрасам: [%(URL)s]",
"weblinkchecker-caption": "Нядзейная спасылка",
"weblinkchecker-report": "Цягам колькіх праверак робат выявіў, што наступная вонкавая спасылка не працуе. Калі ласка, спраўдзіце спасылку і, калі яна сапраўды не працуе, выпраўце або прыбярыце яе!",
"weblinkchecker-summary": "Робат: Знойдзеная няслушная вонкавая спасылка"
diff --git a/weblinkchecker/sv.json b/weblinkchecker/sv.json
index 0b8249b..05b733b 100644
--- a/weblinkchecker/sv.json
+++ b/weblinkchecker/sv.json
@@ -3,11 +3,12 @@
"authors": [
"Jopparn",
"Lokal Profil",
+ "Sabelöga",
"Tor.klingberg"
]
},
"weblinkchecker-archive_msg": "Webbsidan har sparats av Internet Archive. Överväg att länka till en lämplig arkiverad version: [%(URL)s].",
- "weblinkchecker-badurl": "Den angedda länken verkar inte vara en giltig URL",
+ "weblinkchecker-badurl": "Den angivna länken verkar inte vara en giltig URL: [%(URL)s]",
"weblinkchecker-caption": "Död länk",
"weblinkchecker-report": "Följande externa länk har inte kunnat nås under flera försök av en automatisk bot. Var vänlig kontrollera om länken faktiskt är nere, och korrigera eller ta bort den i så fall.",
"weblinkchecker-summary": "Bot: Rapporterar otillgänglig extern länk"
--
To view, visit https://gerrit.wikimedia.org/r/c/pywikibot/i18n/+/1277524?usp=email
To unsubscribe, or for help writing mail filters, visit https://gerrit.wikimedia.org/r/settings?usp=email
Gerrit-MessageType: merged
Gerrit-Project: pywikibot/i18n
Gerrit-Branch: master
Gerrit-Change-Id: I1713dc56bc23d9c9d37b32621b19f5b866701873
Gerrit-Change-Number: 1277524
Gerrit-PatchSet: 1
Gerrit-Owner: L10n-bot <l10n-bot(a)translatewiki.net>
Gerrit-Reviewer: L10n-bot <l10n-bot(a)translatewiki.net>
Gerrit-Reviewer: jenkins-bot
Xqt has submitted this change. ( https://gerrit.wikimedia.org/r/c/pywikibot/core/+/1275263?usp=email )
Change subject: IMPR: load allpages with content flag
......................................................................
IMPR: load allpages with content flag
Also show a dot after every 100 processed pages.
Bug: T423836
Change-Id: I150d24b8f779f5caeae5346b5c27922aaf4aee79
---
M scripts/parser_function_count.py
1 file changed, 8 insertions(+), 11 deletions(-)
Approvals:
Xqt: Verified; Looks good to me, approved
diff --git a/scripts/parser_function_count.py b/scripts/parser_function_count.py
index 6c74556..9296ae4 100755
--- a/scripts/parser_function_count.py
+++ b/scripts/parser_function_count.py
@@ -116,8 +116,8 @@
@property
def generator(self):
"""Generator."""
- gen = self.site.allpages(start=self.opt.start,
- namespace=10, filterredir=False)
+ gen = self.site.allpages(start=self.opt.start, namespace=10,
+ filterredir=False, content=True)
if self.site.doc_subpage:
gen = pagegenerators.RegexFilterPageGenerator(
gen, self.site.doc_subpage, quantifier='none')
@@ -125,8 +125,7 @@
def setup(self) -> None:
"""Setup magic words, regex and result counter."""
- pywikibot.info('Hold on, this will need some time. '
- 'You will be notified by 50 templates.')
+ pywikibot.info('Hold on, this will need some time.')
magicwords = []
for magic_word in self.site.siteinfo['magicwords']:
magicwords += magic_word['aliases']
@@ -135,17 +134,14 @@
def treat(self, page) -> None:
"""Process a single template."""
- title = page.title()
- if (self.counter['read'] + 1) % 50 == 0:
+ if self.counter['read'] % 100 == 0:
# Don't let the poor user panic in front of a black screen.
- pywikibot.info('{}th template is being processed: {}'
- .format(self.counter['read'] + 1, title))
+ pywikibot.info('.', newline=False)
- text = page.text
- functions = self.regex.findall(text)
+ functions = self.regex.findall(page.text)
if functions and (self.opt.atleast is None
or self.opt.atleast <= len(functions)):
- self.results[title] = len(functions)
+ self.results[page.title()] = len(functions)
if self.opt.nosort and self.opt.first \
and len(self.results) >= self.opt.first:
@@ -157,6 +153,7 @@
f'# [[{result[0]}]] ({result[1]})'
for result in self.results.most_common(self.opt.first))
+ pywikibot.info()
pywikibot.info(resultlist)
pywikibot.info(f'{len(self.results)} templates were found.')
--
To view, visit https://gerrit.wikimedia.org/r/c/pywikibot/core/+/1275263?usp=email
To unsubscribe, or for help writing mail filters, visit https://gerrit.wikimedia.org/r/settings?usp=email
Gerrit-MessageType: merged
Gerrit-Project: pywikibot/core
Gerrit-Branch: master
Gerrit-Change-Id: I150d24b8f779f5caeae5346b5c27922aaf4aee79
Gerrit-Change-Number: 1275263
Gerrit-PatchSet: 2
Gerrit-Owner: Xqt <info(a)gno.de>
Gerrit-Reviewer: Xqt <info(a)gno.de>
Gerrit-Reviewer: jenkins-bot