import/mediawiki: more improvements

This commit is contained in:
Drew DeVault 2022-07-11 19:30:57 +02:00
parent 5689b79e13
commit 74b26cecfa

View file

@ -51,6 +51,13 @@ for _, elem in parser:
if (page.model != "wikitext"
or page.redirect is not None
or page.markup is None):
elem.clear()
del elem
continue
if (page.title.startswith("Wikipedia:")
or page.title.startswith("Template:")):
elem.clear()
del elem
continue
content = mw.parse(page.markup).strip_code()
sha = hashlib.sha512()