From 74b26cecfabdf5006478a940a2b2727c1f5c55e1 Mon Sep 17 00:00:00 2001 From: Drew DeVault Date: Mon, 11 Jul 2022 19:30:57 +0200 Subject: [PATCH] import/mediawiki: more improvements --- import/mediawiki/main.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/import/mediawiki/main.py b/import/mediawiki/main.py index bf98102..73023f7 100644 --- a/import/mediawiki/main.py +++ b/import/mediawiki/main.py @@ -51,6 +51,13 @@ for _, elem in parser: if (page.model != "wikitext" or page.redirect is not None or page.markup is None): + elem.clear() + del elem + continue + if (page.title.startswith("Wikipedia:") + or page.title.startswith("Template:")): + elem.clear() + del elem continue content = mw.parse(page.markup).strip_code() sha = hashlib.sha512()