From 7a655f0074ca1ef8cf7a3c337f0b9f378ebf5a55 Mon Sep 17 00:00:00 2001 From: Federico Leva Date: Tue, 22 May 2018 09:33:53 +0300 Subject: [PATCH] Check for sha1 presence in makeXmlFromPage() --- dumpgenerator.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/dumpgenerator.py b/dumpgenerator.py index 7aecf46..6eac8f5 100755 --- a/dumpgenerator.py +++ b/dumpgenerator.py @@ -894,10 +894,12 @@ def makeXmlFromPage(page): ), E.comment(rev['comment']), E.text(rev['*'], space="preserve", bytes=to_unicode(rev['size'])), - E.sha1(rev['sha1']), ) if 'contentmodel' in rev: - revision.append(E.model) + revision.append(E.model(rev['contentmodel']) + # The sha1 may not have been backfilled on older wikis or lack for other reasons (Wikia). + if 'sha1' in rev: + revision.append(E.sha1(rev['sha1'])) p.append(revision) return etree.tostring(p, pretty_print=True)