Merge pull request #302 from nemobis/master

Wikia dumps now use 7z, not gz
pull/287/merge
nemobis 6 years ago committed by GitHub
commit f33f316500
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -55,16 +55,16 @@ def main():
print dbname
first = dbname[0]
# There are one-letter dbnames; the second letter is replaced by an underscore
# http://s3.amazonaws.com/wikia_xml_dumps/n/n_/n_pages_full.xml.gz
# http://s3.amazonaws.com/wikia_xml_dumps/n/n_/n_pages_full.xml.7z
try:
second = dbname[1]
except:
second = '_'
base = 'http://s3.amazonaws.com/wikia_xml_dumps/' + first + '/' \
+ first + second + '/' + dbname
full = base + '_pages_full.xml.gz'
full = base + '_pages_full.xml.7z'
print full
current = base + '_pages_current.xml.gz'
current = base + '_pages_current.xml.7z'
images = base + '_images.tar'
try:
#subprocess.check_call(['wget', '-e', 'robots=off', '--fail', '-nc', '-a', 'wikia.log', full])

Loading…
Cancel
Save