Version 20200727.01. Use trackerproxy for dictionaries. Ignore irc: URLs.

pull/5/head
arkiver 4 years ago
parent 910687b053
commit 147c6416ed

@ -54,9 +54,9 @@ if not WGET_AT:
#
# Update this each time you make a non-cosmetic change.
# It will be added to the WARC files and reported to the tracker.
VERSION = '20200726.06'
VERSION = '20200727.01'
USER_AGENT = 'Archive Team'
TRACKER_ID = 'reddittest'
TRACKER_ID = 'reddit'
TRACKER_HOST = 'trackerproxy.meo.ws'
@ -161,7 +161,7 @@ class ZstdDict(object):
if cls.data is not None and time.time() - cls.created < 1800:
return cls.data
response = requests.get(
'http://tracker.archiveteam.org:25654/dictionary',
'http://trackerproxy.meo.ws:25654/dictionary',
params={
'project': 'reddit'
}

@ -217,6 +217,7 @@ wget.callbacks.get_urls = function(file, url, is_css, iri)
or string.match(newurl, "^android%-app:")
or string.match(newurl, "^ios%-app:")
or string.match(newurl, "^data:")
or string.match(newurl, "^irc:")
or string.match(newurl, "^%${")) then
check(string.match(url, "^(https?://.+/)") .. newurl)
end

Loading…
Cancel
Save