diff --git a/pipeline.py b/pipeline.py index 3ea946d..ac17d3a 100644 --- a/pipeline.py +++ b/pipeline.py @@ -69,8 +69,8 @@ if not WGET_LUA: # # Update this each time you make a non-cosmetic change. # It will be added to the WARC files and reported to the tracker. -VERSION = '20190729.01' -USER_AGENT = 'ArchiveTeam' +VERSION = '20200102.01' +USER_AGENT = 'Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0; WOW64; Trident/4.0; SLCC1)' TRACKER_ID = 'reddit' TRACKER_HOST = 'tracker.archiveteam.org' @@ -281,7 +281,7 @@ class WgetArgs(object): post_id = self.int_to_str(i) wget_args.extend(['--warc-header', 'reddit-post: {}'.format(post_id)]) wget_args.append('https://www.reddit.com/comments/{}'.format(post_id)) - wget_args.append('https://old.reddit.com/comments/{}'.format(post_id)) + #wget_args.append('https://old.reddit.com/comments/{}'.format(post_id)) else: raise Exception('Unknown item')