Version 20200821.01. Ignore comment URL with utm_source param.

pull/5/head
arkiver 4 years ago
parent ace1a4f037
commit 2087174a5c

@ -54,7 +54,7 @@ if not WGET_AT:
#
# Update this each time you make a non-cosmetic change.
# It will be added to the WARC files and reported to the tracker.
VERSION = '20200805.01'
VERSION = '20200821.01'
USER_AGENT = 'Archive Team'
TRACKER_ID = 'reddittest'
TRACKER_HOST = 'trackerproxy.meo.ws'

@ -86,7 +86,10 @@ allowed = function(url, parenturl)
)
or (
item_type == "posts"
and string.match(url, "^https?://[^/]*reddit%.com/r/[^/]+/comments/[0-9a-z]+/[^/]+/[0-9a-z]+/?$")
and (
string.match(url, "^https?://[^/]*reddit%.com/r/[^/]+/comments/[0-9a-z]+/[^/]+/[0-9a-z]+/?$")
or string.match(url, "^https?://[^/]*reddit%.com/r/[^/]+/comments/[0-9a-z]+/[^/]+/[0-9a-z]+/?%?utm_source=")
)
)
or (
parenturl

Loading…
Cancel
Save