Version 20200727.03. Fix handling video URLs without extension.

pull/5/head
arkiver 4 years ago
parent 869cdc4e6e
commit 9a6417ecbc

@ -54,7 +54,7 @@ if not WGET_AT:
#
# Update this each time you make a non-cosmetic change.
# It will be added to the WARC files and reported to the tracker.
VERSION = '20200727.02'
VERSION = '20200727.03'
USER_AGENT = 'Archive Team'
TRACKER_ID = 'reddittest'
TRACKER_HOST = 'trackerproxy.meo.ws'

@ -240,8 +240,11 @@ wget.callbacks.get_urls = function(file, url, is_css, iri)
and not string.match(url, "^https?://out%.reddit%.com/")
and not string.match(url, "^https?://[^%.]*preview%.redd%.it/")
and not string.match(url, "^https?://i%.redd%.it/")
and not string.match(url, "^https?://v%.redd%.it/[^/]+/[^%.]*%.ts")
and not string.match(url, "^https?://v%.redd%.it/[^/]+/[^%.]*%.mp4") then
and not (
string.match(url, "^https?://v%.redd%.it/")
and not string.match(url, "%.m3u8")
and not string.match(url, "%.mpd")
) then
html = read_file(file)
if string.match(url, "^https?://old%.reddit%.com/api/morechildren$") then
html = string.gsub(html, '\\"', '"')

Loading…
Cancel
Save