diff --git a/pipeline.py b/pipeline.py index cf47da1..3a2cc28 100644 --- a/pipeline.py +++ b/pipeline.py @@ -59,7 +59,7 @@ if not WGET_AT: # # Update this each time you make a non-cosmetic change. # It will be added to the WARC files and reported to the tracker. -VERSION = '20230614.02' +VERSION = '20230614.03' TRACKER_ID = 'reddit' TRACKER_HOST = 'legacy-api.arpa.li' MULTI_ITEM_SIZE = 40 diff --git a/reddit.lua b/reddit.lua index e71f942..f317c81 100644 --- a/reddit.lua +++ b/reddit.lua @@ -716,7 +716,7 @@ wget.callbacks.write_to_warc = function(url, http_stat) local is_comments_comment = string.match(url["url"], "^https?://www%.reddit%.com/r/[^/]+/comments/[^/]+/comment/[^/]+/") if ( string.match(url["url"], "^https?://[^/]+/svc/") - and string.match(html, 'level%s*=') + and string.match(html, 'level%s*=%s*"') ) or ( string.match(url["url"], "^https?://old%.reddit%.com/r/") and not string.match(html, 'class="live%-timestamp"')