Update custom sites (ld_archive_is)

merge-requests/20/head
magnolia1234 4 months ago
parent 6940c36e25
commit 8e757a520c

@ -1041,7 +1041,7 @@ Additional custom options:
* unhide text amp-page
* redirect to amp-page when paywall(selector)
* load text from json when paywall|article(selector)
* load text from Google webcache when paywall|article(selector)
* load text from archive.is or Google webcache when paywall|article(selector)
* add external link to archive-site when paywall|article(selector)
* remove/unhide elements in dom (optional for dev; check examples)

@ -94,6 +94,8 @@ var ld_json;
var ld_json_next;
// load text from json (link[rel="alternate"][type="application/json"][href])
var ld_json_url;
// load text from archive.is
var ld_archive_is;
// load text from Google webcache
var ld_google_webcache;
// add external link to article
@ -130,6 +132,7 @@ function initSetRules() {
ld_json = {};
ld_json_next = {};
ld_json_url = {};
ld_archive_is = {};
ld_google_webcache = {};
add_ext_link = {};
block_js_custom = [];
@ -341,9 +344,11 @@ function addRules(domain, rule) {
ld_json_next[domain] = rule.ld_json_next;
if (rule.ld_json_url)
ld_json_url[domain] = rule.ld_json_url;
if (rule.ld_archive_is)
ld_archive_is[domain] = rule.ld_archive_is;
if (rule.ld_google_webcache)
ld_google_webcache[domain] = rule.ld_google_webcache;
if (rule.ld_json || rule.ld_json_next || rule.ld_json_url || rule.ld_google_webcache || rule.cs_dompurify)
if (rule.ld_json || rule.ld_json_next || rule.ld_json_url || rule.ld_archive_is || rule.ld_google_webcache || rule.cs_dompurify)
if (!dompurify_sites.includes(domain))
dompurify_sites.push(domain);
if (rule.add_ext_link && rule.add_ext_link_type)
@ -885,6 +890,9 @@ if (typeof browser !== 'object') {
let ld_json_url_domain = matchUrlDomain(Object.keys(ld_json_url), url);
if (ld_json_url_domain)
bg2csData.ld_json_url = ld_json_url[ld_json_url_domain];
let ld_archive_is_domain = matchUrlDomain(Object.keys(ld_archive_is), url);
if (ld_archive_is_domain)
bg2csData.ld_archive_is = ld_archive_is[ld_archive_is_domain];
let ld_google_webcache_domain = matchUrlDomain(Object.keys(ld_google_webcache), url);
if (ld_google_webcache_domain)
bg2csData.ld_google_webcache = ld_google_webcache[ld_google_webcache_domain];

@ -5,6 +5,7 @@ Updates (install signed xpi-file): https://gitlab.com/magnolia1234/bypass-paywal
Post-release
Fix Augsburger-allgemeine.de (Googlebot)
Fix Tribune Publishing Company (js)
Update custom sites (ld_archive_is)
* v3.5.3.0 (2024-01-28)
Add El Nuevo Herald (McClatchy Group)

@ -161,6 +161,21 @@ if (bg2csData.ld_json_url && dompurify_loaded) {
}
}
// custom/updated sites: load text from archive.is
if (bg2csData.ld_archive_is && dompurify_loaded) {
if (bg2csData.ld_archive_is.includes('|')) {
window.setTimeout(function () {
let url = window.location.href;
let ld_archive_is_split = bg2csData.ld_archive_is.split('|');
let paywall_sel = ld_archive_is_split[0];
let article_sel = ld_archive_is_split[1];
let article_src_sel = ld_archive_is_split[2] || article_sel; // optional
let article_link_sel = ld_archive_is_split[3] || article_sel; // optional
getArchive(url, paywall_sel, '', article_sel, '', article_src_sel, article_link_sel);
}, 1000);
}
}
// custom/updated sites: load text from Google webcache
if (bg2csData.ld_google_webcache && dompurify_loaded) {
if (bg2csData.ld_google_webcache.includes('|')) {
@ -169,12 +184,7 @@ if (bg2csData.ld_google_webcache && dompurify_loaded) {
let ld_google_webcache_split = bg2csData.ld_google_webcache.split('|');
let paywall_sel = ld_google_webcache_split[0];
let article_sel = ld_google_webcache_split[1];
let paywall = document.querySelectorAll(paywall_sel);
if (paywall.length) {
removeDOMElement(...paywall);
let url_cache = 'https://webcache.googleusercontent.com/search?q=cache:' + url.split('?')[0];
replaceDomElementExt(url_cache, true, false, article_sel);
}
getGoogleWebcache(url, paywall_sel, '', article_sel);
}, 1000);
}
}

@ -51,5 +51,5 @@
"webRequestBlocking",
"*://*/*"
],
"version": "3.5.3.2"
"version": "3.5.3.3"
}

@ -18,11 +18,12 @@
"block_regex": "\\.acadienouvelle\\.com\\/script\\.js",
"domain": "acadienouvelle.com"
},
"Airmail.news": {
"Airmail.news (refresh)": {
"add_ext_link": "div.paywall-card|div.article-text",
"add_ext_link_type": "archive.is",
"allow_cookies": 1,
"domain": "airmail.news"
"domain": "airmail.news",
"ld_archive_is": "div.paywall-card|div.article-text|div[data-article-target='body']"
},
"Artsprofessional.co.uk": {
"allow_cookies": 1,
@ -386,7 +387,7 @@
"domain": "limerickpost.ie"
},
"Limesonline.com": {
"add_ext_link": "iframe#__limio_frame|div.sommario",
"add_ext_link": "div#account-pw-container|div.story__content",
"add_ext_link_type": "google_search_tool",
"allow_cookies": 1,
"domain": "limesonline.com"
@ -690,7 +691,8 @@
"add_ext_link": "aside.article-paywall|section.article-content",
"add_ext_link_type": "archive.is",
"allow_cookies": 1,
"domain": "suedkurier.de"
"domain": "suedkurier.de",
"ld_archive_is": "aside.article-paywall|main>article"
},
"Supchina.com": {
"allow_cookies": 1,
@ -750,9 +752,9 @@
},
"Thedispatch.com": {
"add_ext_link": "article:not(.newsletter) section.paywall-section|div.content",
"add_ext_link_type": "archive.is",
"allow_cookies": 1,
"domain": "thedispatch.com",
"ld_archive_is": "article:not(.newsletter) section.paywall-section|main>article",
"ld_json_url": "article.newsletter section.paywall-section|div.content|1"
},
"Thedriftmag.com": {
@ -794,7 +796,8 @@
"add_ext_link": "div#ao-MeteringDNAllow|div[class*='-Teaser']",
"add_ext_link_type": "archive.is",
"allow_cookies": 1,
"domain": "thestage.co.uk"
"domain": "thestage.co.uk",
"ld_archive_is": "div#ao-MeteringDNAllow|div[id^='aos-FeatureArticle2Col-']"
},
"Tijorifinance.com": {
"allow_cookies": 1,

@ -840,5 +840,5 @@
"*://archive.vn/*",
"*://webcache.googleusercontent.com/*"
],
"version": "3.5.3.2"
"version": "3.5.3.3"
}

@ -286,6 +286,7 @@ function edit_options() {
document.querySelector('input[data-key="ld_json"]').value = edit_site.ld_json || '';
document.querySelector('input[data-key="ld_json_next"]').value = edit_site.ld_json_next || '';
document.querySelector('input[data-key="ld_json_url"]').value = edit_site.ld_json_url || '';
document.querySelector('input[data-key="ld_archive_is"]').value = edit_site.ld_archive_is || '';
document.querySelector('input[data-key="ld_google_webcache"]').value = edit_site.ld_google_webcache || '';
document.querySelector('input[data-key="add_ext_link"]').value = edit_site.add_ext_link || '';
document.querySelector('select[data-key="add_ext_link_type"]').selectedIndex = add_ext_link_type_options.indexOf(edit_site.add_ext_link_type);
@ -364,6 +365,7 @@ function renderOptions() {
'ld_json': 0,
'ld_json_next': 0,
'ld_json_url': 0,
'ld_archive_is': 0,
'ld_google_webcache': 0,
'add_ext_link': 0,
'add_ext_link_type': 0,
@ -408,6 +410,7 @@ function renderOptions() {
ld_json: 'div.paywall|div.article',
ld_json_next: 'div.paywall|div.article',
ld_json_url: 'div.paywall|div.article',
ld_archive_is: 'div.paywall|div.art|div.art_src|div.art_link',
ld_google_webcache: 'div.paywall|div.article',
add_ext_link: 'div.paywall|div.article',
cs_code: 'for dev: check GitLab examples',
@ -458,6 +461,7 @@ function renderOptions() {
(sites_custom[key]['ld_json'] ? ' | ld_json' : '') +
(sites_custom[key]['ld_json_next'] ? ' | ld_json_next' : '') +
(sites_custom[key]['ld_json_url'] ? ' | ld_json_url' : '') +
(sites_custom[key]['ld_archive_is'] ? ' | ld_archive_is' : '') +
(sites_custom[key]['ld_google_webcache'] ? ' | ld_google_webcache' : '') +
(sites_custom[key]['add_ext_link'] && sites_custom[key]['add_ext_link_type'] ? ' | add_ext_link' : '') +
(sites_custom[key]['cs_code'] ? ' | cs_code' : '');

@ -2996,4 +2996,4 @@ var de_westfalen_medien_nofix_domains = ['muensterschezeitung.de', 'westfalen-bl
var fr_groupe_ebra_nofix_domains = ['bienpublic.com', 'dna.fr', 'estrepublicain.fr', 'lalsace.fr', 'ledauphine.com', 'lejsl.com', 'leprogres.fr', 'republicain-lorrain.fr', 'vosgesmatin.fr'];
var fr_indigo_nofix_domains = ['africaintelligence.com', 'africaintelligence.fr', 'glitz.paris', 'intelligenceonline.com', 'intelligenceonline.fr', 'lalettre.fr'];
var it_gedi_nofix_domains = ['gelocal.it', 'limesonline.com'];
var nofix_sites = ['11freunde.de', 'aamulehti.fi', 'abendblatt.de', 'aftenposten.no', 'aftonbladet.se', 'allgaeuer-zeitung.de', 'asahi.com', 'asiatimes.com', 'autosport.com', 'aviationweek.com', 'badische-zeitung.de', 'bhaskar.com', 'bloomberglaw.com', 'bloombergtax.com', 'bnef.com', 'bnn.de', 'borsen.dk', 'businessinsider.de', 'businessinsider.jp', 'businesslive.co.za', 'businesstimes.com.sg', 'caixin.com', 'caixinglobal.com', 'caravanmagazine.in', 'catalyst-journal.com', 'chegg.com', 'codesports.com.au', 'compactmag.com', 'courrierinternational.com', 'coursehero.com', 'deutsche-wirtschafts-nachrichten.de', 'die-glocke.de', 'dn.no', 'dn.se', 'elordenmundial.com', 'entrepreneur.com', 'epw.in', 'expresso.pt', 'falter.at', 'finance.si', 'franc-tireur.fr', 'ftchinese.com', 'ftchineselive.com', 'gamestar.de', 'geo.de', 'golem.de', 'gp.se', 'gva.be', 'handelsblatt.com', 'hbrarabic.com', 'hbrchina.org', 'hbrfrance.fr', 'heise.de', 'hs.fi', 'ilsole24ore.com', 'information.dk', 'investors.com', 'iltalehti.fi', 'jacobin.com', 'jeuneafrique.com', 'jungefreiheit.de', 'kleinezeitung.at', 'laverita.info', 'lavie.fr', 'lavozdegalicia.es', 'law360.co.uk', 'law360.com', 'le1hebdo.fr', 'leconomiste.com', 'lefilmfrancais.com', 'lemonde.fr', 'lequipe.fr', 'lesjours.fr', 'letemps.ch', 'liberation.fr', 'main-echo.de', 'mainpost.de', 'manager-magazin.de', 'medianama.com', 'mediapart.fr', 'milanofinanza.it', 'mittelbayerische.de', 'monde-diplomatique.fr', 'mondediplo.com', 'money.it', 'moneycontrol.com', 'moodys.com', 'morningstar.com', 'motorsport.com', 'moz.de', 'nachrichten.at', 'nationaljournal.com', 'nature.com', 'nbr.co.nz', 'news24.com', 'newslaundry.com', 'nn.de', 'nwzonline.de', 'observador.pt', 'ouest-france.fr', 'philonomist.com', 'pnp.de', 'politicopro.com', 'politiken.dk', 'pressreader.com', 'publico.pt', 'quillette.com', 'rbc.ru', 'republic.ru', 'rheinpfalz.de', 'risk.net', 'rnz.de', 'saechsische.de', 'sciencedirect.com', 'springer.com', 'statnews.com', 'stern.de', 'stimme.de', 'straitstimes.com', 'streetinsider.com', 'substack.com', 'suedkurier.de', 'swp.de', 'taxation.co.uk', 'taxjournal.com', 'techcrunch.com', 'the-ken.com', 'theinformation.com', 'theinitium.com', 'themorningcontext.com', 'theparisreview.org', 'thestar.com.my', 'thewirechina.com', 'weltwoche.ch', 'weltwoche.de', 'wissenschaft.de', 'worldpoliticsreview.com', 'wz.de', 'ynet.co.il'].concat(de_funke_medien_nofix_domains, de_rp_aachen_medien_nofix_domains, de_westfalen_medien_nofix_domains, fr_groupe_ebra_nofix_domains, fr_indigo_nofix_domains, it_gedi_nofix_domains);
var nofix_sites = ['11freunde.de', 'aamulehti.fi', 'abendblatt.de', 'aftenposten.no', 'aftonbladet.se', 'allgaeuer-zeitung.de', 'asahi.com', 'asiatimes.com', 'autosport.com', 'aviationweek.com', 'badische-zeitung.de', 'bhaskar.com', 'bloomberglaw.com', 'bloombergtax.com', 'bnef.com', 'bnn.de', 'borsen.dk', 'businessinsider.de', 'businessinsider.jp', 'businesslive.co.za', 'businesstimes.com.sg', 'caixin.com', 'caixinglobal.com', 'caravanmagazine.in', 'catalyst-journal.com', 'chegg.com', 'codesports.com.au', 'compactmag.com', 'courrierinternational.com', 'coursehero.com', 'deutsche-wirtschafts-nachrichten.de', 'die-glocke.de', 'dn.no', 'dn.se', 'elordenmundial.com', 'entrepreneur.com', 'epw.in', 'expresso.pt', 'falter.at', 'finance.si', 'franc-tireur.fr', 'ftchinese.com', 'ftchineselive.com', 'gamestar.de', 'geo.de', 'golem.de', 'gp.se', 'gva.be', 'handelsblatt.com', 'hbrarabic.com', 'hbrchina.org', 'hbrfrance.fr', 'heise.de', 'hs.fi', 'ilsole24ore.com', 'information.dk', 'investors.com', 'iltalehti.fi', 'jacobin.com', 'jeuneafrique.com', 'jungefreiheit.de', 'kleinezeitung.at', 'laverita.info', 'lavie.fr', 'lavozdegalicia.es', 'law360.co.uk', 'law360.com', 'le1hebdo.fr', 'leconomiste.com', 'lefilmfrancais.com', 'lemonde.fr', 'lequipe.fr', 'lesjours.fr', 'letemps.ch', 'liberation.fr', 'libertiesjournal.com', 'main-echo.de', 'mainpost.de', 'manager-magazin.de', 'medianama.com', 'mediapart.fr', 'milanofinanza.it', 'mittelbayerische.de', 'monde-diplomatique.fr', 'mondediplo.com', 'money.it', 'moneycontrol.com', 'moodys.com', 'morningstar.com', 'motorsport.com', 'moz.de', 'nachrichten.at', 'nationaljournal.com', 'nature.com', 'nbr.co.nz', 'newcriterion.com', 'news24.com', 'newslaundry.com', 'nn.de', 'nwzonline.de', 'observador.pt', 'ouest-france.fr', 'philonomist.com', 'pnp.de', 'politicopro.com', 'politiken.dk', 'pressreader.com', 'publico.pt', 'quillette.com', 'rbc.ru', 'republic.ru', 'rheinpfalz.de', 'risk.net', 'rnz.de', 'saechsische.de', 'sciencedirect.com', 'springer.com', 'statnews.com', 'stern.de', 'stimme.de', 'straitstimes.com', 'streetinsider.com', 'substack.com', 'suedkurier.de', 'swp.de', 'taxation.co.uk', 'taxjournal.com', 'techcrunch.com', 'the-ken.com', 'theinformation.com', 'theinitium.com', 'themorningcontext.com', 'theparisreview.org', 'thestar.com.my', 'thewirechina.com', 'weltwoche.ch', 'weltwoche.de', 'wissenschaft.de', 'worldpoliticsreview.com', 'wz.de', 'ynet.co.il'].concat(de_funke_medien_nofix_domains, de_rp_aachen_medien_nofix_domains, de_westfalen_medien_nofix_domains, fr_groupe_ebra_nofix_domains, fr_indigo_nofix_domains, it_gedi_nofix_domains);

Loading…
Cancel
Save