Add Correio & Gazeta do Povo

merge-requests/17/head
magnolia1234 7 months ago
parent a7e0b36800
commit 642ece39c5

@ -955,10 +955,12 @@ Grouped in options:\
##### Brazil
[CartaCapital](https://www.cartacapital.com.br) -
[Correio do Povo](https://www.correiodopovo.com.br) -
[Crusoé](https://crusoe.com.br) -
[Estado de Minas](https://www.em.com.br) -
[Exame](https://exame.com) -
[GaúchaZH](https://gauchazh.clicrbs.com.br) -
[Gazeta do Povo](https://www.gazetadopovo.com.br) -
[Grupo Abril](https://grupoabril.com.br) -
[O Estado de S. Paulo](https://estadao.com.br) -
[O Globo](https://oglobo.globo.com) -

@ -4,6 +4,8 @@ Updates (install signed xpi-file): https://gitlab.com/magnolia1234/bypass-paywal
Post-release
Add 3 more Hearst newspapers
Add Correiodopovo.com.br
Add Gazetadopovo.com.br
Add Ikz-online.de (Funke)
Remove Braunschweiger-zeitung.de (Funke; fix obsolete)
Fix Defector

@ -763,10 +763,9 @@ else if (matchDomain('faz.net')) {
let paywall = document.querySelector('#paywall-form-container-outer, section.atc-ContainerPaywall');
if (paywall) {
removeDOMElement(paywall);
let url = new URL(window.location.href);
let mUrl = new URL(url.pathname, 'https://m.faz.net/');
let url_mobile = 'https://m.faz.net' + window.location.pathname;
try {
fetch(mUrl)
fetch(url_mobile)
.then(response => {
if (response.ok) {
response.text().then(html => {
@ -786,7 +785,7 @@ else if (matchDomain('faz.net')) {
if (json_text && article_text) {
let pars = article_text.querySelectorAll('p.atc-TextParagraph');
removeDOMElement(...pars);
json_text = breakText_faz(json_text).split("\n\n");
json_text = breakText_headers(json_text).split("\n\n");
for (let p_text of json_text) {
let elem;
if (p_text.length < 80) {
@ -869,15 +868,17 @@ else if (matchDomain('freitag.de')) {
if (json_script) {
let json = JSON.parse(json_script.text);
if (json) {
let json_text = breakText(json.articleBody);
let json_text = breakText_headers(json.articleBody);
let pars = json_text.split(/\n\n/g);
if (json_text) {
removeDOMElement(...intro);
let article_new = document.createElement('div');
for (let par of pars) {
let par_new = document.createElement('p');
par_new.innerText = par;
article_new.appendChild(par_new);
if (!par.startsWith('Placeholder ')) {
let par_new = document.createElement('p');
par_new.innerText = par;
article_new.appendChild(par_new);
}
}
article.appendChild(article_new);
}
@ -886,7 +887,7 @@ else if (matchDomain('freitag.de')) {
let hidden_article = document.querySelector('div.o-paywall');
if (hidden_article) {
let par_first = true;
let pars = breakText(hidden_article.innerText).split(/\n\n/g);
let pars = breakText_headers(hidden_article.innerText).split(/\n\n/g);
for (let par of pars) {
let par_new = document.createElement('p');
let overlap = '';
@ -1096,7 +1097,7 @@ else if (matchDomain('nwzonline.de')) {
if (json_script) {
let json = JSON.parse(json_script.text);
if (json) {
let json_text = breakText(parseHtmlEntities(json.articleBody));
let json_text = breakText_headers(parseHtmlEntities(json.articleBody));
let content = document.querySelector('div.article-body');
if (json_text && content) {
content.innerHTML = '';
@ -3408,21 +3409,15 @@ else if (matchDomain('gauchazh.clicrbs.com.br')) {
hideDOMElement(...ads);
}
else if (matchDomain('ladiaria.com.uy')) {
if (window.location.search.startsWith('?display=amp')) {
csDoneOnce = true;
ampToHtml();
else if (matchDomain('gazetadopovo.com.br')) {
if (window.location.pathname.endsWith('/amp/')) {
amp_unhide_subscr_section('div.ads-amp, amp-embed', false);
} else {
let banners = document.querySelectorAll('div.softwall, div.subscribe-notice');
removeDOMElement(...banners);
let ads = document.querySelectorAll('div.c-ads');
hideDOMElement(...ads);
}
}
else if (matchDomain('latercera.com')) {
let subscr_banner = document.querySelector('.empty');
removeDOMElement(subscr_banner);
}
else if (matchDomain('globo.com')) {
if (matchDomain('valor.globo.com')) {
if (!window.location.pathname.startsWith('/google/amp/')) {
@ -3446,6 +3441,21 @@ else if (matchDomain('globo.com')) {
}
}
else if (matchDomain('ladiaria.com.uy')) {
if (window.location.search.startsWith('?display=amp')) {
csDoneOnce = true;
ampToHtml();
} else {
let banners = document.querySelectorAll('div.softwall, div.subscribe-notice');
removeDOMElement(...banners);
}
}
else if (matchDomain('latercera.com')) {
let subscr_banner = document.querySelector('.empty');
removeDOMElement(subscr_banner);
}
else if (matchDomain('revistaoeste.com')) {
if (window.location.pathname.startsWith('/revista/')) {
let intro = document.querySelector('div.is-locked');
@ -6236,16 +6246,17 @@ function findOverlap(a, b) {
return findOverlap(a, b.substring(0, b.length - 1));
}
function breakText(str) {
function breakText(str, headers = false) {
str = str.replace(/(?:^|[A-Za-z\"\“\)])(\.|\?|!)(?=[A-ZÖÜ\„\d][A-Za-zÀ-ÿ\„\d]{1,})/gm, "$&\n\n");
str = str.replace(/(([a-z]{2,}|[\"\“]))(?=[A-Z](?=[A-Za-zÀ-ÿ]+))/gm, "$&\n\n");
if (headers)
str = str.replace(/(([a-z]{2,}|[\"\“]))(?=[A-Z](?=[A-Za-zÀ-ÿ]+))/gm, "$&\n\n");
return str;
}
function breakText_faz(str) {
str = breakText(str);
function breakText_headers(str) {
str = breakText(str, true);
// exceptions: names with alternating lower/uppercase (no general fix)
let str_rep_arr = ['AstraZeneca', 'BaFin', 'BerlHG', 'BfArM', 'BilMoG', 'BioNTech', 'ChatGPT', 'DiGA', 'EuGH', 'FinTechRat', 'GlaxoSmithKline', 'IfSG', 'medRxiv', 'mmHg', 'OpenAI', 'PlosOne', 'StVO'];
let str_rep_arr = ['AstraZeneca', 'BaFin', 'BerlHG', 'BfArM', 'BilMoG', 'BioNTech', 'ChatGPT', 'DiGA', 'EuGH', 'FinTechRat', 'GlaxoSmithKline', 'IfSG', 'medRxiv', 'mmHg', 'OpenAI', 'PlosOne', 'StVO', 'TikTok'];
let str_rep_split;
let str_rep_src;
for (let str_rep of str_rep_arr) {

@ -51,5 +51,5 @@
"webRequestBlocking",
"*://*/*"
],
"version": "3.4.4.6"
"version": "3.4.4.7"
}

@ -134,11 +134,6 @@
"Connexionfrance.com": {
"domain": "connexionfrance.com"
},
"Correiodopovo.com.br": {
"allow_cookies": 1,
"block_regex": "paywall\\.correiodopovo\\.com\\.br",
"domain": "correiodopovo.com.br"
},
"Dailyherald.com": {
"allow_cookies": 1,
"block_regex": "\\.tinypass\\.com",
@ -254,12 +249,6 @@
"block_regex": "js\\.pelcro\\.com",
"domain": "frieze.com"
},
"Gazetadopovo.com.br": {
"allow_cookies": 1,
"amp_unhide": 1,
"block_regex": "\\.tinypass\\.com",
"domain": "gazetadopovo.com.br"
},
"Gazetaprawna.pl": {
"allow_cookies": 1,
"amp_redirect": "div.displayMode_simplePaywall",

@ -163,6 +163,7 @@
"*://*.commercialappeal.com/*",
"*://*.computerweekly.com/*",
"*://*.connaissancedesarts.com/*",
"*://*.correiodopovo.com.br/*",
"*://*.corriere.it/*",
"*://*.corriereadriatico.it/*",
"*://*.corrieredellosport.it/*",
@ -280,6 +281,7 @@
"*://*.ft.com/*",
"*://*.ftm.eu/*",
"*://*.ftm.nl/*",
"*://*.gazetadopovo.com.br/*",
"*://*.gazzetta.it/*",
"*://*.geelongadvertiser.com.au/*",
"*://*.gelderlander.nl/*",
@ -824,5 +826,5 @@
"*://*.wyleex.com/*",
"*://webcache.googleusercontent.com/*"
],
"version": "3.4.4.6"
"version": "3.4.4.7"
}

@ -407,6 +407,11 @@ var defaultSites = {
domain: "cmjornal.pt",
allow_cookies: 1
},
"Correio do Povo": {
domain: "correiodopovo.com.br",
allow_cookies: 1,
block_regex: /(paywall\.correiodopovo\.com\.br|cdn\.ampproject\.org\/v\d\/amp-access-.+\.js)/
},
"Corriere della Sera": {
domain: "corriere.it",
allow_cookies: 1,
@ -768,6 +773,11 @@ var defaultSites = {
allow_cookies: 1,
block_regex: /(\.piano\.io\/api\/tinypass\.min\.js|\.clicrbs\.com\.br\/paywall-api\/count\/)/
},
"Gazeta do Povo": {
domain: "gazetadopovo.com.br",
allow_cookies: 1,
block_regex: /(\.tinypass\.com\/|cdn\.cxense\.com\/|cdn\.ampproject\.org\/v\d\/amp-subscriptions-.+\.js)/
},
"Glassdoor (regwall)": {
domain: "glassdoor.com"
},
@ -2911,4 +2921,4 @@ var de_rp_aachen_medien_nofix_domains = ['aachener-nachrichten.de', 'aachener-ze
var fr_indigo_nofix_domains = ['africaintelligence.com', 'africaintelligence.fr', 'glitz.paris', 'intelligenceonline.com', 'intelligenceonline.fr', 'lalettre.fr'];
var it_gedi_nofix_domains = ['gelocal.it', 'huffingtonpost.it', 'limesonline.com'];
var nl_mediahuis_region_nofix_domains = ['gooieneemlander.nl', 'haarlemsdagblad.nl', 'ijmuidercourant.nl', 'leidschdagblad.nl', 'noordhollandsdagblad.nl'];
var nofix_sites = ['aamulehti.fi', 'aftenposten.no', 'aftonbladet.se', 'allgaeuer-zeitung.de', 'asahi.com', 'asiatimes.com', 'autosport.com', 'aviationweek.com', 'badische-zeitung.de', 'bild.de', 'bloomberglaw.com', 'bloombergtax.com', 'borsen.dk', 'businessgreen.com', 'businessinsider.de', 'businesslive.co.za', 'businesstimes.com.sg', 'caixin.com', 'caixinglobal.com', 'caravanmagazine.in', 'catalyst-journal.com', 'codesports.com.au', 'compactmag.com', 'courrierinternational.com', 'deutsche-wirtschafts-nachrichten.de', 'die-glocke.de', 'diepresse.com', 'dn.no', 'dn.se', 'elordenmundial.com', 'entrepreneur.com', 'epw.in', 'expresso.pt', 'falter.at', 'finance.si', 'ftchinese.com', 'ftchineselive.com', 'gamestar.de', 'geo.de', 'golem.de', 'handelsblatt.com', 'hbrchina.org', 'heise.de', 'hln.be', 'hs.fi', 'ilsole24ore.com', 'information.dk', 'investors.com', 'iltalehti.fi', 'jacobin.com', 'jeuneafrique.com', 'kleinezeitung.at', 'lavie.fr', 'lavozdegalicia.es', 'law360.co.uk', 'law360.com', 'le1hebdo.fr', 'leconomiste.com', 'lefilmfrancais.com', 'lequipe.fr', 'lesjours.fr', 'liberation.fr', 'limburger.nl', 'mainpost.de', 'manager-magazin.de', 'medianama.com', 'mediapart.fr', 'milanofinanza.it', 'mittelbayerische.de', 'monde-diplomatique.fr', 'mondediplo.com', 'moneycontrol.com', 'moodys.com', 'morningstar.com', 'moz.de', 'nachrichten.at', 'nationaljournal.com', 'nature.com', 'nbr.co.nz', 'newslaundry.com', 'nn.de', 'observador.pt', 'ouest-france.fr', 'philonomist.com', 'pnp.de', 'politicopro.com', 'politiken.dk', 'pressreader.com', 'publico.pt', 'quillette.com', 'republic.ru', 'rheinpfalz.de', 'risk.net', 'rnz.de', 'saechsische.de', 'schwarzwaelder-bote.de', 'sciencedirect.com', 'springer.com', 'statnews.com', 'stern.de', 'stimme.de', 'straitstimes.com', 'stratfor.com', 'substack.com', 'suedkurier.de', 'swp.de', 'techcrunch.com', 'the-ken.com', 'theinformation.com', 'theinitium.com', 'themorningcontext.com', 'theparisreview.org', 'thewirechina.com', 'vosgesmatin.fr', 'weltwoche.ch', 'weltwoche.de', 'weser-kurier.de', 'wiwo.de', 'worldpoliticsreview.com', 'ynet.co.il'].concat(be_mediahuis_nofix_domains, de_funke_medien_nofix_domains, de_rp_aachen_medien_nofix_domains, fr_indigo_nofix_domains, it_gedi_nofix_domains, nl_mediahuis_region_nofix_domains);
var nofix_sites = ['aamulehti.fi', 'aftenposten.no', 'aftonbladet.se', 'allgaeuer-zeitung.de', 'asahi.com', 'asiatimes.com', 'autosport.com', 'aviationweek.com', 'badische-zeitung.de', 'bild.de', 'bloomberglaw.com', 'bloombergtax.com', 'borsen.dk', 'businessgreen.com', 'businessinsider.de', 'businesslive.co.za', 'businesstimes.com.sg', 'caixin.com', 'caixinglobal.com', 'caravanmagazine.in', 'catalyst-journal.com', 'codesports.com.au', 'compactmag.com', 'courrierinternational.com', 'coursehero.com', 'deutsche-wirtschafts-nachrichten.de', 'die-glocke.de', 'diepresse.com', 'dn.no', 'dn.se', 'elordenmundial.com', 'entrepreneur.com', 'epw.in', 'expresso.pt', 'falter.at', 'finance.si', 'ftchinese.com', 'ftchineselive.com', 'gamestar.de', 'geo.de', 'golem.de', 'handelsblatt.com', 'hbrchina.org', 'heise.de', 'hln.be', 'hs.fi', 'ilsole24ore.com', 'information.dk', 'investors.com', 'iltalehti.fi', 'jacobin.com', 'jeuneafrique.com', 'kleinezeitung.at', 'lavie.fr', 'lavozdegalicia.es', 'law360.co.uk', 'law360.com', 'le1hebdo.fr', 'leconomiste.com', 'lefilmfrancais.com', 'lequipe.fr', 'lesjours.fr', 'liberation.fr', 'limburger.nl', 'mainpost.de', 'manager-magazin.de', 'medianama.com', 'mediapart.fr', 'milanofinanza.it', 'mittelbayerische.de', 'monde-diplomatique.fr', 'mondediplo.com', 'moneycontrol.com', 'moodys.com', 'morningstar.com', 'moz.de', 'nachrichten.at', 'nationaljournal.com', 'nature.com', 'nbr.co.nz', 'newslaundry.com', 'nn.de', 'observador.pt', 'ouest-france.fr', 'philonomist.com', 'pnp.de', 'politicopro.com', 'politiken.dk', 'pressreader.com', 'publico.pt', 'quillette.com', 'republic.ru', 'rheinpfalz.de', 'risk.net', 'rnz.de', 'saechsische.de', 'schwarzwaelder-bote.de', 'sciencedirect.com', 'springer.com', 'statnews.com', 'stern.de', 'stimme.de', 'straitstimes.com', 'stratfor.com', 'substack.com', 'suedkurier.de', 'swp.de', 'techcrunch.com', 'the-ken.com', 'theinformation.com', 'theinitium.com', 'themorningcontext.com', 'theparisreview.org', 'thewirechina.com', 'vosgesmatin.fr', 'weltwoche.ch', 'weltwoche.de', 'weser-kurier.de', 'wiwo.de', 'worldpoliticsreview.com', 'ynet.co.il'].concat(be_mediahuis_nofix_domains, de_funke_medien_nofix_domains, de_rp_aachen_medien_nofix_domains, fr_indigo_nofix_domains, it_gedi_nofix_domains, nl_mediahuis_region_nofix_domains);

@ -5,6 +5,12 @@
"block_regex": "(\\.cm\\.bloomberg\\.com\\/|assets\\.bwbx\\.io\\/s\\d\\/javelin\\/.+\\/transporter\\/)",
"upd_version": "3.2.7.1"
},
"Correio do Povo": {
"domain": "correiodopovo.com.br",
"allow_cookies": 1,
"block_regex": "(paywall\\.correiodopovo\\.com\\.br|cdn\\.ampproject\\.org\\/v\\d\\/amp-access-.+\\.js)",
"upd_version": "3.4.4.7"
},
"Defector": {
"domain": "defector.com",
"allow_cookies": 1,
@ -38,6 +44,13 @@
"ld_google_webcache": "div.article-teaser|article",
"upd_version": "3.4.2.3"
},
"Gazeta do Povo": {
"domain": "gazetadopovo.com.br",
"allow_cookies": 1,
"amp_unhide": 1,
"block_regex": "(\\.tinypass\\.com\\/|cdn\\.cxense\\.com\\/|cdn\\.ampproject\\.org\\/v\\d\\/amp-subscriptions-.+\\.js)",
"upd_version": "3.4.4.7"
},
"Groupe Nice-Matin": {
"domain": "###_fr_groupe_nice_matin",
"group": [

Loading…
Cancel
Save