feat: supporting all GMG sites using DeadspinExtractor

pull/17/head
Adam Pash 8 years ago
parent a73246306d
commit b65b0c98b0

7
dist/mercury.js vendored

@ -1114,6 +1114,11 @@ var Extractors = {
'www.littlethings.com': LittleThingsExtractor,
'www.politico.com': PoliticoExtractor,
'deadspin.com': DeadspinExtractor,
'jezebel.com': DeadspinExtractor,
'lifehacker.com': DeadspinExtractor,
'kotaku.com': DeadspinExtractor,
'gizmodo.com': DeadspinExtractor,
'jalopnik.com': DeadspinExtractor,
'www.broadwayworld.com': BroadwayWorldExtractor,
'www.apartmenttherapy.com': ApartmentTherapyExtractor
};
@ -1488,7 +1493,6 @@ function cleanHOnes(article, $) {
}
function removeAllButWhitelist($article) {
// $('*', article).each((index, node) => {
$article.find('*').each(function (index, node) {
node.attribs = _Reflect$ownKeys(node.attribs).reduce(function (acc, attr) {
if (WHITELIST_ATTRS_RE.test(attr)) {
@ -1513,7 +1517,6 @@ function cleanAttributes($article) {
// Grabbing the parent because at this point
// $article will be wrapped in a div which will
// have a score set on it.
console.log('HMM', $article.parent().length);
return removeAllButWhitelist($article.parent().length ? $article.parent() : $article);
}

File diff suppressed because one or more lines are too long

@ -32,6 +32,11 @@ const Extractors = {
'www.littlethings.com': LittleThingsExtractor,
'www.politico.com': PoliticoExtractor,
'deadspin.com': DeadspinExtractor,
'jezebel.com': DeadspinExtractor,
'lifehacker.com': DeadspinExtractor,
'kotaku.com': DeadspinExtractor,
'gizmodo.com': DeadspinExtractor,
'jalopnik.com': DeadspinExtractor,
'www.broadwayworld.com': BroadwayWorldExtractor,
'www.apartmenttherapy.com': ApartmentTherapyExtractor,
};

Loading…
Cancel
Save