You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
mercury-parser/src/extractors/custom/blogspot.com/index.js

41 lines
655 B
JavaScript

const BloggerExtractor = {
domain: 'blogspot.com',
content: {
// Blogger is insane and does not load its content
// initially in the page, but it's all there
// in noscript
selectors: [
'.post-content noscript',
],
// Selectors to remove from the extracted content
clean: [
],
// Convert the noscript tag to a div
transforms: {
noscript: 'div',
},
},
author: {
selectors: [
'.post-author-name',
],
},
title: {
selectors: [
'h2.title',
],
},
datePublished: {
selectors: [
'span.publishdate',
],
},
};
export default BloggerExtractor;