mercury-parser/scripts/templates/custom-extractor.js

72 lines
1.3 KiB
JavaScript

import template from './index';
export default function (hostname) {
return template`
// Rename CustomExtractor
// to fit your publication
// (e.g., NYTimesExtractor)
export const CustomExtractor = {
domain: '${hostname}',
title: {
selectors: [
// enter title selectors
],
},
author: {
selectors: [
// enter author selectors
],
},
content: {
selectors: [
// enter content selectors
],
// Is there anything in the content you selected that needs transformed
// before it's consumable content? E.g., unusual lazy loaded images
transforms: {
},
// Is there anything that is in the result that shouldn't be?
// The clean selectors will remove anything that matches from
// the result
clean: [
]
},
date_published: {
selectors: [
// enter selectors
],
},
lead_image_url: {
selectors: [
// enter selectors
],
},
dek: {
selectors: [
// enter selectors
],
},
next_page_url: {
selectors: [
// enter selectors
],
},
excerpt: {
selectors: [
// enter selectors
],
},
}
`;
}