You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
mercury-parser/src/extractors/generic/next-page-url/scoring/utils/score-cap-links.js

20 lines
500 B
JavaScript

import {
NEXT_LINK_TEXT_RE,
CAP_LINK_TEXT_RE,
} from '../constants';
export default function scoreCapLinks(linkData) {
// Cap links are links like "last", etc.
if (CAP_LINK_TEXT_RE.test(linkData)) {
// If we found a link like "last", but we've already seen that
// this link is also "next", it's fine. If it's not been
// previously marked as "next", then it's probably bad.
// Penalize.
if (NEXT_LINK_TEXT_RE.test(linkData)) {
return -65;
}
}
return 0;
}