You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
mercury-parser/src/extractors/generic/word-count/extractor.js

16 lines
355 B
JavaScript

import cheerio from 'cheerio';
import { normalizeSpaces } from 'utils/text';
const GenericWordCountExtractor = {
extract({ content }) {
const $ = cheerio.load(content);
const $content = $('div').first();
const text = normalizeSpaces($content.text());
return text.split(/\s/).length;
},
};
export default GenericWordCountExtractor;