import { load } from 'cheerio'; import { request } from '../lib'; import type { ParsingResult } from '../types'; export const crawl = (word: string): Promise => { return request({ protocol: 'https', hostname: 'www.diccionarios.com', path: `/diccionario/espanol/${encodeURIComponent(word)}`, }); }; export const parse = (html: string): ParsingResult => { const $ = load(html); $('.verdBold14 + .gris11 + .gris13').remove(); $('br + .gris13').remove(); $('.grisItalic13 + .gris13').remove(); $('font[class^="verd"]').remove(); $('font.gris11').remove(); $('font[class^="grisBold"]').remove(); $('font[class^="grisItalic"]').remove(); Array.from($('.gris13')).forEach((element) => { const children = $(element).find('.gris13'); if (children && children.length > 0) { children.remove(); } }); const definitions = Array.from($('.dcom-search-result .gris13')); return { definitions: definitions .map((definition) => $(definition).text().trim()) .filter(Boolean) .map((definition) => definition.replace(/\s+\.$/g, '')) .map((definition) => (definition.endsWith('.') ? definition : `${definition}.`)), exists: $('.wrapper > p > strong').text() !== 'No se ha encontrado la palabra exacta', }; };