diff --git a/src/HTMLNormalizer/HTMLNormalizer.ts b/src/HTMLNormalizer/HTMLNormalizer.ts index 0701019ec7ab770929d411e627be69542ef900c1..c40abe5894e1ade6a581e6802059def8e1a16e7d 100644 --- a/src/HTMLNormalizer/HTMLNormalizer.ts +++ b/src/HTMLNormalizer/HTMLNormalizer.ts @@ -11,7 +11,7 @@ import { pruneOutlookElement, } from "./strategies/outlook"; import { EMAIL_VENDORS } from "../constants"; -import { normalizeTextSpacings, removeSpacesAndLinebreaks } from "../utils"; +import { normalizeTextSpacings } from "../utils"; import { amendGmailNodes, cleanupGMailElementAttributes, @@ -125,7 +125,7 @@ export const printHtmlNode = (node: Node, depth: number): string => { switch (node.nodeType) { case TEXT_NODE: { - const text = removeSpacesAndLinebreaks(node.textContent); + const text = normalizeTextSpacings(node.textContent).trim(); if (text.length) { result += "<TEXT>"; result += text; diff --git a/src/utils.ts b/src/utils.ts index 3723902a1ebaa16ca517bffe227b0f90eafd1f78..6da5b6a8189e393345727710d897ce49454e03c1 100644 --- a/src/utils.ts +++ b/src/utils.ts @@ -1,9 +1,3 @@ -export const removeSpacesAndLinebreaks = (s: string): string => { - const removeSymbols = new RegExp(/[\r\n\v\s\u200B]+/g); - - return s.replace(removeSymbols, "").trim(); -}; - export const normalizeTextSpacings = (s: string): string => { return s.replace(/[\r\n\v\s\u00A0]+/g, " "); };