Merge pull request #64 from ItsVipra/55-sanitize-html-special-characters

Sanitize html special characters
2024-11-21 19:13:03 +00:00 · 2023-08-01 11:00:21 +02:00 · 2023-08-01 11:00:21 +02:00 · d2a992eea2
commit d2a992eea2
parent a8904497c0 58a8404a8d
2 changed files with 28 additions and 1 deletions
--- a/src/libs/domhelpers.js
+++ b/src/libs/domhelpers.js
@ -85,3 +85,26 @@ export function insertAfter(insertion, target) {
 	//docs: https://developer.mozilla.org/en-US/docs/Web/API/Node/insertBefore#example_2
 	target.parentElement.insertBefore(insertion, target.nextSibling);
 }
+
+/**
+ * Turns HTML text into human-readable text
+ * @param {string} input HTML Text
+ * @returns {string}
+ */
+export function htmlDecode(input) {
+	if (typeof window === "undefined" || !window.DOMParser) {
+		const replacements = {
+			"&amp;": "&",
+			"&quot;": '"',
+			"&lt;": "<",
+			"&gt;": ">",
+			"&nbsp;": "",
+		};
+		for (const [html, text] of Object.entries(replacements)) input = input.replaceAll(html, text);
+
+		return input;
+	}
+
+	const doc = new DOMParser().parseFromString(input, "text/html");
+	return doc.documentElement.textContent;
+}
--- a/src/libs/pronouns.js
+++ b/src/libs/pronouns.js
@ -1,4 +1,5 @@
 import sanitizeHtml from "sanitize-html";
+import { htmlDecode } from "./domhelpers.js";

 const fieldMatchers = [/\bpro.*nouns?\b/i, /\bpronomen\b/i, /(i )?go(es)? by/i];
 const knownPronounUrls = [
@ -179,9 +180,12 @@ function sanitizePronouns(str) {
 	// Remove trailing characters that are used as separators.
 	str = str.replace(/[-| :/]+$/, "");

-	// Finally, remove leading and trailing whitespace.
+	// Remove leading and trailing whitespace.
 	str = str.trim();

+	//Finally, turn escaped characters (e.g. &,>) back into their original form
+	str = htmlDecode(str);
+
 	// If the result is empty, return null, otherwise the empty string.
 	return str === "" ? null : str;
 }