1
0
mirror of https://git.tt-rss.org/git/tt-rss.git synced 2025-12-13 23:35:57 +00:00

sanitize: remove doctype properly, add experimental workaround against unnecessary html elements in sanitized data

This commit is contained in:
Andrew Dolgov
2013-10-06 11:08:15 +04:00
parent ae3851b1b5
commit f44d59992e

View File

@@ -2891,7 +2891,7 @@
}
}
$doc->removeChild($doc->firstChild); //remove doctype
$doc->removeChild($doc->doctype); //remove doctype
$doc = strip_harmful_tags($doc, $allowed_elements, $disallowed_attributes);
if ($highlight_words) {
@@ -2924,7 +2924,19 @@
}
}
$res = $doc->saveHTML();
$body = $doc->getElementsByTagName("body")->item(0);
if ($body) {
$div = $doc->createElement("div");
foreach ($body->childNodes as $child) {
$div->appendChild($child);
}
$res = $doc->saveXML($div);
} else {
$res = $doc->saveHTML();
}
return $res;
}