From 57da96485e0671fc34f2ea862b872af186ff043c Mon Sep 17 00:00:00 2001 From: Christian Schneider Date: Mon, 2 Jul 2012 15:30:50 +0000 Subject: Improved cleanup handling for illegal characters in html, now handles utf-8 as well --- it_xml.class | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'it_xml.class') diff --git a/it_xml.class b/it_xml.class index f854682..c98b6eb 100644 --- a/it_xml.class +++ b/it_xml.class @@ -134,7 +134,7 @@ function _sanitize($xmldata, $isutf8 = null) # If not utf-8, remove characters illegal for latin-1 if (!$isutf8 && preg_match('/[\x00-\x08\x0b-\x0c\x0e-\x1f\x80-\x9f]/', $xmldata)) - $xmldata = it_html::latinize($xmldata); + $xmldata = it_html::_cleanup($xmldata, $isutf8 ? "utf-8" : "iso-8859-1"); return array($xmldata, $isutf8); } -- cgit v1.2.3