From 7856adae233d2ddf2aed7d8f4a8c41069ec13006 Mon Sep 17 00:00:00 2001 From: Urban Müller Date: Wed, 14 Apr 2010 16:26:15 +0000 Subject: faster, commented --- it_xml.class | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) (limited to 'it_xml.class') diff --git a/it_xml.class b/it_xml.class index a861245..da02b00 100644 --- a/it_xml.class +++ b/it_xml.class @@ -133,7 +133,8 @@ function _sanitize($xmldata, $isutf8 = null) if ($isutf8 && preg_match('/[^\x80-\xff][\x80-\xff][^\x80-\xff]/', $xmldata)) $xmldata = preg_replace('/[\x80-\xff]{1,4}/e', "it_xml::_utf8_fix('\\0')", $xmldata); - if (!$isutf8) + # If not utf-8, remove characters illegal for latin-1 + if (!$isutf8 && preg_match('/[\x00-\x08\x0a-\x0c\x0e-\x1f\x80-\x9f]/', $xmldata)) $xmldata = it_html::latinize($xmldata); return array($xmldata, $isutf8); -- cgit v1.2.3