From ed1d212ae2daea5e4bd043417610177093e99f19 Mon Sep 17 00:00:00 2001 From: Aleksander Machniak <alec@alec.pl> Date: Sat, 16 Jan 2016 03:03:51 -0500 Subject: [PATCH] Improved SVG cleanup code --- program/lib/Roundcube/rcube_charset.php | 52 +++++++++++++++++++++++++++++++--------------------- 1 files changed, 31 insertions(+), 21 deletions(-) diff --git a/program/lib/Roundcube/rcube_charset.php b/program/lib/Roundcube/rcube_charset.php index beb2134..2d6d9d3 100644 --- a/program/lib/Roundcube/rcube_charset.php +++ b/program/lib/Roundcube/rcube_charset.php @@ -70,8 +70,8 @@ /** * Catch an error and throw an exception. * - * @param int Level of the error - * @param string Error message + * @param int $errno Level of the error + * @param string $errstr Error message */ public static function error_handler($errno, $errstr) { @@ -119,7 +119,7 @@ } // ISO-8859 else if (preg_match('/ISO8859([0-9]{0,2})/', $str, $m)) { - $iso = 'ISO-8859-' . ($m[1] ? $m[1] : 1); + $iso = 'ISO-8859-' . ($m[1] ?: 1); // some clients sends windows-1252 text as latin1, // it is safe to use windows-1252 for all latin1 $result = $iso == 'ISO-8859-1' ? 'WINDOWS-1252' : $iso; @@ -162,19 +162,19 @@ * Convert a string from one charset to another. * Uses mbstring and iconv functions if possible * - * @param string Input string - * @param string Suspected charset of the input string - * @param string Target charset to convert to; defaults to RCUBE_CHARSET + * @param string $str Input string + * @param string $from Suspected charset of the input string + * @param string $to Target charset to convert to; defaults to RCUBE_CHARSET * * @return string Converted string */ public static function convert($str, $from, $to = null) { - static $iconv_options = null; - static $mbstring_list = null; - static $mbstring_sch = null; + static $iconv_options = null; + static $mbstring_list = null; + static $mbstring_sch = null; - $to = empty($to) ? RCUBE_CHARSET : $to; + $to = empty($to) ? RCUBE_CHARSET : strtoupper($to); $from = self::parse_charset($from); // It is a common case when UTF-16 charset is used with US-ASCII content (#1488654) @@ -208,7 +208,8 @@ set_error_handler(array('rcube_charset', 'error_handler'), E_NOTICE); try { $out = iconv($from, $to . $iconv_options, $str); - } catch (ErrorException $e) { + } + catch (ErrorException $e) { $out = false; } restore_error_handler(); @@ -237,20 +238,29 @@ $aliases['US-ASCII'] = 'ASCII'; } - $mb_from = $aliases[$from] ? $aliases[$from] : $from; - $mb_to = $aliases[$to] ? $aliases[$to] : $to; + $mb_from = $aliases[$from] ?: $from; + $mb_to = $aliases[$to] ?: $to; // return if encoding found, string matches encoding and convert succeeded if (in_array($mb_from, $mbstring_list) && in_array($mb_to, $mbstring_list)) { - if (mb_check_encoding($str, $mb_from)) { - // Do the same as //IGNORE with iconv - mb_substitute_character('none'); - $out = mb_convert_encoding($str, $mb_to, $mb_from); - mb_substitute_character($mbstring_sch); + // Do the same as //IGNORE with iconv + mb_substitute_character('none'); - if ($out !== false) { - return $out; - } + // throw an exception if mbstring reports an illegal character in input + // using mb_check_encoding() is much slower + set_error_handler(array('rcube_charset', 'error_handler'), E_WARNING); + try { + $out = mb_convert_encoding($str, $mb_to, $mb_from); + } + catch (ErrorException $e) { + $out = false; + } + restore_error_handler(); + + mb_substitute_character($mbstring_sch); + + if ($out !== false) { + return $out; } } } -- Gitblit v1.9.1