rc2: program/lib/Roundcube/rcube

author	Charlie Root
date	Thu, 04 Jan 2018 15:52:31 -0500
parents
children

rev	line source
0 4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	1 <?php
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	2
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	3 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	4 +-----------------------------------------------------------------------+
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	5 \| This file is part of the Roundcube Webmail client \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	6 \| Copyright (C) 2005-2012, The Roundcube Dev Team \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	7 \| Copyright (C) 2011-2012, Kolab Systems AG \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	8 \| Copyright (C) 2000 Edmund Grimley Evans <edmundo@rano.org> \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	9 \| \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	10 \| Licensed under the GNU General Public License version 3 or \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	11 \| any later version with exceptions for skins & plugins. \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	12 \| See the README file for a full license statement. \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	13 \| \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	14 \| PURPOSE: \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	15 \| Provide charset conversion functionality \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	16 +-----------------------------------------------------------------------+
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	17 \| Author: Thomas Bruederli <roundcube@gmail.com> \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	18 \| Author: Aleksander Machniak <alec@alec.pl> \|
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	19 +-----------------------------------------------------------------------+
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	20 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	21
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	22 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	23 * Character sets conversion functionality
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	24 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	25 * @package Framework
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	26 * @subpackage Core
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	27 * @author Thomas Bruederli <roundcube@gmail.com>
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	28 * @author Aleksander Machniak <alec@alec.pl>
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	29 * @author Edmund Grimley Evans <edmundo@rano.org>
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	30 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	31 class rcube_charset
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	32 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	33 // Aliases: some of them from HTML5 spec.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	34 static public $aliases = array(
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	35 'USASCII' => 'WINDOWS-1252',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	36 'ANSIX31101983' => 'WINDOWS-1252',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	37 'ANSIX341968' => 'WINDOWS-1252',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	38 'UNKNOWN8BIT' => 'ISO-8859-15',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	39 'UNKNOWN' => 'ISO-8859-15',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	40 'USERDEFINED' => 'ISO-8859-15',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	41 'KSC56011987' => 'EUC-KR',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	42 'GB2312' => 'GBK',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	43 'GB231280' => 'GBK',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	44 'UNICODE' => 'UTF-8',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	45 'UTF7IMAP' => 'UTF7-IMAP',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	46 'TIS620' => 'WINDOWS-874',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	47 'ISO88599' => 'WINDOWS-1254',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	48 'ISO885911' => 'WINDOWS-874',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	49 'MACROMAN' => 'MACINTOSH',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	50 '77' => 'MAC',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	51 '128' => 'SHIFT-JIS',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	52 '129' => 'CP949',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	53 '130' => 'CP1361',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	54 '134' => 'GBK',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	55 '136' => 'BIG5',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	56 '161' => 'WINDOWS-1253',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	57 '162' => 'WINDOWS-1254',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	58 '163' => 'WINDOWS-1258',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	59 '177' => 'WINDOWS-1255',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	60 '178' => 'WINDOWS-1256',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	61 '186' => 'WINDOWS-1257',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	62 '204' => 'WINDOWS-1251',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	63 '222' => 'WINDOWS-874',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	64 '238' => 'WINDOWS-1250',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	65 'MS950' => 'CP950',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	66 'WINDOWS949' => 'UHC',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	67 );
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	68
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	69 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	70 * Windows codepages
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	71 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	72 * @var array
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	73 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	74 static public $windows_codepages = array(
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	75 37 => 'IBM037', // IBM EBCDIC US-Canada
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	76 437 => 'IBM437', // OEM United States
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	77 500 => 'IBM500', // IBM EBCDIC International
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	78 708 => 'ASMO-708', // Arabic (ASMO 708)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	79 720 => 'DOS-720', // Arabic (Transparent ASMO); Arabic (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	80 737 => 'IBM737', // OEM Greek (formerly 437G); Greek (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	81 775 => 'IBM775', // OEM Baltic; Baltic (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	82 850 => 'IBM850', // OEM Multilingual Latin 1; Western European (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	83 852 => 'IBM852', // OEM Latin 2; Central European (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	84 855 => 'IBM855', // OEM Cyrillic (primarily Russian)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	85 857 => 'IBM857', // OEM Turkish; Turkish (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	86 858 => 'IBM00858', // OEM Multilingual Latin 1 + Euro symbol
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	87 860 => 'IBM860', // OEM Portuguese; Portuguese (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	88 861 => 'IBM861', // OEM Icelandic; Icelandic (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	89 862 => 'DOS-862', // OEM Hebrew; Hebrew (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	90 863 => 'IBM863', // OEM French Canadian; French Canadian (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	91 864 => 'IBM864', // OEM Arabic; Arabic (864)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	92 865 => 'IBM865', // OEM Nordic; Nordic (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	93 866 => 'cp866', // OEM Russian; Cyrillic (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	94 869 => 'IBM869', // OEM Modern Greek; Greek, Modern (DOS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	95 870 => 'IBM870', // IBM EBCDIC Multilingual/ROECE (Latin 2); IBM EBCDIC Multilingual Latin 2
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	96 874 => 'windows-874', // ANSI/OEM Thai (ISO 8859-11); Thai (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	97 875 => 'cp875', // IBM EBCDIC Greek Modern
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	98 932 => 'shift_jis', // ANSI/OEM Japanese; Japanese (Shift-JIS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	99 936 => 'gb2312', // ANSI/OEM Simplified Chinese (PRC, Singapore); Chinese Simplified (GB2312)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	100 950 => 'big5', // ANSI/OEM Traditional Chinese (Taiwan; Hong Kong SAR, PRC); Chinese Traditional (Big5)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	101 1026 => 'IBM1026', // IBM EBCDIC Turkish (Latin 5)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	102 1047 => 'IBM01047', // IBM EBCDIC Latin 1/Open System
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	103 1140 => 'IBM01140', // IBM EBCDIC US-Canada (037 + Euro symbol); IBM EBCDIC (US-Canada-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	104 1141 => 'IBM01141', // IBM EBCDIC Germany (20273 + Euro symbol); IBM EBCDIC (Germany-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	105 1142 => 'IBM01142', // IBM EBCDIC Denmark-Norway (20277 + Euro symbol); IBM EBCDIC (Denmark-Norway-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	106 1143 => 'IBM01143', // IBM EBCDIC Finland-Sweden (20278 + Euro symbol); IBM EBCDIC (Finland-Sweden-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	107 1144 => 'IBM01144', // IBM EBCDIC Italy (20280 + Euro symbol); IBM EBCDIC (Italy-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	108 1145 => 'IBM01145', // IBM EBCDIC Latin America-Spain (20284 + Euro symbol); IBM EBCDIC (Spain-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	109 1146 => 'IBM01146', // IBM EBCDIC United Kingdom (20285 + Euro symbol); IBM EBCDIC (UK-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	110 1147 => 'IBM01147', // IBM EBCDIC France (20297 + Euro symbol); IBM EBCDIC (France-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	111 1148 => 'IBM01148', // IBM EBCDIC International (500 + Euro symbol); IBM EBCDIC (International-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	112 1149 => 'IBM01149', // IBM EBCDIC Icelandic (20871 + Euro symbol); IBM EBCDIC (Icelandic-Euro)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	113 1200 => 'UTF-16', // Unicode UTF-16, little endian byte order (BMP of ISO 10646); available only to managed applications
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	114 1201 => 'UTF-16BE', // Unicode UTF-16, big endian byte order; available only to managed applications
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	115 1250 => 'windows-1250', // ANSI Central European; Central European (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	116 1251 => 'windows-1251', // ANSI Cyrillic; Cyrillic (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	117 1252 => 'windows-1252', // ANSI Latin 1; Western European (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	118 1253 => 'windows-1253', // ANSI Greek; Greek (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	119 1254 => 'windows-1254', // ANSI Turkish; Turkish (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	120 1255 => 'windows-1255', // ANSI Hebrew; Hebrew (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	121 1256 => 'windows-1256', // ANSI Arabic; Arabic (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	122 1257 => 'windows-1257', // ANSI Baltic; Baltic (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	123 1258 => 'windows-1258', // ANSI/OEM Vietnamese; Vietnamese (Windows)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	124 10000 => 'macintosh', // MAC Roman; Western European (Mac)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	125 12000 => 'UTF-32', // Unicode UTF-32, little endian byte order; available only to managed applications
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	126 12001 => 'UTF-32BE', // Unicode UTF-32, big endian byte order; available only to managed applications
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	127 20127 => 'US-ASCII', // US-ASCII (7-bit)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	128 20273 => 'IBM273', // IBM EBCDIC Germany
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	129 20277 => 'IBM277', // IBM EBCDIC Denmark-Norway
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	130 20278 => 'IBM278', // IBM EBCDIC Finland-Sweden
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	131 20280 => 'IBM280', // IBM EBCDIC Italy
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	132 20284 => 'IBM284', // IBM EBCDIC Latin America-Spain
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	133 20285 => 'IBM285', // IBM EBCDIC United Kingdom
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	134 20290 => 'IBM290', // IBM EBCDIC Japanese Katakana Extended
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	135 20297 => 'IBM297', // IBM EBCDIC France
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	136 20420 => 'IBM420', // IBM EBCDIC Arabic
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	137 20423 => 'IBM423', // IBM EBCDIC Greek
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	138 20424 => 'IBM424', // IBM EBCDIC Hebrew
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	139 20838 => 'IBM-Thai', // IBM EBCDIC Thai
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	140 20866 => 'koi8-r', // Russian (KOI8-R); Cyrillic (KOI8-R)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	141 20871 => 'IBM871', // IBM EBCDIC Icelandic
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	142 20880 => 'IBM880', // IBM EBCDIC Cyrillic Russian
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	143 20905 => 'IBM905', // IBM EBCDIC Turkish
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	144 20924 => 'IBM00924', // IBM EBCDIC Latin 1/Open System (1047 + Euro symbol)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	145 20932 => 'EUC-JP', // Japanese (JIS 0208-1990 and 0212-1990)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	146 20936 => 'cp20936', // Simplified Chinese (GB2312); Chinese Simplified (GB2312-80)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	147 20949 => 'cp20949', // Korean Wansung
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	148 21025 => 'cp1025', // IBM EBCDIC Cyrillic Serbian-Bulgarian
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	149 21866 => 'koi8-u', // Ukrainian (KOI8-U); Cyrillic (KOI8-U)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	150 28591 => 'iso-8859-1', // ISO 8859-1 Latin 1; Western European (ISO)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	151 28592 => 'iso-8859-2', // ISO 8859-2 Central European; Central European (ISO)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	152 28593 => 'iso-8859-3', // ISO 8859-3 Latin 3
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	153 28594 => 'iso-8859-4', // ISO 8859-4 Baltic
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	154 28595 => 'iso-8859-5', // ISO 8859-5 Cyrillic
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	155 28596 => 'iso-8859-6', // ISO 8859-6 Arabic
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	156 28597 => 'iso-8859-7', // ISO 8859-7 Greek
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	157 28598 => 'iso-8859-8', // ISO 8859-8 Hebrew; Hebrew (ISO-Visual)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	158 28599 => 'iso-8859-9', // ISO 8859-9 Turkish
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	159 28603 => 'iso-8859-13', // ISO 8859-13 Estonian
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	160 28605 => 'iso-8859-15', // ISO 8859-15 Latin 9
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	161 38598 => 'iso-8859-8-i', // ISO 8859-8 Hebrew; Hebrew (ISO-Logical)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	162 50220 => 'iso-2022-jp', // ISO 2022 Japanese with no halfwidth Katakana; Japanese (JIS)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	163 50221 => 'csISO2022JP', // ISO 2022 Japanese with halfwidth Katakana; Japanese (JIS-Allow 1 byte Kana)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	164 50222 => 'iso-2022-jp', // ISO 2022 Japanese JIS X 0201-1989; Japanese (JIS-Allow 1 byte Kana - SO/SI)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	165 50225 => 'iso-2022-kr', // ISO 2022 Korean
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	166 51932 => 'EUC-JP', // EUC Japanese
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	167 51936 => 'EUC-CN', // EUC Simplified Chinese; Chinese Simplified (EUC)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	168 51949 => 'EUC-KR', // EUC Korean
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	169 52936 => 'hz-gb-2312', // HZ-GB2312 Simplified Chinese; Chinese Simplified (HZ)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	170 54936 => 'GB18030', // Windows XP and later: GB18030 Simplified Chinese (4 byte); Chinese Simplified (GB18030)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	171 65000 => 'UTF-7',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	172 65001 => 'UTF-8',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	173 );
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	174
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	175 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	176 * Catch an error and throw an exception.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	177 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	178 * @param int $errno Level of the error
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	179 * @param string $errstr Error message
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	180 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	181 public static function error_handler($errno, $errstr)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	182 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	183 throw new ErrorException($errstr, 0, $errno);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	184 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	185
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	186 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	187 * Parse and validate charset name string (see #1485758).
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	188 * Sometimes charset string is malformed, there are also charset aliases
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	189 * but we need strict names for charset conversion (specially utf8 class)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	190 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	191 * @param string $input Input charset name
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	192 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	193 * @return string The validated charset name
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	194 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	195 public static function parse_charset($input)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	196 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	197 static $charsets = array();
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	198 $charset = strtoupper($input);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	199
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	200 if (isset($charsets[$input])) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	201 return $charsets[$input];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	202 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	203
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	204 $charset = preg_replace(array(
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	205 '/^[^0-9A-Z]+/', // e.g. _ISO-8859-JP$SIO
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	206 '/\$.*$/', // e.g. _ISO-8859-JP$SIO
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	207 '/UNICODE-1-1-*/', // RFC1641/1642
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	208 '/^X-/', // X- prefix (e.g. X-ROMAN8 => ROMAN8)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	209 ), '', $charset);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	210
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	211 if ($charset == 'BINARY') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	212 return $charsets[$input] = null;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	213 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	214
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	215 // allow A-Z and 0-9 only
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	216 $str = preg_replace('/[^A-Z0-9]/', '', $charset);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	217
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	218 if (isset(self::$aliases[$str])) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	219 $result = self::$aliases[$str];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	220 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	221 // UTF
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	222 else if (preg_match('/U[A-Z][A-Z](7\|8\|16\|32)(BE\|LE)*/', $str, $m)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	223 $result = 'UTF-' . $m[1] . $m[2];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	224 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	225 // ISO-8859
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	226 else if (preg_match('/ISO8859([0-9]{0,2})/', $str, $m)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	227 $iso = 'ISO-8859-' . ($m[1] ?: 1);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	228 // some clients sends windows-1252 text as latin1,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	229 // it is safe to use windows-1252 for all latin1
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	230 $result = $iso == 'ISO-8859-1' ? 'WINDOWS-1252' : $iso;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	231 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	232 // handle broken charset names e.g. WINDOWS-1250HTTP-EQUIVCONTENT-TYPE
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	233 else if (preg_match('/(WIN\|WINDOWS)([0-9]+)/', $str, $m)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	234 $result = 'WINDOWS-' . $m[2];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	235 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	236 // LATIN
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	237 else if (preg_match('/LATIN(.*)/', $str, $m)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	238 $aliases = array('2' => 2, '3' => 3, '4' => 4, '5' => 9, '6' => 10,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	239 '7' => 13, '8' => 14, '9' => 15, '10' => 16,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	240 'ARABIC' => 6, 'CYRILLIC' => 5, 'GREEK' => 7, 'GREEK1' => 7, 'HEBREW' => 8
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	241 );
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	242
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	243 // some clients sends windows-1252 text as latin1,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	244 // it is safe to use windows-1252 for all latin1
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	245 if ($m[1] == 1) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	246 $result = 'WINDOWS-1252';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	247 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	248 // if iconv is not supported we need ISO labels, it's also safe for iconv
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	249 else if (!empty($aliases[$m[1]])) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	250 $result = 'ISO-8859-'.$aliases[$m[1]];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	251 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	252 // iconv requires conversion of e.g. LATIN-1 to LATIN1
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	253 else {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	254 $result = $str;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	255 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	256 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	257 else {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	258 $result = $charset;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	259 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	260
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	261 $charsets[$input] = $result;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	262
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	263 return $result;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	264 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	265
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	266 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	267 * Convert a string from one charset to another.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	268 * Uses mbstring and iconv functions if possible
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	269 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	270 * @param string $str Input string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	271 * @param string $from Suspected charset of the input string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	272 * @param string $to Target charset to convert to; defaults to RCUBE_CHARSET
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	273 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	274 * @return string Converted string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	275 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	276 public static function convert($str, $from, $to = null)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	277 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	278 static $iconv_options = null;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	279 static $mbstring_sc = null;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	280
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	281 $to = empty($to) ? RCUBE_CHARSET : strtoupper($to);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	282 $from = self::parse_charset($from);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	283
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	284 // It is a common case when UTF-16 charset is used with US-ASCII content (#1488654)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	285 // In that case we can just skip the conversion (use UTF-8)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	286 if ($from == 'UTF-16' && !preg_match('/[^\x00-\x7F]/', $str)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	287 $from = 'UTF-8';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	288 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	289
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	290 if ($from == $to \|\| empty($str) \|\| empty($from)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	291 return $str;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	292 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	293
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	294 if ($iconv_options === null) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	295 if (function_exists('iconv')) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	296 // ignore characters not available in output charset
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	297 $iconv_options = '//IGNORE';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	298 if (iconv('', $iconv_options, '') === false) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	299 // iconv implementation does not support options
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	300 $iconv_options = '';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	301 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	302 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	303 else {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	304 $iconv_options = false;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	305 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	306 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	307
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	308 // convert charset using iconv module
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	309 if ($iconv_options !== false && $from != 'UTF7-IMAP' && $to != 'UTF7-IMAP'
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	310 && $from !== 'ISO-2022-JP'
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	311 ) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	312 // throw an exception if iconv reports an illegal character in input
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	313 // it means that input string has been truncated
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	314 set_error_handler(array('rcube_charset', 'error_handler'), E_NOTICE);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	315 try {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	316 $out = iconv($from, $to . $iconv_options, $str);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	317 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	318 catch (ErrorException $e) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	319 $out = false;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	320 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	321 restore_error_handler();
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	322
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	323 if ($out !== false) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	324 return $out;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	325 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	326 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	327
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	328 if ($mbstring_sc === null) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	329 $mbstring_sc = extension_loaded('mbstring') ? mb_substitute_character() : false;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	330 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	331
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	332 // convert charset using mbstring module
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	333 if ($mbstring_sc !== false) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	334 $aliases = array(
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	335 'WINDOWS-1257' => 'ISO-8859-13',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	336 'US-ASCII' => 'ASCII',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	337 'ISO-2022-JP' => 'ISO-2022-JP-MS',
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	338 );
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	339
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	340 $mb_from = $aliases[$from] ?: $from;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	341 $mb_to = $aliases[$to] ?: $to;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	342
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	343 // Do the same as //IGNORE with iconv
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	344 mb_substitute_character('none');
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	345
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	346 // throw an exception if mbstring reports an illegal character in input
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	347 // using mb_check_encoding() is much slower
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	348 set_error_handler(array('rcube_charset', 'error_handler'), E_WARNING);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	349 try {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	350 $out = mb_convert_encoding($str, $mb_to, $mb_from);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	351 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	352 catch (ErrorException $e) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	353 $out = false;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	354 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	355 restore_error_handler();
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	356
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	357 mb_substitute_character($mbstring_sc);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	358
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	359 if ($out !== false) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	360 return $out;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	361 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	362 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	363
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	364 // convert charset using bundled classes/functions
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	365 if ($to == 'UTF-8') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	366 if ($from == 'UTF7-IMAP') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	367 if ($out = self::utf7imap_to_utf8($str)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	368 return $out;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	369 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	370 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	371 else if ($from == 'UTF-7') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	372 if ($out = self::utf7_to_utf8($str)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	373 return $out;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	374 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	375 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	376 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	377
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	378 // encode string for output
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	379 if ($from == 'UTF-8') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	380 // @TODO: we need a function for UTF-7 (RFC2152) conversion
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	381 if ($to == 'UTF7-IMAP' \|\| $to == 'UTF-7') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	382 if ($out = self::utf8_to_utf7imap($str)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	383 return $out;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	384 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	385 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	386 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	387
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	388 if (!isset($out)) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	389 trigger_error("No suitable function found for '$from' to '$to' conversion");
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	390 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	391
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	392 // return original string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	393 return $str;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	394 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	395
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	396 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	397 * Converts string from standard UTF-7 (RFC 2152) to UTF-8.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	398 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	399 * @param string $str Input string (UTF-7)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	400 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	401 * @return string Converted string (UTF-8)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	402 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	403 public static function utf7_to_utf8($str)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	404 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	405 $Index_64 = array(
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	406 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	407 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	408 0,0,0,0, 0,0,0,0, 0,0,0,1, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	409 1,1,1,1, 1,1,1,1, 1,1,0,0, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	410 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	411 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	412 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	413 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0,
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	414 );
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	415
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	416 $u7len = strlen($str);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	417 $str = strval($str);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	418 $res = '';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	419
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	420 for ($i=0; $u7len > 0; $i++, $u7len--) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	421 $u7 = $str[$i];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	422 if ($u7 == '+') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	423 $i++;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	424 $u7len--;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	425 $ch = '';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	426
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	427 for (; $u7len > 0; $i++, $u7len--) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	428 $u7 = $str[$i];
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	429
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	430 if (!$Index_64[ord($u7)]) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	431 break;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	432 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	433
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	434 $ch .= $u7;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	435 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	436
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	437 if ($ch == '') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	438 if ($u7 == '-') {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	439 $res .= '+';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	440 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	441
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	442 continue;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	443 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	444
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	445 $res .= self::utf16_to_utf8(base64_decode($ch));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	446 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	447 else {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	448 $res .= $u7;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	449 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	450 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	451
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	452 return $res;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	453 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	454
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	455 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	456 * Converts string from UTF-16 to UTF-8 (helper for utf-7 to utf-8 conversion)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	457 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	458 * @param string $str Input string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	459 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	460 * @return string The converted string
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	461 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	462 public static function utf16_to_utf8($str)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	463 {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	464 $len = strlen($str);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	465 $dec = '';
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	466
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	467 for ($i = 0; $i < $len; $i += 2) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	468 $c = ord($str[$i]) << 8 \| ord($str[$i + 1]);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	469 if ($c >= 0x0001 && $c <= 0x007F) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	470 $dec .= chr($c);
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	471 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	472 else if ($c > 0x07FF) {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	473 $dec .= chr(0xE0 \| (($c >> 12) & 0x0F));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	474 $dec .= chr(0x80 \| (($c >> 6) & 0x3F));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	475 $dec .= chr(0x80 \| (($c >> 0) & 0x3F));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	476 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	477 else {
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	478 $dec .= chr(0xC0 \| (($c >> 6) & 0x1F));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	479 $dec .= chr(0x80 \| (($c >> 0) & 0x3F));
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	480 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	481 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	482
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	483 return $dec;
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	484 }
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	485
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	486 /**
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	487 * Convert the data ($str) from RFC 2060's UTF-7 to UTF-8.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	488 * If input data is invalid, return the original input string.
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	489 * RFC 2060 obviously intends the encoding to be unique (see
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	490 * point 5 in section 5.1.3), so we reject any non-canonical
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	491 * form, such as &ACY- (instead of &-) or &AMA-&AMA- (instead
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	492 * of &AMAAwA-).
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	493 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	494 * Translated from C to PHP by Thomas Bruederli <roundcube@gmail.com>
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	495 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	496 * @param string $str Input string (UTF7-IMAP)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	497 *
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	498 * @return string Output string (UTF-8)
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	499 */
4681f974d28b vanilla 1.3.3 distro, I hope Charlie Root parents: diff changeset	500 public static function utf7imap_to_utf8($str)

0

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

1 <?php

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

2

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

3 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

4 +-----------------------------------------------------------------------+

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

5 | This file is part of the Roundcube Webmail client |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

9 | |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

10 | Licensed under the GNU General Public License version 3 or |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

11 | any later version with exceptions for skins & plugins. |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

12 | See the README file for a full license statement. |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

13 | |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

14 | PURPOSE: |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

15 | Provide charset conversion functionality |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

16 +-----------------------------------------------------------------------+

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

17 | Author: Thomas Bruederli <roundcube@gmail.com> |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

18 | Author: Aleksander Machniak <alec@alec.pl> |

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

19 +-----------------------------------------------------------------------+

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

20 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

21

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

22 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

23 * Character sets conversion functionality

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

24 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

25 * @package Framework

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

26 * @subpackage Core

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

27 * @author Thomas Bruederli <roundcube@gmail.com>

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

28 * @author Aleksander Machniak <alec@alec.pl>

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

29 * @author Edmund Grimley Evans <edmundo@rano.org>

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

30 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

31 class rcube_charset

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

32 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

33 // Aliases: some of them from HTML5 spec.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

34 static public $aliases = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

35 'USASCII' => 'WINDOWS-1252',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

36 'ANSIX31101983' => 'WINDOWS-1252',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

37 'ANSIX341968' => 'WINDOWS-1252',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

38 'UNKNOWN8BIT' => 'ISO-8859-15',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

39 'UNKNOWN' => 'ISO-8859-15',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

40 'USERDEFINED' => 'ISO-8859-15',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

41 'KSC56011987' => 'EUC-KR',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

42 'GB2312' => 'GBK',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

43 'GB231280' => 'GBK',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

44 'UNICODE' => 'UTF-8',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

45 'UTF7IMAP' => 'UTF7-IMAP',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

46 'TIS620' => 'WINDOWS-874',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

47 'ISO88599' => 'WINDOWS-1254',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

48 'ISO885911' => 'WINDOWS-874',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

49 'MACROMAN' => 'MACINTOSH',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

50 '77' => 'MAC',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

51 '128' => 'SHIFT-JIS',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

52 '129' => 'CP949',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

53 '130' => 'CP1361',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

54 '134' => 'GBK',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

55 '136' => 'BIG5',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

56 '161' => 'WINDOWS-1253',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

57 '162' => 'WINDOWS-1254',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

58 '163' => 'WINDOWS-1258',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

59 '177' => 'WINDOWS-1255',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

60 '178' => 'WINDOWS-1256',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

61 '186' => 'WINDOWS-1257',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

62 '204' => 'WINDOWS-1251',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

63 '222' => 'WINDOWS-874',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

64 '238' => 'WINDOWS-1250',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

65 'MS950' => 'CP950',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

66 'WINDOWS949' => 'UHC',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

67 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

68

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

69 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

70 * Windows codepages

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

71 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

72 * @var array

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

73 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

74 static public $windows_codepages = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

75 37 => 'IBM037', // IBM EBCDIC US-Canada

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

76 437 => 'IBM437', // OEM United States

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

77 500 => 'IBM500', // IBM EBCDIC International

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

78 708 => 'ASMO-708', // Arabic (ASMO 708)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

79 720 => 'DOS-720', // Arabic (Transparent ASMO); Arabic (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

80 737 => 'IBM737', // OEM Greek (formerly 437G); Greek (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

81 775 => 'IBM775', // OEM Baltic; Baltic (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

82 850 => 'IBM850', // OEM Multilingual Latin 1; Western European (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

83 852 => 'IBM852', // OEM Latin 2; Central European (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

84 855 => 'IBM855', // OEM Cyrillic (primarily Russian)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

85 857 => 'IBM857', // OEM Turkish; Turkish (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

86 858 => 'IBM00858', // OEM Multilingual Latin 1 + Euro symbol

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

87 860 => 'IBM860', // OEM Portuguese; Portuguese (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

88 861 => 'IBM861', // OEM Icelandic; Icelandic (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

89 862 => 'DOS-862', // OEM Hebrew; Hebrew (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

90 863 => 'IBM863', // OEM French Canadian; French Canadian (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

91 864 => 'IBM864', // OEM Arabic; Arabic (864)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

92 865 => 'IBM865', // OEM Nordic; Nordic (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

93 866 => 'cp866', // OEM Russian; Cyrillic (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

94 869 => 'IBM869', // OEM Modern Greek; Greek, Modern (DOS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

95 870 => 'IBM870', // IBM EBCDIC Multilingual/ROECE (Latin 2); IBM EBCDIC Multilingual Latin 2

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

96 874 => 'windows-874', // ANSI/OEM Thai (ISO 8859-11); Thai (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

97 875 => 'cp875', // IBM EBCDIC Greek Modern

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

98 932 => 'shift_jis', // ANSI/OEM Japanese; Japanese (Shift-JIS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

99 936 => 'gb2312', // ANSI/OEM Simplified Chinese (PRC, Singapore); Chinese Simplified (GB2312)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

100 950 => 'big5', // ANSI/OEM Traditional Chinese (Taiwan; Hong Kong SAR, PRC); Chinese Traditional (Big5)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

101 1026 => 'IBM1026', // IBM EBCDIC Turkish (Latin 5)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

102 1047 => 'IBM01047', // IBM EBCDIC Latin 1/Open System

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

103 1140 => 'IBM01140', // IBM EBCDIC US-Canada (037 + Euro symbol); IBM EBCDIC (US-Canada-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

104 1141 => 'IBM01141', // IBM EBCDIC Germany (20273 + Euro symbol); IBM EBCDIC (Germany-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

105 1142 => 'IBM01142', // IBM EBCDIC Denmark-Norway (20277 + Euro symbol); IBM EBCDIC (Denmark-Norway-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

106 1143 => 'IBM01143', // IBM EBCDIC Finland-Sweden (20278 + Euro symbol); IBM EBCDIC (Finland-Sweden-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

107 1144 => 'IBM01144', // IBM EBCDIC Italy (20280 + Euro symbol); IBM EBCDIC (Italy-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

108 1145 => 'IBM01145', // IBM EBCDIC Latin America-Spain (20284 + Euro symbol); IBM EBCDIC (Spain-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

109 1146 => 'IBM01146', // IBM EBCDIC United Kingdom (20285 + Euro symbol); IBM EBCDIC (UK-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

110 1147 => 'IBM01147', // IBM EBCDIC France (20297 + Euro symbol); IBM EBCDIC (France-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

111 1148 => 'IBM01148', // IBM EBCDIC International (500 + Euro symbol); IBM EBCDIC (International-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

112 1149 => 'IBM01149', // IBM EBCDIC Icelandic (20871 + Euro symbol); IBM EBCDIC (Icelandic-Euro)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

113 1200 => 'UTF-16', // Unicode UTF-16, little endian byte order (BMP of ISO 10646); available only to managed applications

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

114 1201 => 'UTF-16BE', // Unicode UTF-16, big endian byte order; available only to managed applications

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

115 1250 => 'windows-1250', // ANSI Central European; Central European (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

116 1251 => 'windows-1251', // ANSI Cyrillic; Cyrillic (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

117 1252 => 'windows-1252', // ANSI Latin 1; Western European (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

118 1253 => 'windows-1253', // ANSI Greek; Greek (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

119 1254 => 'windows-1254', // ANSI Turkish; Turkish (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

120 1255 => 'windows-1255', // ANSI Hebrew; Hebrew (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

121 1256 => 'windows-1256', // ANSI Arabic; Arabic (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

122 1257 => 'windows-1257', // ANSI Baltic; Baltic (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

123 1258 => 'windows-1258', // ANSI/OEM Vietnamese; Vietnamese (Windows)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

124 10000 => 'macintosh', // MAC Roman; Western European (Mac)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

125 12000 => 'UTF-32', // Unicode UTF-32, little endian byte order; available only to managed applications

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

126 12001 => 'UTF-32BE', // Unicode UTF-32, big endian byte order; available only to managed applications

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

127 20127 => 'US-ASCII', // US-ASCII (7-bit)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

128 20273 => 'IBM273', // IBM EBCDIC Germany

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

129 20277 => 'IBM277', // IBM EBCDIC Denmark-Norway

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

130 20278 => 'IBM278', // IBM EBCDIC Finland-Sweden

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

131 20280 => 'IBM280', // IBM EBCDIC Italy

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

132 20284 => 'IBM284', // IBM EBCDIC Latin America-Spain

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

133 20285 => 'IBM285', // IBM EBCDIC United Kingdom

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

134 20290 => 'IBM290', // IBM EBCDIC Japanese Katakana Extended

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

135 20297 => 'IBM297', // IBM EBCDIC France

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

136 20420 => 'IBM420', // IBM EBCDIC Arabic

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

137 20423 => 'IBM423', // IBM EBCDIC Greek

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

138 20424 => 'IBM424', // IBM EBCDIC Hebrew

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

139 20838 => 'IBM-Thai', // IBM EBCDIC Thai

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

140 20866 => 'koi8-r', // Russian (KOI8-R); Cyrillic (KOI8-R)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

141 20871 => 'IBM871', // IBM EBCDIC Icelandic

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

142 20880 => 'IBM880', // IBM EBCDIC Cyrillic Russian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

143 20905 => 'IBM905', // IBM EBCDIC Turkish

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

144 20924 => 'IBM00924', // IBM EBCDIC Latin 1/Open System (1047 + Euro symbol)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

145 20932 => 'EUC-JP', // Japanese (JIS 0208-1990 and 0212-1990)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

146 20936 => 'cp20936', // Simplified Chinese (GB2312); Chinese Simplified (GB2312-80)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

147 20949 => 'cp20949', // Korean Wansung

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

148 21025 => 'cp1025', // IBM EBCDIC Cyrillic Serbian-Bulgarian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

149 21866 => 'koi8-u', // Ukrainian (KOI8-U); Cyrillic (KOI8-U)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

150 28591 => 'iso-8859-1', // ISO 8859-1 Latin 1; Western European (ISO)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

151 28592 => 'iso-8859-2', // ISO 8859-2 Central European; Central European (ISO)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

152 28593 => 'iso-8859-3', // ISO 8859-3 Latin 3

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

153 28594 => 'iso-8859-4', // ISO 8859-4 Baltic

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

154 28595 => 'iso-8859-5', // ISO 8859-5 Cyrillic

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

155 28596 => 'iso-8859-6', // ISO 8859-6 Arabic

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

156 28597 => 'iso-8859-7', // ISO 8859-7 Greek

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

157 28598 => 'iso-8859-8', // ISO 8859-8 Hebrew; Hebrew (ISO-Visual)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

158 28599 => 'iso-8859-9', // ISO 8859-9 Turkish

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

159 28603 => 'iso-8859-13', // ISO 8859-13 Estonian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

160 28605 => 'iso-8859-15', // ISO 8859-15 Latin 9

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

161 38598 => 'iso-8859-8-i', // ISO 8859-8 Hebrew; Hebrew (ISO-Logical)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

162 50220 => 'iso-2022-jp', // ISO 2022 Japanese with no halfwidth Katakana; Japanese (JIS)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

163 50221 => 'csISO2022JP', // ISO 2022 Japanese with halfwidth Katakana; Japanese (JIS-Allow 1 byte Kana)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

164 50222 => 'iso-2022-jp', // ISO 2022 Japanese JIS X 0201-1989; Japanese (JIS-Allow 1 byte Kana - SO/SI)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

165 50225 => 'iso-2022-kr', // ISO 2022 Korean

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

166 51932 => 'EUC-JP', // EUC Japanese

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

167 51936 => 'EUC-CN', // EUC Simplified Chinese; Chinese Simplified (EUC)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

168 51949 => 'EUC-KR', // EUC Korean

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

169 52936 => 'hz-gb-2312', // HZ-GB2312 Simplified Chinese; Chinese Simplified (HZ)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

170 54936 => 'GB18030', // Windows XP and later: GB18030 Simplified Chinese (4 byte); Chinese Simplified (GB18030)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

171 65000 => 'UTF-7',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

172 65001 => 'UTF-8',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

173 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

174

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

175 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

176 * Catch an error and throw an exception.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

177 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

178 * @param int $errno Level of the error

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

179 * @param string $errstr Error message

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

180 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

181 public static function error_handler($errno, $errstr)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

182 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

183 throw new ErrorException($errstr, 0, $errno);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

184 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

185

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

186 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

187 * Parse and validate charset name string (see #1485758).

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

188 * Sometimes charset string is malformed, there are also charset aliases

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

189 * but we need strict names for charset conversion (specially utf8 class)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

190 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

191 * @param string $input Input charset name

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

192 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

193 * @return string The validated charset name

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

194 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

195 public static function parse_charset($input)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

196 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

197 static $charsets = array();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

198 $charset = strtoupper($input);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

199

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

200 if (isset($charsets[$input])) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

201 return $charsets[$input];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

202 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

203

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

204 $charset = preg_replace(array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

205 '/^[^0-9A-Z]+/', // e.g. _ISO-8859-JP$SIO

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

206 '/\$.*$/', // e.g. _ISO-8859-JP$SIO

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

207 '/UNICODE-1-1-*/', // RFC1641/1642

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

208 '/^X-/', // X- prefix (e.g. X-ROMAN8 => ROMAN8)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

209 ), '', $charset);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

210

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

211 if ($charset == 'BINARY') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

212 return $charsets[$input] = null;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

213 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

214

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

215 // allow A-Z and 0-9 only

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

216 $str = preg_replace('/[^A-Z0-9]/', '', $charset);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

217

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

218 if (isset(self::$aliases[$str])) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

219 $result = self::$aliases[$str];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

220 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

221 // UTF

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

222 else if (preg_match('/U[A-Z][A-Z](7|8|16|32)(BE|LE)*/', $str, $m)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

223 $result = 'UTF-' . $m[1] . $m[2];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

224 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

225 // ISO-8859

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

226 else if (preg_match('/ISO8859([0-9]{0,2})/', $str, $m)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

227 $iso = 'ISO-8859-' . ($m[1] ?: 1);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

228 // some clients sends windows-1252 text as latin1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

229 // it is safe to use windows-1252 for all latin1

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

230 $result = $iso == 'ISO-8859-1' ? 'WINDOWS-1252' : $iso;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

231 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

232 // handle broken charset names e.g. WINDOWS-1250HTTP-EQUIVCONTENT-TYPE

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

233 else if (preg_match('/(WIN|WINDOWS)([0-9]+)/', $str, $m)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

234 $result = 'WINDOWS-' . $m[2];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

235 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

236 // LATIN

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

237 else if (preg_match('/LATIN(.*)/', $str, $m)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

238 $aliases = array('2' => 2, '3' => 3, '4' => 4, '5' => 9, '6' => 10,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

239 '7' => 13, '8' => 14, '9' => 15, '10' => 16,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

240 'ARABIC' => 6, 'CYRILLIC' => 5, 'GREEK' => 7, 'GREEK1' => 7, 'HEBREW' => 8

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

241 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

242

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

243 // some clients sends windows-1252 text as latin1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

244 // it is safe to use windows-1252 for all latin1

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

245 if ($m[1] == 1) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

246 $result = 'WINDOWS-1252';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

247 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

248 // if iconv is not supported we need ISO labels, it's also safe for iconv

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

249 else if (!empty($aliases[$m[1]])) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

250 $result = 'ISO-8859-'.$aliases[$m[1]];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

251 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

252 // iconv requires conversion of e.g. LATIN-1 to LATIN1

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

253 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

254 $result = $str;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

255 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

256 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

257 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

258 $result = $charset;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

259 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

260

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

261 $charsets[$input] = $result;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

262

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

263 return $result;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

264 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

265

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

266 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

267 * Convert a string from one charset to another.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

268 * Uses mbstring and iconv functions if possible

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

269 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

270 * @param string $str Input string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

271 * @param string $from Suspected charset of the input string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

272 * @param string $to Target charset to convert to; defaults to RCUBE_CHARSET

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

273 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

274 * @return string Converted string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

275 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

276 public static function convert($str, $from, $to = null)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

277 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

278 static $iconv_options = null;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

279 static $mbstring_sc = null;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

280

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

281 $to = empty($to) ? RCUBE_CHARSET : strtoupper($to);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

282 $from = self::parse_charset($from);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

283

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

284 // It is a common case when UTF-16 charset is used with US-ASCII content (#1488654)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

285 // In that case we can just skip the conversion (use UTF-8)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

286 if ($from == 'UTF-16' && !preg_match('/[^\x00-\x7F]/', $str)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

287 $from = 'UTF-8';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

288 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

289

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

290 if ($from == $to || empty($str) || empty($from)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

291 return $str;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

292 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

293

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

294 if ($iconv_options === null) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

295 if (function_exists('iconv')) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

296 // ignore characters not available in output charset

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

297 $iconv_options = '//IGNORE';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

298 if (iconv('', $iconv_options, '') === false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

299 // iconv implementation does not support options

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

300 $iconv_options = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

301 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

302 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

303 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

304 $iconv_options = false;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

305 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

306 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

307

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

308 // convert charset using iconv module

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

309 if ($iconv_options !== false && $from != 'UTF7-IMAP' && $to != 'UTF7-IMAP'

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

310 && $from !== 'ISO-2022-JP'

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

311 ) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

312 // throw an exception if iconv reports an illegal character in input

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

313 // it means that input string has been truncated

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

314 set_error_handler(array('rcube_charset', 'error_handler'), E_NOTICE);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

315 try {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

316 $out = iconv($from, $to . $iconv_options, $str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

317 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

318 catch (ErrorException $e) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

319 $out = false;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

320 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

321 restore_error_handler();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

322

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

323 if ($out !== false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

324 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

325 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

326 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

327

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

328 if ($mbstring_sc === null) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

329 $mbstring_sc = extension_loaded('mbstring') ? mb_substitute_character() : false;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

330 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

331

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

332 // convert charset using mbstring module

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

333 if ($mbstring_sc !== false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

334 $aliases = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

335 'WINDOWS-1257' => 'ISO-8859-13',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

336 'US-ASCII' => 'ASCII',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

337 'ISO-2022-JP' => 'ISO-2022-JP-MS',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

338 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

339

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

340 $mb_from = $aliases[$from] ?: $from;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

341 $mb_to = $aliases[$to] ?: $to;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

342

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

343 // Do the same as //IGNORE with iconv

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

344 mb_substitute_character('none');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

345

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

346 // throw an exception if mbstring reports an illegal character in input

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

347 // using mb_check_encoding() is much slower

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

348 set_error_handler(array('rcube_charset', 'error_handler'), E_WARNING);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

349 try {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

350 $out = mb_convert_encoding($str, $mb_to, $mb_from);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

351 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

352 catch (ErrorException $e) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

353 $out = false;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

354 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

355 restore_error_handler();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

356

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

357 mb_substitute_character($mbstring_sc);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

358

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

359 if ($out !== false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

360 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

361 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

362 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

363

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

364 // convert charset using bundled classes/functions

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

365 if ($to == 'UTF-8') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

366 if ($from == 'UTF7-IMAP') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

367 if ($out = self::utf7imap_to_utf8($str)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

368 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

369 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

370 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

371 else if ($from == 'UTF-7') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

372 if ($out = self::utf7_to_utf8($str)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

373 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

374 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

375 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

376 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

377

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

378 // encode string for output

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

379 if ($from == 'UTF-8') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

380 // @TODO: we need a function for UTF-7 (RFC2152) conversion

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

381 if ($to == 'UTF7-IMAP' || $to == 'UTF-7') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

382 if ($out = self::utf8_to_utf7imap($str)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

383 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

384 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

385 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

386 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

387

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

388 if (!isset($out)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

389 trigger_error("No suitable function found for '$from' to '$to' conversion");

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

390 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

391

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

392 // return original string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

393 return $str;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

394 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

395

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

396 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

397 * Converts string from standard UTF-7 (RFC 2152) to UTF-8.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

398 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

399 * @param string $str Input string (UTF-7)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

400 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

401 * @return string Converted string (UTF-8)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

402 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

403 public static function utf7_to_utf8($str)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

404 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

405 $Index_64 = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

406 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

407 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

408 0,0,0,0, 0,0,0,0, 0,0,0,1, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

409 1,1,1,1, 1,1,1,1, 1,1,0,0, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

410 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

411 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

412 0,1,1,1, 1,1,1,1, 1,1,1,1, 1,1,1,1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

413 1,1,1,1, 1,1,1,1, 1,1,1,0, 0,0,0,0,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

414 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

415

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

416 $u7len = strlen($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

417 $str = strval($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

418 $res = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

419

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

420 for ($i=0; $u7len > 0; $i++, $u7len--) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

421 $u7 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

422 if ($u7 == '+') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

423 $i++;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

424 $u7len--;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

425 $ch = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

426

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

427 for (; $u7len > 0; $i++, $u7len--) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

428 $u7 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

429

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

430 if (!$Index_64[ord($u7)]) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

431 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

432 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

433

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

434 $ch .= $u7;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

435 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

436

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

437 if ($ch == '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

438 if ($u7 == '-') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

439 $res .= '+';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

440 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

441

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

442 continue;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

443 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

444

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

445 $res .= self::utf16_to_utf8(base64_decode($ch));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

446 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

447 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

448 $res .= $u7;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

449 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

450 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

451

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

452 return $res;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

453 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

454

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

455 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

456 * Converts string from UTF-16 to UTF-8 (helper for utf-7 to utf-8 conversion)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

457 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

458 * @param string $str Input string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

459 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

460 * @return string The converted string

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

461 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

462 public static function utf16_to_utf8($str)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

463 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

464 $len = strlen($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

465 $dec = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

466

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

467 for ($i = 0; $i < $len; $i += 2) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

468 $c = ord($str[$i]) << 8 | ord($str[$i + 1]);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

469 if ($c >= 0x0001 && $c <= 0x007F) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

470 $dec .= chr($c);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

471 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

472 else if ($c > 0x07FF) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

473 $dec .= chr(0xE0 | (($c >> 12) & 0x0F));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

474 $dec .= chr(0x80 | (($c >> 6) & 0x3F));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

475 $dec .= chr(0x80 | (($c >> 0) & 0x3F));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

476 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

477 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

478 $dec .= chr(0xC0 | (($c >> 6) & 0x1F));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

479 $dec .= chr(0x80 | (($c >> 0) & 0x3F));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

480 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

481 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

482

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

483 return $dec;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

484 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

485

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

486 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

487 * Convert the data ($str) from RFC 2060's UTF-7 to UTF-8.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

488 * If input data is invalid, return the original input string.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

489 * RFC 2060 obviously intends the encoding to be unique (see

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

490 * point 5 in section 5.1.3), so we reject any non-canonical

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

491 * form, such as &ACY- (instead of &-) or &AMA-&AMA- (instead

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

492 * of &AMAAwA-).

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

493 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

494 * Translated from C to PHP by Thomas Bruederli <roundcube@gmail.com>

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

495 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

496 * @param string $str Input string (UTF7-IMAP)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

497 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

498 * @return string Output string (UTF-8)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

499 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

500 public static function utf7imap_to_utf8($str)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

501 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

502 $Index_64 = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

503 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

504 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

505 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,62, 63,-1,-1,-1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

506 52,53,54,55, 56,57,58,59, 60,61,-1,-1, -1,-1,-1,-1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

507 -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10, 11,12,13,14,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

508 15,16,17,18, 19,20,21,22, 23,24,25,-1, -1,-1,-1,-1,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

509 -1,26,27,28, 29,30,31,32, 33,34,35,36, 37,38,39,40,

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

510 41,42,43,44, 45,46,47,48, 49,50,51,-1, -1,-1,-1,-1

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

511 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

512

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

513 $u7len = strlen($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

514 $str = strval($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

515 $p = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

516 $err = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

517

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

518 for ($i=0; $u7len > 0; $i++, $u7len--) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

519 $u7 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

520 if ($u7 == '&') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

521 $i++;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

522 $u7len--;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

523 $u7 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

524

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

525 if ($u7len && $u7 == '-') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

526 $p .= '&';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

527 continue;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

528 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

529

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

530 $ch = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

531 $k = 10;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

532 for (; $u7len > 0; $i++, $u7len--) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

533 $u7 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

534

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

535 if ((ord($u7) & 0x80) || ($b = $Index_64[ord($u7)]) == -1) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

536 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

537 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

538

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

539 if ($k > 0) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

540 $ch |= $b << $k;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

541 $k -= 6;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

542 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

543 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

544 $ch |= $b >> (-$k);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

545 if ($ch < 0x80) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

546 // Printable US-ASCII

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

547 if (0x20 <= $ch && $ch < 0x7f) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

548 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

549 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

550 $p .= chr($ch);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

551 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

552 else if ($ch < 0x800) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

553 $p .= chr(0xc0 | ($ch >> 6));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

554 $p .= chr(0x80 | ($ch & 0x3f));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

555 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

556 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

557 $p .= chr(0xe0 | ($ch >> 12));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

558 $p .= chr(0x80 | (($ch >> 6) & 0x3f));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

559 $p .= chr(0x80 | ($ch & 0x3f));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

560 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

561

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

562 $ch = ($b << (16 + $k)) & 0xffff;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

563 $k += 10;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

564 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

565 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

566

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

567 // Non-zero or too many extra bits

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

568 if ($ch || $k < 6) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

569 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

570 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

571

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

572 // BASE64 not properly terminated

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

573 if (!$u7len || $u7 != '-') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

574 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

575 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

576

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

577 // Adjacent BASE64 sections

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

578 if ($u7len > 2 && $str[$i+1] == '&' && $str[$i+2] != '-') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

579 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

580 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

581 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

582 // Not printable US-ASCII

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

583 else if (ord($u7) < 0x20 || ord($u7) >= 0x7f) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

584 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

585 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

586 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

587 $p .= $u7;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

588 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

589 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

590

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

591 return $p;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

592 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

593

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

594 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

595 * Convert the data ($str) from UTF-8 to RFC 2060's UTF-7.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

596 * Unicode characters above U+FFFF are replaced by U+FFFE.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

597 * If input data is invalid, return an empty string.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

598 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

599 * Translated from C to PHP by Thomas Bruederli <roundcube@gmail.com>

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

600 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

601 * @param string $str Input string (UTF-8)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

602 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

603 * @return string Output string (UTF7-IMAP)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

604 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

605 public static function utf8_to_utf7imap($str)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

606 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

607 $B64Chars = array(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

608 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

609 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', 'a', 'b', 'c', 'd',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

610 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

611 't', 'u', 'v', 'w', 'x', 'y', 'z', '0', '1', '2', '3', '4', '5', '6', '7',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

612 '8', '9', '+', ','

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

613 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

614

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

615 $u8len = strlen($str);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

616 $base64 = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

617 $i = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

618 $p = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

619 $err = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

620

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

621 while ($u8len) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

622 $u8 = $str[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

623 $c = ord($u8);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

624

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

625 if ($c < 0x80) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

626 $ch = $c;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

627 $n = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

628 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

629 else if ($c < 0xc2) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

630 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

631 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

632 else if ($c < 0xe0) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

633 $ch = $c & 0x1f;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

634 $n = 1;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

635 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

636 else if ($c < 0xf0) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

637 $ch = $c & 0x0f;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

638 $n = 2;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

639 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

640 else if ($c < 0xf8) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

641 $ch = $c & 0x07;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

642 $n = 3;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

643 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

644 else if ($c < 0xfc) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

645 $ch = $c & 0x03;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

646 $n = 4;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

647 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

648 else if ($c < 0xfe) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

649 $ch = $c & 0x01;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

650 $n = 5;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

651 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

652 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

653 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

654 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

655

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

656 $i++;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

657 $u8len--;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

658

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

659 if ($n > $u8len) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

660 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

661 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

662

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

663 for ($j=0; $j < $n; $j++) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

664 $o = ord($str[$i+$j]);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

665 if (($o & 0xc0) != 0x80) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

666 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

667 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

668 $ch = ($ch << 6) | ($o & 0x3f);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

669 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

670

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

671 if ($n > 1 && !($ch >> ($n * 5 + 1))) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

672 return $err;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

673 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

674

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

675 $i += $n;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

676 $u8len -= $n;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

677

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

678 if ($ch < 0x20 || $ch >= 0x7f) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

679 if (!$base64) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

680 $p .= '&';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

681 $base64 = 1;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

682 $b = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

683 $k = 10;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

684 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

685 if ($ch & ~0xffff) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

686 $ch = 0xfffe;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

687 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

688

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

689 $p .= $B64Chars[($b | $ch >> $k)];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

690 $k -= 6;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

691 for (; $k >= 0; $k -= 6) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

692 $p .= $B64Chars[(($ch >> $k) & 0x3f)];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

693 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

694

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

695 $b = ($ch << (-$k)) & 0x3f;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

696 $k += 16;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

697 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

698 else {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

699 if ($base64) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

700 if ($k > 10) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

701 $p .= $B64Chars[$b];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

702 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

703 $p .= '-';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

704 $base64 = 0;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

705 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

706

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

707 $p .= chr($ch);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

708 if (chr($ch) == '&') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

709 $p .= '-';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

710 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

711 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

712 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

713

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

714 if ($base64) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

715 if ($k > 10) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

716 $p .= $B64Chars[$b];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

717 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

718 $p .= '-';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

719 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

720

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

721 return $p;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

722 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

723

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

724 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

725 * A method to guess character set of a string.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

726 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

727 * @param string $string String

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

728 * @param string $failover Default result for failover

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

729 * @param string $language User language

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

730 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

731 * @return string Charset name

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

732 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

733 public static function detect($string, $failover = null, $language = null)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

734 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

735 if (substr($string, 0, 4) == "\0\0\xFE\xFF") return 'UTF-32BE'; // Big Endian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

736 if (substr($string, 0, 4) == "\xFF\xFE\0\0") return 'UTF-32LE'; // Little Endian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

737 if (substr($string, 0, 2) == "\xFE\xFF") return 'UTF-16BE'; // Big Endian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

738 if (substr($string, 0, 2) == "\xFF\xFE") return 'UTF-16LE'; // Little Endian

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

739 if (substr($string, 0, 3) == "\xEF\xBB\xBF") return 'UTF-8';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

740

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

741 // heuristics

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

742 if ($string[0] == "\0" && $string[1] == "\0" && $string[2] == "\0" && $string[3] != "\0") return 'UTF-32BE';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

743 if ($string[0] != "\0" && $string[1] == "\0" && $string[2] == "\0" && $string[3] == "\0") return 'UTF-32LE';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

744 if ($string[0] == "\0" && $string[1] != "\0" && $string[2] == "\0" && $string[3] != "\0") return 'UTF-16BE';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

745 if ($string[0] != "\0" && $string[1] == "\0" && $string[2] != "\0" && $string[3] == "\0") return 'UTF-16LE';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

746

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

747 if (empty($language)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

748 $rcube = rcube::get_instance();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

749 $language = $rcube->get_user_language();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

750 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

751

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

752 // Prioritize charsets according to current language (#1485669)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

753 switch ($language) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

754 case 'ja_JP':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

755 $prio = array('ISO-2022-JP', 'JIS', 'UTF-8', 'EUC-JP', 'eucJP-win', 'SJIS', 'SJIS-win');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

756 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

757

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

758 case 'zh_CN':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

759 case 'zh_TW':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

760 $prio = array('UTF-8', 'BIG-5', 'GB2312', 'EUC-TW');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

761 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

762

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

763 case 'ko_KR':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

764 $prio = array('UTF-8', 'EUC-KR', 'ISO-2022-KR');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

765 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

766

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

767 case 'ru_RU':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

768 $prio = array('UTF-8', 'WINDOWS-1251', 'KOI8-R');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

769 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

770

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

771 case 'tr_TR':

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

772 $prio = array('UTF-8', 'ISO-8859-9', 'WINDOWS-1254');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

773 break;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

774 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

775

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

776 // mb_detect_encoding() is not reliable for some charsets (#1490135)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

777 // use mb_check_encoding() to make charset priority lists really working

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

778 if ($prio && function_exists('mb_check_encoding')) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

779 foreach ($prio as $encoding) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

780 if (mb_check_encoding($string, $encoding)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

781 return $encoding;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

782 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

783 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

784 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

785

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

786 if (function_exists('mb_detect_encoding')) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

787 if (!$prio) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

788 $prio = array('UTF-8', 'SJIS', 'GB2312',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

789 'ISO-8859-1', 'ISO-8859-2', 'ISO-8859-3', 'ISO-8859-4',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

790 'ISO-8859-5', 'ISO-8859-6', 'ISO-8859-7', 'ISO-8859-8', 'ISO-8859-9',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

791 'ISO-8859-10', 'ISO-8859-13', 'ISO-8859-14', 'ISO-8859-15', 'ISO-8859-16',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

792 'WINDOWS-1252', 'WINDOWS-1251', 'EUC-JP', 'EUC-TW', 'KOI8-R', 'BIG-5',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

793 'ISO-2022-KR', 'ISO-2022-JP',

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

794 );

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

795 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

796

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

797 $encodings = array_unique(array_merge($prio, mb_list_encodings()));

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

798

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

799 if ($encoding = mb_detect_encoding($string, $encodings)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

800 return $encoding;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

801 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

802 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

803

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

804 // No match, check for UTF-8

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

805 // from http://w3.org/International/questions/qa-forms-utf-8.html

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

806 if (preg_match('/\A(

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

807 [\x09\x0A\x0D\x20-\x7E]

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

808 | [\xC2-\xDF][\x80-\xBF]

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

809 | \xE0[\xA0-\xBF][\x80-\xBF]

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

810 | [\xE1-\xEC\xEE\xEF][\x80-\xBF]{2}

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

811 | \xED[\x80-\x9F][\x80-\xBF]

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

812 | \xF0[\x90-\xBF][\x80-\xBF]{2}

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

813 | [\xF1-\xF3][\x80-\xBF]{3}

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

814 | \xF4[\x80-\x8F][\x80-\xBF]{2}

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

815 )*\z/xs', substr($string, 0, 2048))

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

816 ) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

817 return 'UTF-8';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

818 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

819

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

820 return $failover;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

821 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

822

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

823 /**

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

824 * Removes non-unicode characters from input.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

825 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

826 * @param mixed $input String or array.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

827 *

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

828 * @return mixed String or array

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

829 */

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

830 public static function clean($input)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

831 {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

832 // handle input of type array

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

833 if (is_array($input)) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

834 foreach ($input as $idx => $val) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

835 $input[$idx] = self::clean($val);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

836 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

837 return $input;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

838 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

839

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

840 if (!is_string($input) || $input == '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

841 return $input;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

842 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

843

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

844 // iconv/mbstring are much faster (especially with long strings)

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

845 if (function_exists('mb_convert_encoding')) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

846 $msch = mb_substitute_character();

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

847 mb_substitute_character('none');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

848 $res = mb_convert_encoding($input, 'UTF-8', 'UTF-8');

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

849 mb_substitute_character($msch);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

850

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

851 if ($res !== false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

852 return $res;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

853 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

854 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

855

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

856 if (function_exists('iconv')) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

857 if (($res = @iconv('UTF-8', 'UTF-8//IGNORE', $input)) !== false) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

858 return $res;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

859 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

860 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

861

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

862 $seq = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

863 $out = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

864 $regexp = '/^('.

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

865 // '[\x00-\x7F]'. // UTF8-1

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

866 '|[\xC2-\xDF][\x80-\xBF]'. // UTF8-2

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

867 '|\xE0[\xA0-\xBF][\x80-\xBF]'. // UTF8-3

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

868 '|[\xE1-\xEC][\x80-\xBF][\x80-\xBF]'. // UTF8-3

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

869 '|\xED[\x80-\x9F][\x80-\xBF]'. // UTF8-3

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

870 '|[\xEE-\xEF][\x80-\xBF][\x80-\xBF]'. // UTF8-3

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

871 '|\xF0[\x90-\xBF][\x80-\xBF][\x80-\xBF]'. // UTF8-4

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

872 '|[\xF1-\xF3][\x80-\xBF][\x80-\xBF][\x80-\xBF]'.// UTF8-4

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

873 '|\xF4[\x80-\x8F][\x80-\xBF][\x80-\xBF]'. // UTF8-4

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

874 ')$/';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

875

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

876 for ($i = 0, $len = strlen($input); $i < $len; $i++) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

877 $chr = $input[$i];

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

878 $ord = ord($chr);

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

879

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

880 // 1-byte character

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

881 if ($ord <= 0x7F) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

882 if ($seq !== '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

883 $out .= preg_match($regexp, $seq) ? $seq : '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

884 $seq = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

885 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

886

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

887 $out .= $chr;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

888 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

889 // first byte of multibyte sequence

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

890 else if ($ord >= 0xC0) {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

891 if ($seq !== '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

892 $out .= preg_match($regexp, $seq) ? $seq : '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

893 $seq = '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

894 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

895

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

896 $seq = $chr;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

897 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

898 // next byte of multibyte sequence

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

899 else if ($seq !== '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

900 $seq .= $chr;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

901 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

902 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

903

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

904 if ($seq !== '') {

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

905 $out .= preg_match($regexp, $seq) ? $seq : '';

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

906 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

907

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

908 return $out;

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

909 }

4681f974d28b vanilla 1.3.3 distro, I hope

Charlie Root

parents:

diff changeset

910 }

Mercurial > hg > rc2

annotate program/lib/Roundcube/rcube_charset.php @ 0:4681f974d28b