ICONV編碼與Windows 代碼頁的對應關係

    // -------------------------------------------------------------------------------------------------------------------------------------------------
    // codepage     ICONV identifier           是否缺少ICONV對應項     Description
    // -------------------------------------------------------------------------------------------------------------------------------------------------
    related[37]     = "";                   // Yes                     IBM EBCDIC US-Canada                     
    related[437]    = "CP437";              //                         OEM United States
    related[500]    = "";                   // Yes                     IBM EBCDIC International
    related[708]    = "ISO-8859-6";         //                         Arabic (ASMO 708)
    related[709]    = "";                   // Yes                     Arabic (ASMO-449+, BCON V4)
    related[710]    = "";                   // Yes                     Arabic - Transparent Arabic
    related[720]    = "";                   // Yes                     Arabic (Transparent ASMO); Arabic (DOS)
    related[737]    = "CP737";              //                         OEM Greek (formerly 437G); Greek (DOS)
    related[775]    = "CP775";              //                         OEM Baltic; Baltic (DOS)
    related[850]    = "CP850";              //                         OEM Multilingual Latin 1; Western European (DOS)
    related[852]    = "CP852";              //                         OEM Latin 2; Central European (DOS)
    related[855]    = "CP855";              //                         OEM Cyrillic (primarily Russian)
    related[857]    = "CP857";              //                         OEM Turkish; Turkish (DOS)
    related[858]    = "CP858";              //                         OEM Multilingual Latin 1 + Euro symbol
    related[860]    = "CP860";              //                         OEM Portuguese; Portuguese (DOS)
    related[861]    = "CP861";              //                         OEM Icelandic; Icelandic (DOS)
    related[862]    = "CP862";              //                         OEM Hebrew; Hebrew (DOS)
    related[863]    = "CP863";              //                         OEM French Canadian; French Canadian (DOS)
    related[864]    = "CP864";              //                         OEM Arabic; Arabic (864)
    related[865]    = "CP865";              //                         OEM Nordic; Nordic (DOS)
    related[866]    = "CP866";              //                         OEM Russian; Cyrillic (DOS)
    related[869]    = "CP869";              //                         OEM Modern Greek; Greek, Modern (DOS)
    related[870]    = "";                   // Yes                     IBM EBCDIC Multilingual/ROECE (Latin 2); IBM EBCDIC Multilingual Latin 2
    related[874]    = "CP874";              //                         ANSI/OEM Thai (ISO 8859-11); Thai (Windows)
    related[875]    = "";                   // Yes                     IBM EBCDIC Greek Modern
    related[932]    = "CP932";              //                         ANSI/OEM Japanese; Japanese (Shift-JIS)
    related[936]    = "CP936";              //                         ANSI/OEM Simplified Chinese (PRC, Singapore); Chinese Simplified (GB2312)
    related[949]    = "CP949";              //                         ANSI/OEM Korean (Unified Hangul Code)
    related[950]    = "CP950";              //                         ANSI/OEM Traditional Chinese (Taiwan; Hong Kong SAR, PRC); Chinese Traditional (Big5)
    related[1026]   = "";                   // Yes                     IBM EBCDIC Turkish (Latin 5)
    related[1047]   = "";                   // Yes                     IBM EBCDIC Latin 1/Open System
    related[1140]   = "";                   // Yes                     IBM EBCDIC US-Canada (037 + Euro symbol); IBM EBCDIC (US-Canada-Euro)
    related[1141]   = "";                   // Yes                     IBM EBCDIC Germany (20273 + Euro symbol); IBM EBCDIC (Germany-Euro)
    related[1142]   = "";                   // Yes                     IBM EBCDIC Denmark-Norway (20277 + Euro symbol); IBM EBCDIC (Denmark-Norway-Euro)
    related[1143]   = "";                   // Yes                     IBM EBCDIC Finland-Sweden (20278 + Euro symbol); IBM EBCDIC (Finland-Sweden-Euro)
    related[1144]   = "";                   // Yes                     IBM EBCDIC Italy (20280 + Euro symbol); IBM EBCDIC (Italy-Euro)
    related[1145]   = "";                   // Yes                     IBM EBCDIC Latin America-Spain (20284 + Euro symbol); IBM EBCDIC (Spain-Euro)
    related[1146]   = "";                   // Yes                     IBM EBCDIC United Kingdom (20285 + Euro symbol); IBM EBCDIC (UK-Euro)
    related[1147]   = "";                   // Yes                     IBM EBCDIC France (20297 + Euro symbol); IBM EBCDIC (France-Euro)
    related[1148]   = "";                   // Yes                     IBM EBCDIC International (500 + Euro symbol); IBM EBCDIC (International-Euro)
    related[1149]   = "";                   // Yes                     IBM EBCDIC Icelandic (20871 + Euro symbol); IBM EBCDIC (Icelandic-Euro)
    related[1200]   = "UTF-16LE";           //                         Unicode UTF-16, little endian byte order (BMP of ISO 10646);
    related[1201]   = "UTF-16BE";           //                         Unicode UTF-16, big endian byte order;
    related[1250]   = "CP1250";             //                         ANSI Central European; Central European (Windows)
    related[1251]   = "CP1251";             //                         ANSI Cyrillic; Cyrillic (Windows)
    related[1252]   = "CP1252";             //                         ANSI Latin 1; Western European (Windows)
    related[1253]   = "CP1253";             //                         ANSI Greek; Greek (Windows)
    related[1254]   = "CP1254";             //                         ANSI Turkish; Turkish (Windows)
    related[1255]   = "CP1255";             //                         ANSI Hebrew; Hebrew (Windows)
    related[1256]   = "CP1256";             //                         ANSI Arabic; Arabic (Windows)
    related[1257]   = "CP1257";             //                         ANSI Baltic; Baltic (Windows)
    related[1258]   = "CP1258";             //                         ANSI/OEM Vietnamese; Vietnamese (Windows)
    related[1361]   = "CP1361";             //                         Korean (Johab)
    related[10000]  = "Macintosh";          //                         MAC Roman; Western European (Mac)
    related[10001]  = "";                   // Yes                     Japanese (Mac)
    related[10002]  = "";                   // Yes                     MAC Traditional Chinese (Big5); Chinese Traditional (Mac)
    related[10003]  = "";                   // Yes                     Korean (Mac)
    related[10004]  = "MacArabic";          //                         Arabic (Mac)
    related[10005]  = "MacHebrew";          //                         Hebrew (Mac)
    related[10006]  = "MacGreek";           //                         Greek (Mac)
    related[10007]  = "MacCyrillic";        //                         Cyrillic (Mac)
    related[10008]  = "";                   // Yes                     MAC Simplified Chinese (GB 2312); Chinese Simplified (Mac)
    related[10010]  = "MacRomania";         //                         Romanian (Mac)
    related[10017]  = "MacUkraine";         //                         Ukrainian (Mac)
    related[10021]  = "MacThai";            //                         Thai (Mac)
    related[10029]  = "MacCentralEurope";   //                         MAC Latin 2; Central European (Mac)
    related[10079]  = "MacIceland";         //                         Icelandic (Mac)
    related[10081]  = "MacTurkish";         //                         Turkish (Mac)
    related[10082]  = "MacCroatian";        //                         Croatian (Mac)
    related[12000]  = "UTF-32LE";           //                         Unicode UTF-32, little endian byte order
    related[12001]  = "UTF-32BE";           //                         Unicode UTF-32, big endian byte order
    related[20000]  = "";                   // Yes                     CNS Taiwan; Chinese Traditional (CNS)
    related[20001]  = "";                   // Yes                     TCA Taiwan
    related[20002]  = "";                   // Yes                     Eten Taiwan; Chinese Traditional (Eten)
    related[20003]  = "";                   // Yes                     IBM5550 Taiwan
    related[20004]  = "";                   // Yes                     TeleText Taiwan
    related[20005]  = "";                   // Yes                     Wang Taiwan
    related[20105]  = "";                   // Yes                     IA5 (IRV International Alphabet No. 5, 7-bit); Western European (IA5)
    related[20106]  = "";                   // Yes                     IA5 German (7-bit)
    related[20107]  = "";                   // Yes                     IA5 Swedish (7-bit)
    related[20108]  = "";                   // Yes                     IA5 Norwegian (7-bit)
    related[20127]  = "ASCII";              //                         US-ASCII (7-bit)
    related[20261]  = "";                   // Yes                     T.61
    related[20269]  = "";                   // Yes                     ISO 6937 Non-Spacing Accent
    related[20273]  = "";                   // Yes                     IBM EBCDIC Germany
    related[20277]  = "";                   // Yes                     IBM EBCDIC Denmark-Norway
    related[20278]  = "";                   // Yes                     IBM EBCDIC Finland-Sweden
    related[20280]  = "";                   // Yes                     IBM EBCDIC Italy
    related[20284]  = "";                   // Yes                     IBM EBCDIC Latin America-Spain
    related[20285]  = "";                   // Yes                     IBM EBCDIC United Kingdom
    related[20290]  = "";                   // Yes                     IBM EBCDIC Japanese Katakana Extended
    related[20297]  = "";                   // Yes                     IBM EBCDIC France
    related[20420]  = "";                   // Yes                     IBM EBCDIC Arabic
    related[20423]  = "";                   // Yes                     IBM EBCDIC Greek
    related[20424]  = "";                   // Yes                     IBM EBCDIC Hebrew
    related[20833]  = "";                   // Yes                     IBM EBCDIC Korean Extended
    related[20838]  = "";                   // Yes                     IBM EBCDIC Thai
    related[20866]  = "KOI8-R";             // Yes                     Russian (KOI8-R); Cyrillic (KOI8-R)
    related[20871]  = "";                   // Yes                     IBM EBCDIC Icelandic
    related[20880]  = "";                   // Yes                     IBM EBCDIC Cyrillic Russian
    related[20905]  = "";                   // Yes                     IBM EBCDIC Turkish
    related[20924]  = "";                   // Yes                     IBM EBCDIC Latin 1/Open System (1047 + Euro symbol)
    related[20932]  = "EUC-JP";             //                         Japanese (JIS 0208-1990 and 0212-1990)
    related[20936]  = "GB2312";             //                         Simplified Chinese (GB2312); Chinese Simplified (GB2312-80)
    related[20949]  = "EUC-KR";             //                         Korean Wansung
    related[21025]  = "";                   // Yes                     IBM EBCDIC Cyrillic Serbian-Bulgarian
    related[21027]  = "";                   // Yes                     (deprecated)
    related[21866]  = "KOI8-U";             //                         Ukrainian (KOI8-U); Cyrillic (KOI8-U)
    related[28591]  = "ISO-8859-1";         //                         ISO 8859-1 Latin 1; Western European (ISO)
    related[28592]  = "ISO-8859-2";         //                         ISO 8859-2 Central European; Central European (ISO)
    related[28593]  = "ISO-8859-3";         //                         ISO 8859-3 Latin 3
    related[28594]  = "ISO-8859-4";         //                         ISO 8859-4 Baltic
    related[28595]  = "ISO-8859-5";         //                         ISO 8859-5 Cyrillic
    related[28596]  = "ISO-8859-6";         //                         ISO 8859-6 Arabic
    related[28597]  = "ISO-8859-7";         //                         ISO 8859-7 Greek
    related[28598]  = "ISO-8859-8";         //                         ISO 8859-8 Hebrew; Hebrew (ISO-Visual)
    related[28599]  = "ISO-8859-9";         //                         ISO 8859-9 Turkish
    related[28603]  = "ISO-8859-13";        //                         ISO 8859-13 Estonian
    related[28605]  = "ISO-8859-15";        //                         ISO 8859-15 Latin 9
    related[29001]  = "";                   // Yes                     Europa 3
    related[38598]  = "";                   // Yes                     ISO 8859-8 Hebrew; Hebrew (ISO-Logical)
    related[50220]  = "ISO-2022-JP";        //                         ISO 2022 Japanese with no halfwidth Katakana; Japanese (JIS)
    related[50221]  = "CP50221";            //                         ISO 2022 Japanese with halfwidth Katakana; Japanese (JIS-Allow 1 byte Kana)
    related[50222]  = "ISO-2022-JP";        //                         ISO 2022 Japanese JIS X 0201-1989; Japanese (JIS-Allow 1 byte Kana - SO/SI)
    related[50225]  = "ISO-2022-KR";        //                         ISO 2022 Korean
    related[50227]  = "ISO-2022-CN";        //                         ISO 2022 Simplified Chinese; Chinese Simplified (ISO 2022)
    related[50229]  = "";                   // Yes                     ISO 2022 Traditional Chinese
    related[50930]  = "";                   // Yes                     EBCDIC Japanese (Katakana) Extended
    related[50931]  = "";                   // Yes                     EBCDIC US-Canada and Japanese
    related[50933]  = "";                   // Yes                     EBCDIC Korean Extended and Korean
    related[50935]  = "";                   // Yes                     EBCDIC Simplified Chinese Extended and Simplified Chinese
    related[50936]  = "";                   // Yes                     EBCDIC Simplified Chinese
    related[50937]  = "";                   // Yes                     EBCDIC US-Canada and Traditional Chinese
    related[50939]  = "";                   // Yes                     EBCDIC Japanese (Latin) Extended and Japanese
    related[51932]  = "EUC-JP";             //                         EUC Japanese
    related[51936]  = "EUC-CN";             //                         EUC Simplified Chinese; Chinese Simplified (EUC)
    related[51949]  = "EUC-KR";             //                         EUC Korean
    related[51950]  = "EUC-TW";             //                         EUC Traditional Chinese
    related[52936]  = "HZ";                 //                         HZ-GB2312 Simplified Chinese; Chinese Simplified (HZ)
    related[54936]  = "GB18030";            //                         Windows XP and later: GB18030 Simplified Chinese (4 byte); Chinese Simplified (GB18030)
    related[57002]  = "";                   // Yes                     ISCII Devanagari
    related[57003]  = "";                   // Yes                     ISCII Bangla
    related[57004]  = "";                   // Yes                     ISCII Tamil
    related[57005]  = "";                   // Yes                     ISCII Telugu
    related[57006]  = "";                   // Yes                     ISCII Assamese
    related[57007]  = "";                   // Yes                     ISCII Odia
    related[57008]  = "";                   // Yes                     ISCII Kannada
    related[57009]  = "";                   // Yes                     ISCII Malayalam
    related[57010]  = "";                   // Yes                     ISCII Gujarati
    related[57011]  = "";                   // Yes                     ISCII Punjabi
    related[65000]  = "UTF-7";              //                         Unicode (UTF-7)
    related[65001]  = "UTF-8";              //                         Unicode (UTF-8)

以上是整理的Windows所支持的代碼頁(數字)與 iconv 編碼名的對應關係。iconv 不支持IBM的 EBCDIC,這些代碼頁非常老,基本可以不用再看,但還是有一些代碼頁與編碼名對應不上,如果有誰知道更多的信息,請不吝賜教。

 

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章