/* * Code Set Converters for MICO * Copyright (C) 1997 Marcus Mueller & Thomas Holubar * Copyright (c) 1998-2010 by The Mico Team * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public * License along with this library; if not, write to the Free * Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. * * For more information, visit the MICO Home Page at * http://www.mico.org/ * * date vers. name reason * 97/07/01 0.1 mueller CREATED */ #ifdef __COMO__ #pragma no_pch #endif // __COMO__ #include #include #include #include #include "uni_unicode.h" #include "uni_base64.h" #include "uni_strtypes.h" #include "uni_errors.h" #include "uni_conversion.h" #ifdef _WIN32 #pragma warning (disable: 4305 4309 4244 4018) // pragma warning (default: 4305 ) // turn on #endif // XXX workaround for multibyte char constants #define MBC(a,b,c,d) (((uni_ulong)(a)<<24) | ((uni_ulong)(b)<<16) | \ ((uni_ulong)(c)<< 8) | (uni_ulong)(d)) static const uni_ushort ebc2uniArray[] = /* beginning with 0x20 (32) */ { '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x20-0x27 ( 32- 39) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x28-0x2F ( 40- 47) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x30-0x37 ( 48- 55) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x38-0x3F ( 56- 63) */ ' ' , '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x40-0x47 ( 64- 71) */ '\0', '\0', 0xA2, '.' , '<' , '(' , '+' , '|' , /* 0x48-0x4F ( 72- 79) */ '&' , '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x50-0x57 ( 80- 87) */ '\0', '\0', '!' , '$' , '*' , ')' , ';' , 0xAC, /* 0x58-0x5F ( 88- 95) */ '-' , '/' , '\0', '\0', '\0', '\0', '\0', '\0', /* 0x60-0x67 ( 96-103) */ '\0', '\0', '|' , ',' , '%' , '_' , '>' , '?' , /* 0x68-0x6F (104-111) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0x70-0x77 (112-119) */ '\0', '\0', ':' , '#' , '@' , 0x27, '=' , 0x22, /* 0x78-0x7F (120-127) */ '\0', 'a' , 'b' , 'c' , 'd' , 'e' , 'f' , 'g' , /* 0x80-0x87 (128-135) */ 'h' , 'i' , '\0', '{' , '\0', '\0', '\0', '\0', /* 0x88-0x8F (126-143) */ '\0', 'j' , 'k' , 'l' , 'm' , 'n' , 'o' , 'p' , /* 0x90-0x97 (144-151) */ 'q' , 'r' , '\0', '}' , '\0', '\0', '\0', '\0', /* 0x98-0x9F (152-159) */ '\0', 0xDF, 's' , 't' , 'u' , 'v' , 'w' , 'x' , /* 0xA0-0xA7 (160-167) */ 'y' , 'z' , '\0', '\0', '\0', '\0', '\0', '\0', /* 0xA8-0xAF (168-175) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0xB0-0xB7 (176-183) */ '\0', '\0', '\0', '\0', '\0', '\0', '\0', '\0', /* 0xB8-0xBF (184-191) */ '{' , 'A' , 'B' , 'C' , 'D' , 'E' , 'F' , 'G' , /* 0xC0-0xC7 (192-199) */ 'H' , 'I' , '\0', '\0', '\0', '\0', '\0', '\0', /* 0xC8-0xCF (200-207) */ '}' , 'J' , 'K' , 'L' , 'M' , 'N' , 'O' , 'P' , /* 0xD0-0xD7 (208-215) */ 'Q' , 'R' , '\0', '\0', '\0', '\0', '\0', '\0', /* 0xD8-0xDF (216-223) */ '\0', 0xDF, 'S' , 'T' , 'U' , 'V' , 'W' , 'X' , /* 0xE0-0xE7 (224-231) */ 'Y' , 'Z' , '\0', '\0', '\0', '\0', '\0', '\0', /* 0xE8-0xEF (232-239) */ '0' , '1' , '2' , '3' , '4' , '5' , '6' , '7' , /* 0xF0-0xF7 (240-247) */ '8' , '9' , '0' , '|' , '\0', '\0', '\0', '\0' /* 0xF8-0xFF (248-255) */ /* not std-EBCDIC are: 0x6A (|) , 0x6B (,), 0x8B ({), 0x9B (}), 0xA1 (0xDF), 0xC0 ({), 0xD0 (}), 0xE1 (0xDF) */ }; const uni_ushort iso22uniArray[] = /* beginning with 0xA0 (160) */ { 0xA0 , 0x0104, 0x02D8, 0x0141, /* 0xA0-0xA3 (160-163) */ 0xA4 , 0x013D, 0x015A, 0xA7 , /* 0xA4-0xA7 (164-167) */ 0xA8 , 0x0160, 0x015E, 0x0164, /* 0xA8-0xAB (168-171) */ 0x0179, 0xAD , 0x017D, 0x017B, /* 0xAC-0xAF (172-175) */ 0xB0 , 0x0105, 0x02DB, 0x0142, /* 0xB0-0xB3 (176-179) */ 0xB4 , 0x013E, 0x015B, 0x02C7, /* 0xB4-0xB7 (180-183) */ 0xB8 , 0x0161, 0x015F, 0x0165, /* 0xB8-0xBB (184-187) */ 0x017A, 0x02DD, 0x017E, 0x0176, /* 0xBC-0xBF (188-191) */ 0x0154, 0xC1 , 0xC2 , 0x0102, /* 0xC0-0xC3 (192-195) */ 0xC4 , 0x0139, 0x0106, 0xC7 , /* 0xC4-0xC7 (196-199) */ 0x010C, 0xC9 , 0x0118, 0xCB , /* 0xC8-0xCB (200-203) */ 0x011A, 0xCD , 0xCE , 0x010E, /* 0xCC-0xCF (204-207) */ 0x0110, 0x0143, 0x0147, 0xD3 , /* 0xD0-0xD3 (208-211) */ 0xD4 , 0x0150, 0xD6 , 0xD7 , /* 0xD8-0xD7 (202-215) */ 0x0154, 0x016E, 0xDA , 0x0170, /* 0xD8-0xDB (216-219) */ 0xDC , 0xDD , 0x0162, 0xDF , /* 0xDC-0xDF (220-223) */ 0x0155, 0xE1 , 0xE2 , 0x0103, /* 0xE0-0xE3 (224-227) */ 0xE4 , 0x013A, 0x0107, 0xE7 , /* 0xE4-0xE7 (228-231) */ 0x010D, 0xE9 , 0x0119, 0xEB , /* 0xE8-0xEB (232-235) */ 0x011B, 0xED , 0xEE , 0x010F, /* 0xEC-0xEF (236-239) */ 0x0111, 0x0144, 0x0148, 0xF3 , /* 0xF0-0xF3 (240-243) */ 0xF4 , 0x0151, 0xF6 , 0xF7 , /* 0xF4-0xF7 (244-247) */ 0x0159, 0x016F, 0xFA , 0x0171, /* 0xF8-0xFB (248-251) */ 0xFC , 0xFD , 0x0163, 0x02D9 /* 0xFC-0xFF (252-255) */ }; const uni_ushort iso32uniArray[] = /* beginning with 0xA0 (160) */ { 0xA0 , 0x0126, 0x02D8, 0xA3 , /* 0xA0-0xA3 (160-163) */ 0xA4 , '\0' , 0x0124, 0xA7 , /* 0xA4-0xA7 (164-167) */ 0xA8 , 0x0130, 0x015E, 0x011E, /* 0xA8-0xAB (168-171) */ 0x0134, 0xAD , '\0' , 0x017B, /* 0xAC-0xAF (172-175) */ 0xB0 , 0x0127, 0xB2 , 0xB3 , /* 0xB0-0xB3 (176-179) */ 0xB4 , 0xB5 , 0x0125, 0xB7 , /* 0xB4-0xB7 (180-183) */ 0xB8 , 0x0131, 0x015F, 0x011F, /* 0xB8-0xBB (184-187) */ 0x0135, 0xBD , '\0' , 0x017C, /* 0xBC-0xBF (188-191) */ 0xC0 , 0xC1 , 0xC2 , '\0' , /* 0xC0-0xC3 (192-195) */ 0xC4 , 0x010A, 0x0108, 0xC7 , /* 0xC4-0xC7 (196-199) */ 0xC8 , 0xC9 , 0xCA , 0xCB , /* 0xC8-0xCB (200-203) */ 0xCC , 0xCD , 0xCE , 0xCF , /* 0xCC-0xCF (204-207) */ '\0' , 0xD1 , 0xD2 , 0xD3 , /* 0xD0-0xD3 (208-211) */ 0xD4 , 0x0120, 0xD6 , 0xD7 , /* 0xD8-0xD7 (202-215) */ 0x011C, 0xD9 , 0xDA , 0xDB , /* 0xD8-0xDB (216-219) */ 0xDC , 0x016C, 0x015C, 0xDF , /* 0xDC-0xDF (220-223) */ 0xE0 , 0xE1 , 0xE2 , '\0' , /* 0xE0-0xE3 (224-227) */ 0xE4 , 0x010B, 0x0109, 0xE7 , /* 0xE4-0xE7 (228-231) */ 0xE8 , 0xE9 , 0xEA , 0xEB , /* 0xE8-0xEB (232-235) */ 0xEC , 0xED , 0xEE , 0xEF , /* 0xEC-0xEF (236-239) */ '\0' , 0xF1 , 0xF2 , 0xF3 , /* 0xF0-0xF3 (240-243) */ 0xF4 , 0x0121, 0xF6 , 0xF7 , /* 0xF4-0xF7 (244-247) */ 0x011D, 0xF9 , 0xFA , 0xFB , /* 0xF8-0xFB (248-251) */ 0xFC , 0x016D, 0x015D, 0x02D9 /* 0xFC-0xFF (252-255) */ }; const uni_ushort iso42uniArray[] = /* beginning with 0xA0 (160) */ { 0xA0 , 0x0104, 0x0138, 0x0156, /* 0xA0-0xA3 (160-163) */ 0xA4 , 0x0128, 0x013B, 0xA7 , /* 0xA4-0xA7 (164-167) */ 0xA8 , 0x0160, 0x0112, 0x0122, /* 0xA8-0xAB (168-171) */ 0x0166, 0xAD , 0x017D, 0x02C9, /* 0xAC-0xAF (172-175) */ 0xB0 , 0x0105, 0x02DB, 0x0157, /* 0xB0-0xB3 (176-179) */ 0xB4 , 0x0129, 0x013C, 0x02C7, /* 0xB4-0xB7 (180-183) */ 0xB8 , 0x0161, 0x0113, 0x0123, /* 0xB8-0xBB (184-187) */ 0x0167, 0x014A, 0x017E, 0x014B, /* 0xBC-0xBF (188-191) */ 0x0100, 0xC1 , 0xC2 , 0xC3 , /* 0xC0-0xC3 (192-195) */ 0xC4 , 0xC5 , 0xC6 , 0x012E, /* 0xC4-0xC7 (196-199) */ 0x010C, 0xC9 , 0x0118, 0xCB , /* 0xC8-0xCB (200-203) */ 0x0116, 0xCD , 0xCE , 0x012A, /* 0xCC-0xCF (204-207) */ 0x0110, 0x0145, 0x014C, 0x0136, /* 0xD0-0xD3 (208-211) */ 0xD4 , 0xD5 , 0xD6 , 0xD7 , /* 0xD8-0xD7 (202-215) */ 0xD8 , 0x0172, 0xDA , 0xDB , /* 0xD8-0xDB (216-219) */ 0xDC , 0x0168, 0x016A, 0xDF , /* 0xDC-0xDF (220-223) */ 0x0101, 0xE1 , 0xE2 , 0xE3 , /* 0xE0-0xE3 (224-227) */ 0xE4 , 0xE5 , 0xE6 , 0x012F, /* 0xE4-0xE7 (228-231) */ 0x010D, 0xE9 , 0x0119, 0xEB , /* 0xE8-0xEB (232-235) */ 0x0117, 0xED , 0xEE , 0x012B, /* 0xEC-0xEF (236-239) */ 0x0111, 0x0146, 0x014D, 0x0137, /* 0xF0-0xF3 (240-243) */ 0xF4 , 0xF5 , 0xF6 , 0xF7 , /* 0xF4-0xF7 (244-247) */ 0xF8 , 0x0173, 0xFA , 0xFB , /* 0xF8-0xFB (248-251) */ 0xFC , 0x0169, 0x016B, 0x02D9 /* 0xFC-0xFF (252-255) */ }; static const uni_ushort koi2uniArray[] = /* beginning with 0x80 (128) */ { 0x2500, 0x2502, 0x250C, 0x2510, /* 0x80-0x83 (128-131) */ 0x2514, 0x2518, 0x251C, 0x2524, /* 0x84-0x87 (132-135) */ 0x252C, 0x2534, 0x253C, 0x2580, /* 0x88-0x8B (136-139) */ 0x2584, 0x2588, 0x258C, 0x2590, /* 0x8C-0x8F (140-143) */ 0x2591, 0x2592, 0x2593, 0x2320, /* 0x90-0x93 (144-147) */ 0x220E, 0x2219, 0x221A, 0x2248, /* 0x94-0x97 (148-151) */ 0x2264, 0x2265, 0xA0 , 0x2321, /* 0x98-0x9B (152-155) */ 0xB0 , 0xB2 , 0xB7 , 0xF7 , /* 0x9C-0x9F (156-159) */ 0x2550, 0x2551, 0x2552, 0x0451, /* 0xA0-0xA3 (160-163) */ 0x2553, 0x2554, 0x2555, 0x2556, /* 0xA4-0xA7 (164-167) */ 0x2557, 0x2558, 0x2559, 0x255A, /* 0xA8-0xAB (168-171) */ 0x255B, 0x255C, 0x255D, 0x255E, /* 0xAC-0xAF (172-175) */ 0x255F, 0x2560, 0x2561, 0x0401, /* 0xB0-0xB3 (176-179) */ 0x2562, 0x2563, 0x2564, 0x2565, /* 0xB4-0xB7 (180-183) */ 0x2565, 0x2567, 0x2568, 0x2569, /* 0xB8-0xBB (184-187) */ 0x256A, 0x256B, 0x256C, 0xA9 , /* 0xBC-0xBF (188-191) */ 0x044E, 0x0430, 0x0431, 0x0446, /* 0xC0-0xC3 (192-195) */ 0x0434, 0x0435, 0x0444, 0x0433, /* 0xC4-0xC7 (196-199) */ 0x0445, 0x0438, 0x0439, 0x043A, /* 0xC8-0xCB (200-203) */ 0x043B, 0x043C, 0x043D, 0x043E, /* 0xCC-0xCF (204-207) */ 0x043F, 0x044F, 0x0440, 0x0441, /* 0xD0-0xD3 (208-211) */ 0x0442, 0x0443, 0x0436, 0x0432, /* 0xD8-0xD7 (202-215) */ 0x044C, 0x044B, 0x0437, 0x0448, /* 0xD8-0xDB (216-219) */ 0x044D, 0x0449, 0x0447, 0x044A, /* 0xDC-0xDF (220-223) */ 0x042E, 0x0410, 0x0411, 0x0426, /* 0xE0-0xE3 (224-227) */ 0x0414, 0x0415, 0x0424, 0x0413, /* 0xE4-0xE7 (228-231) */ 0x0425, 0x0418, 0x0419, 0x041A, /* 0xE8-0xEB (232-235) */ 0x041B, 0x041C, 0x041D, 0x041E, /* 0xEC-0xEF (236-239) */ 0x041F, 0x042F, 0x0420, 0x0421, /* 0xF0-0xF3 (240-243) */ 0x0422, 0x0423, 0x0416, 0x0412, /* 0xF4-0xF7 (244-247) */ 0x042C, 0x042B, 0x0417, 0x0428, /* 0xF8-0xFB (248-251) */ 0x042D, 0x0429, 0x0427, 0x042A /* 0xFC-0xFF (252-255) */ }; static const uni_ushort iso72uniArray[] = /* beginning with 0xA0 (160) */ { 0xA0 , 0x02BD, 0x02BC, 0xA3 , /* 0xA0-0xA3 (160-163) */ '\0' , '\0' , 0xA6 , 0xA7 , /* 0xA4-0xA7 (164-167) */ 0xA8 , 0xA9 , '\0' , 0xAB , /* 0xA8-0xAB (168-171) */ 0xAC , 0xAD , '\0' , 0xAF , /* 0xAC-0xAF (172-175) */ 0xB0 , 0xB1 , 0xB2 , 0xB3 , /* 0xB0-0xB3 (176-179) */ 0xB4 , 0x0385, 0x0386, 0xB7 , /* 0xB4-0xB7 (180-183) */ 0x0388, 0x0389, 0x038A, 0xBB , /* 0xB8-0xBB (184-187) */ 0x038C, 0xBD , 0x038E, 0x038F /* 0xBC-0xBF (188-191) */ }; const uni_ushort iso102uniArray[] = /* beginning with 0xA0 (160) */ { 0xA0 , 0x0104, 0x0112, 0x0122, /* 0xA0-0xA3 (160-163) */ 0x012A, 0x0128, 0x0136, 0xA7 , /* 0xA4-0xA7 (164-167) */ 0x0138, 0x0110, 0x0160, 0x0166, /* 0xA8-0xAB (168-171) */ 0x017D, 0x0335, 0x016A, 0x014A, /* 0xAC-0xAF (172-175) */ 0xB0 , 0x0105, 0x0113, 0x0123, /* 0xB0-0xB3 (176-179) */ 0x012B, 0x0129, 0x0137, 0xB7 , /* 0xB4-0xB7 (180-183) */ 0x013C, 0x0111, 0x0161, 0x0167, /* 0xB8-0xBB (184-187) */ 0x017E, 0x0336, 0x016B, 0x014B, /* 0xBC-0xBF (188-191) */ 0x0100, 0xC1 , 0xC2 , 0xC3 , /* 0xC0-0xC3 (192-195) */ 0xC4 , 0xC5 , 0xC6 , 0x012E, /* 0xC4-0xC7 (196-199) */ 0x010C, 0xC9 , 0x0118, 0xCB , /* 0xC8-0xCB (200-203) */ 0x0116, 0xCD , 0xCE , 0xCF , /* 0xCC-0xCF (204-207) */ 0xD0 , 0x0145, 0x014C, 0xD3 , /* 0xD0-0xD3 (208-211) */ 0xD4 , 0xD5 , 0xD6 , 0x0168, /* 0xD8-0xD7 (202-215) */ 0xD8 , 0x0172, 0xDA , 0xDB , /* 0xD8-0xDB (216-219) */ 0xDC , 0xDD , 0xDE , 0xDF , /* 0xDC-0xDF (220-223) */ 0x0101, 0xE1 , 0xE2 , 0xE3 , /* 0xE0-0xE3 (224-227) */ 0xE4 , 0xE5 , 0xE6 , 0x012F, /* 0xE4-0xE7 (228-231) */ 0x010D, 0xE9 , 0x0119, 0xEB , /* 0xE8-0xEB (232-235) */ 0x0117, 0xED , 0xEE , 0xEF , /* 0xEC-0xEF (236-239) */ 0xF0 , 0x0146, 0x014D, 0xF3 , /* 0xF0-0xF3 (240-243) */ 0xF4 , 0xF5 , 0xF6 , 0x0169, /* 0xF4-0xF7 (244-247) */ 0xF8 , 0x0173, 0xFA , 0xFB , /* 0xF8-0xFB (248-251) */ 0xFC , 0xFD , 0xFE , 0x0138 /* 0xFC-0xFF (252-255) */ }; static const uni_ushort win2uniArray[] = /* beginning with 0x80 (128) */ { '\0' , '\0' , 0x201A, 0x0192, /* 0x80-0x83 (128-131) */ 0x201E, 0x2026, 0x2020, 0x2021, /* 0x84-0x87 (132-135) */ 0x02C6, 0x2031, 0x0160, 0x2039, /* 0x88-0x8B (136-139) */ 0x0152, '\0' , '\0' , '\0' , /* 0x8C-0x8F (140-143) */ '\0' , 0x2018, 0x2019, 0x201C, /* 0x90-0x93 (144-147) */ 0x201D, 0x200E, 0x2013, 0x2014, /* 0x94-0x97 (148-151) */ 0x02DC, 0x2122, 0x0161, 0x20A0, /* 0x98-0x9B (152-155) */ 0x0153, '\0' , '\0' , 0x0118 /* 0x9C-0x9F (156-159) */ }; static const uni_ushort ibm2uniArray[] = /* beginning with 0x00 (0) */ { 0xFF , 0x263A, 0x263B, 0x2665, /* 0x00-0x03 ( 0- 3) */ 0x2666, 0x2663, 0x2660, 0x07 , /* 0x04-0x07 ( 4- 7) */ 0x08 , 0x09 , 0x0A , 0x0B , /* 0x08-0x0B ( 8- 11) */ 0x0C , 0x0D , 0x0E , 0x0F , /* 0x0C-0x0F ( 12- 15) */ 0x25B6, 0x25C0, 0x2195, 0x203C, /* 0x10-0x13 ( 16- 19) */ 0xB6 , 0xA7 , 0x2583, 0x21A8, /* 0x14-0x17 ( 20- 23) */ 0x2191, 0x2193, 0x2192, 0x2190, /* 0x18-0x1B ( 24- 27) */ 0x2319, 0x2194, 0x25B2, 0x25BC, /* 0x1C-0x1F ( 28- 31) */ }; const uni_ushort ibm4372uniArray[] = /* beginning with 0x80 (128) */ { 0xC7 , 0xFC , 0xE9 , 0xE2 , /* 0x80-0x83 (128-131) */ 0xE4 , 0xE0 , 0xE5 , 0xE7 , /* 0x84-0x87 (132-135) */ 0xEA , 0xEB , 0xE8 , 0xEF , /* 0x88-0x8B (136-139) */ 0xEE , 0xEC , 0xC4 , 0xC5 , /* 0x8C-0x8F (140-143) */ 0xC9 , 0xE6 , 0xC6 , 0xF4 , /* 0x90-0x93 (144-147) */ 0xF6 , 0xF2 , 0xFB , 0xF9 , /* 0x94-0x97 (148-151) */ 0xFF , 0xD6 , 0xDC , 0xA2 , /* 0x98-0x9B (152-155) */ 0xA3 , 0xA5 , '\0' , 0x0192, /* 0x9C-0x9F (156-159) */ 0xE1 , 0xED , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0xF1 , 0xD1 , 0xAA , 0xBA , /* 0xA4-0xA7 (164-167) */ 0xBF , 0x2310, 0xAC , 0xBD , /* 0xA8-0xAB (168-171) */ 0xBC , 0xA1 , 0xAB , 0xBB , /* 0xAC-0xAF (172-175) */ 0x2591, 0x2592, 0x2593, 0x2502, /* 0xB0-0xB3 (176-179) */ 0x2524, 0x2561, 0x2562, 0x2556, /* 0xB4-0xB7 (180-183) */ 0x2555, 0x2563, 0x2551, 0x2557, /* 0xB8-0xBB (184-187) */ 0x255D, 0x255C, 0x255B, 0x2510, /* 0xBC-0xBF (188-191) */ 0x2514, 0x2534, 0x252C, 0x251C, /* 0xC0-0xC3 (192-195) */ 0x2520, 0x253C, 0x255E, 0x255F, /* 0xC4-0xC7 (196-199) */ 0x255A, 0x2554, 0x2569, 0x2566, /* 0xC8-0xCB (200-203) */ 0x2560, 0x2550, 0x256C, 0x2567, /* 0xCC-0xCF (204-207) */ 0x2568, 0x2561, 0x2565, 0x2559, /* 0xD0-0xD3 (208-211) */ 0x2558, 0x2552, 0x2553, 0x256B, /* 0xD8-0xD7 (202-215) */ 0x256A, 0x2518, 0x250C, 0x2588, /* 0xD8-0xDB (216-219) */ 0x2584, 0x258C, 0x2590, 0x2580, /* 0xDC-0xDF (220-223) */ 0x03B1, 0xDF , 0x0393, 0x03A0, /* 0xE0-0xE3 (224-227) */ 0x03A3, 0x03C3, 0xB5 , 0x03D2, /* 0xE4-0xE7 (228-231) */ 0x03A6, 0x0398, 0x03A9, 0x03B4, /* 0xE8-0xEB (232-235) */ 0x221E, 0x2205, 0x2208, 0x2229, /* 0xEC-0xEF (236-239) */ 0x2261, 0xB1 , 0x2265, 0x2264, /* 0xF0-0xF3 (240-243) */ 0x2320, 0x2321, 0xF7 , 0x2248, /* 0xF4-0xF7 (244-247) */ 0xB0 , 0xB7 , 0x2219, 0x221A, /* 0xF8-0xFB (248-251) */ 0x03B7, 0xB2 , 0x220E, 0xA0 /* 0xFC-0xFF (252-255) */ }; const uni_ushort ibm8502uniArray[] = /* beginning with 0x80 (128) */ { 0xC7 , 0xFC , 0xE9 , 0xE2 , /* 0x80-0x83 (128-131) */ 0xE4 , 0xE0 , 0xE5 , 0xE7 , /* 0x84-0x87 (132-135) */ 0xEA , 0xEB , 0xE8 , 0xEF , /* 0x88-0x8B (136-139) */ 0xEE , 0xEC , 0xC4 , 0xC5 , /* 0x8C-0x8F (140-143) */ 0xC9 , 0xE6 , 0xC6 , 0xF4 , /* 0x90-0x93 (144-147) */ 0xF6 , 0xF2 , 0xFB , 0xF9 , /* 0x94-0x97 (148-151) */ 0xFF , 0xD6 , 0xDC , 0xF8 , /* 0x98-0x9B (152-155) */ 0xA3 , 0xD8 , 0xD7 , 0x0192, /* 0x9C-0x9F (156-159) */ 0xE1 , 0xED , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0xF1 , 0xD1 , 0xAA , 0xBA , /* 0xA4-0xA7 (164-167) */ 0xBF , 0xAE , 0xAC , 0xBD , /* 0xA8-0xAB (168-171) */ 0xBC , 0xA1 , 0xAB , 0xBB , /* 0xAC-0xAF (172-175) */ 0x2591, 0x2592, 0x2593, 0x2502, /* 0xB0-0xB3 (176-179) */ 0x2524, 0xC1 , 0xC2 , 0xC0 , /* 0xB4-0xB7 (180-183) */ 0xA9 , 0x2563, 0x2551, 0x2557, /* 0xB8-0xBB (184-187) */ 0x255D, 0xA2 , 0xA5 , 0x2510, /* 0xBC-0xBF (188-191) */ 0x2514, 0x2534, 0x252C, 0x251C, /* 0xC0-0xC3 (192-195) */ 0x2520, 0x253C, 0xE3 , 0xC3 , /* 0xC4-0xC7 (196-199) */ 0x255A, 0x2554, 0x2569, 0x2566, /* 0xC8-0xCB (200-203) */ 0x2560, 0x2550, 0x256C, 0xA4 , /* 0xCC-0xCF (204-207) */ 0xF0 , 0xD0 , 0xCA , 0xCB , /* 0xD0-0xD3 (208-211) */ 0xC8 , 0xB9 , 0xCD , 0xCE , /* 0xD8-0xD7 (202-215) */ 0xCF , 0x2518, 0x250C, 0x2588, /* 0xD8-0xDB (216-219) */ 0x2584, 0xA6 , 0xCC , 0x2580, /* 0xDC-0xDF (220-223) */ 0xD3 , 0xDF , 0xD4 , 0xD2 , /* 0xE0-0xE3 (224-227) */ 0xF5 , 0xD5 , 0xB5 , 0xF4 , /* 0xE4-0xE7 (228-231) */ 0xDE , 0xDA , 0x0155, 0x0170, /* 0xE8-0xEB (232-235) */ 0xFD , 0xDD , 0x0163, 0xB4 , /* 0xEC-0xEF (236-239) */ 0xAD , 0x02DD, 0x02DB, 0x02C7, /* 0xF0-0xF3 (240-243) */ 0x02D8, 0xA7 , 0xF7 , 0xD8 , /* 0xF4-0xF7 (244-247) */ 0xB0 , 0xA8 , 0x2219, 0x0171, /* 0xF8-0xFB (248-251) */ 0x0158, 0x0159, 0x220E, 0xA0 /* 0xFC-0xFF (252-255) */ }; const uni_ushort ibm8522uniArray[] = /* beginning with 0x80 (128) */ { 0xC7 , 0xFC , 0xE9 , 0xE2 , /* 0x80-0x83 (128-131) */ 0xE4 , 0x016F, 0x0107, 0xE7 , /* 0x84-0x87 (132-135) */ 0x0142, 0xEB , 0x0150, 0x0151, /* 0x88-0x8B (136-139) */ 0xEE , 0x0179, 0xC4 , 0x0106, /* 0x8C-0x8F (140-143) */ 0xC9 , 0x0139, 0x013A, 0xF4 , /* 0x90-0x93 (144-147) */ 0xF6 , 0x013D, 0x013E, 0x015A, /* 0x94-0x97 (148-151) */ 0x015B, 0xD6 , 0xDC , 0x0164, /* 0x98-0x9B (152-155) */ 0x0165, 0x0141, 0xD7 , 0x010D, /* 0x9C-0x9F (156-159) */ 0xE1 , 0xED , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0x0104, 0x0105, 0x017D, 0x017E, /* 0xA4-0xA7 (164-167) */ 0x0118, 0x0119, 0xA0 , 0x017A, /* 0xA8-0xAB (168-171) */ 0x010C, 0x015F, 0xAB , 0xBB , /* 0xAC-0xAF (172-175) */ 0x2591, 0x2592, 0x2593, 0x2502, /* 0xB0-0xB3 (176-179) */ 0x2524, 0xC1 , 0xC2 , 0x011A, /* 0xB4-0xB7 (180-183) */ 0x015E, 0x2563, 0x2551, 0x2557, /* 0xB8-0xBB (184-187) */ 0x255D, 0x017B, 0x017C, 0x2510, /* 0xBC-0xBF (188-191) */ 0x2514, 0x2534, 0x252C, 0x251C, /* 0xC0-0xC3 (192-195) */ 0x2520, 0x253C, 0x0102, 0x0103, /* 0xC4-0xC7 (196-199) */ 0x255A, 0x2554, 0x2569, 0x2566, /* 0xC8-0xCB (200-203) */ 0x2560, 0x2550, 0x256C, 0xA4 , /* 0xCC-0xCF (204-207) */ 0x0111, 0x0110, 0x010E, 0xCB , /* 0xD0-0xD3 (208-211) */ 0x010F, 0x0147, 0xCD , 0xCE , /* 0xD8-0xD7 (202-215) */ 0x011B, 0x2518, 0x250C, 0x2588, /* 0xD8-0xDB (216-219) */ 0x2584, 0x0162, 0x016E, 0x2580, /* 0xDC-0xDF (220-223) */ 0xD3 , 0xDF , 0xD4 , 0x0143, /* 0xE0-0xE3 (224-227) */ 0x0144, 0x0148, 0x0160, 0x0161, /* 0xE4-0xE7 (228-231) */ 0x0154, 0xDA , 0x0155, 0x0170, /* 0xE8-0xEB (232-235) */ 0xFD , 0xDD , 0x0163, 0xB4 , /* 0xEC-0xEF (236-239) */ 0xAD , 0x02DD, 0x02DB, 0x02C7, /* 0xF0-0xF3 (240-243) */ 0x02D8, 0xA7 , 0xF7 , 0xD8 , /* 0xF4-0xF7 (244-247) */ 0xB0 , 0xA8 , 0x2219, 0x0171, /* 0xF8-0xFB (248-251) */ 0x0158, 0x0159, 0x220E, 0xA0 /* 0xFC-0xFF (252-255) */ }; const uni_ushort ibm8602uniArray[] = /* beginning with 0x80 (128) */ { 0xC7 , 0xFC , 0xE9 , 0xE2 , /* 0x80-0x83 (128-131) */ 0xE3 , 0xE0 , 0xC1 , 0xE7 , /* 0x84-0x87 (132-135) */ 0xEA , 0xCA , 0xE8 , 0xCD , /* 0x88-0x8B (136-139) */ 0xD4 , 0xEC , 0xC3 , 0xC2 , /* 0x8C-0x8F (140-143) */ 0xC9 , 0xC0 , 0xC8 , 0xF4 , /* 0x90-0x93 (144-147) */ 0xF5 , 0xF2 , 0xDA , 0xF9 , /* 0x94-0x97 (148-151) */ 0xCC , 0xD5 , 0xDC , 0xA2 , /* 0x98-0x9B (152-155) */ 0xA3 , 0xD9 , '\0' , 0xD3 , /* 0x9C-0x9F (156-159) */ 0xE1 , 0xED , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0xF1 , 0xD1 , 0xAA , 0xBA , /* 0xA4-0xA7 (164-167) */ 0xBF , 0xD2 , 0xAC , 0xBD , /* 0xA8-0xAB (168-171) */ 0xBC , 0xA1 , 0xAB , 0xBB /* 0xAC-0xAF (172-175) */ }; const uni_ushort ibm8632uniArray[] = /* beginning with 0x80 (128) */ { 0xC7 , 0xFC , 0xE9 , 0xE2 , /* 0x80-0x83 (128-131) */ 0xC2 , 0xE0 , 0xB6 , 0xE7 , /* 0x84-0x87 (132-135) */ 0xEA , 0xEB , 0xE8 , 0xEF , /* 0x88-0x8B (136-139) */ 0xEE , 0x3D , 0xC0 , 0xA7 , /* 0x8C-0x8F (140-143) */ 0xC9 , 0xC8 , 0xCA , 0xF4 , /* 0x90-0x93 (144-147) */ 0xCB , 0xCF , 0xFB , 0xFA , /* 0x94-0x97 (148-151) */ 0xA4 , 0xD4 , 0xDC , 0xA2 , /* 0x98-0x9B (152-155) */ 0xA3 , 0xD9 , 0xDB , '\0' , /* 0x9C-0x9F (156-159) */ 0xA6 , 0xB4 , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0xA8 , 0xB8 , 0xB3 , 0xAF , /* 0xA4-0xA7 (164-167) */ 0xCE , 0x2310, 0xAC , 0xBD , /* 0xA8-0xAB (168-171) */ 0xBC , 0xBE , 0xAB , 0xBB /* 0xAC-0xAF (172-175) */ }; const uni_ushort ibm8652uniArray[] = /* beginning with 0x97 (151) */ { 0xFA , /* 0x97 ( 151) */ 0xFF , 0xD6 , 0xDC , 0xF8 , /* 0x98-0x9B (152-155) */ 0xA3 , 0xD8 , '\0' , 0x0192, /* 0x9C-0x9F (156-159) */ 0xE1 , 0xED , 0xF3 , 0xFA , /* 0xA0-0xA3 (160-163) */ 0xF1 , 0xD1 , 0xAA , 0xBA , /* 0xA4-0xA7 (164-167) */ 0xBF , 0x2310, 0xAC , 0xBD , /* 0xA8-0xAB (168-171) */ 0xBC , 0xA1 , 0xAB , 0xA4 , /* 0xAC-0xAF (172-175) */ }; const uni_ushort ibm8662uniArray[] = /* beginning with 0x80 (128) */ { 0x0410, 0x0411, 0x0412, 0x0413, /* 0x80-0x83 (128-131) */ 0x0414, 0x0415, 0x0416, 0x0417, /* 0x84-0x87 (132-135) */ 0x0418, 0x0419, 0x041A, 0x041B, /* 0x88-0x8B (136-139) */ 0x041C, 0x041D, 0x041E, 0x041F, /* 0x8C-0x8F (140-143) */ 0x0420, 0x0421, 0x0422, 0x0423, /* 0x90-0x93 (144-147) */ 0x0424, 0x0425, 0x0426, 0x0427, /* 0x94-0x97 (148-151) */ 0x0428, 0x0429, 0x042A, 0x042B, /* 0x98-0x9B (152-155) */ 0x042C, 0x042D, 0x042E, 0x042F, /* 0x9C-0x9F (156-159) */ 0x0430, 0x0431, 0x0432, 0x0433, /* 0xA0-0xA3 (160-163) */ 0x0434, 0x0435, 0x0436, 0x0437, /* 0xA4-0xA7 (164-167) */ 0x0438, 0x0439, 0x043A, 0x043B, /* 0xA8-0xAB (168-171) */ 0x043C, 0x043D, 0x043E, 0x043F, /* 0xAC-0xAF (172-175) */ 0x2591, 0x2592, 0x2593, 0x2502, /* 0xB0-0xB3 (176-179) */ 0x2524, 0x2561, 0x2562, 0x2556, /* 0xB4-0xB7 (180-183) */ 0x2555, 0x2563, 0x2551, 0x2557, /* 0xB8-0xBB (184-187) */ 0x255D, 0x255C, 0x255B, 0x2510, /* 0xBC-0xBF (188-191) */ 0x2514, 0x2534, 0x252C, 0x251C, /* 0xC0-0xC3 (192-195) */ 0x2500, 0x253C, 0x255E, 0x255F, /* 0xC4-0xC7 (196-199) */ 0x255A, 0x2554, 0x2569, 0x2566, /* 0xC8-0xCB (200-203) */ 0x2560, 0x2550, 0x256C, 0x2567, /* 0xCC-0xCF (204-207) */ 0x2568, 0x2564, 0x2565, 0x2559, /* 0xD0-0xD3 (208-211) */ 0x2558, 0x2552, 0x2553, 0x256B, /* 0xD4-0xD7 (212-215) */ 0x256A, 0x2518, 0x250C, 0x2588, /* 0xD8-0xDB (216-219) */ 0x2584, 0x258C, 0x2590, 0x2580, /* 0xDC-0xDF (220-223) */ 0x0440, 0x0441, 0x0442, 0x0443, /* 0xE0-0xE3 (224-227) */ 0x0444, 0x0445, 0x0446, 0x0447, /* 0xE4-0xE7 (228-231) */ 0x0448, 0x0449, 0x044A, 0x044B, /* 0xE8-0xEB (232-235) */ 0x044C, 0x044D, 0x044E, 0x044F, /* 0xEC-0xEF (236-239) */ 0x0401, 0x0451, 0x0404, 0x0454, /* 0xF0-0xF3 (240-243) */ 0x0407, 0x0457, 0x040E, 0x045E, /* 0xF4-0xF7 (244-247) */ 0x00B0, 0x2219, 0x00B7, 0x221A, /* 0xF8-0xFB (248-251) */ 0x2116, 0x00A4, 0x25A0, 0x00A0, /* 0xFC-0xFF (252-255) */ }; static const uni_ushort macarr2uniArray[] = /* beginning with 0x1C ( 28) */ { 0x2190, 0x2192, 0x2191, 0x2193 /* 0x1C-0x1F ( 28- 31) */ }; static const uni_ushort mac2uniArray[] = /* beginning with 0xA0 (160) */ { 0xC4 , 0xC5 , 0xC7 , 0xC9 , /* 0x80-0x83 (128-131) */ 0xD1 , 0xD6 , 0xDC , 0xE1 , /* 0x84-0x87 (132-135) */ 0xE0 , 0xE2 , 0xE4 , 0xE3 , /* 0x88-0x8B (136-139) */ 0xE5 , 0xE7 , 0xE9 , 0xE8 , /* 0x8C-0x8F (140-143) */ 0xEA , 0xEB , 0xED , 0xEC , /* 0x90-0x93 (144-147) */ 0xEE , 0xEF , 0xF1 , 0xF3 , /* 0x94-0x97 (148-151) */ 0xF2 , 0xF4 , 0xF6 , 0xF5 , /* 0x98-0x9B (152-155) */ 0xFA , 0xF9 , 0xFB , 0xFC , /* 0x9C-0x9F (156-159) */ 0x2020, 0xB0 , 0xA2 , 0xA3 , /* 0xA0-0xA3 (160-163) */ 0xA7 , 0x220E, 0xB6 , 0xDF , /* 0xA4-0xA7 (164-167) */ 0xAE , 0xA9 , 0x2122, 0xB4 , /* 0xA8-0xAB (168-171) */ 0xA8 , 0x2260, 0xC6 , 0xD8 , /* 0xAC-0xAF (172-175) */ 0x221E, 0xB1 , 0x2264, 0x2265, /* 0xB0-0xB3 (176-179) */ 0xA5 , 0xB5 , 0x2202, 0x2211, /* 0xB4-0xB7 (180-183) */ 0x220F, 0x03C0, 0x222B, 0xAA , /* 0xB8-0xBB (184-187) */ 0xBA , 0x03A9, 0xE6 , 0xF8 , /* 0xBC-0xBF (188-191) */ 0xBF , 0xA1 , 0xAC , 0x221A, /* 0xC0-0xC3 (192-195) */ 0x0192, 0x2248, 0x2206, 0xAB , /* 0xC4-0xC7 (196-199) */ 0xBB , 0x2026, 0xA0 , 0xC0 , /* 0xC8-0xCB (200-203) */ 0xC3 , 0xD5 , 0x0152, 0x0153, /* 0xCC-0xCF (204-207) */ 0x2013, 0x2014, 0x201C, 0x201D, /* 0xD0-0xD3 (208-211) */ 0x2018, 0x2019, 0xF7 , 0x2205, /* 0xD8-0xD7 (202-215) */ 0xFF , 0x0178, 0x2215, 0xA4 , /* 0xD8-0xDB (216-219) */ 0x2039, 0x20A0, 0xFB01, 0xFB02, /* 0xDC-0xDF (220-223) */ 0x2021, 0xB7 , 0x201A, 0x201E, /* 0xE0-0xE3 (224-227) */ 0x2031, 0xC2 , 0xCA , 0xC1 , /* 0xE4-0xE7 (228-231) */ 0xCB , 0xC8 , 0xCD , 0xCE , /* 0xE8-0xEB (232-235) */ 0xCF , 0xCC , 0xD3 , 0xD4 , /* 0xEC-0xEF (236-239) */ '\0' , 0xD2 , 0xDA , 0xDB , /* 0xF0-0xF3 (240-243) */ 0xD9 , 0xB9 , 0x02C6, 0x02DC, /* 0xF4-0xF7 (244-247) */ 0x02C9, 0x02C7, 0x02D9, 0x02DA, /* 0xF8-0xFB (248-251) */ 0x02DB, 0x02DC, 0x02CE, 0x02D8 /* 0xFC-0xFF (252-255) */ }; const cconv uni_html2uniArray[] = { { MBC('A','E','l','i'), MBC('g',' ',' ',' '), 0x00C6 }, /* 001 */ { MBC('A','a','c','u'), MBC('t','e',' ',' '), 0x00C1 }, /* 002 */ { MBC('A','c','i','r'), MBC('c',' ',' ',' '), 0x00C2 }, /* 003 */ { MBC('A','g','r','a'), MBC('v','e',' ',' '), 0x00C0 }, /* 004 */ { MBC('A','r','i','n'), MBC('g',' ',' ',' '), 0x00C5 }, /* 005 */ { MBC('A','t','i','l'), MBC('d','e',' ',' '), 0x00C3 }, /* 006 */ { MBC('A','u','m','l'), MBC(' ',' ',' ',' '), 0x00C4 }, /* 007 */ { MBC('C','c','e','d'), MBC('i','l',' ',' '), 0x00C7 }, /* 008 */ { MBC('E','T','H',' '), MBC(' ',' ',' ',' '), 0x00D0 }, /* 009 */ { MBC('E','a','c','u'), MBC('t','e',' ',' '), 0x00C9 }, /* 010 */ { MBC('E','c','i','r'), MBC('c',' ',' ',' '), 0x00CA }, /* 011 */ { MBC('E','g','r','a'), MBC('v','e',' ',' '), 0x00C8 }, /* 012 */ { MBC('E','u','m','l'), MBC(' ',' ',' ',' '), 0x00CB }, /* 013 */ { MBC('I','a','c','u'), MBC('t','e',' ',' '), 0x00CD }, /* 014 */ { MBC('I','c','i','r'), MBC('c',' ',' ',' '), 0x00CE }, /* 015 */ { MBC('I','g','r','a'), MBC('v','e',' ',' '), 0x00CC }, /* 016 */ { MBC('I','u','m','l'), MBC(' ',' ',' ',' '), 0x00CF }, /* 017 */ { MBC('N','t','i','l'), MBC('d','e',' ',' '), 0x00D1 }, /* 018 */ { MBC('O','a','c','u'), MBC('t','e',' ',' '), 0x00D3 }, /* 019 */ { MBC('O','c','i','r'), MBC('c',' ',' ',' '), 0x00D4 }, /* 020 */ { MBC('O','g','r','a'), MBC('v','e',' ',' '), 0x00D2 }, /* 021 */ { MBC('O','s','l','a'), MBC('s','h',' ',' '), 0x00D8 }, /* 022 */ { MBC('O','t','i','l'), MBC('d','e',' ',' '), 0x00D5 }, /* 023 */ { MBC('O','u','m','l'), MBC(' ',' ',' ',' '), 0x00D6 }, /* 024 */ { MBC('U','a','c','u'), MBC('t','e',' ',' '), 0x00DA }, /* 025 */ { MBC('U','c','i','r'), MBC('c',' ',' ',' '), 0x00DB }, /* 026 */ { MBC('U','g','r','a'), MBC('v','e',' ',' '), 0x00D9 }, /* 027 */ { MBC('U','u','m','l'), MBC(' ',' ',' ',' '), 0x00DC }, /* 028 */ { MBC('T','H','O','R'), MBC('N',' ',' ',' '), 0x00DE }, /* 029 */ { MBC('Y','a','c','u'), MBC('t','e',' ',' '), 0x00DD }, /* 030 */ { MBC('a','a','c','u'), MBC('t','e',' ',' '), 0x00E1 }, /* 031 */ { MBC('a','c','i','r'), MBC('c',' ',' ',' '), 0x00E2 }, /* 032 */ { MBC('a','c','u','t'), MBC('e',' ',' ',' '), 0x00B4 }, /* 033 */ { MBC('a','e','l','i'), MBC('g',' ',' ',' '), 0x00E6 }, /* 034 */ { MBC('a','g','r','a'), MBC('v','e',' ',' '), 0x00E0 }, /* 035 */ { MBC('a','m','p',' '), MBC(' ',' ',' ',' '), 0x0026 }, /* 036 */ { MBC('a','r','i','n'), MBC('g',' ',' ',' '), 0x00E5 }, /* 037 */ { MBC('a','t','i','l'), MBC('d','e',' ',' '), 0x00E3 }, /* 038 */ { MBC('a','u','m','l'), MBC(' ',' ',' ',' '), 0x00E4 }, /* 039 */ { MBC('b','r','v','b'), MBC('a','r',' ',' '), 0x00A6 }, /* 040 */ { MBC('c','c','e','d'), MBC('i','l',' ',' '), 0x00E7 }, /* 041 */ { MBC('c','e','d','i'), MBC('l',' ',' ',' '), 0x00B8 }, /* 042 */ { MBC('c','e','n','t'), MBC(' ',' ',' ',' '), 0x00A2 }, /* 043 */ { MBC('c','o','p','y'), MBC(' ',' ',' ',' '), 0x00A9 }, /* 044 */ { MBC('c','u','r','r'), MBC('e','n','c','y'), 0x00A4 }, /* 045 */ { MBC('d','e','g',' '), MBC(' ',' ',' ',' '), 0x00B0 }, /* 046 */ { MBC('d','i','v','i'), MBC('d','e',' ',' '), 0x00F7 }, /* 047 */ { MBC('e','a','c','u'), MBC('t','e',' ',' '), 0x00E9 }, /* 048 */ { MBC('e','c','i','r'), MBC('c',' ',' ',' '), 0x00EA }, /* 049 */ { MBC('e','g','r','a'), MBC('v','e',' ',' '), 0x00E8 }, /* 050 */ { MBC('e','t','h',' '), MBC(' ',' ',' ',' '), 0x00F0 }, /* 051 */ { MBC('e','u','m','l'), MBC(' ',' ',' ',' '), 0x00EB }, /* 052 */ { MBC('f','r','a','c'), MBC('1','2',' ',' '), 0x00BD }, /* 053 */ { MBC('f','r','a','c'), MBC('1','4',' ',' '), 0x00BC }, /* 054 */ { MBC('f','r','a','c'), MBC('3','4',' ',' '), 0x00BE }, /* 055 */ { MBC('g','t',' ',' '), MBC(' ',' ',' ',' '), 0x003E }, /* 056 */ { MBC('i','a','c','u'), MBC('t','e',' ',' '), 0x00ED }, /* 057 */ { MBC('i','c','i','r'), MBC('c',' ',' ',' '), 0x00EE }, /* 058 */ { MBC('i','e','x','c'), MBC('l',' ',' ',' '), 0x00A1 }, /* 059 */ { MBC('i','g','r','a'), MBC('v','e',' ',' '), 0x00EC }, /* 060 */ { MBC('i','q','u','e'), MBC('s','t',' ',' '), 0x00BF }, /* 061 */ { MBC('i','u','m','l'), MBC(' ',' ',' ',' '), 0x00EF }, /* 062 */ { MBC('l','a','q','u'), MBC('o',' ',' ',' '), 0x00AB }, /* 063 */ { MBC('l','t',' ',' '), MBC(' ',' ',' ',' '), 0x003C }, /* 064 */ { MBC('m','a','c','r'), MBC(' ',' ',' ',' '), 0x00AF }, /* 065 */ { MBC('m','d','a','s'), MBC('h',' ',' ',' '), 0x2014 }, /* 066 */ { MBC('m','i','c','r'), MBC('o',' ',' ',' '), 0x00B5 }, /* 067 */ { MBC('m','i','d','d'), MBC('o','t',' ',' '), 0x00B7 }, /* 068 */ { MBC('n','b','s','p'), MBC(' ',' ',' ',' '), 0x00A0 }, /* 069 */ { MBC('n','d','a','s'), MBC('h',' ',' ',' '), 0x2013 }, /* 070 */ { MBC('n','o','t',' '), MBC(' ',' ',' ',' '), 0x00AC }, /* 071 */ { MBC('n','t','i','l'), MBC('d','e',' ',' '), 0x00F1 }, /* 072 */ { MBC('o','a','c','u'), MBC('t','e',' ',' '), 0x00F3 }, /* 073 */ { MBC('o','c','i','r'), MBC('c',' ',' ',' '), 0x00F4 }, /* 074 */ { MBC('o','g','r','a'), MBC('v','e',' ',' '), 0x00F2 }, /* 075 */ { MBC('o','r','d','f'), MBC(' ',' ',' ',' '), 0x00AA }, /* 076 */ { MBC('o','r','d','m'), MBC(' ',' ',' ',' '), 0x00AB }, /* 077 */ { MBC('o','s','l','a'), MBC('s','h',' ',' '), 0x00F8 }, /* 078 */ { MBC('o','t','i','l'), MBC('d','e',' ',' '), 0x00F5 }, /* 079 */ { MBC('o','u','m','l'), MBC(' ',' ',' ',' '), 0x00F6 }, /* 080 */ { MBC('p','a','r','a'), MBC(' ',' ',' ',' '), 0x00B6 }, /* 081 */ { MBC('p','l','u','s'), MBC('m','n',' ',' '), 0x00B1 }, /* 082 */ { MBC('p','o','u','n'), MBC('d',' ',' ',' '), 0x00A3 }, /* 083 */ { MBC('q','u','o','t'), MBC(' ',' ',' ',' '), 0x0022 }, /* 084 */ { MBC('r','a','q','u'), MBC('o',' ',' ',' '), 0x00BB }, /* 085 */ { MBC('r','e','g',' '), MBC(' ',' ',' ',' '), 0x00AE }, /* 086 */ { MBC('s','e','c','t'), MBC(' ',' ',' ',' '), 0x00A7 }, /* 087 */ { MBC('s','h','y',' '), MBC(' ',' ',' ',' '), 0x00AD }, /* 088 */ { MBC('s','u','p','1'), MBC(' ',' ',' ',' '), 0x00B9 }, /* 089 */ { MBC('s','u','p','2'), MBC(' ',' ',' ',' '), 0x00B2 }, /* 090 */ { MBC('s','u','p','3'), MBC(' ',' ',' ',' '), 0x00B3 }, /* 091 */ { MBC('s','z','l','i'), MBC('g',' ',' ',' '), 0x00DF }, /* 092 */ { MBC('t','h','o','r'), MBC('n',' ',' ',' '), 0x00FE }, /* 093 */ { MBC('t','i','m','e'), MBC('s',' ',' ',' '), 0x00D7 }, /* 094 */ { MBC('t','r','a','d'), MBC('e',' ',' ',' '), 0x2122 }, /* 095 */ { MBC('u','a','c','u'), MBC('t','e',' ',' '), 0x00DA }, /* 096 */ { MBC('u','c','i','r'), MBC('c',' ',' ',' '), 0x00DB }, /* 097 */ { MBC('u','g','r','a'), MBC('v','e',' ',' '), 0x00D9 }, /* 098 */ { MBC('u','m','l',' '), MBC(' ',' ',' ',' '), 0x00A8 }, /* 099 */ { MBC('u','u','m','l'), MBC(' ',' ',' ',' '), 0x00FC }, /* 100 */ { MBC('y','a','c','u'), MBC('t','e',' ',' '), 0x00FD }, /* 101 */ { MBC('y','e','n',' '), MBC(' ',' ',' ',' '), 0x00A5 }, /* 102 */ { MBC('y','u','m','l'), MBC(' ',' ',' ',' '), 0x00FF } /* 103 */ }; //static const uni_ushort iso52uniArray[] = /* beginning with 0x80 (128) */ //{ // 0xA0 , 0x0104, 0x02D8, 0x0141, /* 0xA0-0xA3 (160-163) */ // 0xA0 , 0x0104, 0x02D8, 0x0141, /* 0xA4-0xA7 (164-167) */ // '\0' , '\0' , '\0' , '\0' , /* 0xA8-0xAB (168-171) */ // '\0' , '\0' , '\0' , '\0' , /* 0xAC-0xAF (172-175) */ // // '\0' , '\0' , '\0' , '\0' , /* 0xB0-0xB3 (176-179) */ // '\0' , '\0' , '\0' , '\0' , /* 0xB4-0xB7 (180-183) */ // '\0' , '\0' , '\0' , '\0' , /* 0xB8-0xBB (184-187) */ // '\0' , '\0' , '\0' , '\0' , /* 0xBC-0xBF (188-191) */ // // '\0' , '\0' , '\0' , '\0' , /* 0xC0-0xC3 (192-195) */ // '\0' , '\0' , '\0' , '\0' , /* 0xC4-0xC7 (196-199) */ // '\0' , '\0' , '\0' , '\0' , /* 0xC8-0xCB (200-203) */ // '\0' , '\0' , '\0' , '\0' , /* 0xCC-0xCF (204-207) */ // // '\0' , '\0' , '\0' , '\0' , /* 0xD0-0xD3 (208-211) */ // '\0' , '\0' , '\0' , '\0' , /* 0xD8-0xD7 (202-215) */ // '\0' , '\0' , '\0' , '\0' , /* 0xD8-0xDB (216-219) */ // '\0' , '\0' , '\0' , '\0' , /* 0xDC-0xDF (220-223) */ // // '\0' , '\0' , '\0' , '\0' , /* 0xE0-0xE3 (224-227) */ // '\0' , '\0' , '\0' , '\0' , /* 0xE4-0xE7 (228-231) */ // '\0' , '\0' , '\0' , '\0' , /* 0xE8-0xEB (232-235) */ // '\0' , '\0' , '\0' , '\0' , /* 0xEC-0xEF (236-239) */ // // '\0' , '\0' , '\0' , '\0' , /* 0xF0-0xF3 (240-243) */ // '\0' , '\0' , '\0' , '\0' , /* 0xF4-0xF7 (244-247) */ // '\0' , '\0' , '\0' , '\0' , /* 0xF8-0xFB (248-251) */ // '\0' , '\0' , '\0' , '\0' /* 0xFC-0xFF (252-255) */ //}; const ctounitable uni_ebc2uniTable = { ebc2uniArray, 0x20 /* 32 */, sizeof(ebc2uniArray) / sizeof(uni_ushort) }; const ctounitable uni_iso22uniTable = { iso22uniArray, 0xA0 /* 160 */, sizeof(iso22uniArray) / sizeof(uni_ushort) }; const ctounitable uni_iso32uniTable = { iso32uniArray, 0xA0 /* 160 */, sizeof(iso32uniArray) / sizeof(uni_ushort) }; const ctounitable uni_iso42uniTable = { iso42uniArray, 0xA0 /* 160 */, sizeof(iso42uniArray) / sizeof(uni_ushort) }; const ctounitable uni_koi2uniTable = { koi2uniArray, 0x80 /* 128 */, sizeof(koi2uniArray) / sizeof(uni_ushort) }; const ctounitable uni_iso72uniTable = { iso72uniArray, 0xA0 /* 160 */, sizeof(iso72uniArray) / sizeof(uni_ushort) }; const ctounitable uni_iso102uniTable = { iso102uniArray, 0xA0 /* 160 */, sizeof(iso102uniArray) / sizeof(uni_ushort) }; const ctounitable uni_win2uniTable = { win2uniArray, 0x80 /* 128 */, sizeof(win2uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm2uniTable = { ibm2uniArray, 0x00 /* 0 */, sizeof(ibm2uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm4372uniTable = { ibm4372uniArray, 0x80 /* 128 */, sizeof(ibm4372uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8502uniTable = { ibm8502uniArray, 0x80 /* 128 */, sizeof(ibm8502uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8522uniTable = { ibm8522uniArray, 0x80 /* 128 */, sizeof(ibm8522uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8602uniTable = { ibm8602uniArray, 0x80 /* 128 */, sizeof(ibm8602uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8632uniTable = { ibm8632uniArray, 0x80 /* 128 */, sizeof(ibm8632uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8652uniTable = { ibm8652uniArray, 0x97 /* 151 */, sizeof(ibm8652uniArray) / sizeof(uni_ushort) }; const ctounitable uni_ibm8662uniTable = { ibm8662uniArray, 0x80 /* 128 */, sizeof(ibm8662uniArray) / sizeof(uni_ushort) }; const ctounitable uni_mac2uniTable = { mac2uniArray, 0x80 /* 128 */, sizeof(mac2uniArray) / sizeof(uni_ushort) }; const ctounitable uni_macarr2uniTable = { macarr2uniArray, 0x1C /* 28 */, sizeof(macarr2uniArray) / sizeof(uni_ushort) }; static const uni_ubyte html2uniSize = 103; static void toCRLF (char *utf8, uni_uword *di, const char *src, uni_uword *si, uni_uword chars, uni_ubyte line_type, uni_ubyte var_type) { uni_ulong c[2]; c[1]=0l; switch(var_type) { case BYTE_LENGTH : c[0] = (uni_ulong)src[*si]; if((*si)+1 < chars) c[1] = (uni_ulong)src[(*si)+1]; break; case SHORT_LENGTH : c[0] = ((uni_ushort*)src)[*si]; if((*si)+1 < chars) c[1] = ((uni_ushort*)src)[(*si)+1]; break; case LONG_LENGTH : c[0] = ((uni_ulong*)src)[*si]; if((*si)+1 < chars) c[1] = ((uni_ulong*)src)[(*si)+1]; break; } switch(c[0]) { case (uni_ulong)'\r' : utf8[*di] = '\r'; if(line_type==C_LINE_CR) { (*di)++; utf8[*di] = '\n'; } else if((line_type==C_LINE_LF)&&(c[1]==0x1A)) { (*si)++; (*di)++; utf8[*di] = '\n'; } break; case (uni_ulong)'\n' : if(line_type==C_LINE_LF) { utf8[*di] = '\r'; (*di)++; if(c[1]==0x1D) (*si)++; } utf8[*di] = '\n'; break; default: utf8[*di] = (char)src[*si]; } } static uni_ulong ScanHTML(register const char *src, uni_uword *length) { register char buffer[10]=" "; register uni_uword i, l = *length; register uni_ulong upper, lower; register uni_uword min, max, mid; if(src[0] == '#') { for(i=1,mid=0; ( (i 0) ) buffer[mid++] = src[i]; if(mid==0) return(0l); /* no number found */ if(i>=l) return(0l); /* reading past end */ if(src[i] != ';') return(0l); /* no terminating ';'-sign */ buffer[mid]='\0'; sscanf(buffer,"%lu", &upper); *length = i+1; return(upper); } for(i=0; ((i<9) && (src[i]!=';') && (i uni_html2uniArray[max].upper) return(0l); if(upper == uni_html2uniArray[max].upper) { if(lower == uni_html2uniArray[max].lower) { *length = l; return( (uni_ulong)uni_html2uniArray[max].unicode ); } else return(0l); } while(max-min > 1) { mid = (min+max)/2; if( upper < uni_html2uniArray[mid].upper ) max = mid; else if( upper > uni_html2uniArray[mid].upper ) min = mid; else /* upper == uni_html2uniArray[mid].upper */ { if(upper != MBC('f','r','a','c')) { if(lower == uni_html2uniArray[mid].lower) { *length = l; return( (uni_ulong)uni_html2uniArray[mid].unicode ); } return(0l); } /* upper == 'frac' */ switch(lower) { case MBC('1','2',' ',' ') : *length = l; return(0xBD); case MBC('1','4',' ',' ') : *length = l; return(0xBC); case MBC('3','4',' ',' ') : *length = l; return(0xBE); } return(0l); } } return(0l); } uni_slong uni_toUTF8 (char *utf8, const char *src, uni_uword chars, uni_ulong string_type, uni_ubyte line_type, uni_uword *written) { register uni_uword i, si, di; uni_ubyte read; short carry; uni_slong RC; int isquot, iscommand, trans; const ctounitable *table1, *table2, *table3; uni_ushort *utf16; uni_ulong *ucs4, c = 0; if(string_type == C_UTF8) { if(line_type == C_LINE_CRLF) { memcpy(utf8, src, chars); di=chars; } else for(si=di=0; si chars) { utf8[di]='\0'; *written = di+1; return(C_OK); } if(RC != C_OK) return(RC); assert(strlen(&utf8[di]) < UINT_MAX); di += (uni_uword)strlen(&utf8[di]); si += read; } while(carry!=0); else return(C_INVALID_FORMAT); } utf8[di] = '\0'; *written = di+1; return(C_OK); } if(string_type==C_UTF16 || string_type==C_UCS2) { utf16 = (uni_ushort*)src; for(si=di=0; si chars) { utf8[di]='\0'; *written = di+1; return(C_OK); } if(RC != C_OK) return(RC); assert(strlen(&utf8[di]) < UINT_MAX); di += (uni_uword)strlen(&utf8[di]); si += read; } } utf8[di] = '\0'; *written = di+1; return(C_OK); } if(string_type==C_UCS4) { ucs4 = (uni_ulong*)src; for(si=di=0; si' : if((read==1)||(read==6)) read++; else i=chars; break; case '<' : if(read==3) read++; else i=chars; break; case '/' : if(read==4) read++; else i=chars; break; default : if(read==2) { c = (uni_ubyte)src[i]; read++; } else i=chars; break; } } if(read==7) { si=i; utf8[di++] = '\033'; /* ESC */ utf8[di++] = '_'; utf8[di++] = c; } else { utf8[di++] = '\033'; /* ESC */ utf8[di++] = '<'; si++; iscommand=true; } } else { utf8[di++] = '<'; si++; } break; case '>': if(!isquot) iscommand=false; utf8[di++] = '>'; si++; break; case '"': if(iscommand) isquot = !isquot; utf8[di++] = '"'; si++; break; default: if((src[si]!='\n')&&(src[si]!='\r')) utf8[di]=src[si]; else toCRLF(utf8, &di, src, &si, chars, line_type, BYTE_LENGTH); di++; si++; } } utf8[di] = '\0'; *written = di+1; return(C_OK); } if(string_type == C_ISO8859_5) { for(si=di=0; si= table1->offset) && ((uni_ubyte)src[si] < table1->offset + table1->size) ) c = table1->array[ (uni_ubyte)src[si] - table1->offset ]; else if(table2 != NULL) { if( ((uni_ubyte)src[si] >= table2->offset) && ((uni_ubyte)src[si] < table2->offset + table2->size) ) c = table2->array[ (uni_ubyte)src[si] - table2->offset ]; else if(table3 != NULL) if( ((uni_ubyte)src[si] >= table3->offset) && ((uni_ubyte)src[si] < table3->offset + table3->size) ) c = table3->array[ (uni_ubyte)src[si] - table3->offset ]; } if( (c==0l) && (src[si]!='\0') ) c = C_UTF8_UNKNOWN; if(c < 0x80) if((src[si]!='\n')&&(src[si]!='\r')) utf8[di++] = (char)c; else toCRLF(utf8, &di, src, &si, chars, line_type, BYTE_LENGTH); else { RC = uni_ucs4toutf8(&utf8[di], c); if(RC != C_OK) return(RC); assert(strlen(&utf8[di]) < UINT_MAX); di += (uni_uword)strlen(&utf8[di]); } } utf8[di] = '\0'; *written = di+1; return(C_OK); }