X-Git-Url: http://git.efficios.com/?a=blobdiff_plain;f=binutils%2Fwinduni.c;h=36d699358b8ed715014932e99fabd30dd1acba75;hb=refs%2Fheads%2Fconcurrent-displaced-stepping-2020-04-01;hp=d79f47a3d7b5927e722d8bd1228e40965ad42b9d;hpb=ed288bb597072176e84fc8279707a3f2f475779b;p=deliverable%2Fbinutils-gdb.git diff --git a/binutils/winduni.c b/binutils/winduni.c index d79f47a3d7..36d699358b 100644 --- a/binutils/winduni.c +++ b/binutils/winduni.c @@ -1,12 +1,13 @@ /* winduni.c -- unicode support for the windres program. - Copyright 1997, 1998 Free Software Foundation, Inc. + Copyright (C) 1997-2020 Free Software Foundation, Inc. Written by Ian Lance Taylor, Cygnus Support. + Rewritten by Kai Tietz, Onevision. This file is part of GNU Binutils. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by - the Free Software Foundation; either version 2 of the License, or + the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, @@ -16,8 +17,9 @@ You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software - Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA - 02111-1307, USA. */ + Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA + 02110-1301, USA. */ + /* This file contains unicode support routines for the windres program. Ideally, we would have generic unicode support which @@ -27,45 +29,268 @@ hosts, but that seems better than not really supporting unicode at all. */ +#include "sysdep.h" #include "bfd.h" +#include "libiberty.h" /* for xstrdup */ #include "bucomm.h" +/* Must be include before windows.h and winnls.h. */ +#if defined (_WIN32) || defined (__CYGWIN__) +#include +#include +#endif #include "winduni.h" +#include "safe-ctype.h" -#include +#if HAVE_ICONV +#include +#endif + +static rc_uint_type wind_WideCharToMultiByte (rc_uint_type, const unichar *, char *, rc_uint_type); +static rc_uint_type wind_MultiByteToWideChar (rc_uint_type, const char *, unichar *, rc_uint_type); +static int unichar_isascii (const unichar *, rc_uint_type); + +/* Convert an ASCII string to a unicode string. We just copy it, + expanding chars to shorts, rather than doing something intelligent. */ + +#if !defined (_WIN32) && !defined (__CYGWIN__) + +/* Codepages mapped. */ +static local_iconv_map codepages[] = +{ + { 0, "cp1252" }, + { 1, "WINDOWS-1252" }, + { 437, "MS-ANSI" }, + { 737, "MS-GREEK" }, + { 775, "WINBALTRIM" }, + { 850, "MS-ANSI" }, + { 852, "MS-EE" }, + { 857, "MS-TURK" }, + { 862, "CP862" }, + { 864, "CP864" }, + { 866, "MS-CYRL" }, + { 874, "WINDOWS-874" }, + { 932, "CP932" }, + { 936, "CP936" }, + { 949, "CP949" }, + { 950, "CP950" }, + { 1250, "WINDOWS-1250" }, + { 1251, "WINDOWS-1251" }, + { 1252, "WINDOWS-1252" }, + { 1253, "WINDOWS-1253" }, + { 1254, "WINDOWS-1254" }, + { 1255, "WINDOWS-1255" }, + { 1256, "WINDOWS-1256" }, + { 1257, "WINDOWS-1257" }, + { 1258, "WINDOWS-1258" }, + { CP_UTF7, "UTF-7" }, + { CP_UTF8, "UTF-8" }, + { CP_UTF16, "UTF-16LE" }, + { (rc_uint_type) -1, NULL } +}; + +/* Languages supported. */ +static const wind_language_t languages[] = +{ + { 0x0000, 437, 1252, "Neutral", "Neutral" }, + { 0x0401, 864, 1256, "Arabic", "Saudi Arabia" }, { 0x0402, 866, 1251, "Bulgarian", "Bulgaria" }, + { 0x0403, 850, 1252, "Catalan", "Spain" }, { 0x0404, 950, 950, "Chinese", "Taiwan" }, + { 0x0405, 852, 1250, "Czech", "Czech Republic" }, { 0x0406, 850, 1252, "Danish", "Denmark" }, + { 0x0407, 850, 1252, "German", "Germany" }, { 0x0408, 737, 1253, "Greek", "Greece" }, + { 0x0409, 437, 1252, "English", "United States" }, { 0x040A, 850, 1252, "Spanish - Traditional Sort", "Spain" }, + { 0x040B, 850, 1252, "Finnish", "Finland" }, { 0x040C, 850, 1252, "French", "France" }, + { 0x040D, 862, 1255, "Hebrew", "Israel" }, { 0x040E, 852, 1250, "Hungarian", "Hungary" }, + { 0x040F, 850, 1252, "Icelandic", "Iceland" }, { 0x0410, 850, 1252, "Italian", "Italy" }, + { 0x0411, 932, 932, "Japanese", "Japan" }, { 0x0412, 949, 949, "Korean", "Korea (south)" }, + { 0x0413, 850, 1252, "Dutch", "Netherlands" }, { 0x0414, 850, 1252, "Norwegian (Bokm\345l)", "Norway" }, + { 0x0415, 852, 1250, "Polish", "Poland" }, { 0x0416, 850, 1252, "Portuguese", "Brazil" }, + { 0x0418, 852, 1250, "Romanian", "Romania" }, { 0x0419, 866, 1251, "Russian", "Russia" }, + { 0x041A, 852, 1250, "Croatian", "Croatia" }, { 0x041B, 852, 1250, "Slovak", "Slovakia" }, + { 0x041C, 852, 1250, "Albanian", "Albania" }, { 0x041D, 850, 1252, "Swedish", "Sweden" }, + { 0x041E, 874, 874, "Thai", "Thailand" }, { 0x041F, 857, 1254, "Turkish", "Turkey" }, + { 0x0421, 850, 1252, "Indonesian", "Indonesia" }, { 0x0422, 866, 1251, "Ukrainian", "Ukraine" }, + { 0x0423, 866, 1251, "Belarusian", "Belarus" }, { 0x0424, 852, 1250, "Slovene", "Slovenia" }, + { 0x0425, 775, 1257, "Estonian", "Estonia" }, { 0x0426, 775, 1257, "Latvian", "Latvia" }, + { 0x0427, 775, 1257, "Lithuanian", "Lithuania" }, + { 0x0429, 864, 1256, "Arabic", "Farsi" }, { 0x042A,1258, 1258, "Vietnamese", "Vietnam" }, + { 0x042D, 850, 1252, "Basque", "Spain" }, + { 0x042F, 866, 1251, "Macedonian", "Former Yugoslav Republic of Macedonia" }, + { 0x0436, 850, 1252, "Afrikaans", "South Africa" }, + { 0x0438, 850, 1252, "Faroese", "Faroe Islands" }, + { 0x043C, 437, 1252, "Irish", "Ireland" }, + { 0x043E, 850, 1252, "Malay", "Malaysia" }, + { 0x0801, 864, 1256, "Arabic", "Iraq" }, + { 0x0804, 936, 936, "Chinese (People's republic of China)", "People's republic of China" }, + { 0x0807, 850, 1252, "German", "Switzerland" }, + { 0x0809, 850, 1252, "English", "United Kingdom" }, { 0x080A, 850, 1252, "Spanish", "Mexico" }, + { 0x080C, 850, 1252, "French", "Belgium" }, + { 0x0810, 850, 1252, "Italian", "Switzerland" }, + { 0x0813, 850, 1252, "Dutch", "Belgium" }, { 0x0814, 850, 1252, "Norwegian (Nynorsk)", "Norway" }, + { 0x0816, 850, 1252, "Portuguese", "Portugal" }, + { 0x081A, 852, 1252, "Serbian (latin)", "Yugoslavia" }, + { 0x081D, 850, 1252, "Swedish (Finland)", "Finland" }, + { 0x0C01, 864, 1256, "Arabic", "Egypt" }, + { 0x0C04, 950, 950, "Chinese", "Hong Kong" }, + { 0x0C07, 850, 1252, "German", "Austria" }, + { 0x0C09, 850, 1252, "English", "Australia" }, { 0x0C0A, 850, 1252, "Spanish - International Sort", "Spain" }, + { 0x0C0C, 850, 1252, "French", "Canada"}, + { 0x0C1A, 855, 1251, "Serbian (Cyrillic)", "Serbia" }, + { 0x1001, 864, 1256, "Arabic", "Libya" }, + { 0x1004, 936, 936, "Chinese", "Singapore" }, + { 0x1007, 850, 1252, "German", "Luxembourg" }, + { 0x1009, 850, 1252, "English", "Canada" }, + { 0x100A, 850, 1252, "Spanish", "Guatemala" }, + { 0x100C, 850, 1252, "French", "Switzerland" }, + { 0x1401, 864, 1256, "Arabic", "Algeria" }, + { 0x1407, 850, 1252, "German", "Liechtenstein" }, + { 0x1409, 850, 1252, "English", "New Zealand" }, { 0x140A, 850, 1252, "Spanish", "Costa Rica" }, + { 0x140C, 850, 1252, "French", "Luxembourg" }, + { 0x1801, 864, 1256, "Arabic", "Morocco" }, + { 0x1809, 850, 1252, "English", "Ireland" }, { 0x180A, 850, 1252, "Spanish", "Panama" }, + { 0x180C, 850, 1252, "French", "Monaco" }, + { 0x1C01, 864, 1256, "Arabic", "Tunisia" }, + { 0x1C09, 437, 1252, "English", "South Africa" }, { 0x1C0A, 850, 1252, "Spanish", "Dominican Republic" }, + { 0x2001, 864, 1256, "Arabic", "Oman" }, + { 0x2009, 850, 1252, "English", "Jamaica" }, { 0x200A, 850, 1252, "Spanish", "Venezuela" }, + { 0x2401, 864, 1256, "Arabic", "Yemen" }, + { 0x2409, 850, 1252, "English", "Caribbean" }, { 0x240A, 850, 1252, "Spanish", "Colombia" }, + { 0x2801, 864, 1256, "Arabic", "Syria" }, + { 0x2809, 850, 1252, "English", "Belize" }, { 0x280A, 850, 1252, "Spanish", "Peru" }, + { 0x2C01, 864, 1256, "Arabic", "Jordan" }, + { 0x2C09, 437, 1252, "English", "Trinidad & Tobago" },{ 0x2C0A, 850, 1252, "Spanish", "Argentina" }, + { 0x3001, 864, 1256, "Arabic", "Lebanon" }, + { 0x3009, 437, 1252, "English", "Zimbabwe" }, { 0x300A, 850, 1252, "Spanish", "Ecuador" }, + { 0x3401, 864, 1256, "Arabic", "Kuwait" }, + { 0x3409, 437, 1252, "English", "Philippines" }, { 0x340A, 850, 1252, "Spanish", "Chile" }, + { 0x3801, 864, 1256, "Arabic", "United Arab Emirates" }, + { 0x380A, 850, 1252, "Spanish", "Uruguay" }, + { 0x3C01, 864, 1256, "Arabic", "Bahrain" }, + { 0x3C0A, 850, 1252, "Spanish", "Paraguay" }, + { 0x4001, 864, 1256, "Arabic", "Qatar" }, + { 0x400A, 850, 1252, "Spanish", "Bolivia" }, + { 0x440A, 850, 1252, "Spanish", "El Salvador" }, + { 0x480A, 850, 1252, "Spanish", "Honduras" }, + { 0x4C0A, 850, 1252, "Spanish", "Nicaragua" }, + { 0x500A, 850, 1252, "Spanish", "Puerto Rico" }, + { (unsigned) -1, 0, 0, NULL, NULL } +}; -#ifdef _WIN32 -#include #endif +/* Specifies the default codepage to be used for unicode + transformations. By default this is CP_ACP. */ +rc_uint_type wind_default_codepage = CP_ACP; + +/* Specifies the currently used codepage for unicode + transformations. By default this is CP_ACP. */ +rc_uint_type wind_current_codepage = CP_ACP; + /* Convert an ASCII string to a unicode string. We just copy it, expanding chars to shorts, rather than doing something intelligent. */ void -unicode_from_ascii (length, unicode, ascii) - int *length; - unichar **unicode; - const char *ascii; +unicode_from_ascii (rc_uint_type *length, unichar **unicode, const char *ascii) { - int len; - const char *s; - unsigned short *w; + unicode_from_codepage (length, unicode, ascii, wind_current_codepage); +} - len = strlen (ascii); +/* Convert an ASCII string with length A_LENGTH to a unicode string. We just + copy it, expanding chars to shorts, rather than doing something intelligent. + This routine converts also \0 within a string. */ - if (length != NULL) - *length = len; +void +unicode_from_ascii_len (rc_uint_type *length, unichar **unicode, const char *ascii, rc_uint_type a_length) +{ + char *tmp, *p; + rc_uint_type tlen, elen, idx = 0; - *unicode = ((unichar *) res_alloc ((len + 1) * sizeof (unichar))); + *unicode = NULL; -#ifdef _WIN32 - /* FIXME: On Windows, we should be using MultiByteToWideChar to set - the length. */ - MultiByteToWideChar (CP_ACP, 0, ascii, len + 1, *unicode, len + 1); -#else - for (s = ascii, w = *unicode; *s != '\0'; s++, w++) - *w = *s & 0xff; - *w = 0; -#endif + if (!a_length) + { + if (length) + *length = 0; + return; + } + + /* Make sure we have zero terminated string. */ + p = tmp = (char *) xmalloc (a_length + 1); + memcpy (tmp, ascii, a_length); + tmp[a_length] = 0; + + while (a_length > 0) + { + unichar *utmp, *up; + + tlen = strlen (p); + + if (tlen > a_length) + tlen = a_length; + if (*p == 0) + { + /* Make room for one more character. */ + utmp = (unichar *) res_alloc (sizeof (unichar) * (idx + 1)); + if (idx > 0) + { + memcpy (utmp, *unicode, idx * sizeof (unichar)); + } + *unicode = utmp; + utmp[idx++] = 0; + --a_length; + p++; + continue; + } + utmp = NULL; + elen = 0; + elen = wind_MultiByteToWideChar (wind_current_codepage, p, NULL, 0); + if (elen) + { + utmp = ((unichar *) res_alloc (elen + sizeof (unichar) * 2)); + wind_MultiByteToWideChar (wind_current_codepage, p, utmp, elen); + elen /= sizeof (unichar); + elen --; + } + else + { + /* Make room for one more character. */ + utmp = (unichar *) res_alloc (sizeof (unichar) * (idx + 1)); + if (idx > 0) + { + memcpy (utmp, *unicode, idx * sizeof (unichar)); + } + *unicode = utmp; + utmp[idx++] = ((unichar) *p) & 0xff; + --a_length; + p++; + continue; + } + p += tlen; + a_length -= tlen; + + up = (unichar *) res_alloc (sizeof (unichar) * (idx + elen)); + if (idx > 0) + memcpy (up, *unicode, idx * sizeof (unichar)); + + *unicode = up; + if (elen) + memcpy (&up[idx], utmp, sizeof (unichar) * elen); + + idx += elen; + } + + if (length) + *length = idx; + + free (tmp); +} + +/* Convert an unicode string to an ASCII string. We just copy it, + shrink shorts to chars, rather than doing something intelligent. + Shorts with not within the char range are replaced by '_'. */ + +void +ascii_from_unicode (rc_uint_type *length, const unichar *unicode, char **ascii) +{ + codepage_from_unicode (length, unicode, ascii, wind_current_codepage); } /* Print the unicode string UNICODE to the file E. LENGTH is the @@ -74,10 +299,7 @@ unicode_from_ascii (length, unicode, ascii) some Windows function, probably WideCharToMultiByte. */ void -unicode_print (e, unicode, length) - FILE *e; - const unichar *unicode; - int length; +unicode_print (FILE *e, const unichar *unicode, rc_uint_type length) { while (1) { @@ -85,12 +307,12 @@ unicode_print (e, unicode, length) if (length == 0) return; - if (length > 0) + if ((bfd_signed_vma) length > 0) --length; ch = *unicode; - if (ch == 0 && length < 0) + if (ch == 0 && (bfd_signed_vma) length < 0) return; ++unicode; @@ -98,8 +320,10 @@ unicode_print (e, unicode, length) if ((ch & 0x7f) == ch) { if (ch == '\\') - fputs ("\\", e); - else if (isprint (ch)) + fputs ("\\\\", e); + else if (ch == '"') + fputs ("\"\"", e); + else if (ISPRINT (ch)) putc (ch, e); else { @@ -142,6 +366,542 @@ unicode_print (e, unicode, length) else if ((ch & 0xff) == ch) fprintf (e, "\\%03o", (unsigned int) ch); else - fprintf (e, "\\x%x", (unsigned int) ch); + fprintf (e, "\\x%04x", (unsigned int) ch); + } +} + +/* Print a unicode string to a file. */ + +void +ascii_print (FILE *e, const char *s, rc_uint_type length) +{ + while (1) + { + char ch; + + if (length == 0) + return; + if ((bfd_signed_vma) length > 0) + --length; + + ch = *s; + + if (ch == 0 && (bfd_signed_vma) length < 0) + return; + + ++s; + + if ((ch & 0x7f) == ch) + { + if (ch == '\\') + fputs ("\\\\", e); + else if (ch == '"') + fputs ("\"\"", e); + else if (ISPRINT (ch)) + putc (ch, e); + else + { + switch (ch) + { + case ESCAPE_A: + fputs ("\\a", e); + break; + + case ESCAPE_B: + fputs ("\\b", e); + break; + + case ESCAPE_F: + fputs ("\\f", e); + break; + + case ESCAPE_N: + fputs ("\\n", e); + break; + + case ESCAPE_R: + fputs ("\\r", e); + break; + + case ESCAPE_T: + fputs ("\\t", e); + break; + + case ESCAPE_V: + fputs ("\\v", e); + break; + + default: + fprintf (e, "\\%03o", (unsigned int) ch); + break; + } + } + } + else + fprintf (e, "\\%03o", (unsigned int) ch & 0xff); + } +} + +rc_uint_type +unichar_len (const unichar *unicode) +{ + rc_uint_type r = 0; + + if (unicode) + while (unicode[r] != 0) + r++; + else + --r; + return r; +} + +unichar * +unichar_dup (const unichar *unicode) +{ + unichar *r; + int len; + + if (! unicode) + return NULL; + for (len = 0; unicode[len] != 0; ++len) + ; + ++len; + r = ((unichar *) res_alloc (len * sizeof (unichar))); + memcpy (r, unicode, len * sizeof (unichar)); + return r; +} + +unichar * +unichar_dup_uppercase (const unichar *u) +{ + unichar *r = unichar_dup (u); + int i; + + if (! r) + return NULL; + + for (i = 0; r[i] != 0; ++i) + { + if (r[i] >= 'a' && r[i] <= 'z') + r[i] &= 0xdf; + } + return r; +} + +static int +unichar_isascii (const unichar *u, rc_uint_type len) +{ + rc_uint_type i; + + if ((bfd_signed_vma) len < 0) + { + if (u) + len = (rc_uint_type) unichar_len (u); + else + len = 0; + } + + for (i = 0; i < len; i++) + if ((u[i] & 0xff80) != 0) + return 0; + return 1; +} + +void +unicode_print_quoted (FILE *e, const unichar *u, rc_uint_type len) +{ + if (! unichar_isascii (u, len)) + fputc ('L', e); + fputc ('"', e); + unicode_print (e, u, len); + fputc ('"', e); +} + +int +unicode_is_valid_codepage (rc_uint_type cp) +{ + if ((cp & 0xffff) != cp) + return 0; + if (cp == CP_UTF16 || cp == CP_ACP) + return 1; + +#if !defined (_WIN32) && !defined (__CYGWIN__) + if (! wind_find_codepage_info (cp)) + return 0; + return 1; +#else + return !! IsValidCodePage ((UINT) cp); +#endif +} + +#if defined (_WIN32) || defined (__CYGWIN__) + +#define max_cp_string_len 6 + +static unsigned int +codepage_from_langid (unsigned short langid) +{ + char cp_string [max_cp_string_len]; + int c; + + memset (cp_string, 0, max_cp_string_len); + /* LOCALE_RETURN_NUMBER flag would avoid strtoul conversion, + but is unavailable on Win95. */ + c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), + LOCALE_IDEFAULTANSICODEPAGE, + cp_string, max_cp_string_len); + /* If codepage data for an LCID is not installed on users's system, + GetLocaleInfo returns an empty string. Fall back to system ANSI + default. */ + if (c == 0) + return CP_ACP; + return strtoul (cp_string, 0, 10); +} + +static unsigned int +wincodepage_from_langid (unsigned short langid) +{ + char cp_string [max_cp_string_len]; + int c; + + memset (cp_string, 0, max_cp_string_len); + /* LOCALE_RETURN_NUMBER flag would avoid strtoul conversion, + but is unavailable on Win95. */ + c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), + LOCALE_IDEFAULTCODEPAGE, + cp_string, max_cp_string_len); + /* If codepage data for an LCID is not installed on users's system, + GetLocaleInfo returns an empty string. Fall back to system ANSI + default. */ + if (c == 0) + return CP_OEM; + return strtoul (cp_string, 0, 10); +} + +static char * +lang_from_langid (unsigned short langid) +{ + char cp_string[261]; + int c; + + memset (cp_string, 0, 261); + c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), + LOCALE_SENGLANGUAGE, + cp_string, 260); + /* If codepage data for an LCID is not installed on users's system, + GetLocaleInfo returns an empty string. Fall back to system ANSI + default. */ + if (c == 0) + strcpy (cp_string, "Neutral"); + return xstrdup (cp_string); +} + +static char * +country_from_langid (unsigned short langid) +{ + char cp_string[261]; + int c; + + memset (cp_string, 0, 261); + c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), + LOCALE_SENGCOUNTRY, + cp_string, 260); + /* If codepage data for an LCID is not installed on users's system, + GetLocaleInfo returns an empty string. Fall back to system ANSI + default. */ + if (c == 0) + strcpy (cp_string, "Neutral"); + return xstrdup (cp_string); +} + +#endif + +const wind_language_t * +wind_find_language_by_id (unsigned id) +{ +#if !defined (_WIN32) && !defined (__CYGWIN__) + int i; + + if (! id) + return NULL; + for (i = 0; languages[i].id != (unsigned) -1 && languages[i].id != id; i++) + ; + if (languages[i].id == id) + return &languages[i]; + return NULL; +#else + static wind_language_t wl; + + wl.id = id; + wl.doscp = codepage_from_langid ((unsigned short) id); + wl.wincp = wincodepage_from_langid ((unsigned short) id); + wl.name = lang_from_langid ((unsigned short) id); + wl.country = country_from_langid ((unsigned short) id); + + return & wl; +#endif +} + +const local_iconv_map * +wind_find_codepage_info (unsigned cp) +{ +#if !defined (_WIN32) && !defined (__CYGWIN__) + int i; + + for (i = 0; codepages[i].codepage != (rc_uint_type) -1 && codepages[i].codepage != cp; i++) + ; + if (codepages[i].codepage == (rc_uint_type) -1) + return NULL; + return &codepages[i]; +#else + static local_iconv_map lim; + if (!unicode_is_valid_codepage (cp)) + return NULL; + lim.codepage = cp; + lim.iconv_name = ""; + return & lim; +#endif +} + +/* Convert an Codepage string to a unicode string. */ + +void +unicode_from_codepage (rc_uint_type *length, unichar **u, const char *src, rc_uint_type cp) +{ + rc_uint_type len; + + len = wind_MultiByteToWideChar (cp, src, NULL, 0); + if (len) + { + *u = ((unichar *) res_alloc (len)); + wind_MultiByteToWideChar (cp, src, *u, len); + } + /* Discount the trailing '/0'. If MultiByteToWideChar failed, + this will set *length to -1. */ + len -= sizeof (unichar); + + if (length != NULL) + *length = len / sizeof (unichar); +} + +/* Convert an unicode string to an codepage string. */ + +void +codepage_from_unicode (rc_uint_type *length, const unichar *unicode, char **ascii, rc_uint_type cp) +{ + rc_uint_type len; + + len = wind_WideCharToMultiByte (cp, unicode, NULL, 0); + if (len) + { + *ascii = (char *) res_alloc (len * sizeof (char)); + wind_WideCharToMultiByte (cp, unicode, *ascii, len); + } + /* Discount the trailing '/0'. If MultiByteToWideChar failed, + this will set *length to -1. */ + len--; + + if (length != NULL) + *length = len; +} + +#if defined (HAVE_ICONV) && !defined (_WIN32) && !defined (__CYGWIN__) +static int +iconv_onechar (iconv_t cd, ICONV_CONST char *s, char *d, int d_len, const char **n_s, char **n_d) +{ + int i; + + for (i = 1; i <= 32; i++) + { + char *tmp_d = d; + ICONV_CONST char *tmp_s = s; + size_t ret; + size_t s_left = (size_t) i; + size_t d_left = (size_t) d_len; + + ret = iconv (cd, & tmp_s, & s_left, & tmp_d, & d_left); + + if (ret != (size_t) -1) + { + *n_s = tmp_s; + *n_d = tmp_d; + return 0; + } + } + + return 1; +} + +static const char * +wind_iconv_cp (rc_uint_type cp) +{ + const local_iconv_map *lim = wind_find_codepage_info (cp); + + if (!lim) + return NULL; + return lim->iconv_name; +} +#endif /* HAVE_ICONV */ + +static rc_uint_type +wind_MultiByteToWideChar (rc_uint_type cp, const char *mb, + unichar *u, rc_uint_type u_len) +{ + rc_uint_type ret = 0; + +#if defined (_WIN32) || defined (__CYGWIN__) + rc_uint_type conv_flags = MB_PRECOMPOSED; + + /* MB_PRECOMPOSED is not allowed for UTF-7 or UTF-8. + MultiByteToWideChar will set the last error to + ERROR_INVALID_FLAGS if we do. */ + if (cp == CP_UTF8 || cp == CP_UTF7) + conv_flags = 0; + + ret = (rc_uint_type) MultiByteToWideChar (cp, conv_flags, + mb, -1, u, u_len); + /* Convert to bytes. */ + ret *= sizeof (unichar); + +#elif defined (HAVE_ICONV) + int first = 1; + char tmp[32]; + char *p_tmp; + const char *iconv_name = wind_iconv_cp (cp); + + if (!mb || !iconv_name) + return 0; + iconv_t cd = iconv_open ("UTF-16LE", iconv_name); + + while (1) + { + int iret; + const char *n_mb = ""; + char *n_tmp = ""; + + p_tmp = tmp; + iret = iconv_onechar (cd, (ICONV_CONST char *) mb, p_tmp, 32, & n_mb, & n_tmp); + if (first) + { + first = 0; + continue; + } + if (!iret) + { + size_t l_tmp = (size_t) (n_tmp - p_tmp); + + if (u) + { + if ((size_t) u_len < l_tmp) + break; + memcpy (u, tmp, l_tmp); + u += l_tmp/2; + u_len -= l_tmp; + } + ret += l_tmp; + } + else + break; + if (tmp[0] == 0 && tmp[1] == 0) + break; + mb = n_mb; } + iconv_close (cd); +#else + if (cp) + ret = 0; + ret = strlen (mb) + 1; + ret *= sizeof (unichar); + if (u != NULL && u_len != 0) + { + do + { + *u++ = ((unichar) *mb) & 0xff; + --u_len; mb++; + } + while (u_len != 0 && mb[-1] != 0); + } + if (u != NULL && u_len != 0) + *u = 0; +#endif + return ret; +} + +static rc_uint_type +wind_WideCharToMultiByte (rc_uint_type cp, const unichar *u, char *mb, rc_uint_type mb_len) +{ + rc_uint_type ret = 0; +#if defined (_WIN32) || defined (__CYGWIN__) + WINBOOL used_def = FALSE; + + ret = (rc_uint_type) WideCharToMultiByte (cp, 0, u, -1, mb, mb_len, + NULL, & used_def); +#elif defined (HAVE_ICONV) + int first = 1; + char tmp[32]; + char *p_tmp; + const char *iconv_name = wind_iconv_cp (cp); + + if (!u || !iconv_name) + return 0; + iconv_t cd = iconv_open (iconv_name, "UTF-16LE"); + + while (1) + { + int iret; + const char *n_u = ""; + char *n_tmp = ""; + + p_tmp = tmp; + iret = iconv_onechar (cd, (ICONV_CONST char *) u, p_tmp, 32, &n_u, & n_tmp); + if (first) + { + first = 0; + continue; + } + if (!iret) + { + size_t l_tmp = (size_t) (n_tmp - p_tmp); + + if (mb) + { + if ((size_t) mb_len < l_tmp) + break; + memcpy (mb, tmp, l_tmp); + mb += l_tmp; + mb_len -= l_tmp; + } + ret += l_tmp; + } + else + break; + if (u[0] == 0) + break; + u = (const unichar *) n_u; + } + iconv_close (cd); +#else + if (cp) + ret = 0; + + while (u[ret] != 0) + ++ret; + + ++ret; + + if (mb) + { + while (*u != 0 && mb_len != 0) + { + if (u[0] == (u[0] & 0x7f)) + *mb++ = (char) u[0]; + else + *mb++ = '_'; + ++u; --mb_len; + } + if (mb_len != 0) + *mb = 0; + } +#endif + return ret; }