|  | /* winduni.c -- unicode support for the windres program. | 
|  | Copyright (C) 1997-2024 Free Software Foundation, Inc. | 
|  | Written by Ian Lance Taylor, Cygnus Support. | 
|  | Rewritten by Kai Tietz, Onevision. | 
|  |  | 
|  | This file is part of GNU Binutils. | 
|  |  | 
|  | This program is free software; you can redistribute it and/or modify | 
|  | it under the terms of the GNU General Public License as published by | 
|  | the Free Software Foundation; either version 3 of the License, or | 
|  | (at your option) any later version. | 
|  |  | 
|  | This program is distributed in the hope that it will be useful, | 
|  | but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
|  | GNU General Public License for more details. | 
|  |  | 
|  | You should have received a copy of the GNU General Public License | 
|  | along with this program; if not, write to the Free Software | 
|  | Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA | 
|  | 02110-1301, USA.  */ | 
|  |  | 
|  |  | 
|  | /* This file contains unicode support routines for the windres | 
|  | program.  Ideally, we would have generic unicode support which | 
|  | would work on all systems.  However, we don't.  Instead, on a | 
|  | Windows host, we are prepared to call some Windows routines.  This | 
|  | means that we will generate different output on Windows and Unix | 
|  | hosts, but that seems better than not really supporting unicode at | 
|  | all.  */ | 
|  |  | 
|  | #include "sysdep.h" | 
|  | #include "bfd.h" | 
|  | #include "libiberty.h" /* for xstrdup */ | 
|  | #include "bucomm.h" | 
|  | /* Must be include before windows.h and winnls.h.  */ | 
|  | #if defined (_WIN32) || defined (__CYGWIN__) | 
|  | #include <windows.h> | 
|  | #include <winnls.h> | 
|  | #endif | 
|  | #include "winduni.h" | 
|  | #include "safe-ctype.h" | 
|  |  | 
|  | #if HAVE_ICONV | 
|  | #include <iconv.h> | 
|  | #endif | 
|  |  | 
|  | static rc_uint_type wind_WideCharToMultiByte (rc_uint_type, const unichar *, char *, rc_uint_type); | 
|  | static rc_uint_type wind_MultiByteToWideChar (rc_uint_type, const char *, unichar *, rc_uint_type); | 
|  | static int unichar_isascii (const unichar *, rc_uint_type); | 
|  |  | 
|  | /* Convert an ASCII string to a unicode string.  We just copy it, | 
|  | expanding chars to shorts, rather than doing something intelligent.  */ | 
|  |  | 
|  | #if !defined (_WIN32) && !defined (__CYGWIN__) | 
|  |  | 
|  | /* Codepages mapped.  */ | 
|  | static local_iconv_map codepages[] = | 
|  | { | 
|  | { 0, "cp1252" }, | 
|  | { 1, "WINDOWS-1252" }, | 
|  | { 437, "MS-ANSI" }, | 
|  | { 737, "MS-GREEK" }, | 
|  | { 775, "WINBALTRIM" }, | 
|  | { 850, "MS-ANSI" }, | 
|  | { 852, "MS-EE" }, | 
|  | { 857, "MS-TURK" }, | 
|  | { 862, "CP862" }, | 
|  | { 864, "CP864" }, | 
|  | { 866, "MS-CYRL" }, | 
|  | { 874, "WINDOWS-874" }, | 
|  | { 932, "CP932" }, | 
|  | { 936, "CP936" }, | 
|  | { 949, "CP949" }, | 
|  | { 950, "CP950" }, | 
|  | { 1250, "WINDOWS-1250" }, | 
|  | { 1251, "WINDOWS-1251" }, | 
|  | { 1252, "WINDOWS-1252" }, | 
|  | { 1253, "WINDOWS-1253" }, | 
|  | { 1254, "WINDOWS-1254" }, | 
|  | { 1255, "WINDOWS-1255" }, | 
|  | { 1256, "WINDOWS-1256" }, | 
|  | { 1257, "WINDOWS-1257" }, | 
|  | { 1258, "WINDOWS-1258" }, | 
|  | { CP_UTF7, "UTF-7" }, | 
|  | { CP_UTF8, "UTF-8" }, | 
|  | { CP_UTF16, "UTF-16LE" }, | 
|  | { (rc_uint_type) -1, NULL } | 
|  | }; | 
|  |  | 
|  | /* Languages supported.  */ | 
|  | static const wind_language_t languages[] = | 
|  | { | 
|  | { 0x0000, 437, 1252, "Neutral", "Neutral" }, | 
|  | { 0x0401, 864, 1256, "Arabic", "Saudi Arabia" },    { 0x0402, 866, 1251, "Bulgarian", "Bulgaria" }, | 
|  | { 0x0403, 850, 1252, "Catalan", "Spain" },	      { 0x0404, 950,  950, "Chinese", "Taiwan" }, | 
|  | { 0x0405, 852, 1250, "Czech", "Czech Republic" },   { 0x0406, 850, 1252, "Danish", "Denmark" }, | 
|  | { 0x0407, 850, 1252, "German", "Germany" },	      { 0x0408, 737, 1253, "Greek", "Greece" }, | 
|  | { 0x0409, 437, 1252, "English", "United States" },  { 0x040A, 850, 1252, "Spanish - Traditional Sort", "Spain" }, | 
|  | { 0x040B, 850, 1252, "Finnish", "Finland" },	      { 0x040C, 850, 1252, "French", "France" }, | 
|  | { 0x040D, 862, 1255, "Hebrew", "Israel" },	      { 0x040E, 852, 1250, "Hungarian", "Hungary" }, | 
|  | { 0x040F, 850, 1252, "Icelandic", "Iceland" },      { 0x0410, 850, 1252, "Italian", "Italy" }, | 
|  | { 0x0411, 932,  932, "Japanese", "Japan" },	      { 0x0412, 949,  949, "Korean", "Korea (south)" }, | 
|  | { 0x0413, 850, 1252, "Dutch", "Netherlands" },      { 0x0414, 850, 1252, "Norwegian (Bokm\345l)", "Norway" }, | 
|  | { 0x0415, 852, 1250, "Polish", "Poland" },	      { 0x0416, 850, 1252, "Portuguese", "Brazil" }, | 
|  | { 0x0418, 852, 1250, "Romanian", "Romania" },	      { 0x0419, 866, 1251, "Russian", "Russia" }, | 
|  | { 0x041A, 852, 1250, "Croatian", "Croatia" },	      { 0x041B, 852, 1250, "Slovak", "Slovakia" }, | 
|  | { 0x041C, 852, 1250, "Albanian", "Albania" },	      { 0x041D, 850, 1252, "Swedish", "Sweden" }, | 
|  | { 0x041E, 874,  874, "Thai", "Thailand" },	      { 0x041F, 857, 1254, "Turkish", "Turkey" }, | 
|  | { 0x0421, 850, 1252, "Indonesian", "Indonesia" },   { 0x0422, 866, 1251, "Ukrainian", "Ukraine" }, | 
|  | { 0x0423, 866, 1251, "Belarusian", "Belarus" },     { 0x0424, 852, 1250, "Slovene", "Slovenia" }, | 
|  | { 0x0425, 775, 1257, "Estonian", "Estonia" },	      { 0x0426, 775, 1257, "Latvian", "Latvia" }, | 
|  | { 0x0427, 775, 1257, "Lithuanian", "Lithuania" }, | 
|  | { 0x0429, 864, 1256, "Arabic", "Farsi" },	      { 0x042A,1258, 1258, "Vietnamese", "Vietnam" }, | 
|  | { 0x042D, 850, 1252, "Basque", "Spain" }, | 
|  | { 0x042F, 866, 1251, "Macedonian", "Former Yugoslav Republic of Macedonia" }, | 
|  | { 0x0436, 850, 1252, "Afrikaans", "South Africa" }, | 
|  | { 0x0438, 850, 1252, "Faroese", "Faroe Islands" }, | 
|  | { 0x043C, 437, 1252, "Irish", "Ireland" }, | 
|  | { 0x043E, 850, 1252, "Malay", "Malaysia" }, | 
|  | { 0x0801, 864, 1256, "Arabic", "Iraq" }, | 
|  | { 0x0804, 936,  936, "Chinese (People's republic of China)", "People's republic of China" }, | 
|  | { 0x0807, 850, 1252, "German", "Switzerland" }, | 
|  | { 0x0809, 850, 1252, "English", "United Kingdom" }, { 0x080A, 850, 1252, "Spanish", "Mexico" }, | 
|  | { 0x080C, 850, 1252, "French", "Belgium" }, | 
|  | { 0x0810, 850, 1252, "Italian", "Switzerland" }, | 
|  | { 0x0813, 850, 1252, "Dutch", "Belgium" },	      { 0x0814, 850, 1252, "Norwegian (Nynorsk)", "Norway" }, | 
|  | { 0x0816, 850, 1252, "Portuguese", "Portugal" }, | 
|  | { 0x081A, 852, 1252, "Serbian (latin)", "Yugoslavia" }, | 
|  | { 0x081D, 850, 1252, "Swedish (Finland)", "Finland" }, | 
|  | { 0x0C01, 864, 1256, "Arabic", "Egypt" }, | 
|  | { 0x0C04, 950,  950, "Chinese", "Hong Kong" }, | 
|  | { 0x0C07, 850, 1252, "German", "Austria" }, | 
|  | { 0x0C09, 850, 1252, "English", "Australia" },      { 0x0C0A, 850, 1252, "Spanish - International Sort", "Spain" }, | 
|  | { 0x0C0C, 850, 1252, "French", "Canada"}, | 
|  | { 0x0C1A, 855, 1251, "Serbian (Cyrillic)", "Serbia" }, | 
|  | { 0x1001, 864, 1256, "Arabic", "Libya" }, | 
|  | { 0x1004, 936,  936, "Chinese", "Singapore" }, | 
|  | { 0x1007, 850, 1252, "German", "Luxembourg" }, | 
|  | { 0x1009, 850, 1252, "English", "Canada" }, | 
|  | { 0x100A, 850, 1252, "Spanish", "Guatemala" }, | 
|  | { 0x100C, 850, 1252, "French", "Switzerland" }, | 
|  | { 0x1401, 864, 1256, "Arabic", "Algeria" }, | 
|  | { 0x1407, 850, 1252, "German", "Liechtenstein" }, | 
|  | { 0x1409, 850, 1252, "English", "New Zealand" },    { 0x140A, 850, 1252, "Spanish", "Costa Rica" }, | 
|  | { 0x140C, 850, 1252, "French", "Luxembourg" }, | 
|  | { 0x1801, 864, 1256, "Arabic", "Morocco" }, | 
|  | { 0x1809, 850, 1252, "English", "Ireland" },	      { 0x180A, 850, 1252, "Spanish", "Panama" }, | 
|  | { 0x180C, 850, 1252, "French", "Monaco" }, | 
|  | { 0x1C01, 864, 1256, "Arabic", "Tunisia" }, | 
|  | { 0x1C09, 437, 1252, "English", "South Africa" },   { 0x1C0A, 850, 1252, "Spanish", "Dominican Republic" }, | 
|  | { 0x2001, 864, 1256, "Arabic", "Oman" }, | 
|  | { 0x2009, 850, 1252, "English", "Jamaica" },	      { 0x200A, 850, 1252, "Spanish", "Venezuela" }, | 
|  | { 0x2401, 864, 1256, "Arabic", "Yemen" }, | 
|  | { 0x2409, 850, 1252, "English", "Caribbean" },      { 0x240A, 850, 1252, "Spanish", "Colombia" }, | 
|  | { 0x2801, 864, 1256, "Arabic", "Syria" }, | 
|  | { 0x2809, 850, 1252, "English", "Belize" },	      { 0x280A, 850, 1252, "Spanish", "Peru" }, | 
|  | { 0x2C01, 864, 1256, "Arabic", "Jordan" }, | 
|  | { 0x2C09, 437, 1252, "English", "Trinidad & Tobago" },{ 0x2C0A, 850, 1252, "Spanish", "Argentina" }, | 
|  | { 0x3001, 864, 1256, "Arabic", "Lebanon" }, | 
|  | { 0x3009, 437, 1252, "English", "Zimbabwe" },	      { 0x300A, 850, 1252, "Spanish", "Ecuador" }, | 
|  | { 0x3401, 864, 1256, "Arabic", "Kuwait" }, | 
|  | { 0x3409, 437, 1252, "English", "Philippines" },    { 0x340A, 850, 1252, "Spanish", "Chile" }, | 
|  | { 0x3801, 864, 1256, "Arabic", "United Arab Emirates" }, | 
|  | { 0x380A, 850, 1252, "Spanish", "Uruguay" }, | 
|  | { 0x3C01, 864, 1256, "Arabic", "Bahrain" }, | 
|  | { 0x3C0A, 850, 1252, "Spanish", "Paraguay" }, | 
|  | { 0x4001, 864, 1256, "Arabic", "Qatar" }, | 
|  | { 0x400A, 850, 1252, "Spanish", "Bolivia" }, | 
|  | { 0x440A, 850, 1252, "Spanish", "El Salvador" }, | 
|  | { 0x480A, 850, 1252, "Spanish", "Honduras" }, | 
|  | { 0x4C0A, 850, 1252, "Spanish", "Nicaragua" }, | 
|  | { 0x500A, 850, 1252, "Spanish", "Puerto Rico" }, | 
|  | { (unsigned) -1,  0,      0, NULL, NULL } | 
|  | }; | 
|  |  | 
|  | #endif | 
|  |  | 
|  | /* Specifies the default codepage to be used for unicode | 
|  | transformations.  By default this is CP_ACP.  */ | 
|  | rc_uint_type wind_default_codepage = CP_ACP; | 
|  |  | 
|  | /* Specifies the currently used codepage for unicode | 
|  | transformations.  By default this is CP_ACP.  */ | 
|  | rc_uint_type wind_current_codepage = CP_ACP; | 
|  |  | 
|  | /* Convert an ASCII string to a unicode string.  We just copy it, | 
|  | expanding chars to shorts, rather than doing something intelligent.  */ | 
|  |  | 
|  | void | 
|  | unicode_from_ascii (rc_uint_type *length, unichar **unicode, const char *ascii) | 
|  | { | 
|  | unicode_from_codepage (length, unicode, ascii, wind_current_codepage); | 
|  | } | 
|  |  | 
|  | /* Convert an ASCII string with length A_LENGTH to a unicode string.  We just | 
|  | copy it, expanding chars to shorts, rather than doing something intelligent. | 
|  | This routine converts also \0 within a string.  */ | 
|  |  | 
|  | void | 
|  | unicode_from_ascii_len (rc_uint_type *length, unichar **unicode, const char *ascii, rc_uint_type a_length) | 
|  | { | 
|  | char *tmp, *p; | 
|  | rc_uint_type tlen, elen, idx = 0; | 
|  |  | 
|  | *unicode = NULL; | 
|  |  | 
|  | if (!a_length) | 
|  | { | 
|  | if (length) | 
|  | *length = 0; | 
|  | return; | 
|  | } | 
|  |  | 
|  | /* Make sure we have zero terminated string.  */ | 
|  | p = tmp = (char *) xmalloc (a_length + 1); | 
|  | memcpy (tmp, ascii, a_length); | 
|  | tmp[a_length] = 0; | 
|  |  | 
|  | while (a_length > 0) | 
|  | { | 
|  | unichar *utmp, *up; | 
|  |  | 
|  | tlen = strlen (p); | 
|  |  | 
|  | if (tlen > a_length) | 
|  | tlen = a_length; | 
|  | if (*p == 0) | 
|  | { | 
|  | /* Make room for one more character.  */ | 
|  | utmp = (unichar *) res_alloc (sizeof (unichar) * (idx + 1)); | 
|  | if (idx > 0) | 
|  | { | 
|  | memcpy (utmp, *unicode, idx * sizeof (unichar)); | 
|  | } | 
|  | *unicode = utmp; | 
|  | utmp[idx++] = 0; | 
|  | --a_length; | 
|  | p++; | 
|  | continue; | 
|  | } | 
|  | utmp = NULL; | 
|  | elen = 0; | 
|  | elen = wind_MultiByteToWideChar (wind_current_codepage, p, NULL, 0); | 
|  | if (elen) | 
|  | { | 
|  | utmp = ((unichar *) res_alloc (elen + sizeof (unichar) * 2)); | 
|  | wind_MultiByteToWideChar (wind_current_codepage, p, utmp, elen); | 
|  | elen /= sizeof (unichar); | 
|  | elen --; | 
|  | } | 
|  | else | 
|  | { | 
|  | /* Make room for one more character.  */ | 
|  | utmp = (unichar *) res_alloc (sizeof (unichar) * (idx + 1)); | 
|  | if (idx > 0) | 
|  | { | 
|  | memcpy (utmp, *unicode, idx * sizeof (unichar)); | 
|  | } | 
|  | *unicode = utmp; | 
|  | utmp[idx++] = ((unichar) *p) & 0xff; | 
|  | --a_length; | 
|  | p++; | 
|  | continue; | 
|  | } | 
|  | p += tlen; | 
|  | a_length -= tlen; | 
|  |  | 
|  | up = (unichar *) res_alloc (sizeof (unichar) * (idx + elen)); | 
|  | if (idx > 0) | 
|  | memcpy (up, *unicode, idx * sizeof (unichar)); | 
|  |  | 
|  | *unicode = up; | 
|  | if (elen) | 
|  | memcpy (&up[idx], utmp, sizeof (unichar) * elen); | 
|  |  | 
|  | idx += elen; | 
|  | } | 
|  |  | 
|  | if (length) | 
|  | *length = idx; | 
|  |  | 
|  | free (tmp); | 
|  | } | 
|  |  | 
|  | /* Convert an unicode string to an ASCII string.  We just copy it, | 
|  | shrink shorts to chars, rather than doing something intelligent. | 
|  | Shorts with not within the char range are replaced by '_'.  */ | 
|  |  | 
|  | void | 
|  | ascii_from_unicode (rc_uint_type *length, const unichar *unicode, char **ascii) | 
|  | { | 
|  | codepage_from_unicode (length, unicode, ascii, wind_current_codepage); | 
|  | } | 
|  |  | 
|  | /* Print the unicode string UNICODE to the file E.  LENGTH is the | 
|  | number of characters to print, or -1 if we should print until the | 
|  | end of the string.  FIXME: On a Windows host, we should be calling | 
|  | some Windows function, probably WideCharToMultiByte.  */ | 
|  |  | 
|  | void | 
|  | unicode_print (FILE *e, const unichar *unicode, rc_uint_type length) | 
|  | { | 
|  | while (1) | 
|  | { | 
|  | unichar ch; | 
|  |  | 
|  | if (length == 0) | 
|  | return; | 
|  | if ((bfd_signed_vma) length > 0) | 
|  | --length; | 
|  |  | 
|  | ch = *unicode; | 
|  |  | 
|  | if (ch == 0 && (bfd_signed_vma) length < 0) | 
|  | return; | 
|  |  | 
|  | ++unicode; | 
|  |  | 
|  | if ((ch & 0x7f) == ch) | 
|  | { | 
|  | if (ch == '\\') | 
|  | fputs ("\\\\", e); | 
|  | else if (ch == '"') | 
|  | fputs ("\"\"", e); | 
|  | else if (ISPRINT (ch)) | 
|  | putc (ch, e); | 
|  | else | 
|  | { | 
|  | switch (ch) | 
|  | { | 
|  | case ESCAPE_A: | 
|  | fputs ("\\a", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_B: | 
|  | fputs ("\\b", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_F: | 
|  | fputs ("\\f", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_N: | 
|  | fputs ("\\n", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_R: | 
|  | fputs ("\\r", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_T: | 
|  | fputs ("\\t", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_V: | 
|  | fputs ("\\v", e); | 
|  | break; | 
|  |  | 
|  | default: | 
|  | fprintf (e, "\\%03o", (unsigned int) ch); | 
|  | break; | 
|  | } | 
|  | } | 
|  | } | 
|  | else if ((ch & 0xff) == ch) | 
|  | fprintf (e, "\\%03o", (unsigned int) ch); | 
|  | else | 
|  | fprintf (e, "\\x%04x", (unsigned int) ch); | 
|  | } | 
|  | } | 
|  |  | 
|  | /* Print a unicode string to a file.  */ | 
|  |  | 
|  | void | 
|  | ascii_print (FILE *e, const char *s, rc_uint_type length) | 
|  | { | 
|  | while (1) | 
|  | { | 
|  | char ch; | 
|  |  | 
|  | if (length == 0) | 
|  | return; | 
|  | if ((bfd_signed_vma) length > 0) | 
|  | --length; | 
|  |  | 
|  | ch = *s; | 
|  |  | 
|  | if (ch == 0 && (bfd_signed_vma) length < 0) | 
|  | return; | 
|  |  | 
|  | ++s; | 
|  |  | 
|  | if ((ch & 0x7f) == ch) | 
|  | { | 
|  | if (ch == '\\') | 
|  | fputs ("\\\\", e); | 
|  | else if (ch == '"') | 
|  | fputs ("\"\"", e); | 
|  | else if (ISPRINT (ch)) | 
|  | putc (ch, e); | 
|  | else | 
|  | { | 
|  | switch (ch) | 
|  | { | 
|  | case ESCAPE_A: | 
|  | fputs ("\\a", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_B: | 
|  | fputs ("\\b", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_F: | 
|  | fputs ("\\f", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_N: | 
|  | fputs ("\\n", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_R: | 
|  | fputs ("\\r", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_T: | 
|  | fputs ("\\t", e); | 
|  | break; | 
|  |  | 
|  | case ESCAPE_V: | 
|  | fputs ("\\v", e); | 
|  | break; | 
|  |  | 
|  | default: | 
|  | fprintf (e, "\\%03o", (unsigned int) ch); | 
|  | break; | 
|  | } | 
|  | } | 
|  | } | 
|  | else | 
|  | fprintf (e, "\\%03o", (unsigned int) ch & 0xff); | 
|  | } | 
|  | } | 
|  |  | 
|  | rc_uint_type | 
|  | unichar_len (const unichar *unicode) | 
|  | { | 
|  | rc_uint_type r = 0; | 
|  |  | 
|  | if (unicode) | 
|  | while (unicode[r] != 0) | 
|  | r++; | 
|  | else | 
|  | --r; | 
|  | return r; | 
|  | } | 
|  |  | 
|  | unichar * | 
|  | unichar_dup (const unichar *unicode) | 
|  | { | 
|  | unichar *r; | 
|  | int len; | 
|  |  | 
|  | if (! unicode) | 
|  | return NULL; | 
|  | for (len = 0; unicode[len] != 0; ++len) | 
|  | ; | 
|  | ++len; | 
|  | r = ((unichar *) res_alloc (len * sizeof (unichar))); | 
|  | memcpy (r, unicode, len * sizeof (unichar)); | 
|  | return r; | 
|  | } | 
|  |  | 
|  | unichar * | 
|  | unichar_dup_uppercase (const unichar *u) | 
|  | { | 
|  | unichar *r = unichar_dup (u); | 
|  | int i; | 
|  |  | 
|  | if (! r) | 
|  | return NULL; | 
|  |  | 
|  | for (i = 0; r[i] != 0; ++i) | 
|  | { | 
|  | if (r[i] >= 'a' && r[i] <= 'z') | 
|  | r[i] &= 0xdf; | 
|  | } | 
|  | return r; | 
|  | } | 
|  |  | 
|  | static int | 
|  | unichar_isascii (const unichar *u, rc_uint_type len) | 
|  | { | 
|  | rc_uint_type i; | 
|  |  | 
|  | if ((bfd_signed_vma) len < 0) | 
|  | { | 
|  | if (u) | 
|  | len = (rc_uint_type) unichar_len (u); | 
|  | else | 
|  | len = 0; | 
|  | } | 
|  |  | 
|  | for (i = 0; i < len; i++) | 
|  | if ((u[i] & 0xff80) != 0) | 
|  | return 0; | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | void | 
|  | unicode_print_quoted (FILE *e, const unichar *u, rc_uint_type len) | 
|  | { | 
|  | if (! unichar_isascii (u, len)) | 
|  | fputc ('L', e); | 
|  | fputc ('"', e); | 
|  | unicode_print (e, u, len); | 
|  | fputc ('"', e); | 
|  | } | 
|  |  | 
|  | int | 
|  | unicode_is_valid_codepage (rc_uint_type cp) | 
|  | { | 
|  | if ((cp & 0xffff) != cp) | 
|  | return 0; | 
|  | if (cp == CP_UTF16 || cp == CP_ACP) | 
|  | return 1; | 
|  |  | 
|  | #if !defined (_WIN32) && !defined (__CYGWIN__) | 
|  | if (! wind_find_codepage_info (cp)) | 
|  | return 0; | 
|  | return 1; | 
|  | #else | 
|  | return !! IsValidCodePage ((UINT) cp); | 
|  | #endif | 
|  | } | 
|  |  | 
|  | #if defined (_WIN32) || defined (__CYGWIN__) | 
|  |  | 
|  | #define max_cp_string_len 6 | 
|  |  | 
|  | static unsigned int | 
|  | codepage_from_langid (unsigned short langid) | 
|  | { | 
|  | char cp_string [max_cp_string_len]; | 
|  | int c; | 
|  |  | 
|  | memset (cp_string, 0, max_cp_string_len); | 
|  | /* LOCALE_RETURN_NUMBER flag would avoid strtoul conversion, | 
|  | but is unavailable on Win95.  */ | 
|  | c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), | 
|  | LOCALE_IDEFAULTANSICODEPAGE, | 
|  | cp_string, max_cp_string_len); | 
|  | /* If codepage data for an LCID is not installed on users's system, | 
|  | GetLocaleInfo returns an empty string.  Fall back to system ANSI | 
|  | default. */ | 
|  | if (c == 0) | 
|  | return CP_ACP; | 
|  | return strtoul (cp_string, 0, 10); | 
|  | } | 
|  |  | 
|  | static unsigned int | 
|  | wincodepage_from_langid (unsigned short langid) | 
|  | { | 
|  | char cp_string [max_cp_string_len]; | 
|  | int c; | 
|  |  | 
|  | memset (cp_string, 0, max_cp_string_len); | 
|  | /* LOCALE_RETURN_NUMBER flag would avoid strtoul conversion, | 
|  | but is unavailable on Win95.  */ | 
|  | c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), | 
|  | LOCALE_IDEFAULTCODEPAGE, | 
|  | cp_string, max_cp_string_len); | 
|  | /* If codepage data for an LCID is not installed on users's system, | 
|  | GetLocaleInfo returns an empty string.  Fall back to system ANSI | 
|  | default. */ | 
|  | if (c == 0) | 
|  | return CP_OEM; | 
|  | return strtoul (cp_string, 0, 10); | 
|  | } | 
|  |  | 
|  | static char * | 
|  | lang_from_langid (unsigned short langid) | 
|  | { | 
|  | char cp_string[261]; | 
|  | int c; | 
|  |  | 
|  | memset (cp_string, 0, 261); | 
|  | c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), | 
|  | LOCALE_SENGLANGUAGE, | 
|  | cp_string, 260); | 
|  | /* If codepage data for an LCID is not installed on users's system, | 
|  | GetLocaleInfo returns an empty string.  Fall back to system ANSI | 
|  | default. */ | 
|  | if (c == 0) | 
|  | strcpy (cp_string, "Neutral"); | 
|  | return xstrdup (cp_string); | 
|  | } | 
|  |  | 
|  | static char * | 
|  | country_from_langid (unsigned short langid) | 
|  | { | 
|  | char cp_string[261]; | 
|  | int c; | 
|  |  | 
|  | memset (cp_string, 0, 261); | 
|  | c = GetLocaleInfoA (MAKELCID (langid, SORT_DEFAULT), | 
|  | LOCALE_SENGCOUNTRY, | 
|  | cp_string, 260); | 
|  | /* If codepage data for an LCID is not installed on users's system, | 
|  | GetLocaleInfo returns an empty string.  Fall back to system ANSI | 
|  | default. */ | 
|  | if (c == 0) | 
|  | strcpy (cp_string, "Neutral"); | 
|  | return xstrdup (cp_string); | 
|  | } | 
|  |  | 
|  | #endif | 
|  |  | 
|  | const wind_language_t * | 
|  | wind_find_language_by_id (unsigned id) | 
|  | { | 
|  | #if !defined (_WIN32) && !defined (__CYGWIN__) | 
|  | int i; | 
|  |  | 
|  | if (! id) | 
|  | return NULL; | 
|  | for (i = 0; languages[i].id != (unsigned) -1 && languages[i].id != id; i++) | 
|  | ; | 
|  | if (languages[i].id == id) | 
|  | return &languages[i]; | 
|  | return NULL; | 
|  | #else | 
|  | static wind_language_t wl; | 
|  |  | 
|  | wl.id = id; | 
|  | wl.doscp = codepage_from_langid ((unsigned short) id); | 
|  | wl.wincp = wincodepage_from_langid ((unsigned short) id); | 
|  | wl.name = lang_from_langid ((unsigned short) id); | 
|  | wl.country = country_from_langid ((unsigned short) id); | 
|  |  | 
|  | return & wl; | 
|  | #endif | 
|  | } | 
|  |  | 
|  | const local_iconv_map * | 
|  | wind_find_codepage_info (unsigned cp) | 
|  | { | 
|  | #if !defined (_WIN32) && !defined (__CYGWIN__) | 
|  | int i; | 
|  |  | 
|  | for (i = 0; codepages[i].codepage != (rc_uint_type) -1 && codepages[i].codepage != cp; i++) | 
|  | ; | 
|  | if (codepages[i].codepage == (rc_uint_type) -1) | 
|  | return NULL; | 
|  | return &codepages[i]; | 
|  | #else | 
|  | static local_iconv_map lim; | 
|  | if (!unicode_is_valid_codepage (cp)) | 
|  | return NULL; | 
|  | lim.codepage = cp; | 
|  | lim.iconv_name = ""; | 
|  | return & lim; | 
|  | #endif | 
|  | } | 
|  |  | 
|  | /* Convert an Codepage string to a unicode string.  */ | 
|  |  | 
|  | void | 
|  | unicode_from_codepage (rc_uint_type *length, unichar **u, const char *src, rc_uint_type cp) | 
|  | { | 
|  | rc_uint_type len; | 
|  |  | 
|  | len = wind_MultiByteToWideChar (cp, src, NULL, 0); | 
|  | if (len) | 
|  | { | 
|  | *u = ((unichar *) res_alloc (len)); | 
|  | wind_MultiByteToWideChar (cp, src, *u, len); | 
|  | } | 
|  | /* Discount the trailing '/0'.  If MultiByteToWideChar failed, | 
|  | this will set *length to -1.  */ | 
|  | len -= sizeof (unichar); | 
|  |  | 
|  | if (length != NULL) | 
|  | *length = len / sizeof (unichar); | 
|  | } | 
|  |  | 
|  | /* Convert an unicode string to an codepage string.  */ | 
|  |  | 
|  | void | 
|  | codepage_from_unicode (rc_uint_type *length, const unichar *unicode, char **ascii, rc_uint_type cp) | 
|  | { | 
|  | rc_uint_type len; | 
|  |  | 
|  | len = wind_WideCharToMultiByte (cp, unicode, NULL, 0); | 
|  | if (len) | 
|  | { | 
|  | *ascii = (char *) res_alloc (len * sizeof (char)); | 
|  | wind_WideCharToMultiByte (cp, unicode, *ascii, len); | 
|  | } | 
|  | /* Discount the trailing '/0'.  If MultiByteToWideChar failed, | 
|  | this will set *length to -1.  */ | 
|  | len--; | 
|  |  | 
|  | if (length != NULL) | 
|  | *length = len; | 
|  | } | 
|  |  | 
|  | #if defined (HAVE_ICONV) && !defined (_WIN32) && !defined (__CYGWIN__) | 
|  | static int | 
|  | iconv_onechar (iconv_t cd, ICONV_CONST char *s, char *d, int d_len, const char **n_s, char **n_d) | 
|  | { | 
|  | int i; | 
|  |  | 
|  | for (i = 1; i <= 32; i++) | 
|  | { | 
|  | char *tmp_d = d; | 
|  | ICONV_CONST char *tmp_s = s; | 
|  | size_t ret; | 
|  | size_t s_left = (size_t) i; | 
|  | size_t d_left = (size_t) d_len; | 
|  |  | 
|  | ret = iconv (cd, & tmp_s, & s_left, & tmp_d, & d_left); | 
|  |  | 
|  | if (ret != (size_t) -1) | 
|  | { | 
|  | *n_s = tmp_s; | 
|  | *n_d = tmp_d; | 
|  | return 0; | 
|  | } | 
|  | } | 
|  |  | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | static const char * | 
|  | wind_iconv_cp (rc_uint_type cp) | 
|  | { | 
|  | const local_iconv_map *lim = wind_find_codepage_info (cp); | 
|  |  | 
|  | if (!lim) | 
|  | return NULL; | 
|  | return lim->iconv_name; | 
|  | } | 
|  | #endif /* HAVE_ICONV */ | 
|  |  | 
|  | static rc_uint_type | 
|  | wind_MultiByteToWideChar (rc_uint_type cp, const char *mb, | 
|  | unichar *u, rc_uint_type u_len) | 
|  | { | 
|  | rc_uint_type ret = 0; | 
|  |  | 
|  | #if defined (_WIN32) || defined (__CYGWIN__) | 
|  | rc_uint_type conv_flags = MB_PRECOMPOSED; | 
|  |  | 
|  | /* MB_PRECOMPOSED is not allowed for UTF-7 or UTF-8. | 
|  | MultiByteToWideChar will set the last error to | 
|  | ERROR_INVALID_FLAGS if we do. */ | 
|  | if (cp == CP_UTF8 || cp == CP_UTF7) | 
|  | conv_flags = 0; | 
|  |  | 
|  | ret = (rc_uint_type) MultiByteToWideChar (cp, conv_flags, | 
|  | mb, -1, u, u_len); | 
|  | /* Convert to bytes. */ | 
|  | ret *= sizeof (unichar); | 
|  |  | 
|  | #elif defined (HAVE_ICONV) | 
|  | int first = 1; | 
|  | char tmp[32]; | 
|  | char *p_tmp; | 
|  | const char *iconv_name = wind_iconv_cp (cp); | 
|  |  | 
|  | if (!mb || !iconv_name) | 
|  | return 0; | 
|  | iconv_t cd = iconv_open ( | 
|  | #if WORDS_BIGENDIAN | 
|  | "UTF-16BE", | 
|  | #else | 
|  | "UTF-16LE", | 
|  | #endif | 
|  | iconv_name); | 
|  |  | 
|  | while (1) | 
|  | { | 
|  | int iret; | 
|  | const char *n_mb = ""; | 
|  | char *n_tmp = ""; | 
|  |  | 
|  | p_tmp = tmp; | 
|  | iret = iconv_onechar (cd, (ICONV_CONST char *) mb, p_tmp, 32, & n_mb, & n_tmp); | 
|  | if (first) | 
|  | { | 
|  | first = 0; | 
|  | continue; | 
|  | } | 
|  | if (!iret) | 
|  | { | 
|  | size_t l_tmp = (size_t) (n_tmp - p_tmp); | 
|  |  | 
|  | if (u) | 
|  | { | 
|  | if ((size_t) u_len < l_tmp) | 
|  | break; | 
|  | memcpy (u, tmp, l_tmp); | 
|  | u += l_tmp/2; | 
|  | u_len -= l_tmp; | 
|  | } | 
|  | ret += l_tmp; | 
|  | } | 
|  | else | 
|  | break; | 
|  | if (tmp[0] == 0 && tmp[1] == 0) | 
|  | break; | 
|  | mb = n_mb; | 
|  | } | 
|  | iconv_close (cd); | 
|  | #else | 
|  | if (cp) | 
|  | ret = 0; | 
|  | ret = strlen (mb) + 1; | 
|  | ret *= sizeof (unichar); | 
|  | if (u != NULL && u_len != 0) | 
|  | { | 
|  | do | 
|  | { | 
|  | *u++ = ((unichar) *mb) & 0xff; | 
|  | --u_len; mb++; | 
|  | } | 
|  | while (u_len != 0 && mb[-1] != 0); | 
|  | } | 
|  | if (u != NULL && u_len != 0) | 
|  | *u = 0; | 
|  | #endif | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | static rc_uint_type | 
|  | wind_WideCharToMultiByte (rc_uint_type cp, const unichar *u, char *mb, rc_uint_type mb_len) | 
|  | { | 
|  | rc_uint_type ret = 0; | 
|  | #if defined (_WIN32) || defined (__CYGWIN__) | 
|  | WINBOOL used_def = false; | 
|  |  | 
|  | ret = (rc_uint_type) WideCharToMultiByte (cp, 0, u, -1, mb, mb_len, | 
|  | NULL, & used_def); | 
|  | #elif defined (HAVE_ICONV) | 
|  | int first = 1; | 
|  | char tmp[32]; | 
|  | char *p_tmp; | 
|  | const char *iconv_name = wind_iconv_cp (cp); | 
|  |  | 
|  | if (!u || !iconv_name) | 
|  | return 0; | 
|  | iconv_t cd = iconv_open (iconv_name, | 
|  | #if WORDS_BIGENDIAN | 
|  | "UTF-16BE" | 
|  | #else | 
|  | "UTF-16LE" | 
|  | #endif | 
|  | ); | 
|  |  | 
|  | while (1) | 
|  | { | 
|  | int iret; | 
|  | const char *n_u = ""; | 
|  | char *n_tmp = ""; | 
|  |  | 
|  | p_tmp = tmp; | 
|  | iret = iconv_onechar (cd, (ICONV_CONST char *) u, p_tmp, 32, &n_u, & n_tmp); | 
|  | if (first) | 
|  | { | 
|  | first = 0; | 
|  | continue; | 
|  | } | 
|  | if (!iret) | 
|  | { | 
|  | size_t l_tmp = (size_t) (n_tmp - p_tmp); | 
|  |  | 
|  | if (mb) | 
|  | { | 
|  | if ((size_t) mb_len < l_tmp) | 
|  | break; | 
|  | memcpy (mb, tmp, l_tmp); | 
|  | mb += l_tmp; | 
|  | mb_len -= l_tmp; | 
|  | } | 
|  | ret += l_tmp; | 
|  | } | 
|  | else | 
|  | break; | 
|  | if (u[0] == 0) | 
|  | break; | 
|  | u = (const unichar *) n_u; | 
|  | } | 
|  | iconv_close (cd); | 
|  | #else | 
|  | if (cp) | 
|  | ret = 0; | 
|  |  | 
|  | while (u[ret] != 0) | 
|  | ++ret; | 
|  |  | 
|  | ++ret; | 
|  |  | 
|  | if (mb) | 
|  | { | 
|  | while (*u != 0 && mb_len != 0) | 
|  | { | 
|  | if (u[0] == (u[0] & 0x7f)) | 
|  | *mb++ = (char) u[0]; | 
|  | else | 
|  | *mb++ = '_'; | 
|  | ++u; --mb_len; | 
|  | } | 
|  | if (mb_len != 0) | 
|  | *mb = 0; | 
|  | } | 
|  | #endif | 
|  | return ret; | 
|  | } |