4 * Copyright 1998 Bertho A. Stultiens
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
22 #include "wine/port.h"
31 #include "wine/unicode.h"
36 /* #define WANT_NEAR_INDICATION */
38 #ifdef WANT_NEAR_INDICATION
39 void make_print(char *str)
50 static void generic_msg(const char *s, const char *t, const char *n, va_list ap)
52 fprintf(stderr, "%s:%d:%d: %s: ", input_name ? input_name : "stdin", line_number, char_number, t);
53 vfprintf(stderr, s, ap);
54 #ifdef WANT_NEAR_INDICATION
61 fprintf(stderr, " near '%s'", cpy);
69 int parser_error(const char *s, ...)
73 generic_msg(s, "Error", parser_text, ap);
79 int parser_warning(const char *s, ...)
83 generic_msg(s, "Warning", parser_text, ap);
88 void internal_error(const char *file, int line, const char *s, ...)
92 fprintf(stderr, "Internal error (please report) %s %d: ", file, line);
93 vfprintf(stderr, s, ap);
98 void error(const char *s, ...)
102 fprintf(stderr, "Error: ");
103 vfprintf(stderr, s, ap);
108 void warning(const char *s, ...)
112 fprintf(stderr, "Warning: ");
113 vfprintf(stderr, s, ap);
117 void chat(const char *s, ...)
119 if(debuglevel & DEBUGLEVEL_CHAT)
123 fprintf(stderr, "FYI: ");
124 vfprintf(stderr, s, ap);
129 char *dup_basename(const char *name, const char *ext)
132 int extlen = strlen(ext);
139 slash = strrchr(name, '/');
143 namelen = strlen(name);
145 /* +4 for later extension and +1 for '\0' */
146 base = xmalloc(namelen +4 +1);
148 if(!strcasecmp(name + namelen-extlen, ext))
150 base[namelen - extlen] = '\0';
155 void *xmalloc(size_t size)
163 error("Virtual memory exhausted.\n");
165 memset(res, 0x55, size);
170 void *xrealloc(void *p, size_t size)
175 res = realloc(p, size);
178 error("Virtual memory exhausted.\n");
183 char *xstrdup(const char *str)
188 s = xmalloc(strlen(str)+1);
189 return strcpy(s, str);
194 *****************************************************************************
195 * Function : compare_name_id
196 * Syntax : int compare_name_id(const name_id_t *n1, const name_id_t *n2)
201 *****************************************************************************
203 int compare_name_id(const name_id_t *n1, const name_id_t *n2)
205 if(n1->type == name_ord && n2->type == name_ord)
207 return n1->name.i_name - n2->name.i_name;
209 else if(n1->type == name_str && n2->type == name_str)
211 if(n1->name.s_name->type == str_char
212 && n2->name.s_name->type == str_char)
214 return strcasecmp(n1->name.s_name->str.cstr, n2->name.s_name->str.cstr);
216 else if(n1->name.s_name->type == str_unicode
217 && n2->name.s_name->type == str_unicode)
219 return strcmpiW(n1->name.s_name->str.wstr, n2->name.s_name->str.wstr);
223 internal_error(__FILE__, __LINE__, "Can't yet compare strings of mixed type\n");
226 else if(n1->type == name_ord && n2->type == name_str)
228 else if(n1->type == name_str && n2->type == name_ord)
231 internal_error(__FILE__, __LINE__, "Comparing name-ids with unknown types (%d, %d)\n",
234 return 0; /* Keep the compiler happy */
237 string_t *convert_string(const string_t *str, enum str_e type, int codepage)
239 const union cptable *cptable = codepage ? wine_cp_get_table( codepage ) : NULL;
240 string_t *ret = xmalloc(sizeof(*ret));
243 if (!codepage && str->type != type)
244 parser_error( "Current language is Unicode only, cannot convert string\n" );
246 if((str->type == str_char) && (type == str_unicode))
248 ret->type = str_unicode;
249 ret->size = cptable ? wine_cp_mbstowcs( cptable, 0, str->str.cstr, str->size, NULL, 0 )
250 : wine_utf8_mbstowcs( 0, str->str.cstr, str->size, NULL, 0 );
251 ret->str.wstr = xmalloc( (ret->size+1) * sizeof(WCHAR) );
253 res = wine_cp_mbstowcs( cptable, MB_ERR_INVALID_CHARS, str->str.cstr, str->size,
254 ret->str.wstr, ret->size );
256 res = wine_utf8_mbstowcs( MB_ERR_INVALID_CHARS, str->str.cstr, str->size,
257 ret->str.wstr, ret->size );
259 parser_error( "Invalid character in string '%.*s' for codepage %u\n",
260 str->size, str->str.cstr, codepage );
261 ret->str.wstr[ret->size] = 0;
263 else if((str->type == str_unicode) && (type == str_char))
265 ret->type = str_char;
266 ret->size = cptable ? wine_cp_wcstombs( cptable, 0, str->str.wstr, str->size, NULL, 0, NULL, NULL )
267 : wine_utf8_wcstombs( 0, str->str.wstr, str->size, NULL, 0 );
268 ret->str.cstr = xmalloc( ret->size + 1 );
270 wine_cp_wcstombs( cptable, 0, str->str.wstr, str->size, ret->str.cstr, ret->size, NULL, NULL );
272 wine_utf8_wcstombs( 0, str->str.wstr, str->size, ret->str.cstr, ret->size );
273 ret->str.cstr[ret->size] = 0;
275 else if(str->type == str_unicode)
277 ret->type = str_unicode;
278 ret->size = str->size;
279 ret->str.wstr = xmalloc(sizeof(WCHAR)*(ret->size+1));
280 memcpy( ret->str.wstr, str->str.wstr, ret->size * sizeof(WCHAR) );
281 ret->str.wstr[ret->size] = 0;
283 else /* str->type == str_char */
285 ret->type = str_char;
286 ret->size = str->size;
287 ret->str.cstr = xmalloc( ret->size + 1 );
288 memcpy( ret->str.cstr, str->str.cstr, ret->size );
289 ret->str.cstr[ret->size] = 0;
295 void free_string(string_t *str)
297 if (str->type == str_unicode) free( str->str.wstr );
298 else free( str->str.cstr );
303 int check_unicode_conversion( const string_t *str_a, const string_t *str_w, int codepage )
306 string_t *teststr = convert_string( str_w, str_char, codepage );
308 ok = (teststr->size == str_a->size && !memcmp( teststr->str.cstr, str_a->str.cstr, str_a->size ));
314 fprintf( stderr, "Source: %s", str_a->str.cstr );
315 for (i = 0; i < str_a->size; i++)
316 fprintf( stderr, " %02x", (unsigned char)str_a->str.cstr[i] );
317 fprintf( stderr, "\nUnicode: " );
318 for (i = 0; i < str_w->size; i++)
319 fprintf( stderr, " %04x", str_w->str.wstr[i] );
320 fprintf( stderr, "\nBack: %s", teststr->str.cstr );
321 for (i = 0; i < teststr->size; i++)
322 fprintf( stderr, " %02x", (unsigned char)teststr->str.cstr[i] );
323 fprintf( stderr, "\n" );
325 free_string( teststr );
333 unsigned short sublang;
337 /* language to codepage conversion table */
338 /* specific sublanguages need only be specified if their codepage */
339 /* differs from the default (SUBLANG_NEUTRAL) */
340 static const struct lang2cp lang2cps[] =
342 { LANG_AFRIKAANS, SUBLANG_NEUTRAL, 1252 },
343 { LANG_ALBANIAN, SUBLANG_NEUTRAL, 1250 },
344 { LANG_ARABIC, SUBLANG_NEUTRAL, 1256 },
345 { LANG_ARMENIAN, SUBLANG_NEUTRAL, 0 },
346 { LANG_AZERI, SUBLANG_NEUTRAL, 1254 },
347 { LANG_AZERI, SUBLANG_AZERI_CYRILLIC, 1251 },
348 { LANG_BASQUE, SUBLANG_NEUTRAL, 1252 },
349 { LANG_BELARUSIAN, SUBLANG_NEUTRAL, 1251 },
351 { LANG_BRETON, SUBLANG_NEUTRAL, 1252 },
352 #endif /* LANG_BRETON */
353 { LANG_BULGARIAN, SUBLANG_NEUTRAL, 1251 },
354 { LANG_CATALAN, SUBLANG_NEUTRAL, 1252 },
355 { LANG_CHINESE, SUBLANG_NEUTRAL, 950 },
356 { LANG_CHINESE, SUBLANG_CHINESE_SINGAPORE, 936 },
357 { LANG_CHINESE, SUBLANG_CHINESE_SIMPLIFIED, 936 },
359 { LANG_CORNISH, SUBLANG_NEUTRAL, 1252 },
360 #endif /* LANG_CORNISH */
361 { LANG_CROATIAN, SUBLANG_NEUTRAL, 1250 },
362 { LANG_CZECH, SUBLANG_NEUTRAL, 1250 },
363 { LANG_DANISH, SUBLANG_NEUTRAL, 1252 },
364 { LANG_DIVEHI, SUBLANG_NEUTRAL, 0 },
365 { LANG_DUTCH, SUBLANG_NEUTRAL, 1252 },
366 { LANG_ENGLISH, SUBLANG_NEUTRAL, 1252 },
367 #ifdef LANG_ESPERANTO
368 { LANG_ESPERANTO, SUBLANG_NEUTRAL, 1252 },
369 #endif /* LANG_ESPERANTO */
370 { LANG_ESTONIAN, SUBLANG_NEUTRAL, 1257 },
371 { LANG_FAEROESE, SUBLANG_NEUTRAL, 1252 },
372 { LANG_FARSI, SUBLANG_NEUTRAL, 1256 },
373 { LANG_FINNISH, SUBLANG_NEUTRAL, 1252 },
374 { LANG_FRENCH, SUBLANG_NEUTRAL, 1252 },
376 { LANG_GAELIC, SUBLANG_NEUTRAL, 1252 },
377 #endif /* LANG_GAELIC */
378 { LANG_GALICIAN, SUBLANG_NEUTRAL, 1252 },
379 { LANG_GEORGIAN, SUBLANG_NEUTRAL, 0 },
380 { LANG_GERMAN, SUBLANG_NEUTRAL, 1252 },
381 { LANG_GREEK, SUBLANG_NEUTRAL, 1253 },
382 { LANG_GUJARATI, SUBLANG_NEUTRAL, 0 },
383 { LANG_HEBREW, SUBLANG_NEUTRAL, 1255 },
384 { LANG_HINDI, SUBLANG_NEUTRAL, 0 },
385 { LANG_HUNGARIAN, SUBLANG_NEUTRAL, 1250 },
386 { LANG_ICELANDIC, SUBLANG_NEUTRAL, 1252 },
387 { LANG_INDONESIAN, SUBLANG_NEUTRAL, 1252 },
388 { LANG_ITALIAN, SUBLANG_NEUTRAL, 1252 },
389 { LANG_JAPANESE, SUBLANG_NEUTRAL, 932 },
390 { LANG_KANNADA, SUBLANG_NEUTRAL, 0 },
391 { LANG_KAZAK, SUBLANG_NEUTRAL, 1251 },
392 { LANG_KONKANI, SUBLANG_NEUTRAL, 0 },
393 { LANG_KOREAN, SUBLANG_NEUTRAL, 949 },
394 { LANG_KYRGYZ, SUBLANG_NEUTRAL, 1251 },
395 { LANG_LATVIAN, SUBLANG_NEUTRAL, 1257 },
396 { LANG_LITHUANIAN, SUBLANG_NEUTRAL, 1257 },
397 { LANG_MACEDONIAN, SUBLANG_NEUTRAL, 1251 },
398 { LANG_MALAY, SUBLANG_NEUTRAL, 1252 },
399 { LANG_MARATHI, SUBLANG_NEUTRAL, 0 },
400 { LANG_MONGOLIAN, SUBLANG_NEUTRAL, 1251 },
401 { LANG_NEUTRAL, SUBLANG_NEUTRAL, 1252 },
402 { LANG_NORWEGIAN, SUBLANG_NEUTRAL, 1252 },
403 { LANG_POLISH, SUBLANG_NEUTRAL, 1250 },
404 { LANG_PORTUGUESE, SUBLANG_NEUTRAL, 1252 },
405 { LANG_PUNJABI, SUBLANG_NEUTRAL, 0 },
406 { LANG_ROMANIAN, SUBLANG_NEUTRAL, 1250 },
407 { LANG_RUSSIAN, SUBLANG_NEUTRAL, 1251 },
408 { LANG_SANSKRIT, SUBLANG_NEUTRAL, 0 },
409 { LANG_SERBIAN, SUBLANG_NEUTRAL, 1250 },
410 { LANG_SERBIAN, SUBLANG_SERBIAN_CYRILLIC, 1251 },
411 { LANG_SLOVAK, SUBLANG_NEUTRAL, 1250 },
412 { LANG_SLOVENIAN, SUBLANG_NEUTRAL, 1250 },
413 { LANG_SPANISH, SUBLANG_NEUTRAL, 1252 },
414 { LANG_SWAHILI, SUBLANG_NEUTRAL, 1252 },
415 { LANG_SWEDISH, SUBLANG_NEUTRAL, 1252 },
416 { LANG_SYRIAC, SUBLANG_NEUTRAL, 0 },
417 { LANG_TAMIL, SUBLANG_NEUTRAL, 0 },
418 { LANG_TATAR, SUBLANG_NEUTRAL, 1251 },
419 { LANG_TELUGU, SUBLANG_NEUTRAL, 0 },
420 { LANG_THAI, SUBLANG_NEUTRAL, 874 },
421 { LANG_TURKISH, SUBLANG_NEUTRAL, 1254 },
422 { LANG_UKRAINIAN, SUBLANG_NEUTRAL, 1251 },
423 { LANG_URDU, SUBLANG_NEUTRAL, 1256 },
424 { LANG_UZBEK, SUBLANG_NEUTRAL, 1254 },
425 { LANG_UZBEK, SUBLANG_UZBEK_CYRILLIC, 1251 },
426 { LANG_VIETNAMESE, SUBLANG_NEUTRAL, 1258 }
428 , { LANG_WALON, SUBLANG_NEUTRAL, 1252 }
429 #endif /* LANG_WALON */
431 , { LANG_WELSH, SUBLANG_NEUTRAL, 1252 }
432 #endif /* LANG_WELSH */
435 int get_language_codepage( unsigned short lang, unsigned short sublang )
438 int cp = -1, defcp = -1;
440 for (i = 0; i < sizeof(lang2cps)/sizeof(lang2cps[0]); i++)
442 if (lang2cps[i].lang != lang) continue;
443 if (lang2cps[i].sublang == sublang)
448 if (lang2cps[i].sublang == SUBLANG_NEUTRAL) defcp = lang2cps[i].cp;
451 if (cp == -1) cp = defcp;
452 assert( cp <= 0 || wine_cp_get_table(cp) );