2 * Wine internal Unicode definitions
4 * Copyright 2000 Alexandre Julliard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #ifndef __WINE_UNICODE_H
22 #define __WINE_UNICODE_H
27 /* code page info common to SBCS and DBCS */
30 unsigned int codepage; /* codepage id */
31 unsigned int char_size; /* char size (1 or 2 bytes) */
32 WCHAR def_char; /* default char value (can be double-byte) */
33 WCHAR def_unicode_char; /* default Unicode char value */
34 const char *name; /* code page name */
40 const WCHAR *cp2uni; /* code page -> Unicode map */
41 const unsigned char *uni2cp_low; /* Unicode -> code page map */
42 const unsigned short *uni2cp_high;
48 const WCHAR *cp2uni; /* code page -> Unicode map */
49 const unsigned char *cp2uni_leadbytes;
50 const unsigned short *uni2cp_low; /* Unicode -> code page map */
51 const unsigned short *uni2cp_high;
52 unsigned char lead_bytes[12]; /* lead bytes ranges */
58 struct sbcs_table sbcs;
59 struct dbcs_table dbcs;
62 extern const union cptable *cp_get_table( unsigned int codepage );
63 extern const union cptable *cp_enum_table( unsigned int index );
65 extern int cp_mbstowcs( const union cptable *table, int flags,
66 const char *src, int srclen,
67 WCHAR *dst, int dstlen );
68 extern int cp_wcstombs( const union cptable *table, int flags,
69 const WCHAR *src, int srclen,
70 char *dst, int dstlen, const char *defchar, int *used );
71 extern int utf8_wcstombs( const WCHAR *src, int srclen, char *dst, int dstlen );
72 extern int utf8_mbstowcs( int flags, const char *src, int srclen, WCHAR *dst, int dstlen );
74 extern int strcmpiW( const WCHAR *str1, const WCHAR *str2 );
75 extern int strncmpiW( const WCHAR *str1, const WCHAR *str2, int n );
76 extern WCHAR *strstrW( const WCHAR *str, const WCHAR *sub );
77 extern long int strtolW( const WCHAR *nptr, WCHAR **endptr, int base );
78 extern unsigned long int strtoulW( const WCHAR *nptr, WCHAR **endptr, int base );
80 static inline int is_dbcs_leadbyte( const union cptable *table, unsigned char ch )
82 return (table->info.char_size == 2) && (table->dbcs.cp2uni_leadbytes[ch]);
85 static inline WCHAR tolowerW( WCHAR ch )
87 extern const WCHAR casemap_lower[];
88 return ch + casemap_lower[casemap_lower[ch >> 8] + (ch & 0xff)];
91 static inline WCHAR toupperW( WCHAR ch )
93 extern const WCHAR casemap_upper[];
94 return ch + casemap_upper[casemap_upper[ch >> 8] + (ch & 0xff)];
97 /* the character type contains the C1_* flags in the low 12 bits */
98 /* and the C2_* type in the high 4 bits */
99 static inline unsigned short get_char_typeW( WCHAR ch )
101 extern const unsigned short wctype_table[];
102 return wctype_table[wctype_table[ch >> 8] + (ch & 0xff)];
105 inline static int iscntrlW( WCHAR wc )
107 return get_char_typeW(wc) & C1_CNTRL;
110 inline static int ispunctW( WCHAR wc )
112 return get_char_typeW(wc) & C1_PUNCT;
115 inline static int isspaceW( WCHAR wc )
117 return get_char_typeW(wc) & C1_SPACE;
120 inline static int isdigitW( WCHAR wc )
122 return get_char_typeW(wc) & C1_DIGIT;
125 inline static int isxdigitW( WCHAR wc )
127 return get_char_typeW(wc) & C1_XDIGIT;
130 inline static int islowerW( WCHAR wc )
132 return get_char_typeW(wc) & C1_LOWER;
135 inline static int isupperW( WCHAR wc )
137 return get_char_typeW(wc) & C1_UPPER;
140 inline static int isalnumW( WCHAR wc )
142 return get_char_typeW(wc) & (C1_ALPHA|C1_DIGIT|C1_LOWER|C1_UPPER);
145 inline static int isalphaW( WCHAR wc )
147 return get_char_typeW(wc) & (C1_ALPHA|C1_LOWER|C1_UPPER);
150 inline static int isgraphW( WCHAR wc )
152 return get_char_typeW(wc) & (C1_ALPHA|C1_PUNCT|C1_DIGIT|C1_LOWER|C1_UPPER);
155 inline static int isprintW( WCHAR wc )
157 return get_char_typeW(wc) & (C1_ALPHA|C1_BLANK|C1_PUNCT|C1_DIGIT|C1_LOWER|C1_UPPER);
160 /* some useful string manipulation routines */
162 static inline unsigned int strlenW( const WCHAR *str )
164 #if defined(__i386__) && defined(__GNUC__)
166 __asm__ __volatile__( "cld\n\t"
170 : "=c" (res), "=&D" (dummy)
171 : "0" (0xffffffff), "1" (str), "a" (0) );
174 const WCHAR *s = str;
180 static inline WCHAR *strcpyW( WCHAR *dst, const WCHAR *src )
182 #if defined(__i386__) && defined(__GNUC__)
183 int dummy1, dummy2, dummy3;
184 __asm__ __volatile__( "cld\n"
187 "testw %%ax,%%ax\n\t"
189 : "=&S" (dummy1), "=&D" (dummy2), "=&a" (dummy3)
190 : "0" (src), "1" (dst)
194 while ((*p++ = *src++));
199 static inline int strcmpW( const WCHAR *str1, const WCHAR *str2 )
201 while (*str1 && (*str1 == *str2)) { str1++; str2++; }
202 return *str1 - *str2;
205 static inline int strncmpW( const WCHAR *str1, const WCHAR *str2, int n )
207 if (n <= 0) return 0;
208 while ((--n > 0) && *str1 && (*str1 == *str2)) { str1++; str2++; }
209 return *str1 - *str2;
212 static inline WCHAR *strncpyW( WCHAR *str1, const WCHAR *str2, int n )
215 while (n-- > 0) if (!(*str1++ = *str2++)) break;
216 while (n-- > 0) *str1++ = 0;
220 static inline WCHAR *strcatW( WCHAR *dst, const WCHAR *src )
222 strcpyW( dst + strlenW(dst), src );
226 static inline WCHAR *strchrW( const WCHAR *str, WCHAR ch )
228 for ( ; *str; str++) if (*str == ch) return (WCHAR *)str;
232 static inline WCHAR *strrchrW( const WCHAR *str, WCHAR ch )
235 for ( ; *str; str++) if (*str == ch) ret = (WCHAR *)str;
239 static inline WCHAR *strlwrW( WCHAR *str )
242 while ((*str = tolowerW(*str))) str++;
246 static inline WCHAR *struprW( WCHAR *str )
249 while ((*str = toupperW(*str))) str++;
253 static inline long int atolW( const WCHAR *str )
255 return strtolW( str, (WCHAR **)0, 10 );
258 static inline int atoiW( const WCHAR *str )
260 return (int)atolW( str );
263 #endif /* __WINE_UNICODE_H */