2 Unix SMB/CIFS implementation.
3 Character set conversion Extensions
4 Copyright (C) Igor Vergeichik <iverg@mail.ru> 2001
5 Copyright (C) Andrew Tridgell 2001
6 Copyright (C) Simo Sorce 2001
7 Copyright (C) Martin Pool 2003
9 This program is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 2 of the License, or
12 (at your option) any later version.
14 This program is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
19 You should have received a copy of the GNU General Public License
20 along with this program; if not, write to the Free Software
21 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
26 #endif /* HAVE_CONFIG_H */
35 #include <sys/param.h>
36 #ifdef HAVE_USABLE_ICONV
46 #include <netatalk/endian.h>
47 #include <atalk/logger.h>
48 #include <atalk/unicode.h>
49 #include "byteorder.h"
55 * @brief Character-set conversion routines built on our iconv.
57 * @note Samba's internal character set (at least in the 3.0 series)
58 * is always the same as the one for the Unix filesystem. It is
59 * <b>not</b> necessarily UTF-8 and may be different on machines that
60 * need i18n filenames to be compatible with Unix software. It does
61 * have to be a superset of ASCII. All multibyte sequences must start
62 * with a byte with the high bit set.
68 #define MAX_CHARSETS 10
70 #define CHECK_FLAGS(a,b) (((a)!=NULL) ? (*(a) & (b)) : 0 )
72 static atalk_iconv_t conv_handles[MAX_CHARSETS][MAX_CHARSETS];
73 static char* charset_names[MAX_CHARSETS];
74 static struct charset_functions* charsets[MAX_CHARSETS];
75 static char hexdig[] = "0123456789abcdef";
76 #define hextoint( c ) ( isdigit( c ) ? c - '0' : c + 10 - 'a' )
79 * Return the name of a charset to give to iconv().
81 static const char *charset_name(charset_t ch)
83 const char *ret = NULL;
85 if (ch == CH_UCS2) ret = "UCS-2";
86 else if (ch == CH_UNIX) ret = "LOCALE"; /*lp_unix_charset();*/
87 else if (ch == CH_MAC) ret = "MAC_ROMAN"; /*lp_display_charset();*/
88 else if (ch == CH_UTF8) ret = "UTF8";
89 else if (ch == CH_UTF8_MAC) ret = "UTF8-MAC";
92 ret = charset_names[ch];
94 #if defined(HAVE_NL_LANGINFO) && defined(CODESET)
95 if (ret && strcasecmp(ret, "LOCALE") == 0) {
96 const char *ln = NULL;
99 setlocale(LC_ALL, "");
101 ln = nl_langinfo(CODESET);
103 /* Check whether the charset name is supported
105 atalk_iconv_t handle = atalk_iconv_open(ln,"UCS-2");
106 if (handle == (atalk_iconv_t) -1) {
107 LOG(log_debug, logtype_default, "Locale charset '%s' unsupported, using ASCII instead", ln);
110 atalk_iconv_close(handle);
115 #else /* system doesn't have LOCALE support */
116 if (ch == CH_UNIX) ret = NULL;
119 if (!ret || !*ret) ret = "ASCII";
123 struct charset_functions* get_charset_functions (charset_t ch)
125 if (charsets[ch] != NULL)
128 charsets[ch] = find_charset_functions(charset_name(ch));
134 void lazy_initialize_conv(void)
136 static int initialized = 0;
144 charset_t add_charset(char* name)
146 static charset_t max_charset_t = NUM_CHARSETS-1;
147 charset_t cur_charset_t = max_charset_t+1;
150 lazy_initialize_conv();
152 for (c1=0; c1<=max_charset_t;c1++) {
153 if ( strcasecmp(name, charset_name(c1)) == 0)
157 if ( cur_charset_t >= MAX_CHARSETS ) {
158 LOG (log_debug, logtype_default, "Adding charset %s failed, too many charsets (max. %u allowed)",
160 return (charset_t) -1;
163 /* First try to setup the required conversions */
165 conv_handles[cur_charset_t][CH_UCS2] = atalk_iconv_open( charset_name(CH_UCS2), name);
166 if (conv_handles[cur_charset_t][CH_UCS2] == (atalk_iconv_t)-1) {
167 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
168 name, charset_name(CH_UCS2));
169 conv_handles[cur_charset_t][CH_UCS2] = NULL;
170 return (charset_t) -1;
173 conv_handles[CH_UCS2][cur_charset_t] = atalk_iconv_open( name, charset_name(CH_UCS2));
174 if (conv_handles[CH_UCS2][cur_charset_t] == (atalk_iconv_t)-1) {
175 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
176 charset_name(CH_UCS2), name);
177 conv_handles[CH_UCS2][cur_charset_t] = NULL;
178 return (charset_t) -1;
181 /* register the new charset_t name */
182 charset_names[cur_charset_t] = strdup(name);
184 charsets[cur_charset_t] = get_charset_functions (cur_charset_t);
188 LOG(log_debug, logtype_default, "Added charset %s with handle %u", name, cur_charset_t);
190 return (cur_charset_t);
194 * Initialize iconv conversion descriptors.
196 * This is called the first time it is needed, and also called again
197 * every time the configuration is reloaded, because the charset or
198 * codepage might have changed.
200 void init_iconv(void)
204 for (c1=0;c1<NUM_CHARSETS;c1++) {
205 const char *name = charset_name((charset_t)c1);
207 conv_handles[c1][CH_UCS2] = atalk_iconv_open( charset_name(CH_UCS2), name);
208 if (conv_handles[c1][CH_UCS2] == (atalk_iconv_t)-1) {
209 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
210 name, charset_name(CH_UCS2));
211 conv_handles[c1][CH_UCS2] = NULL;
214 if (c1 != CH_UCS2) { /* avoid lost memory, make valgrind happy */
215 conv_handles[CH_UCS2][c1] = atalk_iconv_open( name, charset_name(CH_UCS2));
216 if (conv_handles[CH_UCS2][c1] == (atalk_iconv_t)-1) {
217 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
218 charset_name(CH_UCS2), name);
219 conv_handles[CH_UCS2][c1] = NULL;
223 charsets[c1] = get_charset_functions (c1);
228 * Convert string from one encoding to another, making error checking etc
230 * @param src pointer to source string (multibyte or singlebyte)
231 * @param srclen length of the source string in bytes
232 * @param dest pointer to destination string (multibyte or singlebyte)
233 * @param destlen maximal length allowed for string
234 * @returns the number of bytes occupied in the destination
236 static size_t convert_string_internal(charset_t from, charset_t to,
237 void const *src, size_t srclen,
238 void *dest, size_t destlen)
242 const char* inbuf = (const char*)src;
243 char* outbuf = (char*)dest;
244 char* o_save = outbuf;
245 atalk_iconv_t descriptor;
247 if (srclen == (size_t)-1)
248 srclen = strlen(src)+1;
250 lazy_initialize_conv();
252 descriptor = conv_handles[from][to];
254 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
260 retval = atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len);
261 if(retval==(size_t)-1) {
262 const char *reason="unknown error";
265 reason="Incomplete multibyte sequence";
268 reason="No more room";
271 reason="Illegal multibyte sequence";
274 LOG(log_debug, logtype_default,"Conversion error: %s",reason);
278 /* Terminate the string */
279 if (to == CH_UCS2 && destlen-o_len >= 2) {
280 o_save[destlen-o_len] = 0;
281 o_save[destlen-o_len+1] = 0;
283 else if ( to != CH_UCS2 && destlen-o_len > 0 )
284 o_save[destlen-o_len] = 0;
286 /* FIXME: what should we do here, string *might* be unterminated. E2BIG? */
289 return destlen-o_len;
293 size_t convert_string(charset_t from, charset_t to,
294 void const *src, size_t srclen,
295 void *dest, size_t destlen)
299 ucs2_t buffer[MAXPATHLEN];
300 ucs2_t buffer2[MAXPATHLEN];
303 lazy_initialize_conv();
305 /* convert from_set to UCS2 */
306 if ((size_t)(-1) == ( o_len = convert_string_internal( from, CH_UCS2, src, srclen,
307 (char*) buffer, sizeof(buffer))) ) {
308 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from));
312 /* Do pre/decomposition */
313 if ( ((!(charsets[to]) || !(charsets[to]->flags & CHARSET_DECOMPOSED)) &&
314 (!(charsets[from]) || (charsets[from]->flags & CHARSET_DECOMPOSED))))
316 if ((charsets[to] && charsets[to]->flags & CHARSET_DECOMPOSED) )
319 i_len = sizeof(buffer2);
322 switch (composition) {
328 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
332 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
337 /* Convert UCS2 to to_set */
338 if ((size_t)(-1) == ( o_len = convert_string_internal( CH_UCS2, to, (char*) u, i_len, dest, destlen)) ) {
339 LOG(log_error, logtype_default, "Conversion failed (CH_UCS2 to %s):%s", charset_name(to), strerror(errno));
349 * Convert between character sets, allocating a new buffer for the result.
351 * @param srclen length of source buffer.
352 * @param dest always set at least to NULL
353 * @note -1 is not accepted for srclen.
355 * @returns Size in bytes of the converted string; or -1 in case of error.
358 static size_t convert_string_allocate_internal(charset_t from, charset_t to,
359 void const *src, size_t srclen, char **dest)
361 size_t i_len, o_len, destlen;
363 const char *inbuf = (const char *)src;
364 char *outbuf = NULL, *ob = NULL;
365 atalk_iconv_t descriptor;
369 if (src == NULL || srclen == (size_t)-1)
372 lazy_initialize_conv();
374 descriptor = conv_handles[from][to];
376 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
377 /* conversion not supported, return -1*/
378 LOG(log_debug, logtype_default, "convert_string_allocate: conversion not supported!\n");
382 destlen = MAX(srclen, 512);
384 destlen = destlen * 2;
385 ob = (char *)realloc(ob, destlen);
387 LOG(log_debug, logtype_default,"convert_string_allocate: realloc failed!\n");
393 inbuf = src; /* this restarts the whole conversion if buffer needed to be increased */
396 retval = atalk_iconv(descriptor,
399 if(retval == (size_t)-1) {
400 const char *reason="unknown error";
403 reason="Incomplete multibyte sequence";
408 reason="Illegal multibyte sequence";
411 LOG(log_debug, logtype_default,"Conversion error: %s(%s)",reason,inbuf);
416 destlen = destlen - o_len;
418 /* Terminate the string */
419 if (to == CH_UCS2 && o_len >= 2) {
422 *dest = (char *)realloc(ob,destlen+2);
424 else if ( to != CH_UCS2 && o_len > 0 ) {
426 *dest = (char *)realloc(ob,destlen+1);
429 goto convert; /* realloc */
432 if (destlen && !*dest) {
433 LOG(log_debug, logtype_default, "convert_string_allocate: out of memory!\n");
442 size_t convert_string_allocate(charset_t from, charset_t to,
443 void const *src, size_t srclen,
448 ucs2_t buffer[MAXPATHLEN];
449 ucs2_t buffer2[MAXPATHLEN];
452 lazy_initialize_conv();
456 /* convert from_set to UCS2 */
457 if ((size_t)(-1) == ( o_len = convert_string_internal( from, CH_UCS2, src, srclen,
458 buffer, sizeof(buffer))) ) {
459 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from));
463 /* Do pre/decomposition */
464 if ( ((!(charsets[to]) || !(charsets[to]->flags & CHARSET_DECOMPOSED)) &&
465 (!(charsets[from]) || (charsets[from]->flags & CHARSET_DECOMPOSED))))
467 if ((charsets[to] && charsets[to]->flags & CHARSET_DECOMPOSED) )
470 i_len = sizeof(buffer2);
473 switch (composition) {
479 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
483 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
488 /* Convert UCS2 to to_set */
489 if ((size_t)(-1) == ( o_len = convert_string_allocate_internal( CH_UCS2, to, (char*)u, i_len, dest)) )
490 LOG(log_error, logtype_default, "Conversion failed (CH_UCS2 to %s):%s", charset_name(to), strerror(errno));
496 size_t charset_strupper(charset_t ch, const char *src, size_t srclen, char *dest, size_t destlen)
501 size = convert_string_allocate_internal(ch, CH_UCS2, src, srclen,
503 if (size == (size_t)-1) {
507 if (!strupper_w((ucs2_t *)buffer) && (dest == src)) {
512 size = convert_string_internal(CH_UCS2, ch, buffer, size, dest, destlen);
517 size_t charset_strlower(charset_t ch, const char *src, size_t srclen, char *dest, size_t destlen)
522 size = convert_string_allocate_internal(ch, CH_UCS2, src, srclen,
524 if (size == (size_t)-1) {
528 if (!strlower_w((ucs2_t *)buffer) && (dest == src)) {
533 size = convert_string_internal(CH_UCS2, ch, buffer, size, dest, destlen);
539 size_t unix_strupper(const char *src, size_t srclen, char *dest, size_t destlen)
541 return charset_strupper( CH_UNIX, src, srclen, dest, destlen);
544 size_t unix_strlower(const char *src, size_t srclen, char *dest, size_t destlen)
546 return charset_strlower( CH_UNIX, src, srclen, dest, destlen);
549 size_t utf8_strupper(const char *src, size_t srclen, char *dest, size_t destlen)
551 return charset_strupper( CH_UTF8, src, srclen, dest, destlen);
554 size_t utf8_strlower(const char *src, size_t srclen, char *dest, size_t destlen)
556 return charset_strlower( CH_UTF8, src, srclen, dest, destlen);
560 * Copy a string from a charset_t char* src to a UCS2 destination, allocating a buffer
562 * @param dest always set at least to NULL
564 * @returns The number of bytes occupied by the string in the destination
565 * or -1 in case of error.
568 size_t charset_to_ucs2_allocate(charset_t ch, ucs2_t **dest, const char *src)
570 size_t src_len = strlen(src);
573 return convert_string_allocate(ch, CH_UCS2, src, src_len, (char**) dest);
577 * Copy a string from a charset_t char* src to a UTF-8 destination, allocating a buffer
579 * @param dest always set at least to NULL
581 * @returns The number of bytes occupied by the string in the destination
584 size_t charset_to_utf8_allocate(charset_t ch, char **dest, const char *src)
586 size_t src_len = strlen(src);
589 return convert_string_allocate(ch, CH_UTF8, src, src_len, dest);
593 * Copy a string from a UCS2 src to a unix char * destination, allocating a buffer
595 * @param dest always set at least to NULL
597 * @returns The number of bytes occupied by the string in the destination
600 size_t ucs2_to_charset(charset_t ch, const ucs2_t *src, char *dest, size_t destlen)
602 size_t src_len = (strlen_w(src)) * sizeof(ucs2_t);
603 return convert_string(CH_UCS2, ch, src, src_len, dest, destlen);
607 size_t ucs2_to_charset_allocate(charset_t ch, char **dest, const ucs2_t *src)
609 size_t src_len = (strlen_w(src)) * sizeof(ucs2_t);
611 return convert_string_allocate(CH_UCS2, ch, src, src_len, dest);
615 * Copy a string from a UTF-8 src to a unix char * destination, allocating a buffer
617 * @param dest always set at least to NULL
619 * @returns The number of bytes occupied by the string in the destination
622 size_t utf8_to_charset_allocate(charset_t ch, char **dest, const char *src)
624 size_t src_len = strlen(src);
626 return convert_string_allocate(CH_UTF8, ch, src, src_len, dest);
629 size_t charset_precompose ( charset_t ch, char * src, size_t inlen, char * dst, size_t outlen)
632 ucs2_t u[MAXPATHLEN];
636 if ((size_t)(-1) == (len = convert_string_allocate_internal(ch, CH_UCS2, src, inlen, &buffer)) )
641 if ( (size_t)-1 == (ilen = precompose_w((ucs2_t *)buffer, len, u, &ilen)) ) {
646 if ((size_t)(-1) == (len = convert_string_internal( CH_UCS2, ch, (char*)u, ilen, dst, outlen)) ) {
656 size_t charset_decompose ( charset_t ch, char * src, size_t inlen, char * dst, size_t outlen)
659 ucs2_t u[MAXPATHLEN];
663 if ((size_t)(-1) == (len = convert_string_allocate_internal(ch, CH_UCS2, src, inlen, &buffer)) )
668 if ( (size_t)-1 == (ilen = decompose_w((ucs2_t *)buffer, len, u, &ilen)) ) {
673 if ((size_t)(-1) == (len = convert_string_internal( CH_UCS2, ch, (char*)u, ilen, dst, outlen)) ) {
683 size_t utf8_precompose ( char * src, size_t inlen, char * dst, size_t outlen)
685 return charset_precompose ( CH_UTF8, src, inlen, dst, outlen);
688 size_t utf8_decompose ( char * src, size_t inlen, char * dst, size_t outlen)
690 return charset_decompose ( CH_UTF8, src, inlen, dst, outlen);
693 static char debugbuf[ MAXPATHLEN +1 ];
694 char * debug_out ( char * seq, size_t len)
700 p = (unsigned char*) seq;
703 for ( i = 0; i<=(len-1); i++)
705 sprintf(q, "%2.2x.", *p);
715 * Convert from MB to UCS2 charset
717 * CONV_UNESCAPEHEX: ':XX' will be converted to an UCS2 character
718 * CONV_IGNORE: return the first convertable characters.
720 * This will *not* work if the destination charset is not multibyte, i.e. UCS2->UCS2 will fail
721 * The (un)escape scheme is not compatible to the old cap style escape. This is bad, we need it
722 * for e.g. HFS cdroms.
725 static size_t pull_charset_flags (charset_t from_set, charset_t cap_charset, char* src, size_t srclen, char* dest, size_t destlen, u_int16_t *flags)
727 size_t i_len, o_len, hlen;
728 size_t retval, j = 0;
729 const char* inbuf = (const char*)src;
730 char* outbuf = (char*)dest;
731 atalk_iconv_t descriptor;
732 atalk_iconv_t descriptor_cap;
737 if (srclen == (size_t)-1)
738 srclen = strlen(src)+1;
740 lazy_initialize_conv();
742 descriptor = conv_handles[from_set][CH_UCS2];
743 descriptor_cap = conv_handles[cap_charset][CH_UCS2];
745 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
754 if ( flags && (*flags & CONV_UNESCAPEHEX)) {
755 if ( NULL != (s = strchr ( inbuf, ':'))) {
756 j = i_len - (s - inbuf);
757 if ( 0 == (i_len = (s - inbuf)))
762 retval = atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len);
763 if(retval==(size_t)-1) {
764 if (errno == EILSEQ && flags && (*flags & CONV_IGNORE)) {
765 *flags |= CONV_REQMANGLE;
766 return destlen-o_len;
773 if (j && flags && (*flags & CONV_UNESCAPEHEX )) {
774 /* we're at the start on an hex encoded ucs2 char */
780 isxdigit( *(inbuf+1)) && isxdigit( *(inbuf+2)) ) {
782 while ( *inbuf == ':' && j >=3 &&
783 isxdigit( *(inbuf+1)) && isxdigit( *(inbuf+2)) ) {
785 h[hlen] = hextoint( *inbuf ) << 4;
787 h[hlen++] |= hextoint( *inbuf );
791 h_buf = (const char*) h;
792 if ((size_t) -1 == (retval = atalk_iconv(descriptor_cap, &h_buf, &hlen, &outbuf, &o_len)) ) {
793 if (errno == EILSEQ && CHECK_FLAGS(flags, CONV_IGNORE)) {
794 *flags |= CONV_REQMANGLE;
795 return destlen-o_len;
803 /* We have an invalid :xx sequence */
804 if (CHECK_FLAGS(flags, CONV_IGNORE)) {
805 *flags |= CONV_REQMANGLE;
806 return destlen-o_len;
816 goto conversion_loop;
821 return destlen-o_len;
825 * Convert from UCS2 to MB charset
827 * CONV_ESCAPEDOTS: escape leading dots
828 * CONV_ESCAPEHEX: unconvertable characters and '/' will be escaped to :XX
829 * CONV_IGNORE: unconvertable characters will be replaced with '_'
831 * CONV_IGNORE and CONV_ESCAPEHEX can't work together. Should we check this ?
832 * This will *not* work if the destination charset is not multibyte, i.e. UCS2->UCS2 will fail
833 * The escape scheme is not compatible to the old cap style escape. This is bad, we need it
834 * for e.g. HFS cdroms.
838 static size_t push_charset_flags (charset_t to_set, charset_t cap_set, char* src, size_t srclen, char* dest, size_t destlen, u_int16_t *flags)
840 size_t i_len, o_len, i;
841 size_t retval, j = 0;
842 const char* inbuf = (const char*)src;
843 char* outbuf = (char*)dest;
844 atalk_iconv_t descriptor;
846 char *buf, *buf_save;
849 lazy_initialize_conv();
851 descriptor = conv_handles[CH_UCS2][to_set];
853 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
861 if ( SVAL(inbuf,0) == 0x002e && flags && (*flags & CONV_ESCAPEDOTS)) { /* 0x002e = . */
873 if (flags) *flags |= CONV_REQESCAPE;
877 if ( flags && (*flags & CONV_ESCAPEHEX)) {
878 for ( i = 0; i < i_len; i+=2) {
879 if ( SVAL((inbuf+i),0) == 0x002f) { /* 0x002f = / */
881 if ( 0 == ( i_len = i))
884 } else if ( SVAL(inbuf+i,0) == 0x003a) { /* 0x003a = : */
891 retval = atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len);
892 if (retval==(size_t)-1) {
893 if (errno == EILSEQ && CHECK_FLAGS(flags, CONV_IGNORE)) {
894 *flags |= CONV_REQMANGLE;
895 return destlen -o_len;
897 else if ( errno == EILSEQ && flags && (*flags & CONV_ESCAPEHEX)) {
902 if ((size_t) -1 == (buflen = convert_string_allocate_internal(CH_UCS2, cap_set, inbuf, 2, &buf)) )
911 *outbuf++ = hexdig[ ( *buf & 0xf0 ) >> 4 ];
912 *outbuf++ = hexdig[ *buf & 0x0f ];
921 if (flags) *flags |= CONV_REQESCAPE;
923 goto conversion_loop;
930 if (j && flags && (*flags & CONV_ESCAPEHEX)) {
935 o_save[destlen -o_len] = ':';
936 o_save[destlen -o_len+1] = '2';
937 o_save[destlen -o_len+2] = 'f';
944 goto conversion_loop;
946 return destlen -o_len;
949 size_t convert_charset ( charset_t from_set, charset_t to_set, charset_t cap_charset, char* src, size_t src_len, char* dest, size_t dest_len, u_int16_t *flags)
953 ucs2_t buffer[MAXPATHLEN];
954 ucs2_t buffer2[MAXPATHLEN];
957 lazy_initialize_conv();
959 /* convert from_set to UCS2 */
960 if ((size_t)(-1) == ( o_len = pull_charset_flags( from_set, cap_charset, src, src_len,
961 (char *) buffer, sizeof(buffer), flags)) ) {
962 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from_set));
969 /* Do pre/decomposition */
970 if (CHECK_FLAGS(flags, CONV_PRECOMPOSE) ||
971 ((!(charsets[to_set]) || !(charsets[to_set]->flags & CHARSET_DECOMPOSED)) &&
972 (!(charsets[from_set]) || (charsets[from_set]->flags & CHARSET_DECOMPOSED))))
974 if (CHECK_FLAGS(flags, CONV_DECOMPOSE) || (charsets[to_set] && charsets[to_set]->flags & CHARSET_DECOMPOSED) )
977 i_len = sizeof(buffer2);
980 switch (composition) {
986 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
990 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
995 /* Do case conversions */
996 if (CHECK_FLAGS(flags, CONV_TOUPPER)) {
999 if (CHECK_FLAGS(flags, CONV_TOLOWER)) {
1003 /* Convert UCS2 to to_set */
1004 if ((size_t)(-1) == ( o_len = push_charset_flags( to_set, cap_charset, (char *)u, i_len, dest, dest_len, flags )) ) {
1005 LOG(log_error, logtype_default,
1006 "Conversion failed (CH_UCS2 to %s):%s", charset_name(to_set), strerror(errno));