2 Unix SMB/CIFS implementation.
3 Character set conversion Extensions
4 Copyright (C) Igor Vergeichik <iverg@mail.ru> 2001
5 Copyright (C) Andrew Tridgell 2001
6 Copyright (C) Simo Sorce 2001
7 Copyright (C) Martin Pool 2003
9 This program is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 2 of the License, or
12 (at your option) any later version.
14 This program is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
19 You should have received a copy of the GNU General Public License
20 along with this program; if not, write to the Free Software
21 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
26 #endif /* HAVE_CONFIG_H */
35 #include <sys/param.h>
36 #ifdef HAVE_USABLE_ICONV
46 #include <netatalk/endian.h>
47 #include <atalk/logger.h>
48 #include <atalk/unicode.h>
49 #include <atalk/util.h>
50 #include "byteorder.h"
56 * @brief Character-set conversion routines built on our iconv.
58 * @note Samba's internal character set (at least in the 3.0 series)
59 * is always the same as the one for the Unix filesystem. It is
60 * <b>not</b> necessarily UTF-8 and may be different on machines that
61 * need i18n filenames to be compatible with Unix software. It does
62 * have to be a superset of ASCII. All multibyte sequences must start
63 * with a byte with the high bit set.
69 #define MAX_CHARSETS 20
71 #define CHECK_FLAGS(a,b) (((a)!=NULL) ? (*(a) & (b)) : 0 )
73 static atalk_iconv_t conv_handles[MAX_CHARSETS][MAX_CHARSETS];
74 static char* charset_names[MAX_CHARSETS];
75 static struct charset_functions* charsets[MAX_CHARSETS];
76 static char hexdig[] = "0123456789abcdef";
77 #define hextoint( c ) ( isdigit( c ) ? c - '0' : c + 10 - 'a' )
79 static char* read_charsets_from_env(charset_t ch)
85 if (( name = getenv( "ATALK_MAC_CHARSET" )) != NULL )
91 if (( name = getenv( "ATALK_UNIX_CHARSET" )) != NULL )
104 * Return the name of a charset to give to iconv().
106 static const char *charset_name(charset_t ch)
108 const char *ret = NULL;
109 static int first = 1;
110 static char macname[128];
111 static char unixname[128];
114 memset(macname, 0, sizeof(macname));
115 memset(unixname, 0, sizeof(unixname));
119 if (ch == CH_UCS2) ret = "UCS-2";
120 else if (ch == CH_UTF8) ret = "UTF8";
121 else if (ch == CH_UTF8_MAC) ret = "UTF8-MAC";
122 else if (ch == CH_UNIX) {
123 if (unixname[0] == '\0') {
124 ret = read_charsets_from_env(CH_UNIX);
125 strlcpy(unixname, ret, sizeof(unixname));
130 else if (ch == CH_MAC) {
131 if (macname[0] == '\0') {
132 ret = read_charsets_from_env(CH_MAC);
133 strlcpy(macname, ret, sizeof(macname));
140 ret = charset_names[ch];
143 if (ret && strcasecmp(ret, "LOCALE") == 0) {
144 const char *ln = NULL;
146 setlocale(LC_ALL, "");
147 ln = nl_langinfo(CODESET);
149 /* Check whether the charset name is supported
151 atalk_iconv_t handle = atalk_iconv_open(ln, "UCS-2");
152 if (handle == (atalk_iconv_t) -1) {
153 LOG(log_debug, logtype_default, "Locale charset '%s' unsupported, using ASCII instead", ln);
156 atalk_iconv_close(handle);
159 strlcpy(unixname, ln, sizeof(unixname));
163 #else /* system doesn't have LOCALE support */
164 if (ch == CH_UNIX) ret = NULL;
167 if (!ret || !*ret) ret = "ASCII";
171 static struct charset_functions* get_charset_functions (charset_t ch)
173 if (charsets[ch] != NULL)
176 charsets[ch] = find_charset_functions(charset_name(ch));
182 static void lazy_initialize_conv(void)
184 static int initialized = 0;
192 charset_t add_charset(const char* name)
194 static charset_t max_charset_t = NUM_CHARSETS-1;
195 charset_t cur_charset_t = max_charset_t+1;
198 lazy_initialize_conv();
200 for (c1=0; c1<=max_charset_t;c1++) {
201 if ( strcasecmp(name, charset_name(c1)) == 0)
205 if ( cur_charset_t >= MAX_CHARSETS ) {
206 LOG (log_debug, logtype_default, "Adding charset %s failed, too many charsets (max. %u allowed)",
208 return (charset_t) -1;
211 /* First try to setup the required conversions */
213 conv_handles[cur_charset_t][CH_UCS2] = atalk_iconv_open( charset_name(CH_UCS2), name);
214 if (conv_handles[cur_charset_t][CH_UCS2] == (atalk_iconv_t)-1) {
215 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
216 name, charset_name(CH_UCS2));
217 conv_handles[cur_charset_t][CH_UCS2] = NULL;
218 return (charset_t) -1;
221 conv_handles[CH_UCS2][cur_charset_t] = atalk_iconv_open( name, charset_name(CH_UCS2));
222 if (conv_handles[CH_UCS2][cur_charset_t] == (atalk_iconv_t)-1) {
223 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
224 charset_name(CH_UCS2), name);
225 conv_handles[CH_UCS2][cur_charset_t] = NULL;
226 return (charset_t) -1;
229 /* register the new charset_t name */
230 charset_names[cur_charset_t] = strdup(name);
232 charsets[cur_charset_t] = get_charset_functions (cur_charset_t);
236 LOG(log_debug9, logtype_default, "Added charset %s with handle %u", name, cur_charset_t);
238 return (cur_charset_t);
242 * Initialize iconv conversion descriptors.
244 * This is called the first time it is needed, and also called again
245 * every time the configuration is reloaded, because the charset or
246 * codepage might have changed.
248 void init_iconv(void)
252 for (c1=0;c1<NUM_CHARSETS;c1++) {
253 const char *name = charset_name((charset_t)c1);
255 conv_handles[c1][CH_UCS2] = atalk_iconv_open( charset_name(CH_UCS2), name);
256 if (conv_handles[c1][CH_UCS2] == (atalk_iconv_t)-1) {
257 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
258 name, charset_name(CH_UCS2));
259 conv_handles[c1][CH_UCS2] = NULL;
262 if (c1 != CH_UCS2) { /* avoid lost memory, make valgrind happy */
263 conv_handles[CH_UCS2][c1] = atalk_iconv_open( name, charset_name(CH_UCS2));
264 if (conv_handles[CH_UCS2][c1] == (atalk_iconv_t)-1) {
265 LOG(log_error, logtype_default, "Required conversion from %s to %s not supported",
266 charset_name(CH_UCS2), name);
267 conv_handles[CH_UCS2][c1] = NULL;
271 charsets[c1] = get_charset_functions (c1);
278 static size_t add_null(charset_t to, char *buf, size_t bytesleft, size_t len)
280 /* Terminate the string */
281 if (to == CH_UCS2 && bytesleft >= 2) {
286 else if ( to != CH_UCS2 && bytesleft > 0 )
298 * Convert string from one encoding to another, making error checking etc
300 * @param src pointer to source string (multibyte or singlebyte)
301 * @param srclen length of the source string in bytes
302 * @param dest pointer to destination string (multibyte or singlebyte)
303 * @param destlen maximal length allowed for string
304 * @returns the number of bytes occupied in the destination
306 static size_t convert_string_internal(charset_t from, charset_t to,
307 void const *src, size_t srclen,
308 void *dest, size_t destlen)
312 const char* inbuf = (const char*)src;
313 char* outbuf = (char*)dest;
314 char* o_save = outbuf;
315 atalk_iconv_t descriptor;
317 /* Fixed based on Samba 3.0.6 */
318 if (srclen == (size_t)-1) {
319 if (from == CH_UCS2) {
320 srclen = (strlen_w((const ucs2_t *)src)) * 2;
322 srclen = strlen((const char *)src);
327 lazy_initialize_conv();
329 descriptor = conv_handles[from][to];
331 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
337 retval = atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len);
338 if(retval==(size_t)-1) {
339 const char *reason="unknown error";
342 reason="Incomplete multibyte sequence";
345 reason="No more room";
348 reason="Illegal multibyte sequence";
351 LOG(log_debug, logtype_default,"Conversion error: %s",reason);
355 /* Terminate the string */
356 return add_null( to, o_save, o_len, destlen -o_len);
360 size_t convert_string(charset_t from, charset_t to,
361 void const *src, size_t srclen,
362 void *dest, size_t destlen)
366 ucs2_t buffer[MAXPATHLEN];
367 ucs2_t buffer2[MAXPATHLEN];
369 /* convert from_set to UCS2 */
370 if ((size_t)-1 == ( o_len = convert_string_internal( from, CH_UCS2, src, srclen,
371 (char*) buffer, sizeof(buffer))) ) {
372 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from));
376 /* Do pre/decomposition */
377 i_len = sizeof(buffer2);
379 if (charsets[to] && (charsets[to]->flags & CHARSET_DECOMPOSED) ) {
380 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
383 else if (!charsets[from] || (charsets[from]->flags & CHARSET_DECOMPOSED)) {
384 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
391 /* Convert UCS2 to to_set */
392 if ((size_t)(-1) == ( o_len = convert_string_internal( CH_UCS2, to, (char*) u, i_len, dest, destlen)) ) {
393 LOG(log_error, logtype_default, "Conversion failed (CH_UCS2 to %s):%s", charset_name(to), strerror(errno));
403 * Convert between character sets, allocating a new buffer for the result.
405 * @param srclen length of source buffer.
406 * @param dest always set at least to NULL
407 * @note -1 is not accepted for srclen.
409 * @returns Size in bytes of the converted string; or -1 in case of error.
412 static size_t convert_string_allocate_internal(charset_t from, charset_t to,
413 void const *src, size_t srclen, char **dest)
415 size_t i_len, o_len, destlen;
417 const char *inbuf = (const char *)src;
418 char *outbuf = NULL, *ob = NULL;
419 atalk_iconv_t descriptor;
423 if (src == NULL || srclen == (size_t)-1)
426 lazy_initialize_conv();
428 descriptor = conv_handles[from][to];
430 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
431 /* conversion not supported, return -1*/
432 LOG(log_debug, logtype_default, "convert_string_allocate: conversion not supported!");
436 destlen = MAX(srclen, 512);
438 destlen = destlen * 2;
439 outbuf = (char *)realloc(ob, destlen);
441 LOG(log_debug, logtype_default,"convert_string_allocate: realloc failed!");
447 inbuf = src; /* this restarts the whole conversion if buffer needed to be increased */
450 retval = atalk_iconv(descriptor,
453 if(retval == (size_t)-1) {
454 const char *reason="unknown error";
457 reason="Incomplete multibyte sequence";
462 reason="Illegal multibyte sequence";
465 LOG(log_debug, logtype_default,"Conversion error: %s(%s)",reason,inbuf);
471 destlen = destlen - o_len;
473 /* Terminate the string */
474 if (to == CH_UCS2 && o_len >= 2) {
477 *dest = (char *)realloc(ob,destlen+2);
479 else if ( to != CH_UCS2 && o_len > 0 ) {
481 *dest = (char *)realloc(ob,destlen+1);
484 goto convert; /* realloc */
487 if (destlen && !*dest) {
488 LOG(log_debug, logtype_default, "convert_string_allocate: out of memory!");
497 size_t convert_string_allocate(charset_t from, charset_t to,
498 void const *src, size_t srclen,
503 ucs2_t buffer[MAXPATHLEN];
504 ucs2_t buffer2[MAXPATHLEN];
508 /* convert from_set to UCS2 */
509 if ((size_t)(-1) == ( o_len = convert_string_internal( from, CH_UCS2, src, srclen,
510 buffer, sizeof(buffer))) ) {
511 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from));
515 /* Do pre/decomposition */
516 i_len = sizeof(buffer2);
518 if (charsets[to] && (charsets[to]->flags & CHARSET_DECOMPOSED) ) {
519 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
522 else if ( !charsets[from] || (charsets[from]->flags & CHARSET_DECOMPOSED) ) {
523 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
531 /* Convert UCS2 to to_set */
532 if ((size_t)-1 == ( o_len = convert_string_allocate_internal( CH_UCS2, to, (char*)u, i_len, dest)) )
533 LOG(log_error, logtype_default, "Conversion failed (CH_UCS2 to %s):%s", charset_name(to), strerror(errno));
539 size_t charset_strupper(charset_t ch, const char *src, size_t srclen, char *dest, size_t destlen)
544 size = convert_string_allocate_internal(ch, CH_UCS2, src, srclen,
546 if (size == (size_t)-1) {
550 if (!strupper_w((ucs2_t *)buffer) && (dest == src)) {
555 size = convert_string_internal(CH_UCS2, ch, buffer, size, dest, destlen);
560 size_t charset_strlower(charset_t ch, const char *src, size_t srclen, char *dest, size_t destlen)
565 size = convert_string_allocate_internal(ch, CH_UCS2, src, srclen,
567 if (size == (size_t)-1) {
571 if (!strlower_w((ucs2_t *)buffer) && (dest == src)) {
576 size = convert_string_internal(CH_UCS2, ch, buffer, size, dest, destlen);
582 size_t unix_strupper(const char *src, size_t srclen, char *dest, size_t destlen)
584 return charset_strupper( CH_UNIX, src, srclen, dest, destlen);
587 size_t unix_strlower(const char *src, size_t srclen, char *dest, size_t destlen)
589 return charset_strlower( CH_UNIX, src, srclen, dest, destlen);
592 size_t utf8_strupper(const char *src, size_t srclen, char *dest, size_t destlen)
594 return charset_strupper( CH_UTF8, src, srclen, dest, destlen);
597 size_t utf8_strlower(const char *src, size_t srclen, char *dest, size_t destlen)
599 return charset_strlower( CH_UTF8, src, srclen, dest, destlen);
603 * Copy a string from a charset_t char* src to a UCS2 destination, allocating a buffer
605 * @param dest always set at least to NULL
607 * @returns The number of bytes occupied by the string in the destination
608 * or -1 in case of error.
611 size_t charset_to_ucs2_allocate(charset_t ch, ucs2_t **dest, const char *src)
613 size_t src_len = strlen(src);
616 return convert_string_allocate(ch, CH_UCS2, src, src_len, (char**) dest);
619 /** -----------------------------------
620 * Copy a string from a charset_t char* src to a UTF-8 destination, allocating a buffer
622 * @param dest always set at least to NULL
624 * @returns The number of bytes occupied by the string in the destination
627 size_t charset_to_utf8_allocate(charset_t ch, char **dest, const char *src)
629 size_t src_len = strlen(src);
632 return convert_string_allocate(ch, CH_UTF8, src, src_len, dest);
635 /** -----------------------------------
636 * Copy a string from a UCS2 src to a unix char * destination, allocating a buffer
638 * @param dest always set at least to NULL
640 * @returns The number of bytes occupied by the string in the destination
643 size_t ucs2_to_charset(charset_t ch, const ucs2_t *src, char *dest, size_t destlen)
645 size_t src_len = (strlen_w(src)) * sizeof(ucs2_t);
646 return convert_string(CH_UCS2, ch, src, src_len, dest, destlen);
649 /* --------------------------------- */
650 size_t ucs2_to_charset_allocate(charset_t ch, char **dest, const ucs2_t *src)
652 size_t src_len = (strlen_w(src)) * sizeof(ucs2_t);
654 return convert_string_allocate(CH_UCS2, ch, src, src_len, dest);
657 /** ---------------------------------
658 * Copy a string from a UTF-8 src to a unix char * destination, allocating a buffer
660 * @param dest always set at least to NULL
662 * @returns The number of bytes occupied by the string in the destination
665 size_t utf8_to_charset_allocate(charset_t ch, char **dest, const char *src)
667 size_t src_len = strlen(src);
669 return convert_string_allocate(CH_UTF8, ch, src, src_len, dest);
672 size_t charset_precompose ( charset_t ch, char * src, size_t inlen, char * dst, size_t outlen)
675 ucs2_t u[MAXPATHLEN];
679 if ((size_t)(-1) == (len = convert_string_allocate_internal(ch, CH_UCS2, src, inlen, &buffer)) )
684 if ( (size_t)-1 == (ilen = precompose_w((ucs2_t *)buffer, len, u, &ilen)) ) {
689 if ((size_t)(-1) == (len = convert_string_internal( CH_UCS2, ch, (char*)u, ilen, dst, outlen)) ) {
698 size_t charset_decompose ( charset_t ch, char * src, size_t inlen, char * dst, size_t outlen)
701 ucs2_t u[MAXPATHLEN];
705 if ((size_t)(-1) == (len = convert_string_allocate_internal(ch, CH_UCS2, src, inlen, &buffer)) )
710 if ( (size_t)-1 == (ilen = decompose_w((ucs2_t *)buffer, len, u, &ilen)) ) {
715 if ((size_t)(-1) == (len = convert_string_internal( CH_UCS2, ch, (char*)u, ilen, dst, outlen)) ) {
724 size_t utf8_precompose ( char * src, size_t inlen, char * dst, size_t outlen)
726 return charset_precompose ( CH_UTF8, src, inlen, dst, outlen);
729 size_t utf8_decompose ( char * src, size_t inlen, char * dst, size_t outlen)
731 return charset_decompose ( CH_UTF8, src, inlen, dst, outlen);
735 static char debugbuf[ MAXPATHLEN +1 ];
736 char * debug_out ( char * seq, size_t len)
742 p = (unsigned char*) seq;
745 for ( i = 0; i<=(len-1); i++)
747 sprintf(q, "%2.2x.", *p);
758 * Convert from MB to UCS2 charset
760 * CONV_UNESCAPEHEX: ':XX' will be converted to an UCS2 character
761 * CONV_IGNORE: return the first convertable characters.
762 * CONV_FORCE: force convertion
764 * This will *not* work if the destination charset is not multibyte, i.e. UCS2->UCS2 will fail
765 * The (un)escape scheme is not compatible to the old cap style escape. This is bad, we need it
766 * for e.g. HFS cdroms.
769 static size_t pull_charset_flags (charset_t from_set, charset_t cap_set, const char *src, size_t srclen, char* dest, size_t destlen, u_int16_t *flags)
771 const u_int16_t option = (flags ? *flags : 0);
774 const char* inbuf = (const char*)src;
776 atalk_iconv_t descriptor;
777 atalk_iconv_t descriptor_cap;
779 if (srclen == (size_t)-1)
780 srclen = strlen(src) + 1;
782 descriptor = conv_handles[from_set][CH_UCS2];
783 descriptor_cap = conv_handles[cap_set][CH_UCS2];
785 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
794 if ((option & CONV_UNESCAPEHEX)) {
795 for (j = 0; j < i_len; ++j) {
796 if (inbuf[j] == ':') break;
803 atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len) == (size_t)-1) {
804 if (errno == EILSEQ || errno == EINVAL) {
806 if ((option & CONV_IGNORE)) {
807 *flags |= CONV_REQMANGLE;
808 return destlen - o_len;
810 if ((option & CONV__EILSEQ)) {
815 *((ucs2_t *)outbuf) = (ucs2_t) IGNORE_CHAR; /**inbuf */
820 /* FIXME reset stat ? */
828 /* we're at the start on an hex encoded ucs2 char */
833 while (i_len >= 3 && inbuf[0] == ':' &&
834 isxdigit(inbuf[1]) && isxdigit(inbuf[2])) {
835 h[hlen++] = (hextoint(inbuf[1]) << 4) | hextoint(inbuf[2]);
840 const char *h_buf = h;
841 if (atalk_iconv(descriptor_cap, &h_buf, &hlen, &outbuf, &o_len) == (size_t)-1) {
844 if (errno == EILSEQ && (option & CONV_IGNORE)) {
845 *flags |= CONV_REQMANGLE;
846 return destlen - o_len;
851 /* We have an invalid :xx sequence */
853 if ((option & CONV_IGNORE)) {
854 *flags |= CONV_REQMANGLE;
855 return destlen - o_len;
862 return (i_len + j == 0 || (option & CONV_FORCE)) ? destlen - o_len : (size_t)-1;
866 * Convert from UCS2 to MB charset
868 * CONV_ESCAPEDOTS: escape leading dots
869 * CONV_ESCAPEHEX: unconvertable characters and '/' will be escaped to :XX
870 * CONV_IGNORE: return the first convertable characters.
871 * CONV__EILSEQ: unconvertable characters will be replaced with '_'
872 * CONV_FORCE: force convertion
874 * CONV_IGNORE and CONV_ESCAPEHEX can't work together. Should we check this ?
875 * This will *not* work if the destination charset is not multibyte, i.e. UCS2->UCS2 will fail
876 * The escape scheme is not compatible to the old cap style escape. This is bad, we need it
877 * for e.g. HFS cdroms.
881 static size_t push_charset_flags (charset_t to_set, charset_t cap_set, char* src, size_t srclen, char* dest, size_t destlen, u_int16_t *flags)
883 const u_int16_t option = (flags ? *flags : 0);
884 size_t i_len, o_len, i;
886 const char* inbuf = (const char*)src;
887 char* outbuf = (char*)dest;
888 atalk_iconv_t descriptor;
889 atalk_iconv_t descriptor_cap;
890 char escch; /* 150210: uninitialized OK, depends on j */
892 descriptor = conv_handles[CH_UCS2][to_set];
893 descriptor_cap = conv_handles[CH_UCS2][cap_set];
895 if (descriptor == (atalk_iconv_t)-1 || descriptor == (atalk_iconv_t)0) {
903 if ((option & CONV_ESCAPEDOTS) &&
904 i_len >= 2 && SVAL(inbuf, 0) == 0x002e) { /* 0x002e = . */
915 *flags |= CONV_REQESCAPE;
919 if ((option & CONV_ESCAPEHEX)) {
920 for (i = 0; i < i_len; i += 2) {
921 ucs2_t c = SVAL(inbuf, i);
923 case 0x003a: /* 0x003a = ':' */
924 if ( ! (option & CONV_ALLOW_COLON)) {
932 case 0x002f: /* 0x002f = '/' */
941 atalk_iconv(descriptor, &inbuf, &i_len, &outbuf, &o_len) == (size_t)-1) {
942 if (errno == EILSEQ) {
943 if ((option & CONV_IGNORE)) {
944 *flags |= CONV_REQMANGLE;
945 return destlen - o_len;
947 if ((option & CONV_ESCAPEHEX)) {
948 const size_t bufsiz = o_len / 3 + 1;
949 char *buf = malloc(bufsiz);
955 for (buflen = 1; buflen <= bufsiz; ++buflen) {
958 if (atalk_iconv(descriptor_cap, &inbuf, &i, &b, &o) != (size_t)-1) {
961 } else if (errno != E2BIG) {
964 } else if (o < buflen) {
969 if (o_len < buflen * 3) {
976 for (i = 0; i < buflen; ++i) {
978 *outbuf++ = hexdig[(buf[i] >> 4) & 0x0f];
979 *outbuf++ = hexdig[buf[i] & 0x0f];
982 *flags |= CONV_REQESCAPE;
1008 * THIS SHOULD NEVER BE REACHED !!!
1009 * As a safety net I put in a ' ' here
1021 if (i_len > 0) errno = EINVAL;
1023 return (i_len + j == 0 || (option & CONV_FORCE)) ? destlen - o_len : (size_t)-1;
1027 * FIXME the size is a mess we really need a malloc/free logic
1028 *`dest size must be dest_len +2
1030 size_t convert_charset ( charset_t from_set, charset_t to_set, charset_t cap_charset, const char *src, size_t src_len, char *dest, size_t dest_len, u_int16_t *flags)
1032 size_t i_len, o_len;
1034 ucs2_t buffer[MAXPATHLEN +2];
1035 ucs2_t buffer2[MAXPATHLEN +2];
1037 lazy_initialize_conv();
1039 /* convert from_set to UCS2 */
1040 if ((size_t)(-1) == ( o_len = pull_charset_flags( from_set, cap_charset, src, src_len,
1041 (char *) buffer, sizeof(buffer) -2, flags)) ) {
1042 LOG(log_error, logtype_default, "Conversion failed ( %s to CH_UCS2 )", charset_name(from_set));
1049 /* Do pre/decomposition */
1050 i_len = sizeof(buffer2) -2;
1052 if (CHECK_FLAGS(flags, CONV_DECOMPOSE) || (charsets[to_set] && (charsets[to_set]->flags & CHARSET_DECOMPOSED)) ) {
1053 if ( (size_t)-1 == (i_len = decompose_w(buffer, o_len, u, &i_len)) )
1054 return (size_t)(-1);
1056 else if (CHECK_FLAGS(flags, CONV_PRECOMPOSE) || !charsets[from_set] || (charsets[from_set]->flags & CHARSET_DECOMPOSED)) {
1057 if ( (size_t)-1 == (i_len = precompose_w(buffer, o_len, u, &i_len)) )
1058 return (size_t)(-1);
1064 /* null terminate */
1068 /* Do case conversions */
1069 if (CHECK_FLAGS(flags, CONV_TOUPPER)) {
1072 else if (CHECK_FLAGS(flags, CONV_TOLOWER)) {
1076 /* Convert UCS2 to to_set */
1077 if ((size_t)(-1) == ( o_len = push_charset_flags( to_set, cap_charset, (char *)u, i_len, dest, dest_len, flags )) ) {
1078 LOG(log_error, logtype_default,
1079 "Conversion failed (CH_UCS2 to %s):%s", charset_name(to_set), strerror(errno));
1082 /* null terminate */