2 Unix SMB/CIFS implementation.
3 minimal iconv implementation
4 Copyright (C) Andrew Tridgell 2001
5 Copyright (C) Jelmer Vernooij 2002,2003
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, write to the Free Software
19 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 From samba 3.0 beta and GNU libiconv-1.8
22 It's bad but most of the time we can't use libc iconv service:
23 - it doesn't round trip for most encoding
24 - it doesn't know about Apple extension
29 #endif /* HAVE_CONFIG_H */
33 #include <netatalk/endian.h>
34 #include <atalk/unicode.h>
35 #include <atalk/logger.h>
36 #include <atalk/unicode.h>
37 #include "byteorder.h"
40 static size_t utf8_pull(void *,char **, size_t *, char **, size_t *);
41 static size_t utf8_push(void *,char **, size_t *, char **, size_t *);
43 struct charset_functions charset_utf8 =
49 CHARSET_VOLUME | CHARSET_MULTIBYTE | CHARSET_PRECOMPOSED
52 struct charset_functions charset_utf8_mac =
58 CHARSET_VOLUME | CHARSET_CLIENT | CHARSET_MULTIBYTE | CHARSET_DECOMPOSED
61 /* ------------------------ */
62 static size_t utf8_pull(void *cd, char **inbuf, size_t *inbytesleft,
63 char **outbuf, size_t *outbytesleft)
68 while (*inbytesleft >= 1 && *outbytesleft >= 2) {
69 unsigned char *c = (unsigned char *)*inbuf;
72 if ((c[0] & 0x80) == 0) {
74 } else if ((c[0] & 0xf0) == 0xe0) {
75 if (*inbytesleft < 3) {
76 LOG(log_debug, logtype_default, "short utf8 char");
79 uc = ((ucs2_t) (c[0] & 0x0f) << 12) | ((ucs2_t) (c[1] ^ 0x80) << 6) | (ucs2_t) (c[2] ^ 0x80);
81 } else if ((c[0] & 0xe0) == 0xc0) {
82 if (*inbytesleft < 2) {
83 LOG(log_debug, logtype_default, "short utf8 char");
86 uc = ((ucs2_t) (c[0] & 0x1f) << 6) | (ucs2_t) (c[1] ^ 0x80);
96 (*inbytesleft) -= len;
101 if (*inbytesleft > 0) {
113 /* ------------------------ */
114 static size_t utf8_push(void *cd, char **inbuf, size_t *inbytesleft,
115 char **outbuf, size_t *outbytesleft)
120 while (*inbytesleft >= 2 && *outbytesleft >= 1) {
121 unsigned char *c = (unsigned char *)*outbuf;
122 uc = SVAL((*inbuf),0);
126 if (*outbytesleft < 3) {
127 LOG(log_debug, logtype_default, "short utf8 write");
130 c[2] = 0x80 | (uc & 0x3f);
133 c[1] = 0x80 | (uc&0x3f);
138 } else if (uc >= 0x80) {
139 if (*outbytesleft < 2) {
140 LOG(log_debug, logtype_default, "short utf8 write");
143 c[1] = 0x80 | (uc&0x3f);
154 (*outbytesleft) -= len;
159 if (*inbytesleft == 1) {
164 if (*inbytesleft > 1) {