summaryrefslogtreecommitdiffabout
path: root/src/utf8conv.c
blob: 0318853ae257d5bd09717fe53f986e2367519ce7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
/* This file is part of Idest.
   Copyright (C) 2016, 2017 Sergey Poznyakoff
 
   Idest is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation; either version 3, or (at your option)
   any later version.
 
   Idest is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.
 
   You should have received a copy of the GNU General Public License
   along with Idest.  If not, see <http://www.gnu.org/licenses/>. */

#include "idest.h"
#include <limits.h>
#include <localcharset.h>
#ifdef HAVE_ICONV_H
# include <iconv.h>
#endif

#ifndef ICONV_CONST
# define ICONV_CONST
#endif

#ifndef HAVE_ICONV
# undef iconv_open
# define iconv_open(tocode, fromcode) ((iconv_t) -1)
# undef iconv
# define iconv(cd, inbuf, inbytesleft, outbuf, outbytesleft) ((size_t) 0)
# undef iconv_close
# define iconv_close(cd) 0
#endif

char const *charset;
char const *broken_8bit_charset;

static iconv_t conv_desc[] = { (iconv_t) -1, (iconv_t) -1, (iconv_t) -1 };

static iconv_t
utf8_init(int mode)
{
	if (!charset)
		charset = locale_charset();
	if (conv_desc[mode] == (iconv_t) -1) {
		switch (mode) {
		case idest_conv_decode:
			conv_desc[mode] = iconv_open(charset, "UTF-8");
			break;

		case idest_conv_encode:
			conv_desc[mode] = iconv_open("UTF-8", charset);
			break;

		case idest_conv_recode:
			conv_desc[mode] = iconv_open("UTF-8", broken_8bit_charset);
		}
	}
	return conv_desc[mode];
}

int
utf8_convert(int mode, char const *input, char **output)
{
	char ICONV_CONST *ib;
	char *bufptr, *ob;
	size_t inlen;
	size_t outlen;
	size_t rc;
	iconv_t cd = utf8_init(mode);
	
	if (cd == 0) {
		*output = xstrdup(input);
		return 0;
	} else if (cd == (iconv_t)-1)
		return -1;

	inlen = strlen(input) + 1;
	outlen = inlen * MB_LEN_MAX + 1;
	ob = bufptr = xmalloc(outlen);
	ib = (char ICONV_CONST *) input;
	rc = iconv(cd, &ib, &inlen, &ob, &outlen);
	if (rc == (size_t)-1) {
		free(bufptr);
		return -1;
	}

	*ob = 0;
	*output = bufptr;
	return 0;
}

Return to:

Send suggestions and report system problems to the System administrator.