1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
|
/* Conversions between Unicode and legacy encodings.
Copyright (C) 2002, 2005, 2007, 2009 Free Software Foundation, Inc.
This program is free software: you can redistribute it and/or modify it
under the terms of the GNU Lesser General Public License as published
by the Free Software Foundation; either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public License
along with this program. If not, see <http://www.gnu.org/licenses/>. */
#ifndef _UNICONV_H
#define _UNICONV_H
/* Get size_t. */
#include <stddef.h>
#include "unitypes.h"
/* Get enum iconv_ilseq_handler. */
#include <unistring/iconveh.h>
/* Get locale_charset() declaration. */
#include <unistring/localcharset.h>
#ifdef __cplusplus
extern "C" {
#endif
/* Converts an entire string, possibly including NUL bytes, from one encoding
to a Unicode encoding.
Converts a memory region given in encoding FROMCODE. FROMCODE is as for
iconv_open(3).
The input is in the memory region between SRC (inclusive) and SRC + SRCLEN
(exclusive).
If OFFSETS is not NULL, it should point to an array of SRCLEN integers; this
array is filled with offsets into the result, i.e. the character starting
at SRC[i] corresponds to the character starting at (*RESULTP)[OFFSETS[i]],
and other offsets are set to (size_t)(-1).
RESULTBUF and *LENGTHP should initially be a scratch buffer and its size,
or *RESULTBUF can be NULL.
May erase the contents of the memory at RESULTBUF.
If successful: The resulting Unicode string (non-NULL) is returned and its
length stored in *LENGTHP. The resulting string is RESULTBUF if no dynamic
memory allocation was necessary, or a freshly allocated memory block
otherwise.
In case of error: NULL is returned and errno is set. Particular errno
values: EINVAL, EILSEQ, ENOMEM. */
extern uint8_t *
u8_conv_from_encoding (const char *fromcode,
enum iconv_ilseq_handler handler,
const char *src, size_t srclen,
size_t *offsets,
uint8_t *resultbuf, size_t *lengthp);
extern uint16_t *
u16_conv_from_encoding (const char *fromcode,
enum iconv_ilseq_handler handler,
const char *src, size_t srclen,
size_t *offsets,
uint16_t *resultbuf, size_t *lengthp);
extern uint32_t *
u32_conv_from_encoding (const char *fromcode,
enum iconv_ilseq_handler handler,
const char *src, size_t srclen,
size_t *offsets,
uint32_t *resultbuf, size_t *lengthp);
/* Converts an entire Unicode string, possibly including NUL units, from a
Unicode encoding to a given encoding.
Converts a memory region to encoding TOCODE. TOCODE is as for
iconv_open(3).
The input is in the memory region between SRC (inclusive) and SRC + SRCLEN
(exclusive).
If OFFSETS is not NULL, it should point to an array of SRCLEN integers; this
array is filled with offsets into the result, i.e. the character starting
at SRC[i] corresponds to the character starting at (*RESULTP)[OFFSETS[i]],
and other offsets are set to (size_t)(-1).
RESULTBUF and *LENGTHP should initially be a scratch buffer and its size,
or RESULTBUF can be NULL.
May erase the contents of the memory at RESULTBUF.
If successful: The resulting string (non-NULL) is returned and its length
stored in *LENGTHP. The resulting string is RESULTBUF if no dynamic memory
allocation was necessary, or a freshly allocated memory block otherwise.
In case of error: NULL is returned and errno is set. Particular errno
values: EINVAL, EILSEQ, ENOMEM. */
extern char *
u8_conv_to_encoding (const char *tocode,
enum iconv_ilseq_handler handler,
const uint8_t *src, size_t srclen,
size_t *offsets,
char *resultbuf, size_t *lengthp);
extern char *
u16_conv_to_encoding (const char *tocode,
enum iconv_ilseq_handler handler,
const uint16_t *src, size_t srclen,
size_t *offsets,
char *resultbuf, size_t *lengthp);
extern char *
u32_conv_to_encoding (const char *tocode,
enum iconv_ilseq_handler handler,
const uint32_t *src, size_t srclen,
size_t *offsets,
char *resultbuf, size_t *lengthp);
/* Converts a NUL terminated string from a given encoding.
The result is malloc allocated, or NULL (with errno set) in case of error.
Particular errno values: EILSEQ, ENOMEM. */
extern uint8_t *
u8_strconv_from_encoding (const char *string,
const char *fromcode,
enum iconv_ilseq_handler handler);
extern uint16_t *
u16_strconv_from_encoding (const char *string,
const char *fromcode,
enum iconv_ilseq_handler handler);
extern uint32_t *
u32_strconv_from_encoding (const char *string,
const char *fromcode,
enum iconv_ilseq_handler handler);
/* Converts a NUL terminated string to a given encoding.
The result is malloc allocated, or NULL (with errno set) in case of error.
Particular errno values: EILSEQ, ENOMEM. */
extern char *
u8_strconv_to_encoding (const uint8_t *string,
const char *tocode,
enum iconv_ilseq_handler handler);
extern char *
u16_strconv_to_encoding (const uint16_t *string,
const char *tocode,
enum iconv_ilseq_handler handler);
extern char *
u32_strconv_to_encoding (const uint32_t *string,
const char *tocode,
enum iconv_ilseq_handler handler);
/* Converts a NUL terminated string from the locale encoding.
The result is malloc allocated, or NULL (with errno set) in case of error.
Particular errno values: ENOMEM. */
extern uint8_t *
u8_strconv_from_locale (const char *string);
extern uint16_t *
u16_strconv_from_locale (const char *string);
extern uint32_t *
u32_strconv_from_locale (const char *string);
/* Converts a NUL terminated string to the locale encoding.
The result is malloc allocated, or NULL (with errno set) in case of error.
Particular errno values: ENOMEM. */
extern char *
u8_strconv_to_locale (const uint8_t *string);
extern char *
u16_strconv_to_locale (const uint16_t *string);
extern char *
u32_strconv_to_locale (const uint32_t *string);
#ifdef __cplusplus
}
#endif
#endif /* _UNICONV_H */
|