1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
|
/* ****************************************************************************
* conv/utf8_to_wchar.c -- UTF-8 to `wchar_t`.
*
* Copyright (C) 2017 Thomas "Cakeisalie5" Touhey <thomas@touhey.fr>
*
* This file is part of the 'all/iconv' module in libcarrot, an experimental
* modular libc project.
*
* This file is free software: you can redistribute it and/or modify it under
* the terms of the GNU Lesser General Public License as published by the Free
* Software Foundation, either version 3 of the License, or (at your option)
* any later version.
*
* This file is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Lesser Public License
* for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this file. If not, see <http://www.gnu.org/licenses/>.
* ************************************************************************* */
#include "../iconv.h"
#define set_utf8_cookie(c_count, c_ini) { \
count = (c_count); \
val = (c_ini); }
/**
* __iconv_utf8_to_wchar:
* Convert one UTF-8 sequence to a wchar_t.
*
* @arg step the step data.
* @return the error code (0 if ok).
*/
int __iconv_utf8_to_wchar(struct __iconv_step *step)
{
int byte = *step->in;
wchar_t *out; wchar_t val;
int outleft;
/* Initialize the output. */
if (step->next) {
/* Next step input buffer. */
step->next->in = (void*)&val;
step->next->inleft = sizeof(wchar_t);
outleft = sizeof(wchar_t);
out = &val;
/* Next step output buffer. */
step->next->out = step->out;
step->next->outleft = step->outleft;
} else {
out = (wchar_t*)step->out;
outleft = step->outleft;
}
/* Check if too big. */
if (outleft < (int)sizeof(wchar_t))
return (I_E2BIG);
/* Check if it's special. */
if (byte & 0x80) {
unsigned char *in = (void*)step->in;
int count;
if (~byte & 0x40) {
/* error: not a starting byte! */
return (I_EILSEQ);
}
/* Make the cookie. */
if (~byte & 0x20)
set_utf8_cookie(1, byte & 0x1F)
else if (~byte & 0x10)
set_utf8_cookie(2, byte & 0x0F)
else if (~byte & 0x08)
set_utf8_cookie(3, byte & 0x07)
else if (~byte & 0x04)
set_utf8_cookie(4, byte & 0x03)
else if (~byte & 0x02)
set_utf8_cookie(5, byte & 0x01)
else {
/* error: not a valid starting byte */
return (I_EILSEQ);
}
/* Get the data. */
if (step->inleft - 1 < count)
return (I_EINVAL);
step->in += count;
step->inleft -= count;
while (--count) {
int byte = *++in;
if (~byte & 0x80 || byte & 0x40) {
/* not a valid continuation byte! */
return (I_EILSEQ);
}
val = (val << 6) | (byte & 0x3F);
}
} else val = byte;
/* Put into the final thing. */
*out = val;
/* Call next step, end otherwise. */
if (step->next)
return ((*step->next_func)(step->next));
return (0);
}
|