1/* Copyright (C) 2002-2023 Free Software Foundation, Inc.
2 This file is part of the GNU C Library.
3
4 The GNU C Library is free software; you can redistribute it and/or
5 modify it under the terms of the GNU Lesser General Public
6 License as published by the Free Software Foundation; either
7 version 2.1 of the License, or (at your option) any later version.
8
9 The GNU C Library is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 Lesser General Public License for more details.
13
14 You should have received a copy of the GNU Lesser General Public
15 License along with the GNU C Library; if not, see
16 <https://www.gnu.org/licenses/>. */
17
18#include <assert.h>
19#include <ctype.h>
20#include <string.h>
21#include "wcsmbsload.h"
22#include <dlfcn.h>
23#include <errno.h>
24#include <gconv.h>
25#include <stdlib.h>
26#include <string.h>
27#include <wchar.h>
28#include <wcsmbsload.h>
29
30#include <pointer_guard.h>
31
32#ifndef EILSEQ
33# define EILSEQ EINVAL
34#endif
35
36
37size_t
38attribute_hidden
39__mbsrtowcs_l (wchar_t *dst, const char **src, size_t len, mbstate_t *ps,
40 locale_t l)
41{
42 struct __gconv_step_data data;
43 size_t result;
44 int status;
45 struct __gconv_step *towc;
46 size_t non_reversible;
47 const struct gconv_fcts *fcts;
48
49 /* Tell where we want the result. */
50 data.__invocation_counter = 0;
51 data.__internal_use = 1;
52 data.__flags = __GCONV_IS_LAST;
53 data.__statep = ps;
54
55 /* Get the conversion functions. */
56 fcts = get_gconv_fcts (l->__locales[LC_CTYPE]);
57
58 /* Get the structure with the function pointers. */
59 towc = fcts->towc;
60 __gconv_fct fct = towc->__fct;
61 if (towc->__shlib_handle != NULL)
62 PTR_DEMANGLE (fct);
63
64 /* We have to handle DST == NULL special. */
65 if (dst == NULL)
66 {
67 mbstate_t temp_state;
68 wchar_t buf[64]; /* Just an arbitrary size. */
69 const unsigned char *inbuf = (const unsigned char *) *src;
70 const unsigned char *srcend = inbuf + strlen (*src) + 1;
71
72 temp_state = *data.__statep;
73 data.__statep = &temp_state;
74
75 result = 0;
76 data.__outbufend = (unsigned char *) buf + sizeof (buf);
77 do
78 {
79 data.__outbuf = (unsigned char *) buf;
80
81 status = DL_CALL_FCT (fct, (towc, &data, &inbuf, srcend, NULL,
82 &non_reversible, 0, 1));
83
84 result += (wchar_t *) data.__outbuf - buf;
85 }
86 while (status == __GCONV_FULL_OUTPUT);
87
88 if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT)
89 {
90 /* There better should be a NUL wide char at the end. */
91 assert (((wchar_t *) data.__outbuf)[-1] == L'\0');
92 /* Don't count the NUL character in. */
93 --result;
94 }
95 }
96 else
97 {
98 /* This code is based on the safe assumption that all internal
99 multi-byte encodings use the NUL byte only to mark the end
100 of the string. */
101 const unsigned char *srcp = (const unsigned char *) *src;
102 const unsigned char *srcend;
103
104 data.__outbuf = (unsigned char *) dst;
105 data.__outbufend = data.__outbuf + len * sizeof (wchar_t);
106
107 status = __GCONV_FULL_OUTPUT;
108
109 while (len > 0)
110 {
111 /* Pessimistic guess as to how much input we can use. In the
112 worst case we need one input byte for one output wchar_t. */
113 srcend = srcp + __strnlen ((const char *) srcp, len) + 1;
114
115 status = DL_CALL_FCT (fct, (towc, &data, &srcp, srcend, NULL,
116 &non_reversible, 0, 1));
117 if ((status != __GCONV_EMPTY_INPUT
118 && status != __GCONV_INCOMPLETE_INPUT)
119 /* Not all input read. */
120 || srcp != srcend
121 /* Reached the end of the input. */
122 || srcend[-1] == '\0')
123 break;
124
125 len = (wchar_t *) data.__outbufend - (wchar_t *) data.__outbuf;
126 }
127
128 /* Make the end if the input known to the caller. */
129 *src = (const char *) srcp;
130
131 result = (wchar_t *) data.__outbuf - dst;
132
133 /* We have to determine whether the last character converted
134 is the NUL character. */
135 if ((status == __GCONV_OK || status == __GCONV_EMPTY_INPUT)
136 && ((wchar_t *) dst)[result - 1] == L'\0')
137 {
138 assert (result > 0);
139 assert (__mbsinit (data.__statep));
140 *src = NULL;
141 --result;
142 }
143 }
144
145 /* There must not be any problems with the conversion but illegal input
146 characters. */
147 assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT
148 || status == __GCONV_ILLEGAL_INPUT
149 || status == __GCONV_INCOMPLETE_INPUT
150 || status == __GCONV_FULL_OUTPUT);
151
152 if (status != __GCONV_OK && status != __GCONV_FULL_OUTPUT
153 && status != __GCONV_EMPTY_INPUT && status != __GCONV_INCOMPLETE_INPUT)
154 {
155 result = (size_t) -1;
156 __set_errno (EILSEQ);
157 }
158
159 return result;
160}
161