1 | /* Copyright (C) 1997-2023 Free Software Foundation, Inc. |
2 | This file is part of the GNU C Library. |
3 | |
4 | The GNU C Library is free software; you can redistribute it and/or |
5 | modify it under the terms of the GNU Lesser General Public |
6 | License as published by the Free Software Foundation; either |
7 | version 2.1 of the License, or (at your option) any later version. |
8 | |
9 | The GNU C Library is distributed in the hope that it will be useful, |
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
12 | Lesser General Public License for more details. |
13 | |
14 | You should have received a copy of the GNU Lesser General Public |
15 | License along with the GNU C Library; if not, see |
16 | <https://www.gnu.org/licenses/>. */ |
17 | |
18 | #ifndef _GCONV_INT_H |
19 | #define _GCONV_INT_H 1 |
20 | |
21 | #include "gconv.h" |
22 | #include <stdlib.h> /* For alloca used in macro below. */ |
23 | #include <ctype.h> /* For __toupper_l used in macro below. */ |
24 | #include <string.h> /* For strlen et al used in macro below. */ |
25 | #include <libc-lock.h> |
26 | |
27 | __BEGIN_DECLS |
28 | |
29 | |
30 | /* Structure for alias definition. Simply two strings. */ |
31 | struct gconv_alias |
32 | { |
33 | char *fromname; |
34 | char *toname; |
35 | }; |
36 | |
37 | |
38 | /* Structure describing one loaded shared object. This normally are |
39 | objects to perform conversation but as a special case the db shared |
40 | object is also handled. */ |
41 | struct __gconv_loaded_object |
42 | { |
43 | /* Name of the object. It must be the first structure element. */ |
44 | const char *name; |
45 | |
46 | /* Reference counter for the db functionality. If no conversion is |
47 | needed we unload the db library. */ |
48 | int counter; |
49 | |
50 | /* The handle for the shared object. */ |
51 | void *handle; |
52 | |
53 | /* Pointer to the functions the module defines. */ |
54 | __gconv_fct fct; |
55 | __gconv_init_fct init_fct; |
56 | __gconv_end_fct end_fct; |
57 | }; |
58 | |
59 | |
60 | /* Description for an available conversion module. */ |
61 | struct gconv_module |
62 | { |
63 | const char *from_string; |
64 | const char *to_string; |
65 | |
66 | int cost_hi; |
67 | int cost_lo; |
68 | |
69 | const char *module_name; |
70 | |
71 | struct gconv_module *left; /* Prefix smaller. */ |
72 | struct gconv_module *same; /* List of entries with identical prefix. */ |
73 | struct gconv_module *right; /* Prefix larger. */ |
74 | }; |
75 | |
76 | |
77 | /* The specification of the conversion that needs to be performed. */ |
78 | struct gconv_spec |
79 | { |
80 | char *fromcode; |
81 | char *tocode; |
82 | bool translit; |
83 | bool ignore; |
84 | }; |
85 | |
86 | /* Flags for `gconv_open'. */ |
87 | enum |
88 | { |
89 | GCONV_AVOID_NOCONV = 1 << 0 |
90 | }; |
91 | |
92 | /* When GCONV_AVOID_NOCONV is set and no conversion is needed, |
93 | __GCONV_NULCONV should be returned. */ |
94 | enum |
95 | { |
96 | __GCONV_NULCONV = -1 |
97 | }; |
98 | |
99 | /* Global variables. */ |
100 | |
101 | /* Database of alias names. */ |
102 | extern void *__gconv_alias_db attribute_hidden; |
103 | |
104 | /* Array with available modules. */ |
105 | extern struct gconv_module *__gconv_modules_db attribute_hidden; |
106 | |
107 | /* Value of the GCONV_PATH environment variable. */ |
108 | extern const char *__gconv_path_envvar attribute_hidden; |
109 | |
110 | /* Lock for the conversion database content. */ |
111 | __libc_lock_define (extern, __gconv_lock attribute_hidden) |
112 | |
113 | |
114 | /* The gconv functions expects the name to be in upper case and complete, |
115 | including the trailing slashes if necessary. */ |
116 | #define norm_add_slashes(str,suffix) \ |
117 | ({ \ |
118 | const char *cp = (str); \ |
119 | char *result; \ |
120 | char *tmp; \ |
121 | size_t cnt = 0; \ |
122 | const size_t suffix_len = strlen (suffix); \ |
123 | \ |
124 | while (*cp != '\0') \ |
125 | if (*cp++ == '/') \ |
126 | ++cnt; \ |
127 | \ |
128 | tmp = result = __alloca (cp - (str) + 3 + suffix_len); \ |
129 | cp = (str); \ |
130 | while (*cp != '\0') \ |
131 | *tmp++ = __toupper_l (*cp++, _nl_C_locobj_ptr); \ |
132 | if (cnt < 2) \ |
133 | { \ |
134 | *tmp++ = '/'; \ |
135 | if (cnt < 1) \ |
136 | { \ |
137 | *tmp++ = '/'; \ |
138 | if (suffix_len != 0) \ |
139 | tmp = __mempcpy (tmp, suffix, suffix_len); \ |
140 | } \ |
141 | } \ |
142 | *tmp = '\0'; \ |
143 | result; \ |
144 | }) |
145 | |
146 | |
147 | /* Return in *HANDLE, a decriptor for the transformation. The function expects |
148 | the specification of the transformation in the structure pointed to by |
149 | CONV_SPEC. It only reads *CONV_SPEC and does not take ownership of it. */ |
150 | extern int __gconv_open (struct gconv_spec *conv_spec, |
151 | __gconv_t *handle, int flags); |
152 | libc_hidden_proto (__gconv_open) |
153 | |
154 | /* This function accepts the charset names of the source and destination of the |
155 | conversion and populates *conv_spec with an equivalent conversion |
156 | specification that may later be used by __gconv_open. The charset names |
157 | might contain options in the form of suffixes that alter the conversion, |
158 | e.g. "ISO-10646/UTF-8/TRANSLIT". It processes the charset names, ignoring |
159 | and truncating any suffix options in fromcode, and processing and truncating |
160 | any suffix options in tocode. Supported suffix options ("TRANSLIT" or |
161 | "IGNORE") when found in tocode lead to the corresponding flag in *conv_spec |
162 | to be set to true. Unrecognized suffix options are silently discarded. If |
163 | the function succeeds, it returns conv_spec back to the caller. It returns |
164 | NULL upon failure. */ |
165 | extern struct gconv_spec * |
166 | __gconv_create_spec (struct gconv_spec *conv_spec, const char *fromcode, |
167 | const char *tocode); |
168 | libc_hidden_proto (__gconv_create_spec) |
169 | |
170 | /* This function frees all heap memory allocated by __gconv_create_spec. */ |
171 | extern void |
172 | __gconv_destroy_spec (struct gconv_spec *conv_spec); |
173 | libc_hidden_proto (__gconv_destroy_spec) |
174 | |
175 | /* Free resources associated with transformation descriptor CD. */ |
176 | extern int __gconv_close (__gconv_t cd) |
177 | attribute_hidden; |
178 | |
179 | /* Transform at most *INBYTESLEFT bytes from buffer starting at *INBUF |
180 | according to rules described by CD and place up to *OUTBYTESLEFT |
181 | bytes in buffer starting at *OUTBUF. Return number of non-identical |
182 | conversions in *IRREVERSIBLE if this pointer is not null. */ |
183 | extern int __gconv (__gconv_t cd, const unsigned char **inbuf, |
184 | const unsigned char *inbufend, unsigned char **outbuf, |
185 | unsigned char *outbufend, size_t *irreversible) |
186 | attribute_hidden; |
187 | |
188 | /* Return in *HANDLE a pointer to an array with *NSTEPS elements describing |
189 | the single steps necessary for transformation from FROMSET to TOSET. */ |
190 | extern int __gconv_find_transform (const char *toset, const char *fromset, |
191 | struct __gconv_step **handle, |
192 | size_t *nsteps, int flags) |
193 | attribute_hidden; |
194 | |
195 | /* Search for transformation in cache data. */ |
196 | extern int __gconv_lookup_cache (const char *toset, const char *fromset, |
197 | struct __gconv_step **handle, size_t *nsteps, |
198 | int flags) |
199 | attribute_hidden; |
200 | |
201 | /* Compare the two name for whether they are after alias expansion the |
202 | same. This function uses the cache and fails if none is |
203 | loaded. */ |
204 | extern int __gconv_compare_alias_cache (const char *name1, const char *name2, |
205 | int *result) |
206 | attribute_hidden; |
207 | |
208 | /* Free data associated with a step's structure. */ |
209 | extern void __gconv_release_step (struct __gconv_step *step) |
210 | attribute_hidden; |
211 | |
212 | /* Read all the configuration data and cache it if not done so already. */ |
213 | extern void __gconv_load_conf (void) attribute_hidden; |
214 | |
215 | /* Try to read module cache file. */ |
216 | extern int __gconv_load_cache (void) attribute_hidden; |
217 | |
218 | /* Retrieve pointer to internal cache. */ |
219 | extern void *__gconv_get_cache (void); |
220 | |
221 | /* Retrieve pointer to internal module database. */ |
222 | extern struct gconv_module *__gconv_get_modules_db (void); |
223 | |
224 | /* Retrieve pointer to internal alias database. */ |
225 | extern void *__gconv_get_alias_db (void); |
226 | |
227 | /* Comparison function to search alias. */ |
228 | extern int __gconv_alias_compare (const void *p1, const void *p2) |
229 | attribute_hidden; |
230 | |
231 | /* Clear reference to transformation step implementations which might |
232 | cause the code to be unloaded. */ |
233 | extern int __gconv_close_transform (struct __gconv_step *steps, |
234 | size_t nsteps) |
235 | attribute_hidden; |
236 | |
237 | /* Free all resources allocated for the transformation record when |
238 | using the cache. */ |
239 | extern void __gconv_release_cache (struct __gconv_step *steps, size_t nsteps) |
240 | attribute_hidden; |
241 | |
242 | /* Load shared object named by NAME. If already loaded increment reference |
243 | count. */ |
244 | extern struct __gconv_loaded_object *__gconv_find_shlib (const char *name) |
245 | attribute_hidden; |
246 | |
247 | /* Release shared object. If no further reference is available unload |
248 | the object. */ |
249 | extern void __gconv_release_shlib (struct __gconv_loaded_object *handle) |
250 | attribute_hidden; |
251 | |
252 | /* Fill STEP with information about builtin module with NAME. */ |
253 | extern void __gconv_get_builtin_trans (const char *name, |
254 | struct __gconv_step *step) |
255 | attribute_hidden; |
256 | |
257 | /* Transliteration using the locale's data. */ |
258 | extern int __gconv_transliterate (struct __gconv_step *step, |
259 | struct __gconv_step_data *step_data, |
260 | const unsigned char *inbufstart, |
261 | const unsigned char **inbufp, |
262 | const unsigned char *inbufend, |
263 | unsigned char **outbufstart, |
264 | size_t *irreversible); |
265 | libc_hidden_proto (__gconv_transliterate) |
266 | |
267 | /* If NAME is an codeset alias expand it. */ |
268 | extern int __gconv_compare_alias (const char *name1, const char *name2) |
269 | attribute_hidden; |
270 | |
271 | |
272 | /* Builtin transformations. */ |
273 | #ifdef _LIBC |
274 | # define __BUILTIN_TRANSFORM(Name) \ |
275 | extern int Name (struct __gconv_step *step, \ |
276 | struct __gconv_step_data *data, \ |
277 | const unsigned char **inbuf, \ |
278 | const unsigned char *inbufend, \ |
279 | unsigned char **outbufstart, size_t *irreversible, \ |
280 | int do_flush, int consume_incomplete) |
281 | |
282 | __BUILTIN_TRANSFORM (__gconv_transform_ascii_internal); |
283 | __BUILTIN_TRANSFORM (__gconv_transform_internal_ascii); |
284 | __BUILTIN_TRANSFORM (__gconv_transform_utf8_internal); |
285 | __BUILTIN_TRANSFORM (__gconv_transform_internal_utf8); |
286 | __BUILTIN_TRANSFORM (__gconv_transform_ucs2_internal); |
287 | __BUILTIN_TRANSFORM (__gconv_transform_internal_ucs2); |
288 | __BUILTIN_TRANSFORM (__gconv_transform_ucs2reverse_internal); |
289 | __BUILTIN_TRANSFORM (__gconv_transform_internal_ucs2reverse); |
290 | __BUILTIN_TRANSFORM (__gconv_transform_internal_ucs4); |
291 | __BUILTIN_TRANSFORM (__gconv_transform_ucs4_internal); |
292 | __BUILTIN_TRANSFORM (__gconv_transform_internal_ucs4le); |
293 | __BUILTIN_TRANSFORM (__gconv_transform_ucs4le_internal); |
294 | __BUILTIN_TRANSFORM (__gconv_transform_internal_utf16); |
295 | __BUILTIN_TRANSFORM (__gconv_transform_utf16_internal); |
296 | # undef __BUITLIN_TRANSFORM |
297 | |
298 | /* Specialized conversion function for a single byte to INTERNAL, recognizing |
299 | only ASCII characters. */ |
300 | extern wint_t __gconv_btwoc_ascii (struct __gconv_step *step, unsigned char c); |
301 | |
302 | #endif |
303 | |
304 | __END_DECLS |
305 | |
306 | #endif /* gconv_int.h */ |
307 | |