1 /* Copyright (C) 1996-2022 Free Software Foundation, Inc.
2    This file is part of the GNU C Library.
3 
4    The GNU C Library is free software; you can redistribute it and/or
5    modify it under the terms of the GNU Lesser General Public
6    License as published by the Free Software Foundation; either
7    version 2.1 of the License, or (at your option) any later version.
8 
9    The GNU C Library is distributed in the hope that it will be useful,
10    but WITHOUT ANY WARRANTY; without even the implied warranty of
11    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12    Lesser General Public License for more details.
13 
14    You should have received a copy of the GNU Lesser General Public
15    License along with the GNU C Library; if not, see
16    <https://www.gnu.org/licenses/>.  */
17 
18 #include <assert.h>
19 #include <errno.h>
20 #include <locale.h>
21 #include <stdlib.h>
22 #include <string.h>
23 #include <unistd.h>
24 #ifdef _POSIX_MAPPED_FILES
25 # include <sys/mman.h>
26 #endif
27 
28 #include "localeinfo.h"
29 #include "../iconv/gconv_charset.h"
30 #include "../iconv/gconv_int.h"
31 
32 
33 #ifdef NL_CURRENT_INDIRECT
34 # define DEFINE_CATEGORY(category, category_name, items, a) \
35 extern struct __locale_data _nl_C_##category; \
36 weak_extern (_nl_C_##category)
37 # include "categories.def"
38 # undef	DEFINE_CATEGORY
39 
40 /* Array indexed by category of pointers to _nl_C_CATEGORY slots.
41    Elements are zero for categories whose data is never used.  */
42 struct __locale_data *const _nl_C[] attribute_hidden =
43   {
44 # define DEFINE_CATEGORY(category, category_name, items, a) \
45     [category] = &_nl_C_##category,
46 # include "categories.def"
47 # undef	DEFINE_CATEGORY
48   };
49 #else
50 # define _nl_C		(_nl_C_locobj.__locales)
51 #endif
52 
53 
54 /* For each category we keep a list of records for the locale files
55    which are somehow addressed.  */
56 struct loaded_l10nfile *_nl_locale_file_list[__LC_LAST];
57 
58 const char _nl_default_locale_path[] attribute_hidden = COMPLOCALEDIR;
59 
60 /* Checks if the name is actually present, that is, not NULL and not
61    empty.  */
62 static inline int
name_present(const char * name)63 name_present (const char *name)
64 {
65   return name != NULL && name[0] != '\0';
66 }
67 
68 /* Checks that the locale name neither extremely long, nor contains a
69    ".." path component (to prevent directory traversal).  */
70 static inline int
valid_locale_name(const char * name)71 valid_locale_name (const char *name)
72 {
73   /* Not set.  */
74   size_t namelen = strlen (name);
75   /* Name too long.  The limit is arbitrary and prevents stack overflow
76      issues later.  */
77   if (__glibc_unlikely (namelen > 255))
78     return 0;
79   /* Directory traversal attempt.  */
80   static const char slashdot[4] = {'/', '.', '.', '/'};
81   if (__glibc_unlikely (__memmem (name, namelen,
82 				  slashdot, sizeof (slashdot)) != NULL))
83     return 0;
84   if (namelen == 2 && __glibc_unlikely (name[0] == '.' && name [1] == '.'))
85     return 0;
86   if (namelen >= 3
87       && __glibc_unlikely (((name[0] == '.'
88 			     && name[1] == '.'
89 			     && name[2] == '/')
90 			    || (name[namelen - 3] == '/'
91 				&& name[namelen - 2] == '.'
92 				&& name[namelen - 1] == '.'))))
93     return 0;
94   /* If there is a slash in the name, it must start with one.  */
95   if (__glibc_unlikely (memchr (name, '/', namelen) != NULL) && name[0] != '/')
96     return 0;
97   return 1;
98 }
99 
100 struct __locale_data *
_nl_find_locale(const char * locale_path,size_t locale_path_len,int category,const char ** name)101 _nl_find_locale (const char *locale_path, size_t locale_path_len,
102 		 int category, const char **name)
103 {
104   int mask;
105   /* Name of the locale for this category.  */
106   const char *cloc_name = *name;
107   const char *language;
108   const char *modifier;
109   const char *territory;
110   const char *codeset;
111   const char *normalized_codeset;
112   struct loaded_l10nfile *locale_file;
113 
114   if (cloc_name[0] == '\0')
115     {
116       /* The user decides which locale to use by setting environment
117 	 variables.  */
118       cloc_name = getenv ("LC_ALL");
119       if (!name_present (cloc_name))
120 	cloc_name = getenv (_nl_category_names_get (category));
121       if (!name_present (cloc_name))
122 	cloc_name = getenv ("LANG");
123       if (!name_present (cloc_name))
124 	cloc_name = _nl_C_name;
125     }
126 
127   /* We used to fall back to the C locale if the name contains a slash
128      character '/', but we now check for directory traversal in
129      valid_locale_name, so this is no longer necessary.  */
130 
131   if (__builtin_expect (strcmp (cloc_name, _nl_C_name), 1) == 0
132       || __builtin_expect (strcmp (cloc_name, _nl_POSIX_name), 1) == 0)
133     {
134       /* We need not load anything.  The needed data is contained in
135 	 the library itself.  */
136       *name = _nl_C_name;
137       return _nl_C[category];
138     }
139   else if (!valid_locale_name (cloc_name))
140     {
141       __set_errno (EINVAL);
142       return NULL;
143     }
144 
145   *name = cloc_name;
146 
147   /* We really have to load some data.  First we try the archive,
148      but only if there was no LOCPATH environment variable specified.  */
149   if (__glibc_likely (locale_path == NULL))
150     {
151       struct __locale_data *data
152 	= _nl_load_locale_from_archive (category, name);
153       if (__glibc_likely (data != NULL))
154 	return data;
155 
156       /* Nothing in the archive with the given name.  Expanding it as
157 	 an alias and retry.  */
158       cloc_name = _nl_expand_alias (*name);
159       if (cloc_name != NULL)
160 	{
161 	  data = _nl_load_locale_from_archive (category, &cloc_name);
162 	  if (__builtin_expect (data != NULL, 1))
163 	    return data;
164 	}
165 
166       /* Nothing in the archive.  Set the default path to search below.  */
167       locale_path = _nl_default_locale_path;
168       locale_path_len = sizeof _nl_default_locale_path;
169     }
170   else
171     /* We really have to load some data.  First see whether the name is
172        an alias.  Please note that this makes it impossible to have "C"
173        or "POSIX" as aliases.  */
174     cloc_name = _nl_expand_alias (*name);
175 
176   if (cloc_name == NULL)
177     /* It is no alias.  */
178     cloc_name = *name;
179 
180   /* Make a writable copy of the locale name.  */
181   char *loc_name = strdupa (cloc_name);
182 
183   /* LOCALE can consist of up to four recognized parts for the XPG syntax:
184 
185 		language[_territory[.codeset]][@modifier]
186 
187      Beside the first all of them are allowed to be missing.  If the
188      full specified locale is not found, the less specific one are
189      looked for.  The various part will be stripped off according to
190      the following order:
191 		(1) codeset
192 		(2) normalized codeset
193 		(3) territory
194 		(4) modifier
195    */
196   mask = _nl_explode_name (loc_name, &language, &modifier, &territory,
197 			   &codeset, &normalized_codeset);
198   if (mask == -1)
199     /* Memory allocate problem.  */
200     return NULL;
201 
202   /* If exactly this locale was already asked for we have an entry with
203      the complete name.  */
204   locale_file = _nl_make_l10nflist (&_nl_locale_file_list[category],
205 				    locale_path, locale_path_len, mask,
206 				    language, territory, codeset,
207 				    normalized_codeset, modifier,
208 				    _nl_category_names_get (category), 0);
209 
210   if (locale_file == NULL)
211     {
212       /* Find status record for addressed locale file.  We have to search
213 	 through all directories in the locale path.  */
214       locale_file = _nl_make_l10nflist (&_nl_locale_file_list[category],
215 					locale_path, locale_path_len, mask,
216 					language, territory, codeset,
217 					normalized_codeset, modifier,
218 					_nl_category_names_get (category), 1);
219       if (locale_file == NULL)
220 	/* This means we are out of core.  */
221 	return NULL;
222     }
223 
224   /* The space for normalized_codeset is dynamically allocated.  Free it.  */
225   if (mask & XPG_NORM_CODESET)
226     free ((void *) normalized_codeset);
227 
228   if (locale_file->decided == 0)
229     _nl_load_locale (locale_file, category);
230 
231   if (locale_file->data == NULL)
232     {
233       int cnt;
234       for (cnt = 0; locale_file->successor[cnt] != NULL; ++cnt)
235 	{
236 	  if (locale_file->successor[cnt]->decided == 0)
237 	    _nl_load_locale (locale_file->successor[cnt], category);
238 	  if (locale_file->successor[cnt]->data != NULL)
239 	    break;
240 	}
241       /* Move the entry we found (or NULL) to the first place of
242 	 successors.  */
243       locale_file->successor[0] = locale_file->successor[cnt];
244       locale_file = locale_file->successor[cnt];
245 
246       if (locale_file == NULL)
247 	return NULL;
248     }
249 
250   /* The LC_CTYPE category allows to check whether a locale is really
251      usable.  If the locale name contains a charset name and the
252      charset name used in the locale (present in the LC_CTYPE data) is
253      not the same (after resolving aliases etc) we reject the locale
254      since using it would irritate users expecting the charset named
255      in the locale name.  */
256   if (codeset != NULL)
257     {
258       /* Get the codeset information from the locale file.  */
259       static const int codeset_idx[] =
260 	{
261 	  [__LC_CTYPE] = _NL_ITEM_INDEX (CODESET),
262 	  [__LC_NUMERIC] = _NL_ITEM_INDEX (_NL_NUMERIC_CODESET),
263 	  [__LC_TIME] = _NL_ITEM_INDEX (_NL_TIME_CODESET),
264 	  [__LC_COLLATE] = _NL_ITEM_INDEX (_NL_COLLATE_CODESET),
265 	  [__LC_MONETARY] = _NL_ITEM_INDEX (_NL_MONETARY_CODESET),
266 	  [__LC_MESSAGES] = _NL_ITEM_INDEX (_NL_MESSAGES_CODESET),
267 	  [__LC_PAPER] = _NL_ITEM_INDEX (_NL_PAPER_CODESET),
268 	  [__LC_NAME] = _NL_ITEM_INDEX (_NL_NAME_CODESET),
269 	  [__LC_ADDRESS] = _NL_ITEM_INDEX (_NL_ADDRESS_CODESET),
270 	  [__LC_TELEPHONE] = _NL_ITEM_INDEX (_NL_TELEPHONE_CODESET),
271 	  [__LC_MEASUREMENT] = _NL_ITEM_INDEX (_NL_MEASUREMENT_CODESET),
272 	  [__LC_IDENTIFICATION] = _NL_ITEM_INDEX (_NL_IDENTIFICATION_CODESET)
273 	};
274       const struct __locale_data *data;
275       const char *locale_codeset;
276       char *clocale_codeset;
277       char *ccodeset;
278 
279       data = (const struct __locale_data *) locale_file->data;
280       locale_codeset =
281 	(const char *) data->values[codeset_idx[category]].string;
282       assert (locale_codeset != NULL);
283       /* Note the length of the allocated memory: +3 for up to two slashes
284 	 and the NUL byte.  */
285       clocale_codeset = (char *) alloca (strlen (locale_codeset) + 3);
286       strip (clocale_codeset, locale_codeset);
287 
288       ccodeset = (char *) alloca (strlen (codeset) + 3);
289       strip (ccodeset, codeset);
290 
291       if (__gconv_compare_alias (upstr (ccodeset, ccodeset),
292 				 upstr (clocale_codeset,
293 					clocale_codeset)) != 0)
294 	/* The codesets are not identical, don't use the locale.  */
295 	return NULL;
296     }
297 
298   /* Determine the locale name for which loading succeeded.  This
299      information comes from the file name.  The form is
300      <path>/<locale>/LC_foo.  We must extract the <locale> part.  */
301   if (((const struct __locale_data *) locale_file->data)->name == NULL)
302     {
303       char *cp, *endp;
304 
305       endp = strrchr (locale_file->filename, '/');
306       cp = endp - 1;
307       while (cp[-1] != '/')
308 	--cp;
309       ((struct __locale_data *) locale_file->data)->name
310 	= __strndup (cp, endp - cp);
311     }
312 
313   /* Determine whether the user wants transliteration or not.  */
314   if (modifier != NULL
315       && __strcasecmp_l (modifier, "TRANSLIT", _nl_C_locobj_ptr) == 0)
316     ((struct __locale_data *) locale_file->data)->use_translit = 1;
317 
318   /* Increment the usage count.  */
319   if (((const struct __locale_data *) locale_file->data)->usage_count
320       < MAX_USAGE_COUNT)
321     ++((struct __locale_data *) locale_file->data)->usage_count;
322 
323   return (struct __locale_data *) locale_file->data;
324 }
325 
326 
327 /* Calling this function assumes the lock for handling global locale data
328    is acquired.  */
329 void
_nl_remove_locale(int locale,struct __locale_data * data)330 _nl_remove_locale (int locale, struct __locale_data *data)
331 {
332   if (--data->usage_count == 0)
333     {
334       if (data->alloc != ld_archive)
335 	{
336 	  /* First search the entry in the list of loaded files.  */
337 	  struct loaded_l10nfile *ptr = _nl_locale_file_list[locale];
338 
339 	  /* Search for the entry.  It must be in the list.  Otherwise it
340 	     is a bug and we crash badly.  */
341 	  while ((struct __locale_data *) ptr->data != data)
342 	    ptr = ptr->next;
343 
344 	  /* Mark the data as not available anymore.  So when the data has
345 	     to be used again it is reloaded.  */
346 	  ptr->decided = 0;
347 	  ptr->data = NULL;
348 	}
349 
350       /* This does the real work.  */
351       _nl_unload_locale (locale, data);
352     }
353 }
354